From dd3ea8d31b1b5615bcdd6b671f5e6e86315e8dda Mon Sep 17 00:00:00 2001
From: liyang830 <liyang830@jd.com>
Date: Fri, 10 Mar 2023 20:52:27 +0800
Subject: [PATCH 001/985] feat: modify materalized view query, check inner
 table structure

---
 src/Storages/StorageMaterializedView.cpp          | 13 +++++++++++++
 ...erialized_view_query_has_inner_table.reference |  2 ++
 ...er_materialized_view_query_has_inner_table.sql | 15 +++++++++++++++
 3 files changed, 30 insertions(+)
 create mode 100644 tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.reference
 create mode 100644 tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql

diff --git a/src/Storages/StorageMaterializedView.cpp b/src/Storages/StorageMaterializedView.cpp
index ae3fa62b38c..0bbd689043c 100644
--- a/src/Storages/StorageMaterializedView.cpp
+++ b/src/Storages/StorageMaterializedView.cpp
@@ -7,6 +7,7 @@
 #include <Interpreters/InterpreterCreateQuery.h>
 #include <Interpreters/InterpreterDropQuery.h>
 #include <Interpreters/InterpreterRenameQuery.h>
+#include <Interpreters/InterpreterSelectWithUnionQuery.h>
 #include <Interpreters/getTableExpressions.h>
 #include <Interpreters/getHeaderForProcessingStage.h>
 #include <Access/Common/AccessFlags.h>
@@ -269,6 +270,18 @@ void StorageMaterializedView::alter(
         DatabaseCatalog::instance().updateViewDependency(old_select.select_table_id, table_id, new_select.select_table_id, table_id);
 
         new_metadata.setSelectQuery(new_select);
+
+        /// check materialized view inner table structure
+        if (has_inner_table)
+        {
+            const Block & block = InterpreterSelectWithUnionQuery::getSampleBlock(new_select.select_query, local_context);
+            for (const auto & col : block.getColumnsWithTypeAndName())
+            {
+                if (!tryGetTargetTable()->getInMemoryMetadata().columns.has(col.name))
+                    throw Exception(ErrorCodes::QUERY_IS_NOT_SUPPORTED_IN_MATERIALIZED_VIEW, "column {} is not in materialized view inner table", col.name);
+            }
+        }
+
     }
     /// end modify query
 
diff --git a/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.reference b/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.reference
new file mode 100644
index 00000000000..1191247b6d9
--- /dev/null
+++ b/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.reference
@@ -0,0 +1,2 @@
+1
+2
diff --git a/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql b/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql
new file mode 100644
index 00000000000..73bbac59a95
--- /dev/null
+++ b/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql
@@ -0,0 +1,15 @@
+DROP TABLE IF EXISTS src_table;
+DROP TABLE IF EXISTS mv;
+
+CREATE TABLE src_table (`a` UInt32, `b` UInt32) ENGINE = MergeTree ORDER BY a;
+CREATE MATERIALIZED VIEW mv UUID '2bad6d75-86fe-4da0-815b-2c7410253941' (`a` UInt32) ENGINE = MergeTree ORDER BY a AS SELECT a FROM src_table;
+
+INSERT INTO src_table (a, b) VALUES (1, 1), (2, 2);
+
+SELECT * FROM mv;
+
+SET allow_experimental_alter_materialized_view_structure = 1;
+ALTER TABLE mv MODIFY QUERY SELECT a, b FROM src_table; -- {serverError QUERY_IS_NOT_SUPPORTED_IN_MATERIALIZED_VIEW}
+
+DROP TABLE src_table;
+DROP TABLE mv;
\ No newline at end of file

From 3f5853b970dd205465a5593d5786c1f8a4d82cc7 Mon Sep 17 00:00:00 2001
From: AN <bezik@users.noreply.github.com>
Date: Fri, 27 Oct 2023 19:17:13 +0300
Subject: [PATCH 002/985] Update index.md
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Punctuation fixes, узел→сервер as suggested by alexei-milovidov at https://github.com/ClickHouse/ClickHouse/pull/56040#issuecomment-1783155867, консистентность → согласованность (standard translation instead of calque)
---
 docs/ru/index.md | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/docs/ru/index.md b/docs/ru/index.md
index 78bb382753b..a9a666b18db 100644
--- a/docs/ru/index.md
+++ b/docs/ru/index.md
@@ -41,7 +41,7 @@ ClickHouse — столбцовая система управления база
 Разный порядок хранения данных лучше подходит для разных сценариев работы.
 Сценарий работы с данными — это то, какие производятся запросы, как часто и в каком соотношении; сколько читается данных на запросы каждого вида — строк, столбцов, байтов; как соотносятся чтения и обновления данных; какой рабочий размер данных и насколько локально он используется; используются ли транзакции и с какой изолированностью; какие требования к дублированию данных и логической целостности; требования к задержкам на выполнение и пропускной способности запросов каждого вида и т. п.
 
-Чем больше нагрузка на систему, тем более важной становится специализация под сценарий работы, и тем более конкретной становится эта специализация. Не существует системы, одинаково хорошо подходящей под существенно различные сценарии работы. Если система подходит под широкое множество сценариев работы, то при достаточно большой нагрузке, система будет справляться со всеми сценариями работы плохо, или справляться хорошо только с одним из сценариев работы.
+Чем больше нагрузка на систему, тем более важной становится специализация под сценарий работы, и тем более конкретной становится эта специализация. Не существует системы, одинаково хорошо подходящей под существенно различные сценарии работы. Если система подходит под широкое множество сценариев работы, то при достаточно большой нагрузке система будет справляться со всеми сценариями работы плохо, или справляться хорошо только с одним из сценариев работы.
 
 ## Ключевые особенности OLAP-сценария работы {#kliuchevye-osobennosti-olap-stsenariia-raboty}
 
@@ -53,11 +53,11 @@ ClickHouse — столбцовая система управления база
 -   запросы идут сравнительно редко (обычно не более сотни в секунду на сервер);
 -   при выполнении простых запросов, допустимы задержки в районе 50 мс;
 -   значения в столбцах достаточно мелкие — числа и небольшие строки (например, 60 байт на URL);
--   требуется высокая пропускная способность при обработке одного запроса (до миллиардов строк в секунду на один узел);
+-   требуется высокая пропускная способность при обработке одного запроса (до миллиардов строк в секунду на один сервер);
 -   транзакции отсутствуют;
--   низкие требования к консистентности данных;
--   в запросе одна большая таблица, все таблицы кроме одной маленькие;
--   результат выполнения запроса существенно меньше исходных данных — то есть данные фильтруются или агрегируются; результат выполнения помещается в оперативную память одного узла.
+-   низкие требования к согласованности данных;
+-   в запросе одна большая таблица, все остальные таблицы из запроса — маленькие;
+-   результат выполнения запроса существенно меньше исходных данных — то есть данные фильтруются или агрегируются; результат выполнения помещается в оперативную память одного сервера.
 
 Легко видеть, что OLAP-сценарий работы существенно отличается от других распространённых сценариев работы (например, OLTP или Key-Value сценариев работы). Таким образом, не имеет никакого смысла пытаться использовать OLTP-системы или системы класса «ключ — значение» для обработки аналитических запросов, если вы хотите получить приличную производительность («выше плинтуса»). Например, если вы попытаетесь использовать для аналитики MongoDB или Redis — вы получите анекдотически низкую производительность по сравнению с OLAP-СУБД.
 
@@ -77,11 +77,11 @@ ClickHouse — столбцовая система управления база
 
 ### По вводу-выводу {#po-vvodu-vyvodu}
 
-1.  Для выполнения аналитического запроса, требуется прочитать небольшое количество столбцов таблицы. В столбцовой БД для этого можно читать только нужные данные. Например, если вам требуется только 5 столбцов из 100, то следует рассчитывать на 20-кратное уменьшение ввода-вывода.
-2.  Так как данные читаются пачками, то их проще сжимать. Данные, лежащие по столбцам также лучше сжимаются. За счёт этого, дополнительно уменьшается объём ввода-вывода.
-3.  За счёт уменьшения ввода-вывода, больше данных влезает в системный кэш.
+1.  Для выполнения аналитического запроса требуется прочитать небольшое количество столбцов таблицы. В столбцовой БД для этого можно читать только нужные данные. Например, если вам требуется только 5 столбцов из 100, то следует рассчитывать на 20-кратное уменьшение ввода-вывода.
+2.  Так как данные читаются пачками, то их проще сжимать. Данные, лежащие по столбцам, также лучше сжимаются. За счёт этого, дополнительно уменьшается объём ввода-вывода.
+3.  За счёт уменьшения ввода-вывода больше данных влезает в системный кэш.
 
-Например, для запроса «посчитать количество записей для каждой рекламной системы», требуется прочитать один столбец «идентификатор рекламной системы», который занимает 1 байт в несжатом виде. Если большинство переходов было не с рекламных систем, то можно рассчитывать хотя бы на десятикратное сжатие этого столбца. При использовании быстрого алгоритма сжатия, возможно разжатие данных со скоростью более нескольких гигабайт несжатых данных в секунду. То есть, такой запрос может выполняться со скоростью около нескольких миллиардов строк в секунду на одном сервере. На практике, такая скорость действительно достигается.
+Например, для запроса «посчитать количество записей для каждой рекламной системы» требуется прочитать один столбец «идентификатор рекламной системы», который занимает 1 байт в несжатом виде. Если большинство переходов было не с рекламных систем, то можно рассчитывать хотя бы на десятикратное сжатие этого столбца. При использовании быстрого алгоритма сжатия возможно разжатие данных со скоростью более нескольких гигабайт несжатых данных в секунду. То есть такой запрос может выполняться со скоростью около нескольких миллиардов строк в секунду на одном сервере. На практике такая скорость действительно достигается.
 
 ### По вычислениям {#po-vychisleniiam}
 

From 4dcbd6775a9cd1afe3c8be96e3c68c397ae547f0 Mon Sep 17 00:00:00 2001
From: Thom O'Connor <thom@clickhouse.com>
Date: Fri, 3 Nov 2023 09:46:35 -0600
Subject: [PATCH 003/985] Update kill.md

Added additional examples and context for killing queries and mutations
---
 docs/en/sql-reference/statements/kill.md | 64 ++++++++++++++++++++++++
 1 file changed, 64 insertions(+)

diff --git a/docs/en/sql-reference/statements/kill.md b/docs/en/sql-reference/statements/kill.md
index 294724dfa50..32de7a41e72 100644
--- a/docs/en/sql-reference/statements/kill.md
+++ b/docs/en/sql-reference/statements/kill.md
@@ -21,6 +21,35 @@ The queries to terminate are selected from the system.processes table using the
 
 Examples:
 
+First, you'll need to get the list of incomplete queries. This SQL queries provides them according to those running the longest:
+
+List from a single ClickHouse node:
+``` sql
+SELECT
+  initial_query_id,
+  query_id,
+  formatReadableTimeDelta(elapsed) AS time_delta,
+  query,
+  *
+  FROM system.processes
+  WHERE query ILIKE 'SELECT%'
+  ORDER BY time_delta DESC;
+```
+
+List from a ClickHouse cluster:
+``` sql
+SELECT
+  initial_query_id,
+  query_id,
+  formatReadableTimeDelta(elapsed) AS time_delta,
+  query,
+  *
+  FROM clusterAllReplicas(default, system.processes)
+  WHERE query ILIKE 'SELECT%'
+  ORDER BY time_delta DESC;
+```
+
+Kill the query:
 ``` sql
 -- Forcibly terminates all queries with the specified query_id:
 KILL QUERY WHERE query_id='2-857d-4a57-9ee0-327da5d60a90'
@@ -44,6 +73,8 @@ A test query (`TEST`) only checks the user’s rights and displays a list of que
 
 ## KILL MUTATION
 
+One of the first things to check if a ClickHouse system or service is not running well is for long-running, incomplete mutations. The asynchronous (background) nature of mutations can cause a large queue of them that can then consume all available resources on the service. You may need to either pause all new mutations, INSERTs, and SELECTs and allow the queue of mutations to complete, or else manually kill some of these mutations.
+
 ``` sql
 KILL MUTATION [ON CLUSTER cluster]
   WHERE <where expression to SELECT FROM system.mutations query>
@@ -57,6 +88,39 @@ A test query (`TEST`) only checks the user’s rights and displays a list of mut
 
 Examples:
 
+Get a count() of the number of incomplete mutations:
+
+Count of mutations from a single ClickHouse node:
+``` sql
+SELECT count(*)
+FROM system.mutations
+WHERE is_done = 0;
+```
+
+Count of mutations from a ClickHouse cluster of replicas:
+``` sql
+SELECT count(*)
+FROM clusterAllReplicas('default',system.mutations)
+WHERE is_done = 0;
+```
+
+Query the list of incomplete mutations:
+
+List of mutations from a single ClickHouse node:
+``` sql
+SELECT mutation_id,*
+FROM system.mutations
+WHERE is_done = 0;
+```
+
+List of mutations from a ClickHouse cluster:
+``` sql
+SELECT mutation_id,*
+FROM clusterAllReplicas('default',system.mutations)
+WHERE is_done = 0;
+```
+
+Kill the mutations as needed:
 ``` sql
 -- Cancel and remove all mutations of the single table:
 KILL MUTATION WHERE database = 'default' AND table = 'table'

From 1134af19caeaffcf70cc94146faed346d6af0cf6 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Tue, 7 Nov 2023 22:33:29 -0800
Subject: [PATCH 004/985] [Docs] Fix typo

Co-authored-by: Johnny <9611008+johnnymatthews@users.noreply.github.com>
---
 docs/en/sql-reference/statements/kill.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/kill.md b/docs/en/sql-reference/statements/kill.md
index 32de7a41e72..a7d050e548c 100644
--- a/docs/en/sql-reference/statements/kill.md
+++ b/docs/en/sql-reference/statements/kill.md
@@ -21,7 +21,7 @@ The queries to terminate are selected from the system.processes table using the
 
 Examples:
 
-First, you'll need to get the list of incomplete queries. This SQL queries provides them according to those running the longest:
+First, you'll need to get the list of incomplete queries. This SQL query provides them according to those running the longest:
 
 List from a single ClickHouse node:
 ``` sql

From 7e0d95e48cb399c047c9756d81b0f76ce67ea57f Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Tue, 7 Nov 2023 22:33:43 -0800
Subject: [PATCH 005/985] [Docs] Formatting

Co-authored-by: Johnny <9611008+johnnymatthews@users.noreply.github.com>
---
 docs/en/sql-reference/statements/kill.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/kill.md b/docs/en/sql-reference/statements/kill.md
index a7d050e548c..57448c4f441 100644
--- a/docs/en/sql-reference/statements/kill.md
+++ b/docs/en/sql-reference/statements/kill.md
@@ -88,7 +88,7 @@ A test query (`TEST`) only checks the user’s rights and displays a list of mut
 
 Examples:
 
-Get a count() of the number of incomplete mutations:
+Get a `count()` of the number of incomplete mutations:
 
 Count of mutations from a single ClickHouse node:
 ``` sql

From ec02a2a2c4f4d4a279732df2c2dd61ab8b0cb80a Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Tue, 7 Nov 2023 22:36:49 -0800
Subject: [PATCH 006/985] [Docs] Reword for clarity

Co-authored-by: Johnny <9611008+johnnymatthews@users.noreply.github.com>
---
 docs/en/sql-reference/statements/kill.md | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/kill.md b/docs/en/sql-reference/statements/kill.md
index 57448c4f441..c85870fc0c8 100644
--- a/docs/en/sql-reference/statements/kill.md
+++ b/docs/en/sql-reference/statements/kill.md
@@ -73,7 +73,10 @@ A test query (`TEST`) only checks the user’s rights and displays a list of que
 
 ## KILL MUTATION
 
-One of the first things to check if a ClickHouse system or service is not running well is for long-running, incomplete mutations. The asynchronous (background) nature of mutations can cause a large queue of them that can then consume all available resources on the service. You may need to either pause all new mutations, INSERTs, and SELECTs and allow the queue of mutations to complete, or else manually kill some of these mutations.
+The presence of long-running or incomplete mutations often indicates that a ClickHouse service is running poorly. The asynchronous nature of mutations can cause them to consume all available resources on a system. You may need to either: 
+
+- Pause all new mutations, `INSERT`s , and `SELECT`s and allow the queue of mutations to complete.
+- Or manually kill some of these mutations by sending a `KILLSIG` command.
 
 ``` sql
 KILL MUTATION [ON CLUSTER cluster]

From 039bb1d599a5262e558b9b4ebd66fd85469afa3c Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Mon, 22 Jan 2024 20:26:28 +0100
Subject: [PATCH 007/985] fix race on Context::async_insert_queue

---
 src/Interpreters/Context.cpp | 14 ++++++++++++--
 1 file changed, 12 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 7e89c794712..51cfd302338 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -181,6 +181,7 @@ namespace ErrorCodes
     extern const int ILLEGAL_COLUMN;
     extern const int NUMBER_OF_COLUMNS_DOESNT_MATCH;
     extern const int CLUSTER_DOESNT_EXIST;
+    extern const int ABORTED;
 }
 
 #define SHUTDOWN(log, desc, ptr, method) do             \
@@ -556,7 +557,12 @@ struct ContextSharedPart : boost::noncopyable
             return;
 
         /// Need to flush the async insert queue before shutting down the database catalog
-        async_insert_queue.reset();
+        std::shared_ptr<AsynchronousInsertQueue> delete_async_insert_queue;
+        {
+            std::lock_guard lock(mutex);
+            delete_async_insert_queue = std::move(async_insert_queue);
+        }
+        delete_async_insert_queue.reset();
 
         /// Stop periodic reloading of the configuration files.
         /// This must be done first because otherwise the reloading may pass a changed config
@@ -4838,11 +4844,15 @@ PartUUIDsPtr Context::getIgnoredPartUUIDs() const
 
 AsynchronousInsertQueue * Context::getAsynchronousInsertQueue() const
 {
-    return shared->async_insert_queue.get();
+    std::lock_guard lock(mutex);
+    if (auto res = shared->async_insert_queue.get())
+        return res;
+    throw Exception(ErrorCodes::ABORTED, "AsynchronousInsertQueue is not initialized yet or has been already shutdown");
 }
 
 void Context::setAsynchronousInsertQueue(const std::shared_ptr<AsynchronousInsertQueue> & ptr)
 {
+    std::lock_guard lock(mutex);
     using namespace std::chrono;
 
     if (std::chrono::milliseconds(settings.async_insert_busy_timeout_ms) == 0ms)

From eb881667638524f182f06e19d699704ce9e86196 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Tue, 23 Jan 2024 00:28:28 +0100
Subject: [PATCH 008/985] Update Context.cpp

---
 src/Interpreters/Context.cpp | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 51cfd302338..217b247c21c 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -181,7 +181,6 @@ namespace ErrorCodes
     extern const int ILLEGAL_COLUMN;
     extern const int NUMBER_OF_COLUMNS_DOESNT_MATCH;
     extern const int CLUSTER_DOESNT_EXIST;
-    extern const int ABORTED;
 }
 
 #define SHUTDOWN(log, desc, ptr, method) do             \
@@ -4845,9 +4844,7 @@ PartUUIDsPtr Context::getIgnoredPartUUIDs() const
 AsynchronousInsertQueue * Context::getAsynchronousInsertQueue() const
 {
     std::lock_guard lock(mutex);
-    if (auto res = shared->async_insert_queue.get())
-        return res;
-    throw Exception(ErrorCodes::ABORTED, "AsynchronousInsertQueue is not initialized yet or has been already shutdown");
+    return shared->async_insert_queue.get();
 }
 
 void Context::setAsynchronousInsertQueue(const std::shared_ptr<AsynchronousInsertQueue> & ptr)

From 4cfc8d1a34342d44adbc7d9c8c3a4916670d68b2 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Tue, 23 Jan 2024 00:30:42 +0100
Subject: [PATCH 009/985] better method name

---
 src/Interpreters/Context.cpp                             | 2 +-
 src/Interpreters/Context.h                               | 2 +-
 src/Interpreters/InterpreterSystemQuery.cpp              | 2 +-
 src/Interpreters/executeQuery.cpp                        | 2 +-
 src/Server/TCPHandler.cpp                                | 2 +-
 src/Storages/System/StorageSystemAsynchronousInserts.cpp | 2 +-
 6 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 217b247c21c..ab42e6b0ec9 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -4841,7 +4841,7 @@ PartUUIDsPtr Context::getIgnoredPartUUIDs() const
     return ignored_part_uuids;
 }
 
-AsynchronousInsertQueue * Context::getAsynchronousInsertQueue() const
+AsynchronousInsertQueue * Context::tryGetAsynchronousInsertQueue() const
 {
     std::lock_guard lock(mutex);
     return shared->async_insert_queue.get();
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index 65566876a80..6180bfbde88 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -1203,7 +1203,7 @@ public:
     PartUUIDsPtr getPartUUIDs() const;
     PartUUIDsPtr getIgnoredPartUUIDs() const;
 
-    AsynchronousInsertQueue * getAsynchronousInsertQueue() const;
+    AsynchronousInsertQueue * tryGetAsynchronousInsertQueue() const;
     void setAsynchronousInsertQueue(const std::shared_ptr<AsynchronousInsertQueue> & ptr);
 
     ReadTaskCallback getReadTaskCallback() const;
diff --git a/src/Interpreters/InterpreterSystemQuery.cpp b/src/Interpreters/InterpreterSystemQuery.cpp
index 1712c9608bf..f478b43049f 100644
--- a/src/Interpreters/InterpreterSystemQuery.cpp
+++ b/src/Interpreters/InterpreterSystemQuery.cpp
@@ -692,7 +692,7 @@ BlockIO InterpreterSystemQuery::execute()
         case Type::FLUSH_ASYNC_INSERT_QUEUE:
         {
             getContext()->checkAccess(AccessType::SYSTEM_FLUSH_ASYNC_INSERT_QUEUE);
-            auto * queue = getContext()->getAsynchronousInsertQueue();
+            auto * queue = getContext()->tryGetAsynchronousInsertQueue();
             if (!queue)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS,
                     "Cannot flush asynchronous insert queue because it is not initialized");
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 4b5a6a84e17..a84c957d9a8 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -924,7 +924,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
         std::unique_ptr<IInterpreter> interpreter;
 
         bool async_insert = false;
-        auto * queue = context->getAsynchronousInsertQueue();
+        auto * queue = context->tryGetAsynchronousInsertQueue();
         auto * logger = &Poco::Logger::get("executeQuery");
 
         if (insert_query && async_insert_enabled)
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index fa7206eeaac..9bc6c3872fd 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -907,7 +907,7 @@ void TCPHandler::processInsertQuery()
     Block processed_block;
     const auto & settings = query_context->getSettingsRef();
 
-    auto * insert_queue = query_context->getAsynchronousInsertQueue();
+    auto * insert_queue = query_context->tryGetAsynchronousInsertQueue();
     const auto & insert_query = assert_cast<const ASTInsertQuery &>(*state.parsed_query);
 
     bool async_insert_enabled = settings.async_insert;
diff --git a/src/Storages/System/StorageSystemAsynchronousInserts.cpp b/src/Storages/System/StorageSystemAsynchronousInserts.cpp
index 20ba4d1cdfb..b480821f8ea 100644
--- a/src/Storages/System/StorageSystemAsynchronousInserts.cpp
+++ b/src/Storages/System/StorageSystemAsynchronousInserts.cpp
@@ -34,7 +34,7 @@ void StorageSystemAsynchronousInserts::fillData(MutableColumns & res_columns, Co
 {
     using namespace std::chrono;
 
-    auto * insert_queue = context->getAsynchronousInsertQueue();
+    auto * insert_queue = context->tryGetAsynchronousInsertQueue();
     if (!insert_queue)
         return;
 

From f91feb0dcb405df80f317f456372c7374f2c75ee Mon Sep 17 00:00:00 2001
From: Daniil Ivanik <ivanikdaniil01@gmail.com>
Date: Tue, 30 Jan 2024 14:17:11 +0100
Subject: [PATCH 010/985] Initial working commit

---
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 210 ++++++++++--------
 src/Storages/SelectQueryInfo.h                |   2 +-
 src/Storages/System/StorageSystemNumbers.cpp  |   8 +-
 src/Storages/System/StorageSystemNumbers.h    |  36 +--
 src/Storages/System/attachSystemTables.cpp    |   5 +-
 src/TableFunctions/CMakeLists.txt             |   2 +-
 src/TableFunctions/ITableFunction.cpp         |   2 +-
 src/TableFunctions/TableFunctionNumbers.cpp   |   2 +-
 .../TableFunctionsGenerateSeries.cpp          | 100 +++++++++
 src/TableFunctions/registerTableFunctions.cpp |   1 +
 src/TableFunctions/registerTableFunctions.h   |   1 +
 11 files changed, 234 insertions(+), 135 deletions(-)
 create mode 100644 src/TableFunctions/TableFunctionsGenerateSeries.cpp

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 5173b18c6bf..13a14ffb917 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -26,41 +26,59 @@ namespace
 class NumbersSource : public ISource
 {
 public:
-    NumbersSource(UInt64 block_size_, UInt64 offset_, UInt64 step_)
-        : ISource(createHeader()), block_size(block_size_), next(offset_), step(step_)
+    NumbersSource(UInt64 block_size_, UInt64 offset_, UInt64 step_, const std::string& column_name, UInt64 inner_step_)
+        : ISource(createHeader(column_name)), block_size(block_size_), next(offset_), step(step_), inner_step(inner_step_), inner_remainder(offset_ % inner_step_)
     {
     }
 
     String getName() const override { return "Numbers"; }
 
-    static Block createHeader() { return {ColumnWithTypeAndName(ColumnUInt64::create(), std::make_shared<DataTypeUInt64>(), "number")}; }
+    static Block createHeader(const std::string& column_name) { return {ColumnWithTypeAndName(ColumnUInt64::create(), std::make_shared<DataTypeUInt64>(), column_name)}; }
 
 protected:
     Chunk generate() override
     {
-        auto column = ColumnUInt64::create(block_size);
-        ColumnUInt64::Container & vec = column->getData();
 
         UInt64 curr = next; /// The local variable for some reason works faster (>20%) than member of class.
+        UInt64 first_element = (curr / inner_step) * inner_step + inner_remainder;
+        if (first_element < curr) {
+            first_element += inner_step;
+        }
+        UInt64 filtered_block_size = 0;
+        if (first_element - curr >= block_size) {
+            auto column = ColumnUInt64::create(0);
+            return {Columns{std::move(column)}, filtered_block_size};
+        }
+        if (first_element - curr < block_size) {
+            filtered_block_size = (block_size - (first_element - curr) - 1) / inner_step + 1;
+        }
+
+        auto column = ColumnUInt64::create(filtered_block_size);
+        ColumnUInt64::Container & vec = column->getData();
         UInt64 * pos = vec.data(); /// This also accelerates the code.
-        UInt64 * end = &vec[block_size];
-        iota(pos, static_cast<size_t>(end - pos), curr);
+        UInt64 * end = &vec[filtered_block_size];
+        iota(pos, static_cast<size_t>(end - pos), UInt64{0});
+        for (UInt64 p = 0; p < filtered_block_size; p += 1) {
+            vec[p] = vec[p] * inner_step + first_element;
+        }
 
         next += step;
 
         progress(column->size(), column->byteSize());
 
-        return {Columns{std::move(column)}, block_size};
+        return {Columns{std::move(column)}, filtered_block_size};
     }
 
 private:
     UInt64 block_size;
     UInt64 next;
     UInt64 step;
+    UInt64 inner_step;
+    UInt64 inner_remainder;
 };
 
 
-UInt128 sizeOfRange(const Range & r)
+[[maybe_unused]] UInt128 sizeOfRange(const Range & r)
 {
     UInt128 size;
     if (r.right.isPositiveInfinity())
@@ -77,7 +95,7 @@ UInt128 sizeOfRange(const Range & r)
     return size;
 };
 
-auto sizeOfRanges(const Ranges & rs)
+[[maybe_unused]] auto sizeOfRanges(const Ranges & rs)
 {
     UInt128 total_size{};
     for (const Range & r : rs)
@@ -91,7 +109,7 @@ auto sizeOfRanges(const Ranges & rs)
 /// Generate numbers according to ranges.
 /// Numbers generated is ordered in one stream.
 /// Notice that we will not generate additional numbers out of ranges.
-class NumbersRangedSource : public ISource
+class [[maybe_unused]] NumbersRangedSource : public ISource
 {
 public:
     /// Represent a position in Ranges list.
@@ -109,8 +127,8 @@ public:
 
     using RangesStatePtr = std::shared_ptr<RangesState>;
 
-    NumbersRangedSource(const Ranges & ranges_, RangesStatePtr & ranges_state_, UInt64 base_block_size_)
-        : ISource(NumbersSource::createHeader()), ranges(ranges_), ranges_state(ranges_state_), base_block_size(base_block_size_)
+    [[maybe_unused]] NumbersRangedSource(const Ranges & ranges_, RangesStatePtr & ranges_state_, UInt64 base_block_size_, const std::string& column_name)
+        : ISource(NumbersSource::createHeader(column_name)), ranges(ranges_), ranges_state(ranges_state_), base_block_size(base_block_size_)
     {
     }
 
@@ -273,7 +291,7 @@ private:
 namespace
 {
 /// Whether we should push limit down to scan.
-bool shouldPushdownLimit(SelectQueryInfo & query_info, UInt64 limit_length)
+[[maybe_unused]] bool shouldPushdownLimit(SelectQueryInfo & query_info, UInt64 limit_length)
 {
     const auto & query = query_info.query->as<ASTSelectQuery &>();
     /// Just ignore some minor cases, such as:
@@ -286,7 +304,7 @@ bool shouldPushdownLimit(SelectQueryInfo & query_info, UInt64 limit_length)
 
 /// Shrink ranges to size.
 ///     For example: ranges: [1, 5], [8, 100]; size: 7, we will get [1, 5], [8, 9]
-void shrinkRanges(Ranges & ranges, size_t size)
+[[maybe_unused]] void shrinkRanges(Ranges & ranges, size_t size)
 {
     size_t last_range_idx = 0;
     for (size_t i = 0; i < ranges.size(); i++)
@@ -375,107 +393,107 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         num_streams = 1;
 
     /// Build rpn of query filters
-    KeyCondition condition(buildFilterDAG(), context, column_names, key_expression);
+    // KeyCondition condition(buildFilterDAG(), context, column_names, key_expression);
 
     Pipe pipe;
     Ranges ranges;
 
-    if (condition.extractPlainRanges(ranges))
-    {
-        /// Intersect ranges with table range
-        std::optional<Range> table_range;
-        std::optional<Range> overflowed_table_range;
+    // if (condition.extractPlainRanges(ranges))
+    // {
+    //     /// Intersect ranges with table range
+    //     std::optional<Range> table_range;
+    //     std::optional<Range> overflowed_table_range;
 
-        if (numbers_storage.limit.has_value())
-        {
-            if (std::numeric_limits<UInt64>::max() - numbers_storage.offset >= *(numbers_storage.limit))
-            {
-                table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(numbers_storage.offset + *(numbers_storage.limit)), false);
-            }
-            /// UInt64 overflow, for example: SELECT number FROM numbers(18446744073709551614, 5)
-            else
-            {
-                table_range.emplace(FieldRef(numbers_storage.offset), true, std::numeric_limits<UInt64>::max(), true);
-                auto overflow_end = UInt128(numbers_storage.offset) + UInt128(*numbers_storage.limit);
-                overflowed_table_range.emplace(
-                    FieldRef(UInt64(0)), true, FieldRef(UInt64(overflow_end - std::numeric_limits<UInt64>::max() - 1)), false);
-            }
-        }
-        else
-        {
-            table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(std::numeric_limits<UInt64>::max()), true);
-        }
+    //     if (numbers_storage.limit.has_value())
+    //     {
+    //         if (std::numeric_limits<UInt64>::max() - numbers_storage.offset >= *(numbers_storage.limit))
+    //         {
+    //             table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(numbers_storage.offset + *(numbers_storage.limit)), false);
+    //         }
+    //         /// UInt64 overflow, for example: SELECT number FROM numbers(18446744073709551614, 5)
+    //         else
+    //         {
+    //             table_range.emplace(FieldRef(numbers_storage.offset), true, std::numeric_limits<UInt64>::max(), true);
+    //             auto overflow_end = UInt128(numbers_storage.offset) + UInt128(*numbers_storage.limit);
+    //             overflowed_table_range.emplace(
+    //                 FieldRef(UInt64(0)), true, FieldRef(UInt64(overflow_end - std::numeric_limits<UInt64>::max() - 1)), false);
+    //         }
+    //     }
+    //     else
+    //     {
+    //         table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(std::numeric_limits<UInt64>::max()), true);
+    //     }
 
-        Ranges intersected_ranges;
-        for (auto & r : ranges)
-        {
-            auto intersected_range = table_range->intersectWith(r);
-            if (intersected_range)
-                intersected_ranges.push_back(*intersected_range);
-        }
-        /// intersection with overflowed_table_range goes back.
-        if (overflowed_table_range.has_value())
-        {
-            for (auto & r : ranges)
-            {
-                auto intersected_range = overflowed_table_range->intersectWith(r);
-                if (intersected_range)
-                    intersected_ranges.push_back(*overflowed_table_range);
-            }
-        }
+    //     Ranges intersected_ranges;
+    //     for (auto & r : ranges)
+    //     {
+    //         auto intersected_range = table_range->intersectWith(r);
+    //         if (intersected_range)
+    //             intersected_ranges.push_back(*intersected_range);
+    //     }
+    //     /// intersection with overflowed_table_range goes back.
+    //     if (overflowed_table_range.has_value())
+    //     {
+    //         for (auto & r : ranges)
+    //         {
+    //             auto intersected_range = overflowed_table_range->intersectWith(r);
+    //             if (intersected_range)
+    //                 intersected_ranges.push_back(*overflowed_table_range);
+    //         }
+    //     }
 
-        /// ranges is blank, return a source who has no data
-        if (intersected_ranges.empty())
-        {
-            pipe.addSource(std::make_shared<NullSource>(NumbersSource::createHeader()));
-            return pipe;
-        }
-        const auto & limit_length = limit_length_and_offset.first;
-        const auto & limit_offset = limit_length_and_offset.second;
+    //     /// ranges is blank, return a source who has no data
+    //     if (intersected_ranges.empty())
+    //     {
+    //         pipe.addSource(std::make_shared<NullSource>(NumbersSource::createHeader(numbers_storage.column_name)));
+    //         return pipe;
+    //     }
+    //     const auto & limit_length = limit_length_and_offset.first;
+    //     const auto & limit_offset = limit_length_and_offset.second;
 
-        /// If intersected ranges is limited or we can pushdown limit.
-        if (!intersected_ranges.rbegin()->right.isPositiveInfinity() || should_pushdown_limit)
-        {
-            UInt128 total_size = sizeOfRanges(intersected_ranges);
-            UInt128 query_limit = limit_length + limit_offset;
+    //     /// If intersected ranges is limited or we can pushdown limit.
+    //     if (!intersected_ranges.rbegin()->right.isPositiveInfinity() || should_pushdown_limit)
+    //     {
+    //         UInt128 total_size = sizeOfRanges(intersected_ranges);
+    //         UInt128 query_limit = limit_length + limit_offset;
 
-            /// limit total_size by query_limit
-            if (should_pushdown_limit && query_limit < total_size)
-            {
-                total_size = query_limit;
-                /// We should shrink intersected_ranges for case:
-                ///     intersected_ranges: [1, 4], [7, 100]; query_limit: 2
-                shrinkRanges(intersected_ranges, total_size);
-            }
+    //         /// limit total_size by query_limit
+    //         if (should_pushdown_limit && query_limit < total_size)
+    //         {
+    //             total_size = query_limit;
+    //             /// We should shrink intersected_ranges for case:
+    //             ///     intersected_ranges: [1, 4], [7, 100]; query_limit: 2
+    //             shrinkRanges(intersected_ranges, total_size);
+    //         }
 
-            checkLimits(size_t(total_size));
+    //         checkLimits(size_t(total_size));
 
-            if (total_size / max_block_size < num_streams)
-                num_streams = static_cast<size_t>(total_size / max_block_size);
+    //         if (total_size / max_block_size < num_streams)
+    //             num_streams = static_cast<size_t>(total_size / max_block_size);
 
-            if (num_streams == 0)
-                num_streams = 1;
+    //         if (num_streams == 0)
+    //             num_streams = 1;
 
-            /// Ranges state, all streams will share the state.
-            auto ranges_state = std::make_shared<NumbersRangedSource::RangesState>();
-            for (size_t i = 0; i < num_streams; ++i)
-            {
-                auto source = std::make_shared<NumbersRangedSource>(intersected_ranges, ranges_state, max_block_size);
+    //         /// Ranges state, all streams will share the state.
+    //         auto ranges_state = std::make_shared<NumbersRangedSource::RangesState>();
+    //         for (size_t i = 0; i < num_streams; ++i)
+    //         {
+    //             auto source = std::make_shared<NumbersRangedSource>(intersected_ranges, ranges_state, max_block_size, numbers_storage.column_name);
 
-                if (i == 0)
-                    source->addTotalRowsApprox(total_size);
+    //             if (i == 0)
+    //                 source->addTotalRowsApprox(total_size);
 
-                pipe.addSource(std::move(source));
-            }
-            return pipe;
-        }
-    }
+    //             pipe.addSource(std::move(source));
+    //         }
+    //         return pipe;
+    //     }
+    // }
 
     /// Fall back to NumbersSource
     for (size_t i = 0; i < num_streams; ++i)
     {
         auto source
-            = std::make_shared<NumbersSource>(max_block_size, numbers_storage.offset + i * max_block_size, num_streams * max_block_size);
+            = std::make_shared<NumbersSource>(max_block_size, numbers_storage.offset + i * max_block_size, num_streams * max_block_size, numbers_storage.column_name, numbers_storage.step);
 
         if (numbers_storage.limit && i == 0)
         {
diff --git a/src/Storages/SelectQueryInfo.h b/src/Storages/SelectQueryInfo.h
index 662a5c0ef5a..2b4afaa6345 100644
--- a/src/Storages/SelectQueryInfo.h
+++ b/src/Storages/SelectQueryInfo.h
@@ -229,4 +229,4 @@ struct SelectQueryInfo
 
     bool isFinal() const;
 };
-}
+    }
diff --git a/src/Storages/System/StorageSystemNumbers.cpp b/src/Storages/System/StorageSystemNumbers.cpp
index b100be7cdf4..cd7207917a9 100644
--- a/src/Storages/System/StorageSystemNumbers.cpp
+++ b/src/Storages/System/StorageSystemNumbers.cpp
@@ -11,15 +11,16 @@
 #include <Processors/Sources/NullSource.h>
 #include <QueryPipeline/Pipe.h>
 #include <Storages/SelectQueryInfo.h>
+#include <Common/logger_useful.h>
 
 namespace DB
 {
 
-StorageSystemNumbers::StorageSystemNumbers(const StorageID & table_id, bool multithreaded_, std::optional<UInt64> limit_, UInt64 offset_)
-    : IStorage(table_id), multithreaded(multithreaded_), limit(limit_), offset(offset_)
+StorageSystemNumbers::StorageSystemNumbers(const StorageID & table_id, bool multithreaded_, const std::string& column_name_, std::optional<UInt64> limit_, UInt64 offset_, UInt64 step_)
+    : IStorage(table_id), multithreaded(multithreaded_), limit(limit_), offset(offset_), column_name(column_name_), step(step_)
 {
     StorageInMemoryMetadata storage_metadata;
-    storage_metadata.setColumns(ColumnsDescription({{"number", std::make_shared<DataTypeUInt64>()}}));
+    storage_metadata.setColumns(ColumnsDescription({{column_name_, std::make_shared<DataTypeUInt64>()}}));
     setInMemoryMetadata(storage_metadata);
 }
 
@@ -33,6 +34,7 @@ void StorageSystemNumbers::read(
     size_t max_block_size,
     size_t num_streams)
 {
+    // LOG_DEBUG(&Poco::Logger::get("Reading from SystemNumbers"), "Limit : {}", limit.value());
     query_plan.addStep(std::make_unique<ReadFromSystemNumbersStep>(
         column_names, shared_from_this(), storage_snapshot, query_info, std::move(context), max_block_size, num_streams));
 }
diff --git a/src/Storages/System/StorageSystemNumbers.h b/src/Storages/System/StorageSystemNumbers.h
index fe6227db406..ffe87b8ad14 100644
--- a/src/Storages/System/StorageSystemNumbers.h
+++ b/src/Storages/System/StorageSystemNumbers.h
@@ -10,39 +10,11 @@ namespace DB
 
 class Context;
 
-
-/** Implements a table engine for the system table "numbers".
-  * The table contains the only column number UInt64.
-  * From this table, you can read all natural numbers, starting from 0 (to 2^64 - 1, and then again).
-  *
-  * You could also specify a limit (how many numbers to give).
-  *
-  * How to generate numbers?
-  *
-  * 1. First try a smart fashion:
-  *
-  * In this fashion we try to push filters and limit down to scanning.
-  * Firstly extract plain ranges(no overlapping and ordered) by filter expressions.
-  *
-  * For example:
-  *     where (numbers > 1 and numbers < 3) or (numbers in (4, 6)) or (numbers > 7 and numbers < 9)
-  *
-  * We will get ranges
-  *     (1, 3), [4, 4], [6, 6], (7, 9)
-  *
-  * Then split the ranges evenly to one or multi-streams. With this way we will get result without large scanning.
-  *
-  * 2. If fail to extract plain ranges, fall back to ordinary scanning.
-  *
-  * If multithreaded is specified, numbers will be generated in several streams
-  *  (and result could be out of order). If both multithreaded and limit are specified,
-  *  the table could give you not exactly 1..limit range, but some arbitrary 'limit' numbers.
-  */
-class StorageSystemNumbers final : public IStorage
+class   StorageSystemNumbers final : public IStorage
 {
 public:
     /// Otherwise, streams concurrently increment atomic.
-    StorageSystemNumbers(const StorageID & table_id, bool multithreaded_, std::optional<UInt64> limit_ = std::nullopt, UInt64 offset_ = 0);
+    StorageSystemNumbers(const StorageID & table_id, bool multithreaded_, const std::string& column_name, std::optional<UInt64> limit_ = std::nullopt, UInt64 offset_ = 0, UInt64 step_ = 1);
 
     std::string getName() const override { return "SystemNumbers"; }
 
@@ -67,6 +39,10 @@ private:
     bool multithreaded;
     std::optional<UInt64> limit;
     UInt64 offset;
+    std::string column_name;
+    
+    UInt64 step;
+
 };
 
 }
diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index bf898f57833..ddd89709b6a 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -118,8 +118,9 @@ namespace DB
 void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, bool has_zookeeper)
 {
     attach<StorageSystemOne>(context, system_database, "one", "This table contains a single row with a single dummy UInt8 column containing the value 0. Used when the table is not specified explicitly, for example in queries like `SELECT 1`.");
-    attach<StorageSystemNumbers>(context, system_database, "numbers", "Generates all natural numbers, starting from 0 (to 2^64 - 1, and then again) in sorted order.", false);
-    attach<StorageSystemNumbers>(context, system_database, "numbers_mt", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", true);
+    attach<StorageSystemNumbers>(context, system_database, "numbers", "Generates all natural numbers, starting from 0 (to 2^64 - 1, and then again) in sorted order.", false, "number");
+    attach<StorageSystemNumbers>(context, system_database, "numbers_mt", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", true, "number");
+    // attach<StorageSystemNumbers>(context, system_database, "generate_series", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", false, "generate_series");
     attach<StorageSystemZeros>(context, system_database, "zeros", "Produces unlimited number of non-materialized zeros.", false);
     attach<StorageSystemZeros>(context, system_database, "zeros_mt", "Multithreaded version of system.zeros.", true);
     attach<StorageSystemDatabases>(context, system_database, "databases", "Lists all databases of the current server.");
diff --git a/src/TableFunctions/CMakeLists.txt b/src/TableFunctions/CMakeLists.txt
index 770990cc405..c5c2a660935 100644
--- a/src/TableFunctions/CMakeLists.txt
+++ b/src/TableFunctions/CMakeLists.txt
@@ -29,7 +29,7 @@ if (TARGET ch_contrib::azure_sdk)
     target_link_libraries(clickhouse_table_functions PRIVATE ch_contrib::azure_sdk)
 endif ()
 
-if (TARGET ch_contrib::simdjson)
+if (TARGET ch_co`trib::simdjson)
     target_link_libraries(clickhouse_table_functions PRIVATE ch_contrib::simdjson)
 endif ()
 
diff --git a/src/TableFunctions/ITableFunction.cpp b/src/TableFunctions/ITableFunction.cpp
index 137e1dc27fe..c854b6b0f9c 100644
--- a/src/TableFunctions/ITableFunction.cpp
+++ b/src/TableFunctions/ITableFunction.cpp
@@ -5,7 +5,7 @@
 #include <Access/Common/AccessFlags.h>
 #include <Common/ProfileEvents.h>
 #include <TableFunctions/TableFunctionFactory.h>
-
+#include <Common/logger_useful.h>
 
 namespace ProfileEvents
 {
diff --git a/src/TableFunctions/TableFunctionNumbers.cpp b/src/TableFunctions/TableFunctionNumbers.cpp
index 262018f108c..71a9ba097c6 100644
--- a/src/TableFunctions/TableFunctionNumbers.cpp
+++ b/src/TableFunctions/TableFunctionNumbers.cpp
@@ -63,7 +63,7 @@ StoragePtr TableFunctionNumbers<multithreaded>::executeImpl(const ASTPtr & ast_f
         UInt64 offset = arguments.size() == 2 ? evaluateArgument(context, arguments[0]) : 0;
         UInt64 length = arguments.size() == 2 ? evaluateArgument(context, arguments[1]) : evaluateArgument(context, arguments[0]);
 
-        auto res = std::make_shared<StorageSystemNumbers>(StorageID(getDatabaseName(), table_name), multithreaded, length, offset);
+        auto res = std::make_shared<StorageSystemNumbers>(StorageID(getDatabaseName(), table_name), multithreaded, std::string{"number"}, length, offset);
         res->startup();
         return res;
     }
diff --git a/src/TableFunctions/TableFunctionsGenerateSeries.cpp b/src/TableFunctions/TableFunctionsGenerateSeries.cpp
new file mode 100644
index 00000000000..3941f1eadb2
--- /dev/null
+++ b/src/TableFunctions/TableFunctionsGenerateSeries.cpp
@@ -0,0 +1,100 @@
+#include <TableFunctions/ITableFunction.h>
+#include <TableFunctions/TableFunctionFactory.h>
+#include <Parsers/ASTFunction.h>
+#include <Common/typeid_cast.h>
+#include <Common/FieldVisitorToString.h>
+#include <Storages/System/StorageSystemNumbers.h>
+#include <Interpreters/evaluateConstantExpression.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/Context.h>
+#include <DataTypes/DataTypesNumber.h>
+#include "registerTableFunctions.h"
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+}
+
+namespace
+{
+
+/* numbers(limit), numbers_mt(limit)
+ * - the same as SELECT number FROM system.numbers LIMIT limit.
+ * Used for testing purposes, as a simple example of table function.
+ */
+class TableFunctionGenerateSeries : public ITableFunction
+{
+public:
+    static constexpr auto name = "generate_series";
+    std::string getName() const override { return name; }
+    bool hasStaticStructure() const override { return true; }
+private:
+    StoragePtr executeImpl(const ASTPtr & ast_function, ContextPtr context, const std::string & table_name, ColumnsDescription cached_columns, bool is_insert_query) const override;
+    const char * getStorageTypeName() const override { return "SystemNumbers"; }
+
+    UInt64 evaluateArgument(ContextPtr context, ASTPtr & argument) const;
+
+    ColumnsDescription getActualTableStructure(ContextPtr context, bool is_insert_query) const override;
+};
+
+ColumnsDescription TableFunctionGenerateSeries::getActualTableStructure(ContextPtr /*context*/, bool /*is_insert_query*/) const
+{
+    /// NOTE: https://bugs.llvm.org/show_bug.cgi?id=47418
+    return ColumnsDescription{{{"generate_series", std::make_shared<DataTypeUInt64>()}}};
+}
+
+StoragePtr TableFunctionGenerateSeries::executeImpl(const ASTPtr & ast_function, ContextPtr context, const std::string & table_name, ColumnsDescription /*cached_columns*/, bool /*is_insert_query*/) const
+{
+    if (const auto * function = ast_function->as<ASTFunction>())
+    {
+        auto arguments = function->arguments->children;
+
+        if (arguments.size() != 2 && arguments.size() != 3)
+            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires 'length' or 'offset, length'.", getName());
+
+        UInt64 start = evaluateArgument(context, arguments[0]);
+        UInt64 stop = evaluateArgument(context, arguments[1]);
+        UInt64 interval = (arguments.size() == 3) ? evaluateArgument(context, arguments[2]) : UInt64{1};
+        if (start > stop) {
+            auto res = std::make_shared<StorageSystemNumbers>(StorageID(getDatabaseName(), table_name), false, std::string{"generate_series"}, 0);
+            res->startup();
+            return res;
+        }
+
+        auto res = std::make_shared<StorageSystemNumbers>(StorageID(getDatabaseName(), table_name), false, std::string{"generate_series"}, (stop - start) / interval + 1, start, interval);
+        res->startup();
+        return res;
+    }
+    throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires 'limit' or 'offset, limit'.", getName());
+}
+
+UInt64 TableFunctionGenerateSeries::evaluateArgument(ContextPtr context, ASTPtr & argument) const
+{
+    const auto & [field, type] = evaluateConstantExpression(argument, context);
+
+    if (!isNativeNumber(type))
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} expression, must be numeric type", type->getName());
+
+    Field converted = convertFieldToType(field, DataTypeUInt64());
+    if (converted.isNull())
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "The value {} is not representable as UInt64",
+                        applyVisitor(FieldVisitorToString(), field));
+
+    return converted.safeGet<UInt64>();
+}
+
+
+}
+
+void registerTableFunctionGenerateSeries(TableFunctionFactory & factory)
+{
+    factory.registerFunction<TableFunctionGenerateSeries>({.documentation = {}, .allow_readonly = true});
+    // factory.registerFunction<TableFunctionGenerateSeries>({.documentation = {}, .allow_readonly = true});
+}
+
+}
diff --git a/src/TableFunctions/registerTableFunctions.cpp b/src/TableFunctions/registerTableFunctions.cpp
index 8c18c298f45..1631fa8e879 100644
--- a/src/TableFunctions/registerTableFunctions.cpp
+++ b/src/TableFunctions/registerTableFunctions.cpp
@@ -11,6 +11,7 @@ void registerTableFunctions()
     registerTableFunctionMerge(factory);
     registerTableFunctionRemote(factory);
     registerTableFunctionNumbers(factory);
+    registerTableFunctionGenerateSeries(factory);
     registerTableFunctionNull(factory);
     registerTableFunctionZeros(factory);
     registerTableFunctionExecutable(factory);
diff --git a/src/TableFunctions/registerTableFunctions.h b/src/TableFunctions/registerTableFunctions.h
index fae763e7dc8..111fbe8c22f 100644
--- a/src/TableFunctions/registerTableFunctions.h
+++ b/src/TableFunctions/registerTableFunctions.h
@@ -8,6 +8,7 @@ class TableFunctionFactory;
 void registerTableFunctionMerge(TableFunctionFactory & factory);
 void registerTableFunctionRemote(TableFunctionFactory & factory);
 void registerTableFunctionNumbers(TableFunctionFactory & factory);
+void registerTableFunctionGenerateSeries(TableFunctionFactory & factory);
 void registerTableFunctionNull(TableFunctionFactory & factory);
 void registerTableFunctionZeros(TableFunctionFactory & factory);
 void registerTableFunctionExecutable(TableFunctionFactory & factory);

From 3f0cfbd8c0816b007ff85b1a3997696ce5ed3214 Mon Sep 17 00:00:00 2001
From: Daniil Ivanik <ivanikdaniil01@gmail.com>
Date: Sat, 3 Feb 2024 19:46:00 +0100
Subject: [PATCH 011/985] Kek

---
 src/Common/iota.cpp                           |  29 ++
 src/Common/iota.h                             |   9 +
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 281 ++++++++++--------
 3 files changed, 197 insertions(+), 122 deletions(-)

diff --git a/src/Common/iota.cpp b/src/Common/iota.cpp
index 98f18eb195b..532c4bde76d 100644
--- a/src/Common/iota.cpp
+++ b/src/Common/iota.cpp
@@ -27,10 +27,39 @@ void iota(T * begin, size_t count, T first_value)
     return iotaImpl(begin, count, first_value);
 }
 
+MULTITARGET_FUNCTION_AVX2_SSE42(
+    MULTITARGET_FUNCTION_HEADER(template <iota_supported_types T> void NO_INLINE),
+    iotaWithStepImpl, MULTITARGET_FUNCTION_BODY((T * begin, size_t count, T first_value, T step) /// NOLINT
+    {
+        for (size_t i = 0; i < count; i++)
+            *(begin + i) = static_cast<T>(first_value + i * step);
+    })
+)
+
+template <iota_supported_types T>
+void iota_with_step(T * begin, size_t count, T first_value, T step)
+{
+#if USE_MULTITARGET_CODE
+    if (isArchSupported(TargetArch::AVX2))
+        return iotaWithStepImplAVX2(begin, count, first_value, step);
+
+    if (isArchSupported(TargetArch::SSE42))
+        return iotaWithStepImplSSE42(begin, count, first_value, step);
+#endif
+    return iotaWithStepImpl(begin, count, first_value, step);
+}
+
 template void iota(UInt8 * begin, size_t count, UInt8 first_value);
 template void iota(UInt32 * begin, size_t count, UInt32 first_value);
 template void iota(UInt64 * begin, size_t count, UInt64 first_value);
 #if defined(OS_DARWIN)
 template void iota(size_t * begin, size_t count, size_t first_value);
 #endif
+
+template void iota_with_step(UInt8 * begin, size_t count, UInt8 first_value, UInt8 step);
+template void iota_with_step(UInt32 * begin, size_t count, UInt32 first_value, UInt32 step);
+template void iota_with_step(UInt64 * begin, size_t count, UInt64 first_value, UInt64 step);
+#if defined(OS_DARWIN)
+extern template void iota_with_step(size_t * begin, size_t count, size_t first_value, size_t step);
+#endif
 }
diff --git a/src/Common/iota.h b/src/Common/iota.h
index 7910274d15d..f40cde9d5db 100644
--- a/src/Common/iota.h
+++ b/src/Common/iota.h
@@ -31,4 +31,13 @@ extern template void iota(UInt64 * begin, size_t count, UInt64 first_value);
 #if defined(OS_DARWIN)
 extern template void iota(size_t * begin, size_t count, size_t first_value);
 #endif
+
+template <iota_supported_types T> void iota_with_step(T * begin, size_t count, T first_value, T step);
+
+extern template void iota_with_step(UInt8 * begin, size_t count, UInt8 first_value, UInt8 step);
+extern template void iota_with_step(UInt32 * begin, size_t count, UInt32 first_value, UInt32 step);
+extern template void iota_with_step(UInt64 * begin, size_t count, UInt64 first_value, UInt64 step);
+#if defined(OS_DARWIN)
+extern template void iota(size_t * begin, size_t count, size_t first_value, size_t step);
+#endif
 }
diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 13a14ffb917..f85473e43c3 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -12,6 +12,8 @@
 #include <Common/iota.h>
 #include <Common/typeid_cast.h>
 
+#include <Common/logger_useful.h>
+
 namespace DB
 {
 
@@ -30,9 +32,9 @@ public:
         : ISource(createHeader(column_name)), block_size(block_size_), next(offset_), step(step_), inner_step(inner_step_), inner_remainder(offset_ % inner_step_)
     {
     }
-
     String getName() const override { return "Numbers"; }
 
+
     static Block createHeader(const std::string& column_name) { return {ColumnWithTypeAndName(ColumnUInt64::create(), std::make_shared<DataTypeUInt64>(), column_name)}; }
 
 protected:
@@ -57,10 +59,7 @@ protected:
         ColumnUInt64::Container & vec = column->getData();
         UInt64 * pos = vec.data(); /// This also accelerates the code.
         UInt64 * end = &vec[filtered_block_size];
-        iota(pos, static_cast<size_t>(end - pos), UInt64{0});
-        for (UInt64 p = 0; p < filtered_block_size; p += 1) {
-            vec[p] = vec[p] * inner_step + first_element;
-        }
+        iota_with_step(pos, static_cast<size_t>(end - pos), first_element, inner_step);
 
         next += step;
 
@@ -77,28 +76,46 @@ private:
     UInt64 inner_remainder;
 };
 
-
-[[maybe_unused]] UInt128 sizeOfRange(const Range & r)
-{
-    UInt128 size;
-    if (r.right.isPositiveInfinity())
-        return static_cast<UInt128>(std::numeric_limits<uint64_t>::max()) - r.left.get<UInt64>() + r.left_included;
-
-    size = static_cast<UInt128>(r.right.get<UInt64>()) - r.left.get<UInt64>() + 1;
-
-    if (!r.left_included)
-        size--;
-
-    if (!r.right_included)
-        size--;
-    assert(size >= 0);
-    return size;
+struct RangeWithStep {
+    Range range;
+    UInt64 step;
 };
 
-[[maybe_unused]] auto sizeOfRanges(const Ranges & rs)
+using RangesWithStep = std::vector<RangeWithStep>;
+
+std::optional<RangeWithStep> stepped_range_from_range(const Range& r, UInt64 step, UInt64 remainder) {
+    UInt64 begin = (r.left.get<UInt64>() / step) * step;
+    if (begin > std::numeric_limits<UInt64>::max() - remainder) {
+        return std::nullopt;
+    }
+    begin += remainder;
+    while (begin <= r.left.get<UInt128>() - r.left_included)   {
+        if (std::numeric_limits<UInt64>::max() - step < begin) {
+            return std::nullopt;
+        }
+        begin += step;
+    }
+
+    LOG_DEBUG(&Poco::Logger::get("stepped_range_from_range"), "Begin: {}", begin);
+    UInt128 right_edge = (r.right.get<UInt128>() + r.right_included);
+    if (begin >= right_edge) {
+        return std::nullopt;
+    }
+    return std::optional{RangeWithStep{Range(begin, true, static_cast<UInt64>(right_edge - 1), true), step}};
+}
+
+[[maybe_unused]] UInt128 sizeOfRange(const RangeWithStep & r)
+{
+    if (r.range.right.isPositiveInfinity())
+        return static_cast<UInt128>(std::numeric_limits<UInt64>::max() - r.range.left.get<UInt64>()) / r.step + r.range.left_included;
+
+    return static_cast<UInt128>(r.range.right.get<UInt64>() - r.range.left.get<UInt64>()) / r.step + 1;
+};
+
+[[maybe_unused]] auto sizeOfRanges(const RangesWithStep & rs)
 {
     UInt128 total_size{};
-    for (const Range & r : rs)
+    for (const RangeWithStep & r : rs)
     {
         /// total_size will never overflow
         total_size += sizeOfRange(r);
@@ -127,7 +144,7 @@ public:
 
     using RangesStatePtr = std::shared_ptr<RangesState>;
 
-    [[maybe_unused]] NumbersRangedSource(const Ranges & ranges_, RangesStatePtr & ranges_state_, UInt64 base_block_size_, const std::string& column_name)
+    [[maybe_unused]] NumbersRangedSource(const RangesWithStep & ranges_, RangesStatePtr & ranges_state_, UInt64 base_block_size_, const std::string& column_name)
         : ISource(NumbersSource::createHeader(column_name)), ranges(ranges_), ranges_state(ranges_state_), base_block_size(base_block_size_)
     {
     }
@@ -187,9 +204,9 @@ protected:
         if (ranges.empty())
             return {};
 
-        auto first_value = [](const Range & r) { return r.left.get<UInt64>() + (r.left_included ? 0 : 1); };
+        auto first_value = [](const RangeWithStep & r) { return r.range.left.get<UInt64>() + (r.range.left_included ? 0 : 1); };
 
-        auto last_value = [](const Range & r) { return r.right.get<UInt64>() - (r.right_included ? 0 : 1); };
+        auto last_value = [](const RangeWithStep & r) { return r.range.right.get<UInt64>() - (r.range.right_included ? 0 : 1); };
 
         /// Find the data range.
         /// If data left is small, shrink block size.
@@ -215,31 +232,33 @@ protected:
 
             UInt128 can_provide = cursor.offset_in_ranges == end.offset_in_ranges
                 ? end.offset_in_range - cursor.offset_in_range
-                : static_cast<UInt128>(last_value(range)) - first_value(range) + 1 - cursor.offset_in_range;
+                : static_cast<UInt128>(last_value(range) - first_value(range)) / range.step + 1 - cursor.offset_in_range;
 
             /// set value to block
-            auto set_value = [&pos](UInt128 & start_value, UInt128 & end_value)
+            auto set_value = [&pos, this](UInt128 & start_value, UInt128 & end_value)
             {
                 if (end_value > std::numeric_limits<UInt64>::max())
                 {
-                    while (start_value < end_value)
-                        *(pos++) = start_value++;
+                    while (start_value < end_value) {
+                        *(pos++) = start_value;
+                        start_value += this->step;
+                    }
                 }
                 else
                 {
                     auto start_value_64 = static_cast<UInt64>(start_value);
                     auto end_value_64 = static_cast<UInt64>(end_value);
                     auto size = end_value_64 - start_value_64;
-                    iota(pos, static_cast<size_t>(size), start_value_64);
+                    iota_with_step(pos, static_cast<size_t>(size), start_value_64, step);
                     pos += size;
                 }
             };
 
             if (can_provide > need)
             {
-                UInt64 start_value = first_value(range) + cursor.offset_in_range;
+                UInt64 start_value = first_value(range) + cursor.offset_in_range * step;
                 /// end_value will never overflow
-                iota(pos, static_cast<size_t>(need), start_value);
+                iota_with_step(pos, static_cast<size_t>(need), start_value, step);
                 pos += need;
 
                 provided += need;
@@ -248,8 +267,8 @@ protected:
             else if (can_provide == need)
             {
                 /// to avoid UInt64 overflow
-                UInt128 start_value = static_cast<UInt128>(first_value(range)) + cursor.offset_in_range;
-                UInt128 end_value = start_value + need;
+                UInt128 start_value = static_cast<UInt128>(first_value(range)) + cursor.offset_in_range * step;
+                UInt128 end_value = start_value + need * step;
                 set_value(start_value, end_value);
 
                 provided += need;
@@ -259,8 +278,8 @@ protected:
             else
             {
                 /// to avoid UInt64 overflow
-                UInt128 start_value = static_cast<UInt128>(first_value(range)) + cursor.offset_in_range;
-                UInt128 end_value = start_value + can_provide;
+                UInt128 start_value = static_cast<UInt128>(first_value(range)) + cursor.offset_in_range * step;
+                UInt128 end_value = start_value + can_provide * step;
                 set_value(start_value, end_value);
 
                 provided += static_cast<UInt64>(can_provide);
@@ -277,13 +296,15 @@ protected:
 
 private:
     /// The ranges is shared between all streams.
-    Ranges ranges;
+    RangesWithStep ranges;
 
     /// Ranges state shared between all streams, actually is the start of the ranges.
     RangesStatePtr ranges_state;
 
     /// Base block size, will shrink when data left is not enough.
     UInt64 base_block_size;
+
+    UInt64 step;
 };
 
 }
@@ -304,7 +325,7 @@ namespace
 
 /// Shrink ranges to size.
 ///     For example: ranges: [1, 5], [8, 100]; size: 7, we will get [1, 5], [8, 9]
-[[maybe_unused]] void shrinkRanges(Ranges & ranges, size_t size)
+[[maybe_unused]] void shrinkRanges(RangesWithStep & ranges, size_t size)
 {
     size_t last_range_idx = 0;
     for (size_t i = 0; i < ranges.size(); i++)
@@ -323,9 +344,9 @@ namespace
         else
         {
             auto & range = ranges[i];
-            UInt64 right = range.left.get<UInt64>() + static_cast<UInt64>(size);
-            range.right = Field(right);
-            range.right_included = !range.left_included;
+            UInt64 right = range.range.left.get<UInt64>() + static_cast<UInt64>(size);
+            range.range.right = Field(right);
+            range.range.right_included = !range.range.left_included;
             last_range_idx = i;
             break;
         }
@@ -393,101 +414,117 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         num_streams = 1;
 
     /// Build rpn of query filters
-    // KeyCondition condition(buildFilterDAG(), context, column_names, key_expression);
+    KeyCondition condition(buildFilterDAG(), context, column_names, key_expression);
 
     Pipe pipe;
     Ranges ranges;
 
-    // if (condition.extractPlainRanges(ranges))
-    // {
-    //     /// Intersect ranges with table range
-    //     std::optional<Range> table_range;
-    //     std::optional<Range> overflowed_table_range;
+    if (condition.extractPlainRanges(ranges))
+    {
+        LOG_DEBUG(&Poco::Logger::get("My logger"), "Use optimization");
+        /// Intersect ranges with table range
+        std::optional<Range> table_range;
+        std::optional<Range> overflowed_table_range;
 
-    //     if (numbers_storage.limit.has_value())
-    //     {
-    //         if (std::numeric_limits<UInt64>::max() - numbers_storage.offset >= *(numbers_storage.limit))
-    //         {
-    //             table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(numbers_storage.offset + *(numbers_storage.limit)), false);
-    //         }
-    //         /// UInt64 overflow, for example: SELECT number FROM numbers(18446744073709551614, 5)
-    //         else
-    //         {
-    //             table_range.emplace(FieldRef(numbers_storage.offset), true, std::numeric_limits<UInt64>::max(), true);
-    //             auto overflow_end = UInt128(numbers_storage.offset) + UInt128(*numbers_storage.limit);
-    //             overflowed_table_range.emplace(
-    //                 FieldRef(UInt64(0)), true, FieldRef(UInt64(overflow_end - std::numeric_limits<UInt64>::max() - 1)), false);
-    //         }
-    //     }
-    //     else
-    //     {
-    //         table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(std::numeric_limits<UInt64>::max()), true);
-    //     }
+        if (numbers_storage.limit.has_value())
+        {
+            if (std::numeric_limits<UInt64>::max() - numbers_storage.offset >= *(numbers_storage.limit))
+            {
+                table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(numbers_storage.offset + *(numbers_storage.limit)), false);
+            }
+            /// UInt64 overflow, for example: SELECT number FROM numbers(18446744073709551614, 5)
+            else
+            {
+                table_range.emplace(FieldRef(numbers_storage.offset), true, std::numeric_limits<UInt64>::max(), true);
+                auto overflow_end = UInt128(numbers_storage.offset) + UInt128(*numbers_storage.limit);
+                overflowed_table_range.emplace( 
+                    FieldRef(UInt64(0)), true, FieldRef(UInt64(overflow_end - std::numeric_limits<UInt64>::max() - 1)), false);
+            }
+        }
+        else
+        {
+            table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(std::numeric_limits<UInt64>::max()), true);
+        }
+        LOG_DEBUG(&Poco::Logger::get("My logger"), "Found table ranges");
 
-    //     Ranges intersected_ranges;
-    //     for (auto & r : ranges)
-    //     {
-    //         auto intersected_range = table_range->intersectWith(r);
-    //         if (intersected_range)
-    //             intersected_ranges.push_back(*intersected_range);
-    //     }
-    //     /// intersection with overflowed_table_range goes back.
-    //     if (overflowed_table_range.has_value())
-    //     {
-    //         for (auto & r : ranges)
-    //         {
-    //             auto intersected_range = overflowed_table_range->intersectWith(r);
-    //             if (intersected_range)
-    //                 intersected_ranges.push_back(*overflowed_table_range);
-    //         }
-    //     }
+        RangesWithStep intersected_ranges;
+        for (auto & r : ranges)
+        {
+            auto intersected_range = table_range->intersectWith(r);
+            if (intersected_range.has_value()) {
+                auto range_with_step = stepped_range_from_range(intersected_range.value(), numbers_storage.step, numbers_storage.offset % numbers_storage.step);
+                if (range_with_step.has_value()) {
+                    intersected_ranges.push_back(*range_with_step);
+                }
+            }
+        }
 
-    //     /// ranges is blank, return a source who has no data
-    //     if (intersected_ranges.empty())
-    //     {
-    //         pipe.addSource(std::make_shared<NullSource>(NumbersSource::createHeader(numbers_storage.column_name)));
-    //         return pipe;
-    //     }
-    //     const auto & limit_length = limit_length_and_offset.first;
-    //     const auto & limit_offset = limit_length_and_offset.second;
 
-    //     /// If intersected ranges is limited or we can pushdown limit.
-    //     if (!intersected_ranges.rbegin()->right.isPositiveInfinity() || should_pushdown_limit)
-    //     {
-    //         UInt128 total_size = sizeOfRanges(intersected_ranges);
-    //         UInt128 query_limit = limit_length + limit_offset;
+        for (const auto& range : intersected_ranges) {
+            LOG_DEBUG(&Poco::Logger::get("Ranges"), "Left: {}; Right {}, LI: {}, RI: {}, Step: {}", range.range.left.get<UInt64>(), range.range.right.get<UInt64>(), range.range.left_included, range.range.right_included, range.step);
+            // std::cout << 
+        }
+        /// intersection with overflowed_table_range goes back.
+        if (overflowed_table_range.has_value())
+        {
+            for (auto & r : ranges)
+            {
+                auto intersected_range = overflowed_table_range->intersectWith(r);
+                if (intersected_range) {
+                    auto range_with_step = stepped_range_from_range(intersected_range.value(), numbers_storage.step, static_cast<UInt64>((static_cast<UInt128>(numbers_storage.offset) + std::numeric_limits<UInt64>::max() + 1) % numbers_storage.step));
+                    if (range_with_step) {
+                        intersected_ranges.push_back(*range_with_step);
+                    }
+                }
+            }
+        }
 
-    //         /// limit total_size by query_limit
-    //         if (should_pushdown_limit && query_limit < total_size)
-    //         {
-    //             total_size = query_limit;
-    //             /// We should shrink intersected_ranges for case:
-    //             ///     intersected_ranges: [1, 4], [7, 100]; query_limit: 2
-    //             shrinkRanges(intersected_ranges, total_size);
-    //         }
+        /// ranges is blank, return a source who has no data
+        if (intersected_ranges.empty())
+        {
+            pipe.addSource(std::make_shared<NullSource>(NumbersSource::createHeader(numbers_storage.column_name)));
+            return pipe;
+        }
+        const auto & limit_length = limit_length_and_offset.first;
+        const auto & limit_offset = limit_length_and_offset.second;
 
-    //         checkLimits(size_t(total_size));
+        /// If intersected ranges is limited or we can pushdown limit.
+        if (!intersected_ranges.rbegin()->range.right.isPositiveInfinity() || should_pushdown_limit)
+        {
+            UInt128 total_size = sizeOfRanges(intersected_ranges);
+            UInt128 query_limit = limit_length + limit_offset;
 
-    //         if (total_size / max_block_size < num_streams)
-    //             num_streams = static_cast<size_t>(total_size / max_block_size);
+            /// limit total_size by query_limit
+            if (should_pushdown_limit && query_limit < total_size)
+            {
+                total_size = query_limit;
+                /// We should shrink intersected_ranges for case:
+                ///     intersected_ranges: [1, 4], [7, 100]; query_limit: 2
+                shrinkRanges(intersected_ranges, total_size);
+            }
 
-    //         if (num_streams == 0)
-    //             num_streams = 1;
+            checkLimits(size_t(total_size));
 
-    //         /// Ranges state, all streams will share the state.
-    //         auto ranges_state = std::make_shared<NumbersRangedSource::RangesState>();
-    //         for (size_t i = 0; i < num_streams; ++i)
-    //         {
-    //             auto source = std::make_shared<NumbersRangedSource>(intersected_ranges, ranges_state, max_block_size, numbers_storage.column_name);
+            if (total_size / max_block_size < num_streams)
+                num_streams = static_cast<size_t>(total_size / max_block_size);
 
-    //             if (i == 0)
-    //                 source->addTotalRowsApprox(total_size);
+            if (num_streams == 0)
+                num_streams = 1;
 
-    //             pipe.addSource(std::move(source));
-    //         }
-    //         return pipe;
-    //     }
-    // }
+            /// Ranges state, all streams will share the state.
+            auto ranges_state = std::make_shared<NumbersRangedSource::RangesState>();
+            for (size_t i = 0; i < num_streams; ++i)
+            {
+                auto source = std::make_shared<NumbersRangedSource>(intersected_ranges, ranges_state, max_block_size, numbers_storage.column_name);
+
+                if (i == 0)
+                    source->addTotalRowsApprox(total_size);
+
+                pipe.addSource(std::move(source));
+            }
+            return pipe;
+        }
+    }
 
     /// Fall back to NumbersSource
     for (size_t i = 0; i < num_streams; ++i)

From 623b42574587073845a76a5e28a502a792ee6662 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Tue, 6 Feb 2024 21:34:09 +0000
Subject: [PATCH 012/985] Add feature with the right author name

---
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 175 +++++++++++++-----
 src/Storages/SelectQueryInfo.h                |   2 +-
 src/Storages/System/StorageSystemNumbers.cpp  |   8 +-
 src/Storages/System/StorageSystemNumbers.h    |  15 +-
 src/Storages/System/attachSystemTables.cpp    |   2 +-
 src/TableFunctions/CMakeLists.txt             |   2 +-
 src/TableFunctions/ITableFunction.cpp         |   2 +-
 ...es.cpp => TableFunctionGenerateSeries.cpp} |  55 ++++--
 src/TableFunctions/TableFunctionNumbers.cpp   |  45 +++--
 .../02970_generate_series.reference           |  28 +++
 .../0_stateless/02970_generate_series.sql     |  14 ++
 11 files changed, 254 insertions(+), 94 deletions(-)
 rename src/TableFunctions/{TableFunctionsGenerateSeries.cpp => TableFunctionGenerateSeries.cpp} (65%)
 create mode 100644 tests/queries/0_stateless/02970_generate_series.reference
 create mode 100644 tests/queries/0_stateless/02970_generate_series.sql

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index f85473e43c3..4b957778c43 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -28,32 +28,37 @@ namespace
 class NumbersSource : public ISource
 {
 public:
-    NumbersSource(UInt64 block_size_, UInt64 offset_, UInt64 step_, const std::string& column_name, UInt64 inner_step_)
-        : ISource(createHeader(column_name)), block_size(block_size_), next(offset_), step(step_), inner_step(inner_step_), inner_remainder(offset_ % inner_step_)
+    NumbersSource(UInt64 block_size_, UInt64 offset_, UInt64 step_, const std::string & column_name, UInt64 inner_step_)
+        : ISource(createHeader(column_name))
+        , block_size(block_size_)
+        , next(offset_)
+        , step(step_)
+        , inner_step(inner_step_)
+        , inner_remainder(offset_ % inner_step_)
     {
     }
     String getName() const override { return "Numbers"; }
 
-
-    static Block createHeader(const std::string& column_name) { return {ColumnWithTypeAndName(ColumnUInt64::create(), std::make_shared<DataTypeUInt64>(), column_name)}; }
+    static Block createHeader(const std::string & column_name)
+    {
+        return {ColumnWithTypeAndName(ColumnUInt64::create(), std::make_shared<DataTypeUInt64>(), column_name)};
+    }
 
 protected:
     Chunk generate() override
     {
-
         UInt64 curr = next; /// The local variable for some reason works faster (>20%) than member of class.
         UInt64 first_element = (curr / inner_step) * inner_step + inner_remainder;
-        if (first_element < curr) {
+        if (first_element < curr)
             first_element += inner_step;
-        }
         UInt64 filtered_block_size = 0;
-        if (first_element - curr >= block_size) {
+        if (first_element - curr >= block_size)
+        {
             auto column = ColumnUInt64::create(0);
             return {Columns{std::move(column)}, filtered_block_size};
         }
-        if (first_element - curr < block_size) {
+        if (first_element - curr < block_size)
             filtered_block_size = (block_size - (first_element - curr) - 1) / inner_step + 1;
-        }
 
         auto column = ColumnUInt64::create(filtered_block_size);
         ColumnUInt64::Container & vec = column->getData();
@@ -76,32 +81,37 @@ private:
     UInt64 inner_remainder;
 };
 
-struct RangeWithStep {
+struct RangeWithStep
+{
     Range range;
     UInt64 step;
 };
 
 using RangesWithStep = std::vector<RangeWithStep>;
 
-std::optional<RangeWithStep> stepped_range_from_range(const Range& r, UInt64 step, UInt64 remainder) {
-    UInt64 begin = (r.left.get<UInt64>() / step) * step;
-    if (begin > std::numeric_limits<UInt64>::max() - remainder) {
+std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 step, UInt64 remainder)
+{
+    if ((r.right.get<UInt64>() == 0) && (!r.right_included))
+        return std::nullopt;
+    UInt64 begin = (r.left.get<UInt64>() / step) * step;
+    if (begin > std::numeric_limits<UInt64>::max() - remainder)
         return std::nullopt;
-    }
     begin += remainder;
-    while (begin <= r.left.get<UInt128>() - r.left_included)   {
-        if (std::numeric_limits<UInt64>::max() - step < begin) {
+
+    // LOG_DEBUG(&Poco::Logger::get("stepped_range_from_range"), "Begin: {}", begin);
+    // LOG_DEBUG(&Poco::Logger::get("stepped_range_from_range"), "Begin: {}", begin);
+    while ((r.left_included <= r.left.get<UInt64>()) && (begin <= r.left.get<UInt64>() - r.left_included))
+    {
+        if (std::numeric_limits<UInt64>::max() - step < begin)
             return std::nullopt;
-        }
         begin += step;
     }
 
-    LOG_DEBUG(&Poco::Logger::get("stepped_range_from_range"), "Begin: {}", begin);
-    UInt128 right_edge = (r.right.get<UInt128>() + r.right_included);
-    if (begin >= right_edge) {
+    // LOG_DEBUG(&Poco::Logger::get("stepped_range_from_range"), "Begin: {}", begin);
+    if ((begin >= r.right_included) && (begin - r.right_included >= r.right.get<UInt64>()))
         return std::nullopt;
-    }
-    return std::optional{RangeWithStep{Range(begin, true, static_cast<UInt64>(right_edge - 1), true), step}};
+    UInt64 right_edge_included = r.right.get<UInt64>() - (1 - r.right_included);
+    return std::optional{RangeWithStep{Range(begin, true, right_edge_included, true), step}};
 }
 
 [[maybe_unused]] UInt128 sizeOfRange(const RangeWithStep & r)
@@ -144,8 +154,17 @@ public:
 
     using RangesStatePtr = std::shared_ptr<RangesState>;
 
-    [[maybe_unused]] NumbersRangedSource(const RangesWithStep & ranges_, RangesStatePtr & ranges_state_, UInt64 base_block_size_, const std::string& column_name)
-        : ISource(NumbersSource::createHeader(column_name)), ranges(ranges_), ranges_state(ranges_state_), base_block_size(base_block_size_)
+    [[maybe_unused]] NumbersRangedSource(
+        const RangesWithStep & ranges_,
+        RangesStatePtr & ranges_state_,
+        UInt64 base_block_size_,
+        UInt64 step_,
+        const std::string & column_name)
+        : ISource(NumbersSource::createHeader(column_name))
+        , ranges(ranges_)
+        , ranges_state(ranges_state_)
+        , base_block_size(base_block_size_)
+        , step(step_)
     {
     }
 
@@ -158,6 +177,7 @@ protected:
     {
         std::lock_guard lock(ranges_state->mutex);
 
+
         UInt64 need = base_block_size_;
         UInt64 size = 0; /// how many item found.
 
@@ -196,6 +216,10 @@ protected:
         }
 
         ranges_state->pos = end;
+
+        LOG_DEBUG(&Poco::Logger::get("Range borders"), "Begin: {} {}", start.offset_in_ranges, static_cast<size_t>(start.offset_in_range));
+        LOG_DEBUG(&Poco::Logger::get("Range borders"), "End: {} {}", end.offset_in_ranges, static_cast<size_t>(end.offset_in_range));
+
         return size;
     }
 
@@ -234,12 +258,19 @@ protected:
                 ? end.offset_in_range - cursor.offset_in_range
                 : static_cast<UInt128>(last_value(range) - first_value(range)) / range.step + 1 - cursor.offset_in_range;
 
+            LOG_DEBUG(
+                &Poco::Logger::get("Generate"),
+                "Can Provide: {}, Block size: {}",
+                static_cast<UInt64>(can_provide),
+                static_cast<UInt64>(block_size));
+
             /// set value to block
             auto set_value = [&pos, this](UInt128 & start_value, UInt128 & end_value)
             {
                 if (end_value > std::numeric_limits<UInt64>::max())
                 {
-                    while (start_value < end_value) {
+                    while (start_value < end_value)
+                    {
                         *(pos++) = start_value;
                         start_value += this->step;
                     }
@@ -248,7 +279,9 @@ protected:
                 {
                     auto start_value_64 = static_cast<UInt64>(start_value);
                     auto end_value_64 = static_cast<UInt64>(end_value);
-                    auto size = end_value_64 - start_value_64;
+                    auto size = (end_value_64 - start_value_64) / this->step;
+                    LOG_DEBUG(
+                        &Poco::Logger::get("Iota"), "Size: {}, Step: {}, Start: {}", static_cast<size_t>(size), this->step, start_value_64);
                     iota_with_step(pos, static_cast<size_t>(size), start_value_64, step);
                     pos += size;
                 }
@@ -374,7 +407,7 @@ ReadFromSystemNumbersStep::ReadFromSystemNumbersStep(
     , key_expression{KeyDescription::parse(column_names[0], storage_snapshot->metadata->columns, context).expression}
     , max_block_size{max_block_size_}
     , num_streams{num_streams_}
-    , limit_length_and_offset(InterpreterSelectQuery::getLimitLengthAndOffset(query_info.query->as<ASTSelectQuery&>(), context))
+    , limit_length_and_offset(InterpreterSelectQuery::getLimitLengthAndOffset(query_info.query->as<ASTSelectQuery &>(), context))
     , should_pushdown_limit(shouldPushdownLimit(query_info, limit_length_and_offset.first))
     , limit(query_info.limit)
     , storage_limits(query_info.storage_limits)
@@ -410,14 +443,28 @@ Pipe ReadFromSystemNumbersStep::makePipe()
 {
     auto & numbers_storage = storage->as<StorageSystemNumbers &>();
 
+    LOG_DEBUG(
+        &Poco::Logger::get("Parameters"),
+        "Parameters: Limit: {}, Offset: {} Step: {}",
+        numbers_storage.limit.value(),
+        numbers_storage.offset,
+        numbers_storage.step);
+
     if (!numbers_storage.multithreaded)
         num_streams = 1;
 
+    Pipe pipe;
+    Ranges ranges;
+
+    if (numbers_storage.limit.has_value() && (numbers_storage.limit.value() == 0))
+    {
+        pipe.addSource(std::make_shared<NullSource>(NumbersSource::createHeader(numbers_storage.column_name)));
+        return pipe;
+    }
+
     /// Build rpn of query filters
     KeyCondition condition(buildFilterDAG(), context, column_names, key_expression);
 
-    Pipe pipe;
-    Ranges ranges;
 
     if (condition.extractPlainRanges(ranges))
     {
@@ -430,14 +477,15 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         {
             if (std::numeric_limits<UInt64>::max() - numbers_storage.offset >= *(numbers_storage.limit))
             {
-                table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(numbers_storage.offset + *(numbers_storage.limit)), false);
+                table_range.emplace(
+                    FieldRef(numbers_storage.offset), true, FieldRef(numbers_storage.offset + *(numbers_storage.limit)), false);
             }
             /// UInt64 overflow, for example: SELECT number FROM numbers(18446744073709551614, 5)
             else
             {
                 table_range.emplace(FieldRef(numbers_storage.offset), true, std::numeric_limits<UInt64>::max(), true);
                 auto overflow_end = UInt128(numbers_storage.offset) + UInt128(*numbers_storage.limit);
-                overflowed_table_range.emplace( 
+                overflowed_table_range.emplace(
                     FieldRef(UInt64(0)), true, FieldRef(UInt64(overflow_end - std::numeric_limits<UInt64>::max() - 1)), false);
             }
         }
@@ -451,34 +499,59 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         for (auto & r : ranges)
         {
             auto intersected_range = table_range->intersectWith(r);
-            if (intersected_range.has_value()) {
-                auto range_with_step = stepped_range_from_range(intersected_range.value(), numbers_storage.step, numbers_storage.offset % numbers_storage.step);
-                if (range_with_step.has_value()) {
+            if (intersected_range.has_value())
+            {
+                LOG_DEBUG(
+                    &Poco::Logger::get("Ranges"),
+                    "Ranges: {} {} {} {}",
+                    intersected_range->left.get<UInt64>(),
+                    intersected_range->right.get<UInt64>(),
+                    intersected_range->left_included,
+                    intersected_range->right_included);
+                auto range_with_step = stepped_range_from_range(
+                    intersected_range.value(), numbers_storage.step, numbers_storage.offset % numbers_storage.step);
+                if (range_with_step.has_value())
+                {
+                    LOG_DEBUG(
+                        &Poco::Logger::get("Ranges With Step"),
+                        "Ranges: {} {} {} {} {}",
+                        range_with_step->range.left.get<UInt64>(),
+                        range_with_step->range.right.get<UInt64>(),
+                        range_with_step->range.left_included,
+                        range_with_step->range.right_included,
+                        range_with_step->step);
                     intersected_ranges.push_back(*range_with_step);
                 }
             }
         }
 
 
-        for (const auto& range : intersected_ranges) {
-            LOG_DEBUG(&Poco::Logger::get("Ranges"), "Left: {}; Right {}, LI: {}, RI: {}, Step: {}", range.range.left.get<UInt64>(), range.range.right.get<UInt64>(), range.range.left_included, range.range.right_included, range.step);
-            // std::cout << 
-        }
         /// intersection with overflowed_table_range goes back.
         if (overflowed_table_range.has_value())
         {
             for (auto & r : ranges)
             {
                 auto intersected_range = overflowed_table_range->intersectWith(r);
-                if (intersected_range) {
-                    auto range_with_step = stepped_range_from_range(intersected_range.value(), numbers_storage.step, static_cast<UInt64>((static_cast<UInt128>(numbers_storage.offset) + std::numeric_limits<UInt64>::max() + 1) % numbers_storage.step));
-                    if (range_with_step) {
+                if (intersected_range)
+                {
+                    auto range_with_step = stepped_range_from_range(
+                        intersected_range.value(),
+                        numbers_storage.step,
+                        static_cast<UInt64>(
+                            (static_cast<UInt128>(numbers_storage.offset) + std::numeric_limits<UInt64>::max() + 1)
+                            % numbers_storage.step));
+                    if (range_with_step)
                         intersected_ranges.push_back(*range_with_step);
-                    }
                 }
             }
         }
 
+        // for (const auto& range : intersected_ranges)
+        // {
+        //     LOG_DEBUG(&Poco::Logger::get("Ranges with step"), "Left: {}; Right {}, LI: {}, RI: {}, Step: {}", range.range.left.get<UInt64>(), range.range.right.get<UInt64>(), range.range.left_included, range.range.right_included, range.step);
+        //     // std::cout <<
+        // }
+
         /// ranges is blank, return a source who has no data
         if (intersected_ranges.empty())
         {
@@ -492,6 +565,7 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         if (!intersected_ranges.rbegin()->range.right.isPositiveInfinity() || should_pushdown_limit)
         {
             UInt128 total_size = sizeOfRanges(intersected_ranges);
+            LOG_DEBUG(&Poco::Logger::get("Total_Size"), "Total Size: {}", static_cast<UInt64>(total_size));
             UInt128 query_limit = limit_length + limit_offset;
 
             /// limit total_size by query_limit
@@ -515,7 +589,8 @@ Pipe ReadFromSystemNumbersStep::makePipe()
             auto ranges_state = std::make_shared<NumbersRangedSource::RangesState>();
             for (size_t i = 0; i < num_streams; ++i)
             {
-                auto source = std::make_shared<NumbersRangedSource>(intersected_ranges, ranges_state, max_block_size, numbers_storage.column_name);
+                auto source = std::make_shared<NumbersRangedSource>(
+                    intersected_ranges, ranges_state, max_block_size, numbers_storage.step, numbers_storage.column_name);
 
                 if (i == 0)
                     source->addTotalRowsApprox(total_size);
@@ -529,12 +604,16 @@ Pipe ReadFromSystemNumbersStep::makePipe()
     /// Fall back to NumbersSource
     for (size_t i = 0; i < num_streams; ++i)
     {
-        auto source
-            = std::make_shared<NumbersSource>(max_block_size, numbers_storage.offset + i * max_block_size, num_streams * max_block_size, numbers_storage.column_name, numbers_storage.step);
+        auto source = std::make_shared<NumbersSource>(
+            max_block_size,
+            numbers_storage.offset + i * max_block_size,
+            num_streams * max_block_size,
+            numbers_storage.column_name,
+            numbers_storage.step);
 
         if (numbers_storage.limit && i == 0)
         {
-            auto rows_appr = *(numbers_storage.limit);
+            auto rows_appr = (*numbers_storage.limit - 1) / numbers_storage.step + 1;
             if (limit > 0 && limit < rows_appr)
                 rows_appr = limit;
             source->addTotalRowsApprox(rows_appr);
@@ -546,7 +625,7 @@ Pipe ReadFromSystemNumbersStep::makePipe()
     if (numbers_storage.limit)
     {
         size_t i = 0;
-        auto storage_limit = *(numbers_storage.limit);
+        auto storage_limit = (*numbers_storage.limit - 1) / numbers_storage.step + 1;
         /// This formula is how to split 'limit' elements to 'num_streams' chunks almost uniformly.
         pipe.addSimpleTransform(
             [&](const Block & header)
diff --git a/src/Storages/SelectQueryInfo.h b/src/Storages/SelectQueryInfo.h
index 2b4afaa6345..662a5c0ef5a 100644
--- a/src/Storages/SelectQueryInfo.h
+++ b/src/Storages/SelectQueryInfo.h
@@ -229,4 +229,4 @@ struct SelectQueryInfo
 
     bool isFinal() const;
 };
-    }
+}
diff --git a/src/Storages/System/StorageSystemNumbers.cpp b/src/Storages/System/StorageSystemNumbers.cpp
index cd7207917a9..4c319ec7105 100644
--- a/src/Storages/System/StorageSystemNumbers.cpp
+++ b/src/Storages/System/StorageSystemNumbers.cpp
@@ -16,7 +16,13 @@
 namespace DB
 {
 
-StorageSystemNumbers::StorageSystemNumbers(const StorageID & table_id, bool multithreaded_, const std::string& column_name_, std::optional<UInt64> limit_, UInt64 offset_, UInt64 step_)
+StorageSystemNumbers::StorageSystemNumbers(
+    const StorageID & table_id,
+    bool multithreaded_,
+    const std::string & column_name_,
+    std::optional<UInt64> limit_,
+    UInt64 offset_,
+    UInt64 step_)
     : IStorage(table_id), multithreaded(multithreaded_), limit(limit_), offset(offset_), column_name(column_name_), step(step_)
 {
     StorageInMemoryMetadata storage_metadata;
diff --git a/src/Storages/System/StorageSystemNumbers.h b/src/Storages/System/StorageSystemNumbers.h
index ffe87b8ad14..9663ee25251 100644
--- a/src/Storages/System/StorageSystemNumbers.h
+++ b/src/Storages/System/StorageSystemNumbers.h
@@ -10,11 +10,17 @@ namespace DB
 
 class Context;
 
-class   StorageSystemNumbers final : public IStorage
+class StorageSystemNumbers final : public IStorage
 {
 public:
     /// Otherwise, streams concurrently increment atomic.
-    StorageSystemNumbers(const StorageID & table_id, bool multithreaded_, const std::string& column_name, std::optional<UInt64> limit_ = std::nullopt, UInt64 offset_ = 0, UInt64 step_ = 1);
+    StorageSystemNumbers(
+        const StorageID & table_id,
+        bool multithreaded_,
+        const std::string & column_name,
+        std::optional<UInt64> limit_ = std::nullopt,
+        UInt64 offset_ = 0,
+        UInt64 step_ = 1);
 
     std::string getName() const override { return "SystemNumbers"; }
 
@@ -30,7 +36,6 @@ public:
 
     bool hasEvenlyDistributedRead() const override { return true; }
     bool isSystemStorage() const override { return true; }
-
     bool supportsTransactions() const override { return true; }
 
 private:
@@ -38,11 +43,9 @@ private:
 
     bool multithreaded;
     std::optional<UInt64> limit;
-    UInt64 offset;
+    UInt64 offset;`
     std::string column_name;
-    
     UInt64 step;
-
 };
 
 }
diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index ddd89709b6a..9eacb07bd8d 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -120,7 +120,7 @@ void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, b
     attach<StorageSystemOne>(context, system_database, "one", "This table contains a single row with a single dummy UInt8 column containing the value 0. Used when the table is not specified explicitly, for example in queries like `SELECT 1`.");
     attach<StorageSystemNumbers>(context, system_database, "numbers", "Generates all natural numbers, starting from 0 (to 2^64 - 1, and then again) in sorted order.", false, "number");
     attach<StorageSystemNumbers>(context, system_database, "numbers_mt", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", true, "number");
-    // attach<StorageSystemNumbers>(context, system_database, "generate_series", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", false, "generate_series");
+    attach<StorageSystemNumbers>(context, system_database, "generate_series", "Generates arithmetic progression of natural numbers in sorted order in a given segment with a given step", false, "generate_series");
     attach<StorageSystemZeros>(context, system_database, "zeros", "Produces unlimited number of non-materialized zeros.", false);
     attach<StorageSystemZeros>(context, system_database, "zeros_mt", "Multithreaded version of system.zeros.", true);
     attach<StorageSystemDatabases>(context, system_database, "databases", "Lists all databases of the current server.");
diff --git a/src/TableFunctions/CMakeLists.txt b/src/TableFunctions/CMakeLists.txt
index c5c2a660935..770990cc405 100644
--- a/src/TableFunctions/CMakeLists.txt
+++ b/src/TableFunctions/CMakeLists.txt
@@ -29,7 +29,7 @@ if (TARGET ch_contrib::azure_sdk)
     target_link_libraries(clickhouse_table_functions PRIVATE ch_contrib::azure_sdk)
 endif ()
 
-if (TARGET ch_co`trib::simdjson)
+if (TARGET ch_contrib::simdjson)
     target_link_libraries(clickhouse_table_functions PRIVATE ch_contrib::simdjson)
 endif ()
 
diff --git a/src/TableFunctions/ITableFunction.cpp b/src/TableFunctions/ITableFunction.cpp
index c854b6b0f9c..137e1dc27fe 100644
--- a/src/TableFunctions/ITableFunction.cpp
+++ b/src/TableFunctions/ITableFunction.cpp
@@ -5,7 +5,7 @@
 #include <Access/Common/AccessFlags.h>
 #include <Common/ProfileEvents.h>
 #include <TableFunctions/TableFunctionFactory.h>
-#include <Common/logger_useful.h>
+
 
 namespace ProfileEvents
 {
diff --git a/src/TableFunctions/TableFunctionsGenerateSeries.cpp b/src/TableFunctions/TableFunctionGenerateSeries.cpp
similarity index 65%
rename from src/TableFunctions/TableFunctionsGenerateSeries.cpp
rename to src/TableFunctions/TableFunctionGenerateSeries.cpp
index 3941f1eadb2..88d7b0d1a71 100644
--- a/src/TableFunctions/TableFunctionsGenerateSeries.cpp
+++ b/src/TableFunctions/TableFunctionGenerateSeries.cpp
@@ -1,13 +1,13 @@
+#include <DataTypes/DataTypesNumber.h>
+#include <Interpreters/Context.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/evaluateConstantExpression.h>
+#include <Parsers/ASTFunction.h>
+#include <Storages/System/StorageSystemNumbers.h>
 #include <TableFunctions/ITableFunction.h>
 #include <TableFunctions/TableFunctionFactory.h>
-#include <Parsers/ASTFunction.h>
-#include <Common/typeid_cast.h>
 #include <Common/FieldVisitorToString.h>
-#include <Storages/System/StorageSystemNumbers.h>
-#include <Interpreters/evaluateConstantExpression.h>
-#include <Interpreters/convertFieldToType.h>
-#include <Interpreters/Context.h>
-#include <DataTypes/DataTypesNumber.h>
+#include <Common/typeid_cast.h>
 #include "registerTableFunctions.h"
 
 
@@ -18,6 +18,7 @@ namespace ErrorCodes
 {
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+    extern const int INVALID_SETTING_VALUE;
 }
 
 namespace
@@ -33,8 +34,14 @@ public:
     static constexpr auto name = "generate_series";
     std::string getName() const override { return name; }
     bool hasStaticStructure() const override { return true; }
+
 private:
-    StoragePtr executeImpl(const ASTPtr & ast_function, ContextPtr context, const std::string & table_name, ColumnsDescription cached_columns, bool is_insert_query) const override;
+    StoragePtr executeImpl(
+        const ASTPtr & ast_function,
+        ContextPtr context,
+        const std::string & table_name,
+        ColumnsDescription cached_columns,
+        bool is_insert_query) const override;
     const char * getStorageTypeName() const override { return "SystemNumbers"; }
 
     UInt64 evaluateArgument(ContextPtr context, ASTPtr & argument) const;
@@ -48,25 +55,31 @@ ColumnsDescription TableFunctionGenerateSeries::getActualTableStructure(ContextP
     return ColumnsDescription{{{"generate_series", std::make_shared<DataTypeUInt64>()}}};
 }
 
-StoragePtr TableFunctionGenerateSeries::executeImpl(const ASTPtr & ast_function, ContextPtr context, const std::string & table_name, ColumnsDescription /*cached_columns*/, bool /*is_insert_query*/) const
+StoragePtr TableFunctionGenerateSeries::executeImpl(
+    const ASTPtr & ast_function,
+    ContextPtr context,
+    const std::string & table_name,
+    ColumnsDescription /*cached_columns*/,
+    bool /*is_insert_query*/) const
 {
     if (const auto * function = ast_function->as<ASTFunction>())
     {
         auto arguments = function->arguments->children;
 
         if (arguments.size() != 2 && arguments.size() != 3)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires 'length' or 'offset, length'.", getName());
+            throw Exception(
+                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires 'length' or 'offset, length'.", getName());
 
         UInt64 start = evaluateArgument(context, arguments[0]);
         UInt64 stop = evaluateArgument(context, arguments[1]);
-        UInt64 interval = (arguments.size() == 3) ? evaluateArgument(context, arguments[2]) : UInt64{1};
-        if (start > stop) {
-            auto res = std::make_shared<StorageSystemNumbers>(StorageID(getDatabaseName(), table_name), false, std::string{"generate_series"}, 0);
-            res->startup();
-            return res;
-        }
-
-        auto res = std::make_shared<StorageSystemNumbers>(StorageID(getDatabaseName(), table_name), false, std::string{"generate_series"}, (stop - start) / interval + 1, start, interval);
+        UInt64 step = (arguments.size() == 3) ? evaluateArgument(context, arguments[2]) : UInt64{1};
+        if (step == UInt64{0})
+            throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Table function '{}' requires step to be a positive number", getName());
+        auto res = (start > stop)
+            ? std::make_shared<StorageSystemNumbers>(
+                StorageID(getDatabaseName(), table_name), false, std::string{"generate_series"}, 0, 0, 0)
+            : std::make_shared<StorageSystemNumbers>(
+                StorageID(getDatabaseName(), table_name), false, std::string{"generate_series"}, (stop - start) + 1, start, step);
         res->startup();
         return res;
     }
@@ -82,8 +95,10 @@ UInt64 TableFunctionGenerateSeries::evaluateArgument(ContextPtr context, ASTPtr
 
     Field converted = convertFieldToType(field, DataTypeUInt64());
     if (converted.isNull())
-        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "The value {} is not representable as UInt64",
-                        applyVisitor(FieldVisitorToString(), field));
+        throw Exception(
+            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+            "The value {} is not representable as UInt64",
+            applyVisitor(FieldVisitorToString(), field));
 
     return converted.safeGet<UInt64>();
 }
diff --git a/src/TableFunctions/TableFunctionNumbers.cpp b/src/TableFunctions/TableFunctionNumbers.cpp
index 71a9ba097c6..bcda8dc6a5e 100644
--- a/src/TableFunctions/TableFunctionNumbers.cpp
+++ b/src/TableFunctions/TableFunctionNumbers.cpp
@@ -1,13 +1,13 @@
+#include <DataTypes/DataTypesNumber.h>
+#include <Interpreters/Context.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/evaluateConstantExpression.h>
+#include <Parsers/ASTFunction.h>
+#include <Storages/System/StorageSystemNumbers.h>
 #include <TableFunctions/ITableFunction.h>
 #include <TableFunctions/TableFunctionFactory.h>
-#include <Parsers/ASTFunction.h>
-#include <Common/typeid_cast.h>
 #include <Common/FieldVisitorToString.h>
-#include <Storages/System/StorageSystemNumbers.h>
-#include <Interpreters/evaluateConstantExpression.h>
-#include <Interpreters/convertFieldToType.h>
-#include <Interpreters/Context.h>
-#include <DataTypes/DataTypesNumber.h>
+#include <Common/typeid_cast.h>
 #include "registerTableFunctions.h"
 
 
@@ -16,8 +16,8 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
 namespace
@@ -34,8 +34,14 @@ public:
     static constexpr auto name = multithreaded ? "numbers_mt" : "numbers";
     std::string getName() const override { return name; }
     bool hasStaticStructure() const override { return true; }
+
 private:
-    StoragePtr executeImpl(const ASTPtr & ast_function, ContextPtr context, const std::string & table_name, ColumnsDescription cached_columns, bool is_insert_query) const override;
+    StoragePtr executeImpl(
+        const ASTPtr & ast_function,
+        ContextPtr context,
+        const std::string & table_name,
+        ColumnsDescription cached_columns,
+        bool is_insert_query) const override;
     const char * getStorageTypeName() const override { return "SystemNumbers"; }
 
     UInt64 evaluateArgument(ContextPtr context, ASTPtr & argument) const;
@@ -51,19 +57,26 @@ ColumnsDescription TableFunctionNumbers<multithreaded>::getActualTableStructure(
 }
 
 template <bool multithreaded>
-StoragePtr TableFunctionNumbers<multithreaded>::executeImpl(const ASTPtr & ast_function, ContextPtr context, const std::string & table_name, ColumnsDescription /*cached_columns*/, bool /*is_insert_query*/) const
+StoragePtr TableFunctionNumbers<multithreaded>::executeImpl(
+    const ASTPtr & ast_function,
+    ContextPtr context,
+    const std::string & table_name,
+    ColumnsDescription /*cached_columns*/,
+    bool /*is_insert_query*/) const
 {
     if (const auto * function = ast_function->as<ASTFunction>())
     {
         auto arguments = function->arguments->children;
 
         if (arguments.size() != 1 && arguments.size() != 2)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires 'length' or 'offset, length'.", getName());
+            throw Exception(
+                ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires 'length' or 'offset, length'.", getName());
 
         UInt64 offset = arguments.size() == 2 ? evaluateArgument(context, arguments[0]) : 0;
         UInt64 length = arguments.size() == 2 ? evaluateArgument(context, arguments[1]) : evaluateArgument(context, arguments[0]);
 
-        auto res = std::make_shared<StorageSystemNumbers>(StorageID(getDatabaseName(), table_name), multithreaded, std::string{"number"}, length, offset);
+        auto res = std::make_shared<StorageSystemNumbers>(
+            StorageID(getDatabaseName(), table_name), multithreaded, std::string{"number"}, length, offset);
         res->startup();
         return res;
     }
@@ -80,8 +93,10 @@ UInt64 TableFunctionNumbers<multithreaded>::evaluateArgument(ContextPtr context,
 
     Field converted = convertFieldToType(field, DataTypeUInt64());
     if (converted.isNull())
-        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "The value {} is not representable as UInt64",
-                        applyVisitor(FieldVisitorToString(), field));
+        throw Exception(
+            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+            "The value {} is not representable as UInt64",
+            applyVisitor(FieldVisitorToString(), field));
 
     return converted.safeGet<UInt64>();
 }
diff --git a/tests/queries/0_stateless/02970_generate_series.reference b/tests/queries/0_stateless/02970_generate_series.reference
new file mode 100644
index 00000000000..9e6f1db911e
--- /dev/null
+++ b/tests/queries/0_stateless/02970_generate_series.reference
@@ -0,0 +1,28 @@
+0
+1
+4
+8
+500000001
+50000000
+100000001
+0
+10
+13
+16
+19
+7
+17
+27
+37
+47
+57
+67
+77
+17
+22
+27
+32
+37
+42
+47
+52
diff --git a/tests/queries/0_stateless/02970_generate_series.sql b/tests/queries/0_stateless/02970_generate_series.sql
new file mode 100644
index 00000000000..045f584a622
--- /dev/null
+++ b/tests/queries/0_stateless/02970_generate_series.sql
@@ -0,0 +1,14 @@
+SELECT count() FROM generate_series(5, 4);
+SELECT count() FROM generate_series(0, 0);
+SELECT count() FROM generate_series(10, 20, 3);
+SELECT count() FROM generate_series(7, 77, 10);
+SELECT count() FROM generate_series(0, 1000000000, 2);
+SELECT count() FROM generate_series(0, 999999999, 20);
+SELECT count() FROM generate_series(0, 1000000000, 2) WHERE generate_series % 5 == 0;
+
+SELECT * FROM generate_series(5, 4);
+SELECT * FROM generate_series(0, 0);
+SELECT * FROM generate_series(10, 20, 3);
+SELECT * FROM generate_series(7, 77, 10);
+SELECT * FROM generate_series(7, 52, 5) WHERE generate_series >= 13;
+

From 145e425ddd5707a5852dd3c6ac2672ccbd68e2bd Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Wed, 7 Feb 2024 15:29:45 +0000
Subject: [PATCH 013/985] Added Documentation

---
 .../table-functions/generate_series.md        | 25 +++++++++
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 53 -------------------
 src/Storages/System/StorageSystemNumbers.h    |  2 +-
 3 files changed, 26 insertions(+), 54 deletions(-)
 create mode 100644 docs/en/sql-reference/table-functions/generate_series.md

diff --git a/docs/en/sql-reference/table-functions/generate_series.md b/docs/en/sql-reference/table-functions/generate_series.md
new file mode 100644
index 00000000000..de34e10ac76
--- /dev/null
+++ b/docs/en/sql-reference/table-functions/generate_series.md
@@ -0,0 +1,25 @@
+---
+slug: /en/sql-reference/table-functions/generate_series
+sidebar_position: ?
+sidebar_label: generate_series
+---
+
+# generate_series
+
+`generate_series(START, STOP)` - Returns a table with the single ‘generate_series’ column (UInt64) that contains integers from start to stop inclusively.
+
+`generate_series(START, STOP, STEP)` - Returns a table with the single ‘generate_series’ column (UInt64) that contains integers from start to stop inclusively with spacing between values given by STEP. 
+
+The following queries return tables with the same content but different column names:
+
+``` sql
+SELECT * FROM numbers(10, 5);
+SELECT * FROM generate_series(10, 14);
+```
+
+And the following queries return tables with the same content but different column names (but the second option is more efficient):
+
+``` sql
+SELECT * FROM numbers(10, 11) WHERE number % 3 == (10 % 3);
+SELECT * FROM generate_series(10, 20, 3) ;
+```
\ No newline at end of file
diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 4b957778c43..3bb2e0cd69d 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -98,8 +98,6 @@ std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 st
         return std::nullopt;
     begin += remainder;
 
-    // LOG_DEBUG(&Poco::Logger::get("stepped_range_from_range"), "Begin: {}", begin);
-    // LOG_DEBUG(&Poco::Logger::get("stepped_range_from_range"), "Begin: {}", begin);
     while ((r.left_included <= r.left.get<UInt64>()) && (begin <= r.left.get<UInt64>() - r.left_included))
     {
         if (std::numeric_limits<UInt64>::max() - step < begin)
@@ -107,7 +105,6 @@ std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 st
         begin += step;
     }
 
-    // LOG_DEBUG(&Poco::Logger::get("stepped_range_from_range"), "Begin: {}", begin);
     if ((begin >= r.right_included) && (begin - r.right_included >= r.right.get<UInt64>()))
         return std::nullopt;
     UInt64 right_edge_included = r.right.get<UInt64>() - (1 - r.right_included);
@@ -217,9 +214,6 @@ protected:
 
         ranges_state->pos = end;
 
-        LOG_DEBUG(&Poco::Logger::get("Range borders"), "Begin: {} {}", start.offset_in_ranges, static_cast<size_t>(start.offset_in_range));
-        LOG_DEBUG(&Poco::Logger::get("Range borders"), "End: {} {}", end.offset_in_ranges, static_cast<size_t>(end.offset_in_range));
-
         return size;
     }
 
@@ -258,12 +252,6 @@ protected:
                 ? end.offset_in_range - cursor.offset_in_range
                 : static_cast<UInt128>(last_value(range) - first_value(range)) / range.step + 1 - cursor.offset_in_range;
 
-            LOG_DEBUG(
-                &Poco::Logger::get("Generate"),
-                "Can Provide: {}, Block size: {}",
-                static_cast<UInt64>(can_provide),
-                static_cast<UInt64>(block_size));
-
             /// set value to block
             auto set_value = [&pos, this](UInt128 & start_value, UInt128 & end_value)
             {
@@ -280,8 +268,6 @@ protected:
                     auto start_value_64 = static_cast<UInt64>(start_value);
                     auto end_value_64 = static_cast<UInt64>(end_value);
                     auto size = (end_value_64 - start_value_64) / this->step;
-                    LOG_DEBUG(
-                        &Poco::Logger::get("Iota"), "Size: {}, Step: {}, Start: {}", static_cast<size_t>(size), this->step, start_value_64);
                     iota_with_step(pos, static_cast<size_t>(size), start_value_64, step);
                     pos += size;
                 }
@@ -443,13 +429,6 @@ Pipe ReadFromSystemNumbersStep::makePipe()
 {
     auto & numbers_storage = storage->as<StorageSystemNumbers &>();
 
-    LOG_DEBUG(
-        &Poco::Logger::get("Parameters"),
-        "Parameters: Limit: {}, Offset: {} Step: {}",
-        numbers_storage.limit.value(),
-        numbers_storage.offset,
-        numbers_storage.step);
-
     if (!numbers_storage.multithreaded)
         num_streams = 1;
 
@@ -468,7 +447,6 @@ Pipe ReadFromSystemNumbersStep::makePipe()
 
     if (condition.extractPlainRanges(ranges))
     {
-        LOG_DEBUG(&Poco::Logger::get("My logger"), "Use optimization");
         /// Intersect ranges with table range
         std::optional<Range> table_range;
         std::optional<Range> overflowed_table_range;
@@ -493,36 +471,11 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         {
             table_range.emplace(FieldRef(numbers_storage.offset), true, FieldRef(std::numeric_limits<UInt64>::max()), true);
         }
-        LOG_DEBUG(&Poco::Logger::get("My logger"), "Found table ranges");
 
         RangesWithStep intersected_ranges;
         for (auto & r : ranges)
         {
             auto intersected_range = table_range->intersectWith(r);
-            if (intersected_range.has_value())
-            {
-                LOG_DEBUG(
-                    &Poco::Logger::get("Ranges"),
-                    "Ranges: {} {} {} {}",
-                    intersected_range->left.get<UInt64>(),
-                    intersected_range->right.get<UInt64>(),
-                    intersected_range->left_included,
-                    intersected_range->right_included);
-                auto range_with_step = stepped_range_from_range(
-                    intersected_range.value(), numbers_storage.step, numbers_storage.offset % numbers_storage.step);
-                if (range_with_step.has_value())
-                {
-                    LOG_DEBUG(
-                        &Poco::Logger::get("Ranges With Step"),
-                        "Ranges: {} {} {} {} {}",
-                        range_with_step->range.left.get<UInt64>(),
-                        range_with_step->range.right.get<UInt64>(),
-                        range_with_step->range.left_included,
-                        range_with_step->range.right_included,
-                        range_with_step->step);
-                    intersected_ranges.push_back(*range_with_step);
-                }
-            }
         }
 
 
@@ -546,11 +499,6 @@ Pipe ReadFromSystemNumbersStep::makePipe()
             }
         }
 
-        // for (const auto& range : intersected_ranges)
-        // {
-        //     LOG_DEBUG(&Poco::Logger::get("Ranges with step"), "Left: {}; Right {}, LI: {}, RI: {}, Step: {}", range.range.left.get<UInt64>(), range.range.right.get<UInt64>(), range.range.left_included, range.range.right_included, range.step);
-        //     // std::cout <<
-        // }
 
         /// ranges is blank, return a source who has no data
         if (intersected_ranges.empty())
@@ -565,7 +513,6 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         if (!intersected_ranges.rbegin()->range.right.isPositiveInfinity() || should_pushdown_limit)
         {
             UInt128 total_size = sizeOfRanges(intersected_ranges);
-            LOG_DEBUG(&Poco::Logger::get("Total_Size"), "Total Size: {}", static_cast<UInt64>(total_size));
             UInt128 query_limit = limit_length + limit_offset;
 
             /// limit total_size by query_limit
diff --git a/src/Storages/System/StorageSystemNumbers.h b/src/Storages/System/StorageSystemNumbers.h
index 9663ee25251..298721984b8 100644
--- a/src/Storages/System/StorageSystemNumbers.h
+++ b/src/Storages/System/StorageSystemNumbers.h
@@ -43,7 +43,7 @@ private:
 
     bool multithreaded;
     std::optional<UInt64> limit;
-    UInt64 offset;`
+    UInt64 offset;
     std::string column_name;
     UInt64 step;
 };

From 03aaedace439f5db6d9a6aaf91a1b2f978b0f6a9 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Fri, 9 Feb 2024 12:05:01 +0000
Subject: [PATCH 014/985] Fix bug

---
 .../QueryPlan/ReadFromSystemNumbersStep.cpp           | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 3bb2e0cd69d..bc14547889b 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -435,6 +435,8 @@ Pipe ReadFromSystemNumbersStep::makePipe()
     Pipe pipe;
     Ranges ranges;
 
+    // LOG_DEBUG(&Poco::Logger::get("parameters"), "Parameters: {} {} {}", numbers_storage.step, numbers_storage.limit.value(), numbers_storage.offset);
+
     if (numbers_storage.limit.has_value() && (numbers_storage.limit.value() == 0))
     {
         pipe.addSource(std::make_shared<NullSource>(NumbersSource::createHeader(numbers_storage.column_name)));
@@ -476,6 +478,15 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         for (auto & r : ranges)
         {
             auto intersected_range = table_range->intersectWith(r);
+            if (intersected_range.has_value())
+            {
+                auto range_with_step = stepped_range_from_range(
+                    intersected_range.value(), numbers_storage.step, numbers_storage.offset % numbers_storage.step);
+                if (range_with_step.has_value())
+                {
+                    intersected_ranges.push_back(*range_with_step);
+                }
+            }
         }
 
 
From 1b2f23247b7f115ba92b9908d224d4e78e8649f4 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Fri, 9 Feb 2024 12:28:54 +0000
Subject: [PATCH 015/985] Change documentation

---
 docs/en/sql-reference/table-functions/generate_series.md | 2 +-
 src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp   | 2 --
 2 files changed, 1 insertion(+), 3 deletions(-)

diff --git a/docs/en/sql-reference/table-functions/generate_series.md b/docs/en/sql-reference/table-functions/generate_series.md
index de34e10ac76..c5d29369627 100644
--- a/docs/en/sql-reference/table-functions/generate_series.md
+++ b/docs/en/sql-reference/table-functions/generate_series.md
@@ -1,6 +1,6 @@
 ---
 slug: /en/sql-reference/table-functions/generate_series
-sidebar_position: ?
+sidebar_position: 146
 sidebar_label: generate_series
 ---
 
diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index bc14547889b..ab2f726aeb5 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -483,9 +483,7 @@ Pipe ReadFromSystemNumbersStep::makePipe()
                 auto range_with_step = stepped_range_from_range(
                     intersected_range.value(), numbers_storage.step, numbers_storage.offset % numbers_storage.step);
                 if (range_with_step.has_value())
-                {
                     intersected_ranges.push_back(*range_with_step);
-                }
             }
         }
 

From 79f91003538a71014eb035dca024285f2fbba7d5 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Fri, 9 Feb 2024 14:17:25 +0000
Subject: [PATCH 016/985] To pull

---
 src/TableFunctions/TableFunctionGenerateSeries.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/TableFunctions/TableFunctionGenerateSeries.cpp b/src/TableFunctions/TableFunctionGenerateSeries.cpp
index 88d7b0d1a71..65c4c4915c2 100644
--- a/src/TableFunctions/TableFunctionGenerateSeries.cpp
+++ b/src/TableFunctions/TableFunctionGenerateSeries.cpp
@@ -77,7 +77,7 @@ StoragePtr TableFunctionGenerateSeries::executeImpl(
             throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Table function '{}' requires step to be a positive number", getName());
         auto res = (start > stop)
             ? std::make_shared<StorageSystemNumbers>(
-                StorageID(getDatabaseName(), table_name), false, std::string{"generate_series"}, 0, 0, 0)
+                StorageID(getDatabaseName(), table_name), false, std::string{"generate_series"}, 0, 0, 1)
             : std::make_shared<StorageSystemNumbers>(
                 StorageID(getDatabaseName(), table_name), false, std::string{"generate_series"}, (stop - start) + 1, start, step);
         res->startup();

From f7dbcdd7e7e00d4fb6d30a02ebcb4a3befcd3190 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Fri, 9 Feb 2024 18:12:24 +0000
Subject: [PATCH 017/985] Made refactoring

---
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 41 ++++++++++++-------
 src/Storages/System/StorageSystemNumbers.h    | 28 +++++++++++++
 2 files changed, 54 insertions(+), 15 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 3a905a56aa1..2488fa37643 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -9,10 +9,12 @@
 #include <QueryPipeline/QueryPipelineBuilder.h>
 #include <Storages/MergeTree/KeyCondition.h>
 #include <Storages/System/StorageSystemNumbers.h>
+#include <fmt/format.h>
 #include <Common/iota.h>
 #include <Common/typeid_cast.h>
 
 #include <Common/logger_useful.h>
+#include "base/types.h"
 
 namespace DB
 {
@@ -28,13 +30,13 @@ namespace
 class NumbersSource : public ISource
 {
 public:
-    NumbersSource(UInt64 block_size_, UInt64 offset_, UInt64 step_, const std::string & column_name, UInt64 inner_step_)
+    NumbersSource(UInt64 block_size_, UInt64 offset_, UInt64 chunk_step_, const std::string & column_name, UInt64 step_, UInt64 remainder_)
         : ISource(createHeader(column_name))
         , block_size(block_size_)
         , next(offset_)
+        , chunk_step(chunk_step_)
         , step(step_)
-        , inner_step(inner_step_)
-        , inner_remainder(offset_ % inner_step_)
+        , remainder(remainder_)
     {
     }
     String getName() const override { return "Numbers"; }
@@ -48,25 +50,33 @@ protected:
     Chunk generate() override
     {
         UInt64 curr = next; /// The local variable for some reason works faster (>20%) than member of class.
-        UInt64 first_element = (curr / inner_step) * inner_step + inner_remainder;
-        if (first_element < curr)
-            first_element += inner_step;
-        UInt64 filtered_block_size = 0;
+        UInt64 first_element = (curr / step) * step;
+        if (first_element > std::numeric_limits<UInt64>::max() - remainder) {
+            auto column = ColumnUInt64::create(0);
+            return {Columns{std::move(column)}, 0};
+        }
+        first_element += remainder;
+        if (first_element < curr) {
+            if (first_element > std::numeric_limits<UInt64>::max() - step) {
+                auto column = ColumnUInt64::create(0);
+                return {Columns{std::move(column)}, 0};
+            }
+            first_element += step;
+        }
         if (first_element - curr >= block_size)
         {
             auto column = ColumnUInt64::create(0);
-            return {Columns{std::move(column)}, filtered_block_size};
+            return {Columns{std::move(column)}, 0};
         }
-        if (first_element - curr < block_size)
-            filtered_block_size = (block_size - (first_element - curr) - 1) / inner_step + 1;
+        UInt64 filtered_block_size = (block_size - (first_element - curr) - 1) / step + 1;
 
         auto column = ColumnUInt64::create(filtered_block_size);
         ColumnUInt64::Container & vec = column->getData();
         UInt64 * pos = vec.data(); /// This also accelerates the code.
         UInt64 * end = &vec[filtered_block_size];
-        iota_with_step(pos, static_cast<size_t>(end - pos), first_element, inner_step);
+        iota_with_step(pos, static_cast<size_t>(end - pos), first_element, step);
 
-        next += step;
+        next += chunk_step;
 
         progress(column->size(), column->byteSize());
 
@@ -76,9 +86,9 @@ protected:
 private:
     UInt64 block_size;
     UInt64 next;
+    UInt64 chunk_step;
     UInt64 step;
-    UInt64 inner_step;
-    UInt64 inner_remainder;
+    UInt64 remainder;
 };
 
 struct RangeWithStep
@@ -565,7 +575,8 @@ Pipe ReadFromSystemNumbersStep::makePipe()
             numbers_storage.offset + i * max_block_size,
             num_streams * max_block_size,
             numbers_storage.column_name,
-            numbers_storage.step);
+            numbers_storage.step, 
+            numbers_storage.offset % numbers_storage.step);
 
         if (numbers_storage.limit && i == 0)
         {
diff --git a/src/Storages/System/StorageSystemNumbers.h b/src/Storages/System/StorageSystemNumbers.h
index 298721984b8..c698bae4393 100644
--- a/src/Storages/System/StorageSystemNumbers.h
+++ b/src/Storages/System/StorageSystemNumbers.h
@@ -10,6 +10,34 @@ namespace DB
 
 class Context;
 
+/** Implements a table engine for the system table "numbers".
+  * The table contains the only column number UInt64.
+  * From this table, you can read all natural numbers, starting from 0 (to 2^64 - 1, and then again).
+  *
+  * You could also specify a limit (how many numbers to give).
+  *
+  * How to generate numbers?
+  *
+  * 1. First try a smart fashion:
+  *
+  * In this fashion we try to push filters and limit down to scanning.
+  * Firstly extract plain ranges(no overlapping and ordered) by filter expressions.
+  *
+  * For example:
+  *     where (numbers > 1 and numbers < 3) or (numbers in (4, 6)) or (numbers > 7 and numbers < 9)
+  *
+  * We will get ranges
+  *     (1, 3), [4, 4], [6, 6], (7, 9)
+  *
+  * Then split the ranges evenly to one or multi-streams. With this way we will get result without large scanning.
+  *
+  * 2. If fail to extract plain ranges, fall back to ordinary scanning.
+  *
+  * If multithreaded is specified, numbers will be generated in several streams
+  *  (and result could be out of order). If both multithreaded and limit are specified,
+  *  the table could give you not exactly 1..limit range, but some arbitrary 'limit' numbers.
+  */
+
 class StorageSystemNumbers final : public IStorage
 {
 public:

From 696609e7d562d15cfc7a6ffa776785444a97c2e7 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Sat, 10 Feb 2024 19:59:57 +0000
Subject: [PATCH 018/985] Kek

---
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 42 ++++++++++++++++---
 1 file changed, 36 insertions(+), 6 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 2488fa37643..dc6aebc69c1 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -14,6 +14,7 @@
 #include <Common/typeid_cast.h>
 
 #include <Common/logger_useful.h>
+#include "Core/Types.h"
 #include "base/types.h"
 
 namespace DB
@@ -51,13 +52,16 @@ protected:
     {
         UInt64 curr = next; /// The local variable for some reason works faster (>20%) than member of class.
         UInt64 first_element = (curr / step) * step;
-        if (first_element > std::numeric_limits<UInt64>::max() - remainder) {
+        if (first_element > std::numeric_limits<UInt64>::max() - remainder) 
+        {
             auto column = ColumnUInt64::create(0);
             return {Columns{std::move(column)}, 0};
         }
         first_element += remainder;
-        if (first_element < curr) {
-            if (first_element > std::numeric_limits<UInt64>::max() - step) {
+        if (first_element < curr) 
+        {
+            if (first_element > std::numeric_limits<UInt64>::max() - step) 
+            {
                 auto column = ColumnUInt64::create(0);
                 return {Columns{std::move(column)}, 0};
             }
@@ -101,6 +105,8 @@ using RangesWithStep = std::vector<RangeWithStep>;
 
 std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 step, UInt64 remainder)
 {
+    // LOG_DEBUG(&Poco::Logger::get("Stepped from range"),
+    //                     "stepped from range");
     if ((r.right.get<UInt64>() == 0) && (!r.right_included))
         return std::nullopt;
     UInt64 begin = (r.left.get<UInt64>() / step) * step;
@@ -126,7 +132,11 @@ std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 st
     if (r.range.right.isPositiveInfinity())
         return static_cast<UInt128>(std::numeric_limits<UInt64>::max() - r.range.left.get<UInt64>()) / r.step + r.range.left_included;
 
-    return static_cast<UInt128>(r.range.right.get<UInt64>() - r.range.left.get<UInt64>()) / r.step + 1;
+    UInt128 size = static_cast<UInt128>(r.range.right.get<UInt64>() - r.range.left.get<UInt64>()) / r.step;
+    if (r.range.right_included && (r.range.right.get<UInt64>() % r.step == 0)) {
+        ++size;
+    }
+    return size;
 };
 
 [[maybe_unused]] auto sizeOfRanges(const RangesWithStep & rs)
@@ -173,6 +183,17 @@ public:
         , base_block_size(base_block_size_)
         , step(step_)
     {
+        // for (const auto& range_with_step : ranges_) {
+        //     // LOG_DEBUG(&Poco::Logger::get("Ranges With Step"),
+        //     //             "Ranges: {} {} {} {} {}",
+        //     //             range_with_step.range.left.get<UInt64>(),
+        //     //             range_with_step.range.right.get<UInt64>(),
+        //     //             range_with_step.range.left_included,
+        //     //             range_with_step.range.right_included,
+        //     //             range_with_step.step);
+        //     // LOG_DEBUG(&Poco::Logger::get("Ranges With Step"),
+        //     //             "Step: {}", step);
+        // }
     }
 
     String getName() const override { return "NumbersRange"; }
@@ -241,6 +262,8 @@ protected:
         RangesPos start, end;
         auto block_size = findRanges(start, end, base_block_size);
 
+        // LOG_DEBUG(&Poco::Logger::get("Found range"), "Evth: {} {} {} {} {} {}", start.offset_in_ranges, static_cast<UInt64>(start.offset_in_range), end.offset_in_ranges, static_cast<UInt64>(end.offset_in_range), base_block_size, block_size);
+
         if (!block_size)
             return {};
 
@@ -256,6 +279,11 @@ protected:
         while (block_size - provided != 0)
         {
             UInt64 need = block_size - provided;
+            // LOG_DEBUG(&Poco::Logger::get("Indices:"),
+            //             "Indices: {} {}, provided: {}",
+            //             ranges.size(),
+            //             cursor.offset_in_ranges,
+            //             provided);
             auto & range = ranges[cursor.offset_in_ranges];
 
             UInt128 can_provide = cursor.offset_in_ranges == end.offset_in_ranges
@@ -445,13 +473,15 @@ Pipe ReadFromSystemNumbersStep::makePipe()
     Pipe pipe;
     Ranges ranges;
 
-    // LOG_DEBUG(&Poco::Logger::get("parameters"), "Parameters: {} {} {}", numbers_storage.step, numbers_storage.limit.value(), numbers_storage.offset);
+
+    // LOG_DEBUG(&Poco::Logger::get("parameters"), "Parameters: {} {} {} {}", numbers_storage.step, numbers_storage.offset, numbers_storage.limit.has_value(), numbers_storage.limit.has_value() ? numbers_storage.limit.value() : UInt64{0});
 
     if (numbers_storage.limit.has_value() && (numbers_storage.limit.value() == 0))
     {
         pipe.addSource(std::make_shared<NullSource>(NumbersSource::createHeader(numbers_storage.column_name)));
         return pipe;
     }
+    chassert(numbers_storage.step != UInt64{0});
 
     /// Build rpn of query filters
     KeyCondition condition(buildFilterDAG(), context, column_names, key_expression);
@@ -575,7 +605,7 @@ Pipe ReadFromSystemNumbersStep::makePipe()
             numbers_storage.offset + i * max_block_size,
             num_streams * max_block_size,
             numbers_storage.column_name,
-            numbers_storage.step, 
+            numbers_storage.step,
             numbers_storage.offset % numbers_storage.step);
 
         if (numbers_storage.limit && i == 0)

From 3ec9f3c4c89dec2f1971979d7d3ae406c1ecd938 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Sat, 10 Feb 2024 20:06:52 +0000
Subject: [PATCH 019/985] Check foormattign

---
 src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp | 9 ++++-----
 1 file changed, 4 insertions(+), 5 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index dc6aebc69c1..1e6b539ee2e 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -52,15 +52,15 @@ protected:
     {
         UInt64 curr = next; /// The local variable for some reason works faster (>20%) than member of class.
         UInt64 first_element = (curr / step) * step;
-        if (first_element > std::numeric_limits<UInt64>::max() - remainder) 
+        if (first_element > std::numeric_limits<UInt64>::max() - remainder)
         {
             auto column = ColumnUInt64::create(0);
             return {Columns{std::move(column)}, 0};
         }
         first_element += remainder;
-        if (first_element < curr) 
+        if (first_element < curr)
         {
-            if (first_element > std::numeric_limits<UInt64>::max() - step) 
+            if (first_element > std::numeric_limits<UInt64>::max() - step)
             {
                 auto column = ColumnUInt64::create(0);
                 return {Columns{std::move(column)}, 0};
@@ -133,9 +133,8 @@ std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 st
         return static_cast<UInt128>(std::numeric_limits<UInt64>::max() - r.range.left.get<UInt64>()) / r.step + r.range.left_included;
 
     UInt128 size = static_cast<UInt128>(r.range.right.get<UInt64>() - r.range.left.get<UInt64>()) / r.step;
-    if (r.range.right_included && (r.range.right.get<UInt64>() % r.step == 0)) {
+    if (r.range.right_included && (r.range.right.get<UInt64>() % r.step == 0))
         ++size;
-    }
     return size;
 };
 

From d0456980991c45935fd316ca7dc2bd61cf45e5b9 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Sat, 10 Feb 2024 23:04:52 +0000
Subject: [PATCH 020/985] It seems to work

---
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 31 ++++++-------------
 ...ble_functions_must_be_documented.reference |  1 +
 2 files changed, 11 insertions(+), 21 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 1e6b539ee2e..2217e426b02 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -97,7 +97,8 @@ private:
 
 struct RangeWithStep
 {
-    Range range;
+    UInt64 left;
+    UInt64 right;
     UInt64 step;
 };
 
@@ -124,18 +125,12 @@ std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 st
     if ((begin >= r.right_included) && (begin - r.right_included >= r.right.get<UInt64>()))
         return std::nullopt;
     UInt64 right_edge_included = r.right.get<UInt64>() - (1 - r.right_included);
-    return std::optional{RangeWithStep{Range(begin, true, right_edge_included, true), step}};
+    return std::optional{RangeWithStep{begin, right_edge_included, step}};
 }
 
 [[maybe_unused]] UInt128 sizeOfRange(const RangeWithStep & r)
 {
-    if (r.range.right.isPositiveInfinity())
-        return static_cast<UInt128>(std::numeric_limits<UInt64>::max() - r.range.left.get<UInt64>()) / r.step + r.range.left_included;
-
-    UInt128 size = static_cast<UInt128>(r.range.right.get<UInt64>() - r.range.left.get<UInt64>()) / r.step;
-    if (r.range.right_included && (r.range.right.get<UInt64>() % r.step == 0))
-        ++size;
-    return size;
+    return static_cast<UInt128>(r.right - r.left) / r.step + 1;
 };
 
 [[maybe_unused]] auto sizeOfRanges(const RangesWithStep & rs)
@@ -252,10 +247,6 @@ protected:
         if (ranges.empty())
             return {};
 
-        auto first_value = [](const RangeWithStep & r) { return r.range.left.get<UInt64>() + (r.range.left_included ? 0 : 1); };
-
-        auto last_value = [](const RangeWithStep & r) { return r.range.right.get<UInt64>() - (r.range.right_included ? 0 : 1); };
-
         /// Find the data range.
         /// If data left is small, shrink block size.
         RangesPos start, end;
@@ -287,7 +278,7 @@ protected:
 
             UInt128 can_provide = cursor.offset_in_ranges == end.offset_in_ranges
                 ? end.offset_in_range - cursor.offset_in_range
-                : static_cast<UInt128>(last_value(range) - first_value(range)) / range.step + 1 - cursor.offset_in_range;
+                : static_cast<UInt128>(range.right - range.left) / range.step + 1 - cursor.offset_in_range;
 
             /// set value to block
             auto set_value = [&pos, this](UInt128 & start_value, UInt128 & end_value)
@@ -312,7 +303,7 @@ protected:
 
             if (can_provide > need)
             {
-                UInt64 start_value = first_value(range) + cursor.offset_in_range * step;
+                UInt64 start_value = range.left + cursor.offset_in_range * step;
                 /// end_value will never overflow
                 iota_with_step(pos, static_cast<size_t>(need), start_value, step);
                 pos += need;
@@ -323,7 +314,7 @@ protected:
             else if (can_provide == need)
             {
                 /// to avoid UInt64 overflow
-                UInt128 start_value = static_cast<UInt128>(first_value(range)) + cursor.offset_in_range * step;
+                UInt128 start_value = static_cast<UInt128>(range.left) + cursor.offset_in_range * step;
                 UInt128 end_value = start_value + need * step;
                 set_value(start_value, end_value);
 
@@ -334,7 +325,7 @@ protected:
             else
             {
                 /// to avoid UInt64 overflow
-                UInt128 start_value = static_cast<UInt128>(first_value(range)) + cursor.offset_in_range * step;
+                UInt128 start_value = static_cast<UInt128>(range.left) + cursor.offset_in_range * step;
                 UInt128 end_value = start_value + can_provide * step;
                 set_value(start_value, end_value);
 
@@ -400,9 +391,7 @@ namespace
         else
         {
             auto & range = ranges[i];
-            UInt64 right = range.range.left.get<UInt64>() + static_cast<UInt64>(size);
-            range.range.right = Field(right);
-            range.range.right_included = !range.range.left_included;
+            range.right = range.left + static_cast<UInt64>(size) * range.step - 1;
             last_range_idx = i;
             break;
         }
@@ -558,7 +547,7 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         const auto & limit_offset = limit_length_and_offset.second;
 
         /// If intersected ranges is limited or we can pushdown limit.
-        if (!intersected_ranges.rbegin()->range.right.isPositiveInfinity() || should_pushdown_limit)
+        if (should_pushdown_limit)
         {
             UInt128 total_size = sizeOfRanges(intersected_ranges);
             UInt128 query_limit = limit_length + limit_offset;
diff --git a/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference b/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference
index e4040a2d371..1e4f21a6722 100644
--- a/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference
+++ b/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference
@@ -4,6 +4,7 @@ dictionary
 executable
 file
 generateRandom
+generate_series
 input
 jdbc
 merge

From 789d3c699c77d7a39f42281d9dc0c61010471242 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Sat, 10 Feb 2024 23:49:58 +0000
Subject: [PATCH 021/985] Remove bug for mt

---
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 65 +++++++++----------
 1 file changed, 31 insertions(+), 34 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 2217e426b02..3656a6d31ee 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -547,42 +547,39 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         const auto & limit_offset = limit_length_and_offset.second;
 
         /// If intersected ranges is limited or we can pushdown limit.
-        if (should_pushdown_limit)
+        UInt128 total_size = sizeOfRanges(intersected_ranges);
+        UInt128 query_limit = limit_length + limit_offset;
+
+        /// limit total_size by query_limit
+        if (should_pushdown_limit && query_limit < total_size)
         {
-            UInt128 total_size = sizeOfRanges(intersected_ranges);
-            UInt128 query_limit = limit_length + limit_offset;
-
-            /// limit total_size by query_limit
-            if (should_pushdown_limit && query_limit < total_size)
-            {
-                total_size = query_limit;
-                /// We should shrink intersected_ranges for case:
-                ///     intersected_ranges: [1, 4], [7, 100]; query_limit: 2
-                shrinkRanges(intersected_ranges, total_size);
-            }
-
-            checkLimits(size_t(total_size));
-
-            if (total_size / max_block_size < num_streams)
-                num_streams = static_cast<size_t>(total_size / max_block_size);
-
-            if (num_streams == 0)
-                num_streams = 1;
-
-            /// Ranges state, all streams will share the state.
-            auto ranges_state = std::make_shared<NumbersRangedSource::RangesState>();
-            for (size_t i = 0; i < num_streams; ++i)
-            {
-                auto source = std::make_shared<NumbersRangedSource>(
-                    intersected_ranges, ranges_state, max_block_size, numbers_storage.step, numbers_storage.column_name);
-
-                if (i == 0)
-                    source->addTotalRowsApprox(total_size);
-
-                pipe.addSource(std::move(source));
-            }
-            return pipe;
+            total_size = query_limit;
+            /// We should shrink intersected_ranges for case:
+            ///     intersected_ranges: [1, 4], [7, 100]; query_limit: 2
+            shrinkRanges(intersected_ranges, total_size);
         }
+
+        checkLimits(size_t(total_size));
+
+        if (total_size / max_block_size < num_streams)
+            num_streams = static_cast<size_t>(total_size / max_block_size);
+
+        if (num_streams == 0)
+            num_streams = 1;
+
+        /// Ranges state, all streams will share the state.
+        auto ranges_state = std::make_shared<NumbersRangedSource::RangesState>();
+        for (size_t i = 0; i < num_streams; ++i)
+        {
+            auto source = std::make_shared<NumbersRangedSource>(
+                intersected_ranges, ranges_state, max_block_size, numbers_storage.step, numbers_storage.column_name);
+
+            if (i == 0)
+                source->addTotalRowsApprox(total_size);
+
+            pipe.addSource(std::move(source));
+        }
+        return pipe;
     }
 
     /// Fall back to NumbersSource

From 0f84f68da77663e2adcce800cceefff5ab019b58 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Tue, 13 Feb 2024 09:59:39 +0000
Subject: [PATCH 022/985] Simplified code

---
 src/Common/iota.cpp                           |  2 +-
 src/Common/iota.h                             |  2 +-
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 65 +++++--------------
 .../02970_generate_series.reference           |  1 -
 .../0_stateless/02970_generate_series.sql     |  1 -
 5 files changed, 20 insertions(+), 51 deletions(-)

diff --git a/src/Common/iota.cpp b/src/Common/iota.cpp
index 532c4bde76d..86c9e04bb06 100644
--- a/src/Common/iota.cpp
+++ b/src/Common/iota.cpp
@@ -60,6 +60,6 @@ template void iota_with_step(UInt8 * begin, size_t count, UInt8 first_value, UIn
 template void iota_with_step(UInt32 * begin, size_t count, UInt32 first_value, UInt32 step);
 template void iota_with_step(UInt64 * begin, size_t count, UInt64 first_value, UInt64 step);
 #if defined(OS_DARWIN)
-extern template void iota_with_step(size_t * begin, size_t count, size_t first_value, size_t step);
+template void iota_with_step(size_t * begin, size_t count, size_t first_value, size_t step);
 #endif
 }
diff --git a/src/Common/iota.h b/src/Common/iota.h
index f40cde9d5db..8fa18be9769 100644
--- a/src/Common/iota.h
+++ b/src/Common/iota.h
@@ -38,6 +38,6 @@ extern template void iota_with_step(UInt8 * begin, size_t count, UInt8 first_val
 extern template void iota_with_step(UInt32 * begin, size_t count, UInt32 first_value, UInt32 step);
 extern template void iota_with_step(UInt64 * begin, size_t count, UInt64 first_value, UInt64 step);
 #if defined(OS_DARWIN)
-extern template void iota(size_t * begin, size_t count, size_t first_value, size_t step);
+extern template void iota_with_step(size_t * begin, size_t count, size_t first_value, size_t step);
 #endif
 }
diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 3656a6d31ee..d69e2b6ca5a 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -15,6 +15,7 @@
 
 #include <Common/logger_useful.h>
 #include "Core/Types.h"
+#include "base/Decimal_fwd.h"
 #include "base/types.h"
 
 namespace DB
@@ -31,13 +32,12 @@ namespace
 class NumbersSource : public ISource
 {
 public:
-    NumbersSource(UInt64 block_size_, UInt64 offset_, UInt64 chunk_step_, const std::string & column_name, UInt64 step_, UInt64 remainder_)
+    NumbersSource(UInt64 block_size_, UInt64 offset_, UInt64 chunk_step_, const std::string & column_name, UInt64 step_)
         : ISource(createHeader(column_name))
         , block_size(block_size_)
         , next(offset_)
         , chunk_step(chunk_step_)
         , step(step_)
-        , remainder(remainder_)
     {
     }
     String getName() const override { return "Numbers"; }
@@ -50,41 +50,19 @@ public:
 protected:
     Chunk generate() override
     {
-        UInt64 curr = next; /// The local variable for some reason works faster (>20%) than member of class.
-        UInt64 first_element = (curr / step) * step;
-        if (first_element > std::numeric_limits<UInt64>::max() - remainder)
-        {
-            auto column = ColumnUInt64::create(0);
-            return {Columns{std::move(column)}, 0};
-        }
-        first_element += remainder;
-        if (first_element < curr)
-        {
-            if (first_element > std::numeric_limits<UInt64>::max() - step)
-            {
-                auto column = ColumnUInt64::create(0);
-                return {Columns{std::move(column)}, 0};
-            }
-            first_element += step;
-        }
-        if (first_element - curr >= block_size)
-        {
-            auto column = ColumnUInt64::create(0);
-            return {Columns{std::move(column)}, 0};
-        }
-        UInt64 filtered_block_size = (block_size - (first_element - curr) - 1) / step + 1;
-
-        auto column = ColumnUInt64::create(filtered_block_size);
+        auto column = ColumnUInt64::create(block_size);
         ColumnUInt64::Container & vec = column->getData();
+
+        UInt64 curr = next; /// The local variable for some reason works faster (>20%) than member of class.
         UInt64 * pos = vec.data(); /// This also accelerates the code.
-        UInt64 * end = &vec[filtered_block_size];
-        iota_with_step(pos, static_cast<size_t>(end - pos), first_element, step);
+        UInt64 * end = &vec[block_size];
+        iota_with_step(pos, static_cast<size_t>(end - pos), curr, step);
 
         next += chunk_step;
 
         progress(column->size(), column->byteSize());
 
-        return {Columns{std::move(column)}, filtered_block_size};
+        return {Columns{std::move(column)}, block_size};
     }
 
 private:
@@ -92,14 +70,13 @@ private:
     UInt64 next;
     UInt64 chunk_step;
     UInt64 step;
-    UInt64 remainder;
 };
 
 struct RangeWithStep
 {
     UInt64 left;
-    UInt64 right;
     UInt64 step;
+    UInt128 size;
 };
 
 using RangesWithStep = std::vector<RangeWithStep>;
@@ -125,21 +102,16 @@ std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 st
     if ((begin >= r.right_included) && (begin - r.right_included >= r.right.get<UInt64>()))
         return std::nullopt;
     UInt64 right_edge_included = r.right.get<UInt64>() - (1 - r.right_included);
-    return std::optional{RangeWithStep{begin, right_edge_included, step}};
+    return std::optional{RangeWithStep{begin, step, static_cast<UInt128>(right_edge_included - begin) / step + 1}};
 }
 
-[[maybe_unused]] UInt128 sizeOfRange(const RangeWithStep & r)
-{
-    return static_cast<UInt128>(r.right - r.left) / r.step + 1;
-};
-
 [[maybe_unused]] auto sizeOfRanges(const RangesWithStep & rs)
 {
     UInt128 total_size{};
     for (const RangeWithStep & r : rs)
     {
         /// total_size will never overflow
-        total_size += sizeOfRange(r);
+        total_size += r.size;
     }
     return total_size;
 };
@@ -211,7 +183,7 @@ protected:
         while (need != 0)
         {
             UInt128 can_provide = end.offset_in_ranges == ranges.size() ? static_cast<UInt128>(0)
-                                                                        : sizeOfRange(ranges[end.offset_in_ranges]) - end.offset_in_range;
+                                                                        : ranges[end.offset_in_ranges].size - end.offset_in_range;
             if (can_provide == 0)
                 break;
 
@@ -278,7 +250,7 @@ protected:
 
             UInt128 can_provide = cursor.offset_in_ranges == end.offset_in_ranges
                 ? end.offset_in_range - cursor.offset_in_range
-                : static_cast<UInt128>(range.right - range.left) / range.step + 1 - cursor.offset_in_range;
+                : range.size - cursor.offset_in_range;
 
             /// set value to block
             auto set_value = [&pos, this](UInt128 & start_value, UInt128 & end_value)
@@ -377,7 +349,7 @@ namespace
     size_t last_range_idx = 0;
     for (size_t i = 0; i < ranges.size(); i++)
     {
-        auto range_size = sizeOfRange(ranges[i]);
+        auto range_size = ranges[i].size;
         if (range_size < size)
         {
             size -= static_cast<UInt64>(range_size);
@@ -391,7 +363,7 @@ namespace
         else
         {
             auto & range = ranges[i];
-            range.right = range.left + static_cast<UInt64>(size) * range.step - 1;
+            range.size = static_cast<UInt128>(size);
             last_range_idx = i;
             break;
         }
@@ -587,11 +559,10 @@ Pipe ReadFromSystemNumbersStep::makePipe()
     {
         auto source = std::make_shared<NumbersSource>(
             max_block_size,
-            numbers_storage.offset + i * max_block_size,
-            num_streams * max_block_size,
+            numbers_storage.offset + i * max_block_size * numbers_storage.step,
+            num_streams * max_block_size * numbers_storage.step,
             numbers_storage.column_name,
-            numbers_storage.step,
-            numbers_storage.offset % numbers_storage.step);
+            numbers_storage.step);
 
         if (numbers_storage.limit && i == 0)
         {
diff --git a/tests/queries/0_stateless/02970_generate_series.reference b/tests/queries/0_stateless/02970_generate_series.reference
index 9e6f1db911e..4e4f556a39b 100644
--- a/tests/queries/0_stateless/02970_generate_series.reference
+++ b/tests/queries/0_stateless/02970_generate_series.reference
@@ -4,7 +4,6 @@
 8
 500000001
 50000000
-100000001
 0
 10
 13
diff --git a/tests/queries/0_stateless/02970_generate_series.sql b/tests/queries/0_stateless/02970_generate_series.sql
index 045f584a622..a7f89e1bd3f 100644
--- a/tests/queries/0_stateless/02970_generate_series.sql
+++ b/tests/queries/0_stateless/02970_generate_series.sql
@@ -4,7 +4,6 @@ SELECT count() FROM generate_series(10, 20, 3);
 SELECT count() FROM generate_series(7, 77, 10);
 SELECT count() FROM generate_series(0, 1000000000, 2);
 SELECT count() FROM generate_series(0, 999999999, 20);
-SELECT count() FROM generate_series(0, 1000000000, 2) WHERE generate_series % 5 == 0;
 
 SELECT * FROM generate_series(5, 4);
 SELECT * FROM generate_series(0, 0);

From d12ecdc5f06689d6259e2ef082a916f8b2f1836f Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 13 Feb 2024 12:35:17 +0100
Subject: [PATCH 023/985] Asynchronous WriteBuffer for AzureBlobStorage

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     |   3 +-
 src/Core/Settings.h                           |   3 +-
 .../IO/WriteBufferFromAzureBlobStorage.cpp    | 116 +++++++++++-------
 .../IO/WriteBufferFromAzureBlobStorage.h      |  22 +++-
 .../AzureBlobStorage/AzureBlobStorageAuth.cpp |   3 +-
 .../AzureBlobStorage/AzureObjectStorage.cpp   |   3 +-
 .../AzureBlobStorage/AzureObjectStorage.h     |   5 +-
 src/IO/WriteBufferFromS3.cpp                  |   2 +-
 src/IO/WriteBufferFromS3.h                    |   5 +-
 src/IO/WriteBufferFromS3TaskTracker.cpp       |  21 ++--
 src/IO/WriteBufferFromS3TaskTracker.h         |   8 +-
 11 files changed, 124 insertions(+), 67 deletions(-)

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index 52ce20d5108..44a72f80456 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -278,7 +278,8 @@ std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const Strin
         settings->max_single_part_upload_size,
         settings->max_unexpected_write_error_retries,
         DBMS_DEFAULT_BUFFER_SIZE,
-        write_settings);
+        write_settings,
+        settings->max_inflight_parts_for_one_file);
 }
 
 void BackupWriterAzureBlobStorage::removeFile(const String & file_name)
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 44badfefabb..53de245bdfc 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -80,7 +80,8 @@ class IColumn;
     M(UInt64, s3_max_upload_part_size, 5ull*1024*1024*1024, "The maximum size of part to upload during multipart upload to S3.", 0) \
     M(UInt64, s3_upload_part_size_multiply_factor, 2, "Multiply s3_min_upload_part_size by this factor each time s3_multiply_parts_count_threshold parts were uploaded from a single write to S3.", 0) \
     M(UInt64, s3_upload_part_size_multiply_parts_count_threshold, 500, "Each time this number of parts was uploaded to S3, s3_min_upload_part_size is multiplied by s3_upload_part_size_multiply_factor.", 0) \
-    M(UInt64, s3_max_inflight_parts_for_one_file, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited. You ", 0) \
+    M(UInt64, s3_max_inflight_parts_for_one_file, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited.", 0) \
+    M(UInt64, azure_max_inflight_parts_for_one_file, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited.", 0) \
     M(UInt64, s3_max_single_part_upload_size, 32*1024*1024, "The maximum size of object to upload using singlepart upload to S3.", 0) \
     M(UInt64, azure_max_single_part_upload_size, 100*1024*1024, "The maximum size of object to upload using singlepart upload to Azure blob storage.", 0)                                                                             \
     M(UInt64, azure_max_single_part_copy_size, 256*1024*1024, "The maximum size of object to copy using single part copy to Azure blob storage.", 0) \
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index 905114f50e9..cbe2367823d 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -18,13 +18,21 @@ namespace ProfileEvents
 namespace DB
 {
 
+struct WriteBufferFromAzureBlobStorage::PartData
+{
+    Memory<> memory;
+    size_t data_size = 0;
+};
+
 WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> blob_container_client_,
     const String & blob_path_,
     size_t max_single_part_upload_size_,
     size_t max_unexpected_write_error_retries_,
     size_t buf_size_,
-    const WriteSettings & write_settings_)
+    const WriteSettings & write_settings_,
+    size_t max_inflight_parts_for_one_file_,
+    ThreadPoolCallbackRunner<void> schedule_)
     : WriteBufferFromFileBase(buf_size_, nullptr, 0)
     , log(getLogger("WriteBufferFromAzureBlobStorage"))
     , max_single_part_upload_size(max_single_part_upload_size_)
@@ -32,7 +40,13 @@ WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     , blob_path(blob_path_)
     , write_settings(write_settings_)
     , blob_container_client(blob_container_client_)
+    , task_tracker(
+          std::make_unique<TaskTracker>(
+              std::move(schedule_),
+              max_inflight_parts_for_one_file_,
+              limitedLog))
 {
+    allocateBuffer();
 }
 
 
@@ -79,60 +93,80 @@ void WriteBufferFromAzureBlobStorage::finalizeImpl()
 {
     execWithRetry([this](){ next(); }, max_unexpected_write_error_retries);
 
-    if (tmp_buffer_write_offset > 0)
-        uploadBlock(tmp_buffer->data(), tmp_buffer_write_offset);
+    task_tracker->waitAll();
 
     auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
     execWithRetry([&](){ block_blob_client.CommitBlockList(block_ids); }, max_unexpected_write_error_retries);
 
-    LOG_TRACE(log, "Committed {} blocks for blob `{}`", block_ids.size(), blob_path);
-}
-
-void WriteBufferFromAzureBlobStorage::uploadBlock(const char * data, size_t size)
-{
-    auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
-    const std::string & block_id = block_ids.emplace_back(getRandomASCIIString(64));
-
-    Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(data), size);
-    execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, max_unexpected_write_error_retries, size);
-    tmp_buffer_write_offset = 0;
-
-    LOG_TRACE(log, "Staged block (id: {}) of size {} (blob path: {}).", block_id, size, blob_path);
-}
-
-WriteBufferFromAzureBlobStorage::MemoryBufferPtr WriteBufferFromAzureBlobStorage::allocateBuffer() const
-{
-    return std::make_unique<Memory<>>(max_single_part_upload_size);
+    LOG_DEBUG(log, "Committed {} blocks for blob `{}`", block_ids.size(), blob_path);
 }
 
 void WriteBufferFromAzureBlobStorage::nextImpl()
 {
-    size_t size_to_upload = offset();
+    task_tracker->waitIfAny();
 
-    if (size_to_upload == 0)
-        return;
+    reallocateBuffer();
+    detachBuffer();
 
-    if (!tmp_buffer)
-        tmp_buffer = allocateBuffer();
-
-    size_t uploaded_size = 0;
-    while (uploaded_size != size_to_upload)
+    while (!detached_part_data.empty())
     {
-        size_t memory_buffer_remaining_size = max_single_part_upload_size - tmp_buffer_write_offset;
-        if (memory_buffer_remaining_size == 0)
-            uploadBlock(tmp_buffer->data(), tmp_buffer->size());
-
-        size_t size = std::min(memory_buffer_remaining_size, size_to_upload - uploaded_size);
-        memcpy(tmp_buffer->data() + tmp_buffer_write_offset, working_buffer.begin() + uploaded_size, size);
-        uploaded_size += size;
-        tmp_buffer_write_offset += size;
+        writePart(std::move(detached_part_data.front()));
+        detached_part_data.pop_front();
     }
 
-    if (tmp_buffer_write_offset == max_single_part_upload_size)
-        uploadBlock(tmp_buffer->data(), tmp_buffer->size());
+    allocateBuffer();
+}
 
-    if (write_settings.remote_throttler)
-        write_settings.remote_throttler->add(size_to_upload, ProfileEvents::RemoteWriteThrottlerBytes, ProfileEvents::RemoteWriteThrottlerSleepMicroseconds);
+void WriteBufferFromAzureBlobStorage::allocateBuffer()
+{
+    memory = Memory(max_single_part_upload_size);
+    WriteBuffer::set(memory.data(), memory.size());
+}
+
+
+void WriteBufferFromAzureBlobStorage::reallocateBuffer()
+{
+    chassert(offset() == 0);
+
+    if (available() > 0)
+        return;
+
+    if (memory.size() == max_single_part_upload_size)
+        return;
+
+    memory.resize(max_single_part_upload_size);
+
+    WriteBuffer::set(memory.data(), memory.size());
+
+    chassert(offset() == 0);
+}
+
+void WriteBufferFromAzureBlobStorage::detachBuffer()
+{
+    size_t data_size = size_t(position() - memory.data());
+    auto buf = std::move(memory);
+    WriteBuffer::set(nullptr, 0);
+    detached_part_data.push_back({std::move(buf), data_size});
+}
+
+void WriteBufferFromAzureBlobStorage::writePart(WriteBufferFromAzureBlobStorage::PartData && data)
+{
+    if (data.data_size == 0)
+        return;
+
+    auto upload_worker = [&] ()
+    {
+        auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
+        const std::string & block_id = block_ids.emplace_back(getRandomASCIIString(64));
+
+        Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(data.memory.data()), data.data_size);
+        execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, max_unexpected_write_error_retries, data.data_size);
+
+        if (write_settings.remote_throttler)
+            write_settings.remote_throttler->add(data.data_size, ProfileEvents::RemoteWriteThrottlerBytes, ProfileEvents::RemoteWriteThrottlerSleepMicroseconds);
+    };
+
+    task_tracker->add(std::move(upload_worker));
 }
 
 }
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
index f105b35c121..2d11014fa2a 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
@@ -11,6 +11,7 @@
 #include <IO/WriteSettings.h>
 #include <azure/storage/blobs.hpp>
 #include <azure/core/io/body_stream.hpp>
+#include <IO/WriteBufferFromS3TaskTracker.h>
 
 
 namespace Poco
@@ -21,6 +22,8 @@ class Logger;
 namespace DB
 {
 
+class TaskTracker;
+
 class WriteBufferFromAzureBlobStorage : public WriteBufferFromFileBase
 {
 public:
@@ -32,7 +35,9 @@ public:
         size_t max_single_part_upload_size_,
         size_t max_unexpected_write_error_retries_,
         size_t buf_size_,
-        const WriteSettings & write_settings_);
+        const WriteSettings & write_settings_,
+        size_t max_inflight_parts_for_one_file_,
+        ThreadPoolCallbackRunner<void> schedule_ = {});
 
     ~WriteBufferFromAzureBlobStorage() override;
 
@@ -42,11 +47,21 @@ public:
     void sync() override { next(); }
 
 private:
+    struct PartData;
+
+    void writePart(WriteBufferFromAzureBlobStorage::PartData && data);
+    void detachBuffer();
+    void allocateBuffer();
+    void allocateFirstBuffer();
+    void reallocateFirstBuffer();
+    void reallocateBuffer();
+
     void finalizeImpl() override;
     void execWithRetry(std::function<void()> func, size_t num_tries, size_t cost = 0);
     void uploadBlock(const char * data, size_t size);
 
     LoggerPtr log;
+    LogSeriesLimiterPtr limitedLog = std::make_shared<LogSeriesLimiter>(log, 1, 5);
 
     const size_t max_single_part_upload_size;
     const size_t max_unexpected_write_error_retries;
@@ -61,6 +76,11 @@ private:
     size_t tmp_buffer_write_offset = 0;
 
     MemoryBufferPtr allocateBuffer() const;
+
+    bool first_buffer=true;
+
+    std::unique_ptr<TaskTracker> task_tracker;
+    std::deque<PartData> detached_part_data;
 };
 
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index 72c4abee5c9..f99586b2d1a 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -169,7 +169,8 @@ std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Po
         config.getUInt64(config_prefix + ".max_upload_part_size", 5ULL * 1024 * 1024 * 1024),
         config.getUInt64(config_prefix + ".max_single_part_copy_size", context->getSettings().azure_max_single_part_copy_size),
         config.getBool(config_prefix + ".use_native_copy", false),
-        config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", context->getSettings().azure_max_unexpected_write_error_retries)
+        config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", context->getSettings().azure_max_unexpected_write_error_retries),
+        config.getUInt64(config_prefix + ".max_inflight_parts_for_one_file", context->getSettings().azure_max_inflight_parts_for_one_file)
     );
 }
 
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
index 74389aedb64..844789ea5b5 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
@@ -268,7 +268,8 @@ std::unique_ptr<WriteBufferFromFileBase> AzureObjectStorage::writeObject( /// NO
         settings.get()->max_single_part_upload_size,
         settings.get()->max_unexpected_write_error_retries,
         buf_size,
-        patchSettings(write_settings));
+        patchSettings(write_settings),
+        settings.get()->max_inflight_parts_for_one_file);
 }
 
 /// Remove file. Throws exception if file doesn't exists or it's a directory.
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index f16c35fb52c..1b473a01304 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -27,7 +27,8 @@ struct AzureObjectStorageSettings
         size_t max_upload_part_size_,
         size_t max_single_part_copy_size_,
         bool use_native_copy_,
-        size_t max_unexpected_write_error_retries_)
+        size_t max_unexpected_write_error_retries_,
+        size_t max_inflight_parts_for_one_file_)
         : max_single_part_upload_size(max_single_part_upload_size_)
         , min_bytes_for_seek(min_bytes_for_seek_)
         , max_single_read_retries(max_single_read_retries_)
@@ -37,6 +38,7 @@ struct AzureObjectStorageSettings
         , max_single_part_copy_size(max_single_part_copy_size_)
         , use_native_copy(use_native_copy_)
         , max_unexpected_write_error_retries (max_unexpected_write_error_retries_)
+        , max_inflight_parts_for_one_file (max_inflight_parts_for_one_file_)
     {
     }
 
@@ -52,6 +54,7 @@ struct AzureObjectStorageSettings
     size_t max_single_part_copy_size = 256 * 1024 * 1024;
     bool use_native_copy = false;
     size_t max_unexpected_write_error_retries = 4;
+    size_t max_inflight_parts_for_one_file = 20;
 };
 
 using AzureClient = Azure::Storage::Blobs::BlobContainerClient;
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index 5bb01050591..6fc0a35672f 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -95,7 +95,7 @@ WriteBufferFromS3::WriteBufferFromS3(
     , object_metadata(std::move(object_metadata_))
     , buffer_allocation_policy(ChooseBufferPolicy(upload_settings))
     , task_tracker(
-          std::make_unique<WriteBufferFromS3::TaskTracker>(
+          std::make_unique<TaskTracker>(
               std::move(schedule_),
               upload_settings.max_inflight_parts_for_one_file,
               limitedLog))
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 230f39b074e..f3637122ee4 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -12,6 +12,7 @@
 #include <Storages/StorageS3Settings.h>
 #include <Interpreters/threadPoolCallbackRunner.h>
 #include <IO/S3/BlobStorageLogWriter.h>
+#include <IO/WriteBufferFromS3TaskTracker.h>
 
 #include <memory>
 #include <vector>
@@ -26,6 +27,8 @@ namespace DB
  * Data is divided on chunks with size greater than 'minimum_upload_part_size'. Last chunk can be less than this threshold.
  * Each chunk is written as a part to S3.
  */
+class TaskTracker;
+
 class WriteBufferFromS3 final : public WriteBufferFromFileBase
 {
 public:
@@ -118,7 +121,7 @@ private:
     size_t total_size = 0;
     size_t hidden_size = 0;
 
-    class TaskTracker;
+//    class TaskTracker;
     std::unique_ptr<TaskTracker> task_tracker;
 
     BlobStorageLogWriterPtr blob_log;
diff --git a/src/IO/WriteBufferFromS3TaskTracker.cpp b/src/IO/WriteBufferFromS3TaskTracker.cpp
index bce122dd6c8..e62de261fc2 100644
--- a/src/IO/WriteBufferFromS3TaskTracker.cpp
+++ b/src/IO/WriteBufferFromS3TaskTracker.cpp
@@ -1,7 +1,5 @@
 #include "config.h"
 
-#if USE_AWS_S3
-
 #include <IO/WriteBufferFromS3TaskTracker.h>
 
 namespace ProfileEvents
@@ -12,19 +10,19 @@ namespace ProfileEvents
 namespace DB
 {
 
-WriteBufferFromS3::TaskTracker::TaskTracker(ThreadPoolCallbackRunner<void> scheduler_, size_t max_tasks_inflight_, LogSeriesLimiterPtr limitedLog_)
+TaskTracker::TaskTracker(ThreadPoolCallbackRunner<void> scheduler_, size_t max_tasks_inflight_, LogSeriesLimiterPtr limitedLog_)
     : is_async(bool(scheduler_))
     , scheduler(scheduler_ ? std::move(scheduler_) : syncRunner())
     , max_tasks_inflight(max_tasks_inflight_)
     , limitedLog(limitedLog_)
 {}
 
-WriteBufferFromS3::TaskTracker::~TaskTracker()
+TaskTracker::~TaskTracker()
 {
     safeWaitAll();
 }
 
-ThreadPoolCallbackRunner<void> WriteBufferFromS3::TaskTracker::syncRunner()
+ThreadPoolCallbackRunner<void> TaskTracker::syncRunner()
 {
     return [](Callback && callback, int64_t) mutable -> std::future<void>
     {
@@ -35,7 +33,7 @@ ThreadPoolCallbackRunner<void> WriteBufferFromS3::TaskTracker::syncRunner()
     };
 }
 
-void WriteBufferFromS3::TaskTracker::waitAll()
+void TaskTracker::waitAll()
 {
     /// Exceptions are propagated
     for (auto & future : futures)
@@ -48,7 +46,7 @@ void WriteBufferFromS3::TaskTracker::waitAll()
     finished_futures.clear();
 }
 
-void WriteBufferFromS3::TaskTracker::safeWaitAll()
+void TaskTracker::safeWaitAll()
 {
     for (auto & future : futures)
     {
@@ -71,7 +69,7 @@ void WriteBufferFromS3::TaskTracker::safeWaitAll()
     finished_futures.clear();
 }
 
-void WriteBufferFromS3::TaskTracker::waitIfAny()
+void TaskTracker::waitIfAny()
 {
     if (futures.empty())
         return;
@@ -99,7 +97,7 @@ void WriteBufferFromS3::TaskTracker::waitIfAny()
     ProfileEvents::increment(ProfileEvents::WriteBufferFromS3WaitInflightLimitMicroseconds, watch.elapsedMicroseconds());
 }
 
-void WriteBufferFromS3::TaskTracker::add(Callback && func)
+void TaskTracker::add(Callback && func)
 {
     /// All this fuzz is about 2 things. This is the most critical place of TaskTracker.
     /// The first is not to fail insertion in the list `futures`.
@@ -134,7 +132,7 @@ void WriteBufferFromS3::TaskTracker::add(Callback && func)
     waitTilInflightShrink();
 }
 
-void WriteBufferFromS3::TaskTracker::waitTilInflightShrink()
+void TaskTracker::waitTilInflightShrink()
 {
     if (!max_tasks_inflight)
         return;
@@ -166,11 +164,10 @@ void WriteBufferFromS3::TaskTracker::waitTilInflightShrink()
     ProfileEvents::increment(ProfileEvents::WriteBufferFromS3WaitInflightLimitMicroseconds, watch.elapsedMicroseconds());
 }
 
-bool WriteBufferFromS3::TaskTracker::isAsync() const
+bool TaskTracker::isAsync() const
 {
     return is_async;
 }
 
 }
 
-#endif
diff --git a/src/IO/WriteBufferFromS3TaskTracker.h b/src/IO/WriteBufferFromS3TaskTracker.h
index 815e041ae52..134abbbc4c1 100644
--- a/src/IO/WriteBufferFromS3TaskTracker.h
+++ b/src/IO/WriteBufferFromS3TaskTracker.h
@@ -1,9 +1,7 @@
 #pragma once
 
 #include "config.h"
-
-#if USE_AWS_S3
-
+#include <Interpreters/threadPoolCallbackRunner.h>
 #include "WriteBufferFromS3.h"
 
 #include <Common/logger_useful.h>
@@ -22,7 +20,7 @@ namespace DB
 /// Basic exception safety is provided. If exception occurred the object has to be destroyed.
 /// No thread safety is provided. Use this object with no concurrency.
 
-class WriteBufferFromS3::TaskTracker
+class TaskTracker
 {
 public:
     using Callback = std::function<void()>;
@@ -68,5 +66,3 @@ private:
 };
 
 }
-
-#endif

From 26fd3d0d852986b6bbaf595087cb0d06bdff9f93 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 14 Feb 2024 16:13:53 +0100
Subject: [PATCH 024/985] Removed offset check

---
 src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index cbe2367823d..d700090303a 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -126,8 +126,6 @@ void WriteBufferFromAzureBlobStorage::allocateBuffer()
 
 void WriteBufferFromAzureBlobStorage::reallocateBuffer()
 {
-    chassert(offset() == 0);
-
     if (available() > 0)
         return;
 

From 750a82a4ff615190a2793c0cfae9f4c1f5c75433 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 15 Feb 2024 13:23:33 +0100
Subject: [PATCH 025/985] Update doc

---
 .../mergetree-family/mergetree.md             |   2 +
 docs/en/operations/storing-data.md            | 146 ++++++++++++++++--
 2 files changed, 134 insertions(+), 14 deletions(-)

diff --git a/docs/en/engines/table-engines/mergetree-family/mergetree.md b/docs/en/engines/table-engines/mergetree-family/mergetree.md
index f185c11bab3..e1eef8db9ab 100644
--- a/docs/en/engines/table-engines/mergetree-family/mergetree.md
+++ b/docs/en/engines/table-engines/mergetree-family/mergetree.md
@@ -1106,6 +1106,8 @@ Configuration markup:
 </storage_configuration>
 ```
 
+Also see [configuring external storage options](/docs/en/operations/storing-data.md/#configuring-external-storage).
+
 :::note cache configuration
 ClickHouse versions 22.3 through 22.7 use a different cache configuration, see [using local cache](/docs/en/operations/storing-data.md/#using-local-cache) if you are using one of those versions.
 :::
diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index 003277c8d4f..7a7edfb1a90 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -11,45 +11,163 @@ To work with data stored on `Amazon S3` disks use [S3](/docs/en/engines/table-en
 
 To load data from a web server with static files use a disk with type [web](#storing-data-on-webserver).
 
-## Configuring HDFS {#configuring-hdfs}
+## Configuring external storage {#configuring-external-storage}
 
-[MergeTree](/docs/en/engines/table-engines/mergetree-family/mergetree.md) and [Log](/docs/en/engines/table-engines/log-family/log.md) family table engines can store data to HDFS using a disk with type `HDFS`.
+[MergeTree](/docs/en/engines/table-engines/mergetree-family/mergetree.md) and [Log](/docs/en/engines/table-engines/log-family/log.md) family table engines can store data to `S3`, `AzureBlobStorage`, `HDFS` using a disk with types `s3`, `azure_blob_storage`, `hdfs` accordingly.
 
 Configuration markup:
 
+Let's take a loop at different storage configuration options on the example of `S3` storage.
+Firstly, define configuration in server configuration file. In order to configure `S3` storage the following configuration can be used:
+
 ``` xml
 <clickhouse>
     <storage_configuration>
         <disks>
-            <hdfs>
-                <type>hdfs</type>
-                <endpoint>hdfs://hdfs1:9000/clickhouse/</endpoint>
-            </hdfs>
+            <s3>
+                <type>s3</type>
+                <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+                <use_invironment_credentials>1</use_invironment_credentials>
+            </s3>
         </disks>
         <policies>
-            <hdfs>
+            <s3>
                 <volumes>
                     <main>
-                        <disk>hdfs</disk>
+                        <disk>s3</disk>
                     </main>
                 </volumes>
-            </hdfs>
+            </s3>
         </policies>
     </storage_configuration>
+</clickhouse>
+```
 
+Starting with 24.1 clickhouse version, a different type of configuration is supported in addition to the older one:
+
+``` xml
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <s3>
+                <type>object_storage</type>
+                <object_storage_type>s3</object_storage_type>
+                <metadata_type>local</metadata_type>
+                <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+                <use_invironment_credentials>1</use_invironment_credentials>
+            </s3>
+        </disks>
+        <policies>
+            <s3>
+                <volumes>
+                    <main>
+                        <disk>s3</disk>
+                    </main>
+                </volumes>
+            </s3>
+        </policies>
+    </storage_configuration>
+</clickhouse>
+```
+
+In order to make a specific kind of storage a default option for all `MergeTree` tables add the following section to configuration file:
+
+``` xml
+<clickhouse>
     <merge_tree>
-        <min_bytes_for_wide_part>0</min_bytes_for_wide_part>
+        <storage_policy>s3</storage_policy>
     </merge_tree>
 </clickhouse>
 ```
 
-Required parameters:
+If you want to configure a specific storage policy only to specific table, you can define it in settings while creating the table:
 
-- `endpoint` — HDFS endpoint URL in `path` format. Endpoint URL should contain a root path to store data.
+``` sql
+CREATE TABLE test (a Int32, b String)
+ENGINE = MergeTree() ORDER BY a
+SETTINGS storage_policy = 's3';
+```
 
-Optional parameters:
+You can also use `disk` instead of `storage_policy`. In this case it is not requires to have `storage_policy` section in configuration file, only `disk` section would be enough.
 
-- `min_bytes_for_seek` — The minimal number of bytes to use seek operation instead of sequential read. Default value: `1 Mb`.
+``` sql
+CREATE TABLE test (a Int32, b String)
+ENGINE = MergeTree() ORDER BY a
+SETTINGS disk = 's3';
+```
+
+There is also a possibility to specify storage configuration without a preconfigured disk in configuration file:
+
+``` sql
+CREATE TABLE test (a Int32, b String)
+ENGINE = MergeTree() ORDER BY a
+SETTINGS disk = disk(name = 's3_disk', type = 's3', endpoint = 'https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/', use_environment_credentials = 1);
+```
+
+Adding cache is also possible:
+
+``` sql
+CREATE TABLE test (a Int32, b String)
+ENGINE = MergeTree() ORDER BY a
+SETTINGS disk = disk(name = 'cached_s3_disk', type = 'cache', max_size = '10Gi', path = '/s3_cache', disk = disk(name = 's3_disk', type = 's3', endpoint = 'https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/', use_environment_credentials = 1));
+```
+
+A combination of config file disk configuration and sql-defined configuration is also possible:
+
+``` sql
+CREATE TABLE test (a Int32, b String)
+ENGINE = MergeTree() ORDER BY a
+SETTINGS disk = disk(name = 'cached_s3_disk', type = 'cache', max_size = '10Gi', path = '/s3_cache', disk = 's3');
+```
+
+Here `s3` is a disk name from server configuration file, while `cache` disk is defined via sql.
+
+Let's take a closer look at configuration parameters.
+
+All disk configuration require `type` section, equal to one of `s3`, `azure_blob_storage`, `hdfs`, `local`, `cache`, `web`. Then goes configuration of a specific storage type.
+Starting from 24.1 clickhouse version, you can you a new configuration option. For it you are required to specify `type` as `object_storage`, `object_storage_type` as one of `s3`, `azure_blob_storage`, `hdfs`, `local`, `cache`, `web`, and optionally you can specify `metadata_type`, which is `local` by default, but it can also be set to `plain`, `web`.
+
+E.g. first configuration option:
+``` xml
+<s3>
+    <type>s3</type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3>
+```
+
+and second (from `24.1`):
+``` xml
+<s3>
+    <type>object_storage</type>
+    <object_storage_type>s3</object_storage_type>
+    <metadata_type>local</metadata_type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3>
+```
+
+Configuration like
+``` xml
+<s3_plain>
+    <type>s3_plain</type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3_plain>
+```
+
+is equal to
+``` xml
+<s3_plain>
+    <type>object_storage</type>
+    <object_storage_type>s3</object_storage_type>
+    <metadata_type>plain</metadata_type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3_plain>
+```
+
+For details configuration options of each storage see [MergeTree](/docs/en/engines/table-engines/mergetree-family/mergetree.md).
 
 ## Using Virtual File System for Data Encryption {#encrypted-virtual-file-system}
 

From 9bcd4daabe56e29132fc5098420afb4dcba9001d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 15 Feb 2024 16:19:31 +0100
Subject: [PATCH 026/985] Better

---
 .../mergetree-family/mergetree.md             | 294 +------------
 docs/en/operations/storing-data.md            | 411 +++++++++++++++---
 2 files changed, 346 insertions(+), 359 deletions(-)

diff --git a/docs/en/engines/table-engines/mergetree-family/mergetree.md b/docs/en/engines/table-engines/mergetree-family/mergetree.md
index e1eef8db9ab..0fff13c906f 100644
--- a/docs/en/engines/table-engines/mergetree-family/mergetree.md
+++ b/docs/en/engines/table-engines/mergetree-family/mergetree.md
@@ -987,49 +987,6 @@ ORDER BY (postcode1, postcode2, addr1, addr2)
   # highlight-end
 ```
 
-### Nested Dynamic Storage
-
-This example query builds on the above dynamic disk configuration and shows how to
-use a local disk to cache data from a table stored at a URL. Neither the cache disk
-nor the web storage is configured in the ClickHouse configuration files; both are
-configured in the CREATE/ATTACH query settings.
-
-In the settings highlighted below notice that the disk of `type=web` is nested within
-the disk of `type=cache`.
-
-```sql
-ATTACH TABLE uk_price_paid UUID 'cf712b4f-2ca8-435c-ac23-c4393efe52f7'
-(
-    price UInt32,
-    date Date,
-    postcode1 LowCardinality(String),
-    postcode2 LowCardinality(String),
-    type Enum8('other' = 0, 'terraced' = 1, 'semi-detached' = 2, 'detached' = 3, 'flat' = 4),
-    is_new UInt8,
-    duration Enum8('unknown' = 0, 'freehold' = 1, 'leasehold' = 2),
-    addr1 String,
-    addr2 String,
-    street LowCardinality(String),
-    locality LowCardinality(String),
-    town LowCardinality(String),
-    district LowCardinality(String),
-    county LowCardinality(String)
-)
-ENGINE = MergeTree
-ORDER BY (postcode1, postcode2, addr1, addr2)
-  # highlight-start
-  SETTINGS disk = disk(
-    type=cache,
-    max_size='1Gi',
-    path='/var/lib/clickhouse/custom_disk_cache/',
-    disk=disk(
-      type=web,
-      endpoint='https://raw.githubusercontent.com/ClickHouse/web-tables-demo/main/web/'
-      )
-  );
-  # highlight-end
-```
-
 ### Details {#details}
 
 In the case of `MergeTree` tables, data is getting to disk in different ways:
@@ -1058,19 +1015,17 @@ During this time, they are not moved to other volumes or disks. Therefore, until
 
 User can assign new big parts to different disks of a [JBOD](https://en.wikipedia.org/wiki/Non-RAID_drive_architectures) volume in a balanced way using the [min_bytes_to_rebalance_partition_over_jbod](/docs/en/operations/settings/merge-tree-settings.md/#min-bytes-to-rebalance-partition-over-jbod) setting.
 
-## Using S3 for Data Storage {#table_engine-mergetree-s3}
+## Using External Storage for Data Storage {#table_engine-mergetree-s3}
 
-:::note
-Google Cloud Storage (GCS) is also supported using the type `s3`. See [GCS backed MergeTree](/docs/en/integrations/gcs).
-:::
+[MergeTree](/docs/en/engines/table-engines/mergetree-family/mergetree.md) family table engines can store data to `S3`, `AzureBlobStorage`, `HDFS` using a disk with types `s3`, `azure_blob_storage`, `hdfs` accordingly. See [configuring external storage options](/docs/en/operations/storing-data.md/#configuring-external-storage) for more details.
 
-`MergeTree` family table engines can store data to [S3](https://aws.amazon.com/s3/) using a disk with type `s3`.
+Example for [S3](https://aws.amazon.com/s3/) as external storage using a disk with type `s3`.
 
 Configuration markup:
 ``` xml
 <storage_configuration>
     ...
-    <disks>
+e   <disks>
         <s3>
             <type>s3</type>
             <support_batch_delete>true</support_batch_delete>
@@ -1112,247 +1067,6 @@ Also see [configuring external storage options](/docs/en/operations/storing-data
 ClickHouse versions 22.3 through 22.7 use a different cache configuration, see [using local cache](/docs/en/operations/storing-data.md/#using-local-cache) if you are using one of those versions.
 :::
 
-### Configuring the S3 disk
-
-Required parameters:
-
-- `endpoint` — S3 endpoint URL in `path` or `virtual hosted` [styles](https://docs.aws.amazon.com/AmazonS3/latest/dev/VirtualHosting.html). Endpoint URL should contain a bucket and root path to store data.
-- `access_key_id` — S3 access key id.
-- `secret_access_key` — S3 secret access key.
-
-Optional parameters:
-
-- `region` — S3 region name.
-- `support_batch_delete` — This controls the check to see if batch deletes are supported. Set this to `false` when using Google Cloud Storage (GCS) as GCS does not support batch deletes and preventing the checks will prevent error messages in the logs.
-- `use_environment_credentials` — Reads AWS credentials from the Environment variables AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY and AWS_SESSION_TOKEN if they exist. Default value is `false`.
-- `use_insecure_imds_request` — If set to `true`, S3 client will use insecure IMDS request while obtaining credentials from Amazon EC2 metadata. Default value is `false`.
-- `expiration_window_seconds` — Grace period for checking if expiration-based credentials have expired. Optional, default value is `120`.
-- `proxy` — Proxy configuration for S3 endpoint. Each `uri` element inside `proxy` block should contain a proxy URL.
-- `connect_timeout_ms` — Socket connect timeout in milliseconds. Default value is `10 seconds`.
-- `request_timeout_ms` — Request timeout in milliseconds. Default value is `5 seconds`.
-- `retry_attempts` — Number of retry attempts in case of failed request. Default value is `10`.
-- `single_read_retries` — Number of retry attempts in case of connection drop during read. Default value is `4`.
-- `min_bytes_for_seek` — Minimal number of bytes to use seek operation instead of sequential read. Default value is `1 Mb`.
-- `metadata_path` — Path on local FS to store metadata files for S3. Default value is `/var/lib/clickhouse/disks/<disk_name>/`.
-- `skip_access_check` — If true, disk access checks will not be performed on disk start-up. Default value is `false`.
-- `header` —  Adds specified HTTP header to a request to given endpoint. Optional, can be specified multiple times.
-- `server_side_encryption_customer_key_base64` — If specified, required headers for accessing S3 objects with SSE-C encryption will be set.
-- `server_side_encryption_kms_key_id` - If specified, required headers for accessing S3 objects with [SSE-KMS encryption](https://docs.aws.amazon.com/AmazonS3/latest/userguide/UsingKMSEncryption.html) will be set. If an empty string is specified, the AWS managed S3 key will be used. Optional.
-- `server_side_encryption_kms_encryption_context` - If specified alongside `server_side_encryption_kms_key_id`, the given encryption context header for SSE-KMS will be set. Optional.
-- `server_side_encryption_kms_bucket_key_enabled` - If specified alongside `server_side_encryption_kms_key_id`, the header to enable S3 bucket keys for SSE-KMS will be set. Optional, can be `true` or `false`, defaults to nothing (matches the bucket-level setting).
-- `s3_max_put_rps` — Maximum PUT requests per second rate before throttling. Default value is `0` (unlimited).
-- `s3_max_put_burst` — Max number of requests that can be issued simultaneously before hitting request per second limit. By default (`0` value) equals to `s3_max_put_rps`.
-- `s3_max_get_rps` — Maximum GET requests per second rate before throttling. Default value is `0` (unlimited).
-- `s3_max_get_burst` — Max number of requests that can be issued simultaneously before hitting request per second limit. By default (`0` value) equals to `s3_max_get_rps`.
-- `read_resource` — Resource name to be used for [scheduling](/docs/en/operations/workload-scheduling.md) of read requests to this disk. Default value is empty string (IO scheduling is not enabled for this disk).
-- `write_resource` — Resource name to be used for [scheduling](/docs/en/operations/workload-scheduling.md) of write requests to this disk. Default value is empty string (IO scheduling is not enabled for this disk).
-- `key_template` — Define the format with which the object keys are generated. By default, Clickhouse takes `root path` from `endpoint` option and adds random generated suffix. That suffix is a dir with 3 random symbols and a file name with 29 random symbols. With that option you have a full control how to the object keys are generated. Some usage scenarios require having random symbols in the prefix or in the middle of object key. For example: `[a-z]{3}-prefix-random/constant-part/random-middle-[a-z]{3}/random-suffix-[a-z]{29}`. The value is parsed with [`re2`](https://github.com/google/re2/wiki/Syntax). Only some subset of the syntax is supported. Check if your preferred format is supported before using that option. Disk isn't initialized if clickhouse is unable to generate a key by the value of `key_template`. It requires enabled feature flag [storage_metadata_write_full_object_key](/docs/en/operations/settings/settings#storage_metadata_write_full_object_key). It forbids declaring the `root path` in `endpoint` option. It requires definition of the option `key_compatibility_prefix`.
-- `key_compatibility_prefix` — That option is required when option `key_template` is in use. In order to be able to read the objects keys which were stored in the metadata files with the metadata version lower that `VERSION_FULL_OBJECT_KEY`, the previous `root path` from the `endpoint` option should be set here.
-
-### Configuring the cache
-
-This is the cache configuration from above:
-```xml
-        <s3_cache>
-            <type>cache</type>
-            <disk>s3</disk>
-            <path>/var/lib/clickhouse/disks/s3_cache/</path>
-            <max_size>10Gi</max_size>
-        </s3_cache>
-```
-
-These parameters define the cache layer:
-- `type` — If a disk is of type `cache` it caches mark and index files in memory.
-- `disk` — The name of the disk that will be cached.
-
-Cache parameters:
-- `path` — The path where metadata for the cache is stored.
-- `max_size` — The size (amount of disk space) that the cache can grow to.
-
-:::tip
-There are several other cache parameters that you can use to tune your storage, see [using local cache](/docs/en/operations/storing-data.md/#using-local-cache) for the details.
-:::
-
-S3 disk can be configured as `main` or `cold` storage:
-``` xml
-<storage_configuration>
-    ...
-    <disks>
-        <s3>
-            <type>s3</type>
-            <endpoint>https://clickhouse-public-datasets.s3.amazonaws.com/my-bucket/root-path/</endpoint>
-            <access_key_id>your_access_key_id</access_key_id>
-            <secret_access_key>your_secret_access_key</secret_access_key>
-        </s3>
-    </disks>
-    <policies>
-        <s3_main>
-            <volumes>
-                <main>
-                    <disk>s3</disk>
-                </main>
-            </volumes>
-        </s3_main>
-        <s3_cold>
-            <volumes>
-                <main>
-                    <disk>default</disk>
-                </main>
-                <external>
-                    <disk>s3</disk>
-                </external>
-            </volumes>
-            <move_factor>0.2</move_factor>
-        </s3_cold>
-    </policies>
-    ...
-</storage_configuration>
-```
-
-In case of `cold` option a data can be moved to S3 if local disk free size will be smaller than `move_factor * disk_size` or by TTL move rule.
-
-## Using Azure Blob Storage for Data Storage {#table_engine-mergetree-azure-blob-storage}
-
-`MergeTree` family table engines can store data to [Azure Blob Storage](https://azure.microsoft.com/en-us/services/storage/blobs/) using a disk with type `azure_blob_storage`.
-
-As of February 2022, this feature is still a fresh addition, so expect that some Azure Blob Storage functionalities might be unimplemented.
-
-Configuration markup:
-``` xml
-<storage_configuration>
-    ...
-    <disks>
-        <blob_storage_disk>
-            <type>azure_blob_storage</type>
-            <storage_account_url>http://account.blob.core.windows.net</storage_account_url>
-            <container_name>container</container_name>
-            <account_name>account</account_name>
-            <account_key>pass123</account_key>
-            <metadata_path>/var/lib/clickhouse/disks/blob_storage_disk/</metadata_path>
-            <cache_path>/var/lib/clickhouse/disks/blob_storage_disk/cache/</cache_path>
-            <skip_access_check>false</skip_access_check>
-        </blob_storage_disk>
-    </disks>
-    ...
-</storage_configuration>
-```
-
-Connection parameters:
-* `storage_account_url` - **Required**, Azure Blob Storage account URL, like `http://account.blob.core.windows.net` or `http://azurite1:10000/devstoreaccount1`.
-* `container_name` - Target container name, defaults to `default-container`.
-* `container_already_exists` - If set to `false`, a new container `container_name` is created in the storage account, if set to `true`, disk connects to the container directly, and if left unset, disk connects to the account, checks if the container `container_name` exists, and creates it if it doesn't exist yet.
-
-Authentication parameters (the disk will try all available methods **and** Managed Identity Credential):
-* `connection_string` - For authentication using a connection string.
-* `account_name` and `account_key` - For authentication using Shared Key.
-
-Limit parameters (mainly for internal usage):
-* `s3_max_single_part_upload_size` - Limits the size of a single block upload to Blob Storage.
-* `min_bytes_for_seek` - Limits the size of a seekable region.
-* `max_single_read_retries` - Limits the number of attempts to read a chunk of data from Blob Storage.
-* `max_single_download_retries` - Limits the number of attempts to download a readable buffer from Blob Storage.
-* `thread_pool_size` - Limits the number of threads with which `IDiskRemote` is instantiated.
-* `s3_max_inflight_parts_for_one_file` - Limits the number of put requests that can be run concurrently for one object.
-
-Other parameters:
-* `metadata_path` - Path on local FS to store metadata files for Blob Storage. Default value is `/var/lib/clickhouse/disks/<disk_name>/`.
-* `skip_access_check` - If true, disk access checks will not be performed on disk start-up. Default value is `false`.
-* `read_resource` — Resource name to be used for [scheduling](/docs/en/operations/workload-scheduling.md) of read requests to this disk. Default value is empty string (IO scheduling is not enabled for this disk).
-* `write_resource` — Resource name to be used for [scheduling](/docs/en/operations/workload-scheduling.md) of write requests to this disk. Default value is empty string (IO scheduling is not enabled for this disk).
-
-Examples of working configurations can be found in integration tests directory (see e.g. [test_merge_tree_azure_blob_storage](https://github.com/ClickHouse/ClickHouse/blob/master/tests/integration/test_merge_tree_azure_blob_storage/configs/config.d/storage_conf.xml) or [test_azure_blob_storage_zero_copy_replication](https://github.com/ClickHouse/ClickHouse/blob/master/tests/integration/test_azure_blob_storage_zero_copy_replication/configs/config.d/storage_conf.xml)).
-
-:::note Zero-copy replication is not ready for production
-Zero-copy replication is disabled by default in ClickHouse version 22.8 and higher.  This feature is not recommended for production use.
-:::
-
-## HDFS storage {#hdfs-storage}
-
-In this sample configuration:
-- the disk is of type `hdfs`
-- the data is hosted at `hdfs://hdfs1:9000/clickhouse/`
-
-```xml
-<clickhouse>
-    <storage_configuration>
-        <disks>
-            <hdfs>
-                <type>hdfs</type>
-                <endpoint>hdfs://hdfs1:9000/clickhouse/</endpoint>
-                <skip_access_check>true</skip_access_check>
-            </hdfs>
-            <hdd>
-                <type>local</type>
-                <path>/</path>
-            </hdd>
-        </disks>
-        <policies>
-            <hdfs>
-                <volumes>
-                    <main>
-                        <disk>hdfs</disk>
-                    </main>
-                    <external>
-                        <disk>hdd</disk>
-                    </external>
-                </volumes>
-            </hdfs>
-        </policies>
-    </storage_configuration>
-</clickhouse>
-```
-
-## Web storage (read-only) {#web-storage}
-
-Web storage can be used for read-only purposes. An example use is for hosting sample
-data, or for migrating data.
-
-:::tip
-Storage can also be configured temporarily within a query, if a web dataset is not expected
-to be used routinely, see [dynamic storage](#dynamic-storage) and skip editing the
-configuration file.
-:::
-
-In this sample configuration:
-- the disk is of type `web`
-- the data is hosted at `http://nginx:80/test1/`
-- a cache on local storage is used
-
-```xml
-<clickhouse>
-    <storage_configuration>
-        <disks>
-            <web>
-                <type>web</type>
-                <endpoint>http://nginx:80/test1/</endpoint>
-            </web>
-            <cached_web>
-                <type>cache</type>
-                <disk>web</disk>
-                <path>cached_web_cache/</path>
-                <max_size>100000000</max_size>
-            </cached_web>
-        </disks>
-        <policies>
-            <web>
-                <volumes>
-                    <main>
-                        <disk>web</disk>
-                    </main>
-                </volumes>
-            </web>
-            <cached_web>
-                <volumes>
-                    <main>
-                        <disk>cached_web</disk>
-                    </main>
-                </volumes>
-            </cached_web>
-        </policies>
-    </storage_configuration>
-</clickhouse>
-```
-
 ## Virtual Columns {#virtual-columns}
 
 - `_part` — Name of a part.
diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index 7a7edfb1a90..baf4e1999a7 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -5,21 +5,68 @@ sidebar_label: "External Disks for Storing Data"
 title: "External Disks for Storing Data"
 ---
 
-Data, processed in ClickHouse, is usually stored in the local file system — on the same machine with the ClickHouse server. That requires large-capacity disks, which can be expensive enough. To avoid that you can store the data remotely — on [Amazon S3](https://aws.amazon.com/s3/) disks or in the Hadoop Distributed File System ([HDFS](https://hadoop.apache.org/docs/current/hadoop-project-dist/hadoop-hdfs/HdfsDesign.html)).
+Data, processed in ClickHouse, is usually stored in the local file system — on the same machine with the ClickHouse server. That requires large-capacity disks, which can be expensive enough. To avoid that you can store the data remotely. Various storages are supported:
+1. [Amazon S3](https://aws.amazon.com/s3/) object storage.
+2. The Hadoop Distributed File System ([HDFS](https://hadoop.apache.org/docs/current/hadoop-project-dist/hadoop-hdfs/HdfsDesign.html))
+3. [Azure Blob Storage](https://azure.microsoft.com/en-us/products/storage/blobs).
 
-To work with data stored on `Amazon S3` disks use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine, and to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine.
-
-To load data from a web server with static files use a disk with type [web](#storing-data-on-webserver).
+Note: to work with data stored on `Amazon S3` disks use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine, to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine, and to work with data stored in Azure Blob Storage use [AzureBlobStorage](/docs/en/engines/table-engines/integrations/AzureBlobStorage.md) table engine. They are different from external storage described on this page as they allow to read data stored in some general file format (like Parquet), while on this page we are describing storage configuration for ClickHouse `MergeTree` famility or `Log` family tables.
 
 ## Configuring external storage {#configuring-external-storage}
 
 [MergeTree](/docs/en/engines/table-engines/mergetree-family/mergetree.md) and [Log](/docs/en/engines/table-engines/log-family/log.md) family table engines can store data to `S3`, `AzureBlobStorage`, `HDFS` using a disk with types `s3`, `azure_blob_storage`, `hdfs` accordingly.
 
-Configuration markup:
+Disk configuration requires:
+1. `type` section, equal to one of `s3`, `azure_blob_storage`, `hdfs`, `local_blob_storage`, `web`.
+2. Configuration of a specific external storage type.
 
-Let's take a loop at different storage configuration options on the example of `S3` storage.
-Firstly, define configuration in server configuration file. In order to configure `S3` storage the following configuration can be used:
+Starting from 24.1 clickhouse version, it is possible to use a new configuration option.
+It requires to specify:
+1. `type` equal to `object_storage`
+2. `object_storage_type`, equal to one of `s3`, `azure_blob_storage`, `hdfs`, `local_blob_storage`, `web`.
+Optionally, `metadata_type` can be specified (it is equal to `local` by default), but it can also be set to `plain`, `web`.
 
+E.g. configuration option
+``` xml
+<s3>
+    <type>s3</type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3>
+```
+
+is equal to configuration (from `24.1`):
+``` xml
+<s3>
+    <type>object_storage</type>
+    <object_storage_type>s3</object_storage_type>
+    <metadata_type>local</metadata_type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3>
+```
+
+Configuration
+``` xml
+<s3_plain>
+    <type>s3_plain</type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3_plain>
+```
+
+is equal to
+``` xml
+<s3_plain>
+    <type>object_storage</type>
+    <object_storage_type>s3</object_storage_type>
+    <metadata_type>plain</metadata_type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3_plain>
+```
+
+Example of full storage configuration will look like:
 ``` xml
 <clickhouse>
     <storage_configuration>
@@ -43,8 +90,7 @@ Firstly, define configuration in server configuration file. In order to configur
 </clickhouse>
 ```
 
-Starting with 24.1 clickhouse version, a different type of configuration is supported in addition to the older one:
-
+Starting with 24.1 clickhouse version, it can also look like:
 ``` xml
 <clickhouse>
     <storage_configuration>
@@ -71,7 +117,6 @@ Starting with 24.1 clickhouse version, a different type of configuration is supp
 ```
 
 In order to make a specific kind of storage a default option for all `MergeTree` tables add the following section to configuration file:
-
 ``` xml
 <clickhouse>
     <merge_tree>
@@ -96,80 +141,259 @@ ENGINE = MergeTree() ORDER BY a
 SETTINGS disk = 's3';
 ```
 
-There is also a possibility to specify storage configuration without a preconfigured disk in configuration file:
+## Dynamic Configuration {#dynamic-configuration}
 
-``` sql
-CREATE TABLE test (a Int32, b String)
-ENGINE = MergeTree() ORDER BY a
-SETTINGS disk = disk(name = 's3_disk', type = 's3', endpoint = 'https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/', use_environment_credentials = 1);
+There is also a possibility to specify storage configuration without a predefined disk in configuration in a configuration file, but can be configured in the CREATE/ATTACH query settings.
+
+The following example query builds on the above dynamic disk configuration and shows how to use a local disk to cache data from a table stored at a URL.
+
+```sql
+ATTACH TABLE uk_price_paid UUID 'cf712b4f-2ca8-435c-ac23-c4393efe52f7'
+(
+    price UInt32,
+    date Date,
+    postcode1 LowCardinality(String),
+    postcode2 LowCardinality(String),
+    type Enum8('other' = 0, 'terraced' = 1, 'semi-detached' = 2, 'detached' = 3, 'flat' = 4),
+    is_new UInt8,
+    duration Enum8('unknown' = 0, 'freehold' = 1, 'leasehold' = 2),
+    addr1 String,
+    addr2 String,
+    street LowCardinality(String),
+    locality LowCardinality(String),
+    town LowCardinality(String),
+    district LowCardinality(String),
+    county LowCardinality(String)
+)
+ENGINE = MergeTree
+ORDER BY (postcode1, postcode2, addr1, addr2)
+  # highlight-start
+  SETTINGS disk = disk(
+    type=web,
+    endpoint='https://raw.githubusercontent.com/ClickHouse/web-tables-demo/main/web/'
+  );
+  # highlight-end
 ```
 
-Adding cache is also possible:
+The example below adds cache to external storage.
 
-``` sql
-CREATE TABLE test (a Int32, b String)
-ENGINE = MergeTree() ORDER BY a
-SETTINGS disk = disk(name = 'cached_s3_disk', type = 'cache', max_size = '10Gi', path = '/s3_cache', disk = disk(name = 's3_disk', type = 's3', endpoint = 'https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/', use_environment_credentials = 1));
+```sql
+ATTACH TABLE uk_price_paid UUID 'cf712b4f-2ca8-435c-ac23-c4393efe52f7'
+(
+    price UInt32,
+    date Date,
+    postcode1 LowCardinality(String),
+    postcode2 LowCardinality(String),
+    type Enum8('other' = 0, 'terraced' = 1, 'semi-detached' = 2, 'detached' = 3, 'flat' = 4),
+    is_new UInt8,
+    duration Enum8('unknown' = 0, 'freehold' = 1, 'leasehold' = 2),
+    addr1 String,
+    addr2 String,
+    street LowCardinality(String),
+    locality LowCardinality(String),
+    town LowCardinality(String),
+    district LowCardinality(String),
+    county LowCardinality(String)
+)
+ENGINE = MergeTree
+ORDER BY (postcode1, postcode2, addr1, addr2)
+  # highlight-start
+  SETTINGS disk = disk(
+    type=cache,
+    max_size='1Gi',
+    path='/var/lib/clickhouse/custom_disk_cache/',
+    disk=disk(
+      type=web,
+      endpoint='https://raw.githubusercontent.com/ClickHouse/web-tables-demo/main/web/'
+      )
+  );
+  # highlight-end
 ```
 
-A combination of config file disk configuration and sql-defined configuration is also possible:
+In the settings highlighted below notice that the disk of `type=web` is nested within
+the disk of `type=cache`.
 
-``` sql
-CREATE TABLE test (a Int32, b String)
-ENGINE = MergeTree() ORDER BY a
-SETTINGS disk = disk(name = 'cached_s3_disk', type = 'cache', max_size = '10Gi', path = '/s3_cache', disk = 's3');
+A combination of config-based configuration and sql-defined configuration is also possible:
+
+```sql
+ATTACH TABLE uk_price_paid UUID 'cf712b4f-2ca8-435c-ac23-c4393efe52f7'
+(
+    price UInt32,
+    date Date,
+    postcode1 LowCardinality(String),
+    postcode2 LowCardinality(String),
+    type Enum8('other' = 0, 'terraced' = 1, 'semi-detached' = 2, 'detached' = 3, 'flat' = 4),
+    is_new UInt8,
+    duration Enum8('unknown' = 0, 'freehold' = 1, 'leasehold' = 2),
+    addr1 String,
+    addr2 String,
+    street LowCardinality(String),
+    locality LowCardinality(String),
+    town LowCardinality(String),
+    district LowCardinality(String),
+    county LowCardinality(String)
+)
+ENGINE = MergeTree
+ORDER BY (postcode1, postcode2, addr1, addr2)
+  # highlight-start
+  SETTINGS disk = disk(
+    type=cache,
+    max_size='1Gi',
+    path='/var/lib/clickhouse/custom_disk_cache/',
+    disk=disk(
+      type=web,
+      endpoint='https://raw.githubusercontent.com/ClickHouse/web-tables-demo/main/web/'
+      )
+  );
+  # highlight-end
 ```
 
-Here `s3` is a disk name from server configuration file, while `cache` disk is defined via sql.
+where `web` is a from a server configuration file:
 
-Let's take a closer look at configuration parameters.
-
-All disk configuration require `type` section, equal to one of `s3`, `azure_blob_storage`, `hdfs`, `local`, `cache`, `web`. Then goes configuration of a specific storage type.
-Starting from 24.1 clickhouse version, you can you a new configuration option. For it you are required to specify `type` as `object_storage`, `object_storage_type` as one of `s3`, `azure_blob_storage`, `hdfs`, `local`, `cache`, `web`, and optionally you can specify `metadata_type`, which is `local` by default, but it can also be set to `plain`, `web`.
-
-E.g. first configuration option:
 ``` xml
-<s3>
-    <type>s3</type>
-    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
-    <use_invironment_credentials>1</use_invironment_credentials>
-</s3>
+<storage_configuration>
+    <disks>
+        <web>
+            <type>web</type>
+            <endpoint>'https://raw.githubusercontent.com/ClickHouse/web-tables-demo/main/web/'</endpoint>
+        </web>
+    </disks>
+</storage_configuration>
 ```
 
-and second (from `24.1`):
+### Using S3 Storage {#s3-storage}
+
+Required parameters:
+
+- `endpoint` — S3 endpoint URL in `path` or `virtual hosted` [styles](https://docs.aws.amazon.com/AmazonS3/latest/dev/VirtualHosting.html). Endpoint URL should contain a bucket and root path to store data.
+- `access_key_id` — S3 access key id.
+- `secret_access_key` — S3 secret access key.
+
+Optional parameters:
+
+- `region` — S3 region name.
+- `support_batch_delete` — This controls the check to see if batch deletes are supported. Set this to `false` when using Google Cloud Storage (GCS) as GCS does not support batch deletes and preventing the checks will prevent error messages in the logs.
+- `use_environment_credentials` — Reads AWS credentials from the Environment variables AWS_ACCESS_KEY_ID and AWS_SECRET_ACCESS_KEY and AWS_SESSION_TOKEN if they exist. Default value is `false`.
+- `use_insecure_imds_request` — If set to `true`, S3 client will use insecure IMDS request while obtaining credentials from Amazon EC2 metadata. Default value is `false`.
+- `expiration_window_seconds` — Grace period for checking if expiration-based credentials have expired. Optional, default value is `120`.
+- `proxy` — Proxy configuration for S3 endpoint. Each `uri` element inside `proxy` block should contain a proxy URL.
+- `connect_timeout_ms` — Socket connect timeout in milliseconds. Default value is `10 seconds`.
+- `request_timeout_ms` — Request timeout in milliseconds. Default value is `5 seconds`.
+- `retry_attempts` — Number of retry attempts in case of failed request. Default value is `10`.
+- `single_read_retries` — Number of retry attempts in case of connection drop during read. Default value is `4`.
+- `min_bytes_for_seek` — Minimal number of bytes to use seek operation instead of sequential read. Default value is `1 Mb`.
+- `metadata_path` — Path on local FS to store metadata files for S3. Default value is `/var/lib/clickhouse/disks/<disk_name>/`.
+- `skip_access_check` — If true, disk access checks will not be performed on disk start-up. Default value is `false`.
+- `header` —  Adds specified HTTP header to a request to given endpoint. Optional, can be specified multiple times.
+- `server_side_encryption_customer_key_base64` — If specified, required headers for accessing S3 objects with SSE-C encryption will be set.
+- `server_side_encryption_kms_key_id` - If specified, required headers for accessing S3 objects with [SSE-KMS encryption](https://docs.aws.amazon.com/AmazonS3/latest/userguide/UsingKMSEncryption.html) will be set. If an empty string is specified, the AWS managed S3 key will be used. Optional.
+- `server_side_encryption_kms_encryption_context` - If specified alongside `server_side_encryption_kms_key_id`, the given encryption context header for SSE-KMS will be set. Optional.
+- `server_side_encryption_kms_bucket_key_enabled` - If specified alongside `server_side_encryption_kms_key_id`, the header to enable S3 bucket keys for SSE-KMS will be set. Optional, can be `true` or `false`, defaults to nothing (matches the bucket-level setting).
+- `s3_max_put_rps` — Maximum PUT requests per second rate before throttling. Default value is `0` (unlimited).
+- `s3_max_put_burst` — Max number of requests that can be issued simultaneously before hitting request per second limit. By default (`0` value) equals to `s3_max_put_rps`.
+- `s3_max_get_rps` — Maximum GET requests per second rate before throttling. Default value is `0` (unlimited).
+- `s3_max_get_burst` — Max number of requests that can be issued simultaneously before hitting request per second limit. By default (`0` value) equals to `s3_max_get_rps`.
+- `read_resource` — Resource name to be used for [scheduling](/docs/en/operations/workload-scheduling.md) of read requests to this disk. Default value is empty string (IO scheduling is not enabled for this disk).
+- `write_resource` — Resource name to be used for [scheduling](/docs/en/operations/workload-scheduling.md) of write requests to this disk. Default value is empty string (IO scheduling is not enabled for this disk).
+- `key_template` — Define the format with which the object keys are generated. By default, Clickhouse takes `root path` from `endpoint` option and adds random generated suffix. That suffix is a dir with 3 random symbols and a file name with 29 random symbols. With that option you have a full control how to the object keys are generated. Some usage scenarios require having random symbols in the prefix or in the middle of object key. For example: `[a-z]{3}-prefix-random/constant-part/random-middle-[a-z]{3}/random-suffix-[a-z]{29}`. The value is parsed with [`re2`](https://github.com/google/re2/wiki/Syntax). Only some subset of the syntax is supported. Check if your preferred format is supported before using that option. Disk isn't initialized if clickhouse is unable to generate a key by the value of `key_template`. It requires enabled feature flag [storage_metadata_write_full_object_key](/docs/en/operations/settings/settings#storage_metadata_write_full_object_key). It forbids declaring the `root path` in `endpoint` option. It requires definition of the option `key_compatibility_prefix`.
+- `key_compatibility_prefix` — That option is required when option `key_template` is in use. In order to be able to read the objects keys which were stored in the metadata files with the metadata version lower that `VERSION_FULL_OBJECT_KEY`, the previous `root path` from the `endpoint` option should be set here.
+
+:::note
+Google Cloud Storage (GCS) is also supported using the type `s3`. See [GCS backed MergeTree](/docs/en/integrations/gcs).
+:::
+
+### Using Azure Blob Storage {#azure-blob-storage}
+
+`MergeTree` family table engines can store data to [Azure Blob Storage](https://azure.microsoft.com/en-us/services/storage/blobs/) using a disk with type `azure_blob_storage`.
+
+As of February 2022, this feature is still a fresh addition, so expect that some Azure Blob Storage functionalities might be unimplemented.
+
+Configuration markup:
 ``` xml
-<s3>
-    <type>object_storage</type>
-    <object_storage_type>s3</object_storage_type>
-    <metadata_type>local</metadata_type>
-    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
-    <use_invironment_credentials>1</use_invironment_credentials>
-</s3>
+<storage_configuration>
+    ...
+    <disks>
+        <blob_storage_disk>
+            <type>azure_blob_storage</type>
+            <storage_account_url>http://account.blob.core.windows.net</storage_account_url>
+            <container_name>container</container_name>
+            <account_name>account</account_name>
+            <account_key>pass123</account_key>
+            <metadata_path>/var/lib/clickhouse/disks/blob_storage_disk/</metadata_path>
+            <cache_path>/var/lib/clickhouse/disks/blob_storage_disk/cache/</cache_path>
+            <skip_access_check>false</skip_access_check>
+        </blob_storage_disk>
+    </disks>
+    ...
+</storage_configuration>
 ```
 
-Configuration like
-``` xml
-<s3_plain>
-    <type>s3_plain</type>
-    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
-    <use_invironment_credentials>1</use_invironment_credentials>
-</s3_plain>
+Connection parameters:
+* `storage_account_url` - **Required**, Azure Blob Storage account URL, like `http://account.blob.core.windows.net` or `http://azurite1:10000/devstoreaccount1`.
+* `container_name` - Target container name, defaults to `default-container`.
+* `container_already_exists` - If set to `false`, a new container `container_name` is created in the storage account, if set to `true`, disk connects to the container directly, and if left unset, disk connects to the account, checks if the container `container_name` exists, and creates it if it doesn't exist yet.
+
+Authentication parameters (the disk will try all available methods **and** Managed Identity Credential):
+* `connection_string` - For authentication using a connection string.
+* `account_name` and `account_key` - For authentication using Shared Key.
+
+Limit parameters (mainly for internal usage):
+* `s3_max_single_part_upload_size` - Limits the size of a single block upload to Blob Storage.
+* `min_bytes_for_seek` - Limits the size of a seekable region.
+* `max_single_read_retries` - Limits the number of attempts to read a chunk of data from Blob Storage.
+* `max_single_download_retries` - Limits the number of attempts to download a readable buffer from Blob Storage.
+* `thread_pool_size` - Limits the number of threads with which `IDiskRemote` is instantiated.
+* `s3_max_inflight_parts_for_one_file` - Limits the number of put requests that can be run concurrently for one object.
+
+Other parameters:
+* `metadata_path` - Path on local FS to store metadata files for Blob Storage. Default value is `/var/lib/clickhouse/disks/<disk_name>/`.
+* `skip_access_check` - If true, disk access checks will not be performed on disk start-up. Default value is `false`.
+* `read_resource` — Resource name to be used for [scheduling](/docs/en/operations/workload-scheduling.md) of read requests to this disk. Default value is empty string (IO scheduling is not enabled for this disk).
+* `write_resource` — Resource name to be used for [scheduling](/docs/en/operations/workload-scheduling.md) of write requests to this disk. Default value is empty string (IO scheduling is not enabled for this disk).
+
+Examples of working configurations can be found in integration tests directory (see e.g. [test_merge_tree_azure_blob_storage](https://github.com/ClickHouse/ClickHouse/blob/master/tests/integration/test_merge_tree_azure_blob_storage/configs/config.d/storage_conf.xml) or [test_azure_blob_storage_zero_copy_replication](https://github.com/ClickHouse/ClickHouse/blob/master/tests/integration/test_azure_blob_storage_zero_copy_replication/configs/config.d/storage_conf.xml)).
+
+:::note Zero-copy replication is not ready for production
+Zero-copy replication is disabled by default in ClickHouse version 22.8 and higher.  This feature is not recommended for production use.
+:::
+
+## Using HDFS storage {#hdfs-storage}
+
+In this sample configuration:
+- the disk is of type `hdfs`
+- the data is hosted at `hdfs://hdfs1:9000/clickhouse/`
+
+```xml
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <hdfs>
+                <type>hdfs</type>
+                <endpoint>hdfs://hdfs1:9000/clickhouse/</endpoint>
+                <skip_access_check>true</skip_access_check>
+            </hdfs>
+            <hdd>
+                <type>local</type>
+                <path>/</path>
+            </hdd>
+        </disks>
+        <policies>
+            <hdfs>
+                <volumes>
+                    <main>
+                        <disk>hdfs</disk>
+                    </main>
+                    <external>
+                        <disk>hdd</disk>
+                    </external>
+                </volumes>
+            </hdfs>
+        </policies>
+    </storage_configuration>
+</clickhouse>
 ```
 
-is equal to
-``` xml
-<s3_plain>
-    <type>object_storage</type>
-    <object_storage_type>s3</object_storage_type>
-    <metadata_type>plain</metadata_type>
-    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
-    <use_invironment_credentials>1</use_invironment_credentials>
-</s3_plain>
-```
-
-For details configuration options of each storage see [MergeTree](/docs/en/engines/table-engines/mergetree-family/mergetree.md).
-
-## Using Virtual File System for Data Encryption {#encrypted-virtual-file-system}
+### Using Data Encryption {#encrypted-virtual-file-system}
 
 You can encrypt the data stored on [S3](/docs/en/engines/table-engines/mergetree-family/mergetree.md/#table_engine-mergetree-s3), or [HDFS](#configuring-hdfs) external disks, or on a local disk. To turn on the encryption mode, in the configuration file you must define a disk with the type `encrypted` and choose a disk on which the data will be saved. An `encrypted` disk ciphers all written files on the fly, and when you read files from an `encrypted` disk it deciphers them automatically. So you can work with an `encrypted` disk like with a normal one.
 
@@ -230,7 +454,7 @@ Example of disk configuration:
 </clickhouse>
 ```
 
-## Using local cache {#using-local-cache}
+### Using local cache {#using-local-cache}
 
 It is possible to configure local cache over disks in storage configuration starting from version 22.3.
 For versions 22.3 - 22.7 cache is supported only for `s3` disk type. For versions >= 22.8 cache is supported for any disk type: S3, Azure, Local, Encrypted, etc.
@@ -393,7 +617,56 @@ Cache profile events:
 
 - `CachedWriteBufferCacheWriteBytes`, `CachedWriteBufferCacheWriteMicroseconds`
 
-## Storing Data on Web Server {#storing-data-on-webserver}
+### Using static Web storage (read-only) {#web-storage}
+
+Web storage can be used for read-only purposes. An example use is for hosting sample
+data, or for migrating data.
+
+:::tip
+Storage can also be configured temporarily within a query, if a web dataset is not expected
+to be used routinely, see [dynamic storage](#dynamic-storage) and skip editing the
+configuration file.
+:::
+
+In this sample configuration:
+- the disk is of type `web`
+- the data is hosted at `http://nginx:80/test1/`
+- a cache on local storage is used
+
+```xml
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <web>
+                <type>web</type>
+                <endpoint>http://nginx:80/test1/</endpoint>
+            </web>
+            <cached_web>
+                <type>cache</type>
+                <disk>web</disk>
+                <path>cached_web_cache/</path>
+                <max_size>100000000</max_size>
+            </cached_web>
+        </disks>
+        <policies>
+            <web>
+                <volumes>
+                    <main>
+                        <disk>web</disk>
+                    </main>
+                </volumes>
+            </web>
+            <cached_web>
+                <volumes>
+                    <main>
+                        <disk>cached_web</disk>
+                    </main>
+                </volumes>
+            </cached_web>
+        </policies>
+    </storage_configuration>
+</clickhouse>
+```
 
 There is a tool `clickhouse-static-files-uploader`, which prepares a data directory for a given table (`SELECT data_paths FROM system.tables WHERE name = 'table_name'`). For each table you need, you get a directory of files. These files can be uploaded to, for example, a web server with static files. After this preparation, you can load this table into any ClickHouse server via `DiskWeb`.
 
@@ -595,7 +868,7 @@ If URL is not reachable on disk load when the server is starting up tables, then
 Use [http_max_single_read_retries](/docs/en/operations/settings/settings.md/#http-max-single-read-retries) setting to limit the maximum number of retries during a single HTTP read.
 
 
-## Zero-copy Replication (not ready for production) {#zero-copy}
+### Zero-copy Replication (not ready for production) {#zero-copy}
 
 Zero-copy replication is possible, but not recommended, with  `S3` and `HDFS` disks. Zero-copy replication means that if the data is stored remotely on several machines and needs to be synchronized, then only the metadata is replicated (paths to the data parts), but not the data itself.
 

From 5ae410e6339fe52e33b41bbc9c6c115ac6293f57 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 15 Feb 2024 18:33:38 +0100
Subject: [PATCH 027/985] A bit more explanation

---
 .../mergetree-family/mergetree.md             | 49 +------------------
 docs/en/operations/storing-data.md            | 44 ++++++++++++++++-
 2 files changed, 44 insertions(+), 49 deletions(-)

diff --git a/docs/en/engines/table-engines/mergetree-family/mergetree.md b/docs/en/engines/table-engines/mergetree-family/mergetree.md
index 0fff13c906f..f23b251f3a1 100644
--- a/docs/en/engines/table-engines/mergetree-family/mergetree.md
+++ b/docs/en/engines/table-engines/mergetree-family/mergetree.md
@@ -940,53 +940,6 @@ You could change storage policy after table creation with [ALTER TABLE ... MODIF
 
 The number of threads performing background moves of data parts can be changed by [background_move_pool_size](/docs/en/operations/server-configuration-parameters/settings.md/#background_move_pool_size) setting.
 
-### Dynamic Storage
-
-This example query shows how to attach a table stored at a URL and configure the
-remote storage within the query. The web storage is not configured in the ClickHouse
-configuration files; all the settings are in the CREATE/ATTACH query.
-
-:::note
-The example uses `type=web`, but any disk type can be configured as dynamic, even Local disk. Local disks require a path argument to be inside the server config parameter `custom_local_disks_base_directory`, which has no default, so set that also when using local disk.
-:::
-
-#### Example dynamic web storage
-
-:::tip
-A [demo dataset](https://github.com/ClickHouse/web-tables-demo) is hosted in GitHub.  To prepare your own tables for web storage see the tool [clickhouse-static-files-uploader](/docs/en/operations/storing-data.md/#storing-data-on-webserver)
-:::
-
-In this `ATTACH TABLE` query the `UUID` provided matches the directory name of the data, and the endpoint is the URL for the raw GitHub content.
-
-```sql
-# highlight-next-line
-ATTACH TABLE uk_price_paid UUID 'cf712b4f-2ca8-435c-ac23-c4393efe52f7'
-(
-    price UInt32,
-    date Date,
-    postcode1 LowCardinality(String),
-    postcode2 LowCardinality(String),
-    type Enum8('other' = 0, 'terraced' = 1, 'semi-detached' = 2, 'detached' = 3, 'flat' = 4),
-    is_new UInt8,
-    duration Enum8('unknown' = 0, 'freehold' = 1, 'leasehold' = 2),
-    addr1 String,
-    addr2 String,
-    street LowCardinality(String),
-    locality LowCardinality(String),
-    town LowCardinality(String),
-    district LowCardinality(String),
-    county LowCardinality(String)
-)
-ENGINE = MergeTree
-ORDER BY (postcode1, postcode2, addr1, addr2)
-  # highlight-start
-  SETTINGS disk = disk(
-      type=web,
-      endpoint='https://raw.githubusercontent.com/ClickHouse/web-tables-demo/main/web/'
-      );
-  # highlight-end
-```
-
 ### Details {#details}
 
 In the case of `MergeTree` tables, data is getting to disk in different ways:
@@ -1025,7 +978,7 @@ Configuration markup:
 ``` xml
 <storage_configuration>
     ...
-e   <disks>
+    <disks>
         <s3>
             <type>s3</type>
             <support_batch_delete>true</support_batch_delete>
diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index baf4e1999a7..0f818b813bf 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -213,6 +213,10 @@ ORDER BY (postcode1, postcode2, addr1, addr2)
 In the settings highlighted below notice that the disk of `type=web` is nested within
 the disk of `type=cache`.
 
+:::note
+The example uses `type=web`, but any disk type can be configured as dynamic, even Local disk. Local disks require a path argument to be inside the server config parameter `custom_local_disks_base_directory`, which has no default, so set that also when using local disk.
+:::
+
 A combination of config-based configuration and sql-defined configuration is also possible:
 
 ```sql
@@ -302,6 +306,11 @@ Optional parameters:
 Google Cloud Storage (GCS) is also supported using the type `s3`. See [GCS backed MergeTree](/docs/en/integrations/gcs).
 :::
 
+### Using Plain Storage {#s3-storage}
+
+There is a disk type `s3_plain`, which provides a write-once storage. Unlike `s3` disk type, it stores data as is, e.g. instead of randomly-generated blob names, it uses normal file names as clickhouse stores files on local disk. So this disk type allows to keeper a static version of the table and can also be used to create backups on it.
+Configuration parameters are the same as for `s3` disk type.
+
 ### Using Azure Blob Storage {#azure-blob-storage}
 
 `MergeTree` family table engines can store data to [Azure Blob Storage](https://azure.microsoft.com/en-us/services/storage/blobs/) using a disk with type `azure_blob_storage`.
@@ -672,7 +681,40 @@ There is a tool `clickhouse-static-files-uploader`, which prepares a data direct
 
 This is a read-only disk. Its data is only read and never modified. A new table is loaded to this disk via `ATTACH TABLE` query (see example below). Local disk is not actually used, each `SELECT` query will result in a `http` request to fetch required data. All modification of the table data will result in an exception, i.e. the following types of queries are not allowed: [CREATE TABLE](/docs/en/sql-reference/statements/create/table.md), [ALTER TABLE](/docs/en/sql-reference/statements/alter/index.md), [RENAME TABLE](/docs/en/sql-reference/statements/rename.md/#misc_operations-rename_table), [DETACH TABLE](/docs/en/sql-reference/statements/detach.md) and [TRUNCATE TABLE](/docs/en/sql-reference/statements/truncate.md).
 
-Web server storage is supported only for the [MergeTree](/docs/en/engines/table-engines/mergetree-family/mergetree.md) and [Log](/docs/en/engines/table-engines/log-family/log.md) engine families. To access the data stored on a `web` disk, use the [storage_policy](/docs/en/engines/table-engines/mergetree-family/mergetree.md/#terms) setting when executing the query. For example, `ATTACH TABLE table_web UUID '{}' (id Int32) ENGINE = MergeTree() ORDER BY id SETTINGS storage_policy = 'web'`.
+:::tip
+A [demo dataset](https://github.com/ClickHouse/web-tables-demo) is hosted in GitHub.  To prepare your own tables for web storage see the tool [clickhouse-static-files-uploader](/docs/en/operations/storing-data.md/#storing-data-on-webserver)
+:::
+
+In this `ATTACH TABLE` query the `UUID` provided matches the directory name of the data, and the endpoint is the URL for the raw GitHub content.
+
+```sql
+# highlight-next-line
+ATTACH TABLE uk_price_paid UUID 'cf712b4f-2ca8-435c-ac23-c4393efe52f7'
+(
+    price UInt32,
+    date Date,
+    postcode1 LowCardinality(String),
+    postcode2 LowCardinality(String),
+    type Enum8('other' = 0, 'terraced' = 1, 'semi-detached' = 2, 'detached' = 3, 'flat' = 4),
+    is_new UInt8,
+    duration Enum8('unknown' = 0, 'freehold' = 1, 'leasehold' = 2),
+    addr1 String,
+    addr2 String,
+    street LowCardinality(String),
+    locality LowCardinality(String),
+    town LowCardinality(String),
+    district LowCardinality(String),
+    county LowCardinality(String)
+)
+ENGINE = MergeTree
+ORDER BY (postcode1, postcode2, addr1, addr2)
+  # highlight-start
+  SETTINGS disk = disk(
+      type=web,
+      endpoint='https://raw.githubusercontent.com/ClickHouse/web-tables-demo/main/web/'
+      );
+  # highlight-end
+```
 
 A ready test case. You need to add this configuration to config:
 

From 09e630e02be9ccd19681b34f33e24cea849ca9fd Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Thu, 15 Feb 2024 19:00:08 +0100
Subject: [PATCH 028/985] Update storing-data.md

---
 docs/en/operations/storing-data.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index 0f818b813bf..60e33fe2849 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -10,7 +10,7 @@ Data, processed in ClickHouse, is usually stored in the local file system — on
 2. The Hadoop Distributed File System ([HDFS](https://hadoop.apache.org/docs/current/hadoop-project-dist/hadoop-hdfs/HdfsDesign.html))
 3. [Azure Blob Storage](https://azure.microsoft.com/en-us/products/storage/blobs).
 
-Note: to work with data stored on `Amazon S3` disks use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine, to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine, and to work with data stored in Azure Blob Storage use [AzureBlobStorage](/docs/en/engines/table-engines/integrations/AzureBlobStorage.md) table engine. They are different from external storage described on this page as they allow to read data stored in some general file format (like Parquet), while on this page we are describing storage configuration for ClickHouse `MergeTree` famility or `Log` family tables.
+Note: to work with data stored on `Amazon S3` disks use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine, to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine, and to work with data stored in Azure Blob Storage use [AzureBlobStorage](/docs/en/engines/table-engines/integrations/AzureBlobStorage.md) table engine. They are different from external storage described on this page as they allow to read data stored in some general file format (like Parquet), while on this page we are describing storage configuration for ClickHouse `MergeTree` family or `Log` family tables.
 
 ## Configuring external storage {#configuring-external-storage}
 

From 7bf42fd86e9599357282f947312c98d2bec1047f Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 16 Feb 2024 11:16:14 +0100
Subject: [PATCH 029/985] Fix upgrade check

---
 src/Core/SettingsChangesHistory.h                | 3 ++-
 src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp | 2 +-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index c453dd837eb..b6d07d7057a 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -93,7 +93,8 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"async_insert_busy_timeout_decrease_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout decreases"},
               {"split_parts_ranges_into_intersecting_and_non_intersecting_final", true, true, "Allow to split parts ranges into intersecting and non intersecting during FINAL optimization"},
               {"split_intersecting_parts_ranges_into_layers_final", true, true, "Allow to split intersecting parts ranges into layers during FINAL optimization"},
-              {"azure_max_single_part_copy_size", 256*1024*1024, 256*1024*1024, "The maximum size of object to copy using single part copy to Azure blob storage."}}},
+              {"azure_max_single_part_copy_size", 256*1024*1024, 256*1024*1024, "The maximum size of object to copy using single part copy to Azure blob storage."},
+              {"azure_max_inflight_parts_for_one_file", 20, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited."}}},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
               {"output_format_arrow_use_signed_indexes_for_dictionary", false, true, "Use signed indexes type for Arrow dictionaries by default as it's recommended"},
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index d700090303a..74a8949b235 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -98,7 +98,7 @@ void WriteBufferFromAzureBlobStorage::finalizeImpl()
     auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
     execWithRetry([&](){ block_blob_client.CommitBlockList(block_ids); }, max_unexpected_write_error_retries);
 
-    LOG_DEBUG(log, "Committed {} blocks for blob `{}`", block_ids.size(), blob_path);
+    LOG_TRACE(log, "Committed {} blocks for blob `{}`", block_ids.size(), blob_path);
 }
 
 void WriteBufferFromAzureBlobStorage::nextImpl()

From a11e67d4aae4433dd0f3d8ee46ba40e1cd73fdd5 Mon Sep 17 00:00:00 2001
From: Alexander Sapin <alesapin@gmail.com>
Date: Fri, 16 Feb 2024 16:41:58 +0100
Subject: [PATCH 030/985] Make max_insert_delayed_streams_for_parallel_write
 actually work

---
 src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
index 1fb2393948a..f5494e56049 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
@@ -323,6 +323,9 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
         if (!temp_part.part)
             continue;
 
+        if (!support_parallel_write && temp_part.part->getDataPartStorage().supportParallelWrite())
+            support_parallel_write = true;
+
         BlockIDsType block_id;
 
         if constexpr (async_insert)

From 458793cc50b92361848c91803d07105a91acea85 Mon Sep 17 00:00:00 2001
From: Alexander Sapin <alesapin@gmail.com>
Date: Fri, 16 Feb 2024 17:13:37 +0100
Subject: [PATCH 031/985] Review fix

---
 src/Storages/MergeTree/MergeTreeSink.cpp | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeSink.cpp b/src/Storages/MergeTree/MergeTreeSink.cpp
index 36816904a81..ebc49e22d03 100644
--- a/src/Storages/MergeTree/MergeTreeSink.cpp
+++ b/src/Storages/MergeTree/MergeTreeSink.cpp
@@ -109,9 +109,14 @@ void MergeTreeSink::consume(Chunk chunk)
             }
         }
 
-        size_t max_insert_delayed_streams_for_parallel_write = DEFAULT_DELAYED_STREAMS_FOR_PARALLEL_WRITE;
-        if (!support_parallel_write || settings.max_insert_delayed_streams_for_parallel_write.changed)
+        size_t max_insert_delayed_streams_for_parallel_write;
+
+        if (settings.max_insert_delayed_streams_for_parallel_write.changed)
             max_insert_delayed_streams_for_parallel_write = settings.max_insert_delayed_streams_for_parallel_write;
+        else if (support_parallel_write)
+            max_insert_delayed_streams_for_parallel_write = DEFAULT_DELAYED_STREAMS_FOR_PARALLEL_WRITE;
+        else
+            max_insert_delayed_streams_for_parallel_write = 0;
 
         /// In case of too much columns/parts in block, flush explicitly.
         streams += temp_part.streams.size();

From f7b524465c60b15c85f579ca22c48d4c165bf6f2 Mon Sep 17 00:00:00 2001
From: Alexander Sapin <alesapin@gmail.com>
Date: Fri, 16 Feb 2024 17:14:36 +0100
Subject: [PATCH 032/985] Followup

---
 src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
index f5494e56049..3cbdcf5106e 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
@@ -368,9 +368,13 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
         profile_events_scope.reset();
         UInt64 elapsed_ns = watch.elapsed();
 
-        size_t max_insert_delayed_streams_for_parallel_write = DEFAULT_DELAYED_STREAMS_FOR_PARALLEL_WRITE;
-        if (!support_parallel_write || settings.max_insert_delayed_streams_for_parallel_write.changed)
+        size_t max_insert_delayed_streams_for_parallel_write;
+        if (settings.max_insert_delayed_streams_for_parallel_write.changed)
             max_insert_delayed_streams_for_parallel_write = settings.max_insert_delayed_streams_for_parallel_write;
+        else if (support_parallel_write)
+            max_insert_delayed_streams_for_parallel_write = DEFAULT_DELAYED_STREAMS_FOR_PARALLEL_WRITE;
+        else
+            max_insert_delayed_streams_for_parallel_write = 0;
 
         /// In case of too much columns/parts in block, flush explicitly.
         streams += temp_part.streams.size();

From 1549725eddb6db299ba0297de21a51411607d2a3 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Sun, 18 Feb 2024 19:26:12 +0800
Subject: [PATCH 033/985] [feature]: allow to attach parts from a different
 disk

---
 src/Storages/MergeTree/MergeTreeData.cpp      |  13 ++
 src/Storages/MergeTree/MergeTreeData.h        |   9 +
 .../MergeTree/MergeTreeDataPartCloner.cpp     |  70 ++++++-
 src/Storages/StorageMergeTree.cpp             |  45 +++--
 src/Storages/StorageReplicatedMergeTree.cpp   |  42 ++--
 .../__init__.py                               |   0
 .../configs/remote_servers.xml                |  17 ++
 .../test_attach_partition_using_copy/test.py  | 183 ++++++++++++++++++
 8 files changed, 353 insertions(+), 26 deletions(-)
 create mode 100644 tests/integration/test_attach_partition_using_copy/__init__.py
 create mode 100644 tests/integration/test_attach_partition_using_copy/configs/remote_servers.xml
 create mode 100644 tests/integration/test_attach_partition_using_copy/test.py

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 3ca746a7197..56710b157de 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7085,6 +7085,19 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
         this, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, require_part_metadata, params, read_settings, write_settings);
 }
 
+std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAndLoadDataPartOnOtherDisk(
+    const MergeTreeData::DataPartPtr & src_part,
+    const String & tmp_part_prefix,
+    const MergeTreePartInfo & dst_part_info,
+    const StorageMetadataPtr & metadata_snapshot,
+    const IDataPartStorage::ClonePartParams & params,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings)
+{
+    return MergeTreeDataPartCloner::clone(
+        this, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, require_part_metadata, params, read_settings, write_settings);
+}
+
 std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAndLoadPartOnSameDiskWithDifferentPartitionKey(
     const MergeTreeData::DataPartPtr & src_part,
     const MergeTreePartition & new_partition,
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index dfdc22baa8f..a24362f68fc 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -866,6 +866,15 @@ public:
         ContextPtr local_context,
         Int64 min_block,
         Int64 max_block);
+    
+    std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneAndLoadDataPartOnOtherDisk(
+        const MergeTreeData::DataPartPtr & src_part,
+        const String & tmp_part_prefix,
+        const MergeTreePartInfo & dst_part_info,
+        const StorageMetadataPtr & metadata_snapshot,
+        const IDataPartStorage::ClonePartParams & params,
+        const ReadSettings & read_settings,
+        const WriteSettings & write_settings);
 
     static std::pair<MergeTreePartition, IMergeTreeDataPart::MinMaxIndex> createPartitionAndMinMaxIndexFromSourcePart(
         const MergeTreeData::DataPartPtr & src_part,
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
index 04019d2c665..69b7abacc93 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCloner.cpp
@@ -142,6 +142,30 @@ std::shared_ptr<IDataPartStorage> hardlinkAllFiles(
         params);
 }
 
+std::shared_ptr<IDataPartStorage> cloneAllFiles(
+    MergeTreeData * merge_tree_data,
+    const DB::ReadSettings & read_settings,
+    const DB::WriteSettings & write_settings,
+    const DataPartStoragePtr & storage,
+    const String & path)
+{
+    for (const DiskPtr & disk : merge_tree_data->getStoragePolicy()->getDisks())
+    {
+        try{
+            return storage->clonePart(
+            merge_tree_data->getRelativeDataPath(),
+            path,
+            disk,
+            read_settings,
+            write_settings,{},{});
+        }catch(...) {
+            LOG_TRACE(&Poco::Logger::get("MergeTreeDataPartCloner"), "Clone part on disk {} fail", disk->getName());
+        }
+    }
+    LOG_FATAL(&Poco::Logger::get("MergeTreeDataPartCloner"), "Clone part on disks all fail");
+    throw;
+}
+
 std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneSourcePart(
     MergeTreeData * merge_tree_data,
     const MergeTreeData::DataPartPtr & src_part,
@@ -165,8 +189,18 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneSourcePart(
 
     auto src_part_storage = flushPartStorageToDiskIfInMemory(
         merge_tree_data, src_part, metadata_snapshot, tmp_part_prefix, tmp_dst_part_name, src_flushed_tmp_dir_lock, src_flushed_tmp_part);
-
-    auto dst_part_storage = hardlinkAllFiles(merge_tree_data, read_settings, write_settings, src_part_storage, tmp_dst_part_name, params);
+    std::shared_ptr<IDataPartStorage> dst_part_storage {};
+    if (params.copy_instead_of_hardlink) {
+        dst_part_storage = cloneAllFiles(merge_tree_data, read_settings, write_settings, src_part_storage, tmp_dst_part_name);
+    } else {
+        try{
+            dst_part_storage = hardlinkAllFiles(merge_tree_data, read_settings, write_settings, src_part_storage, tmp_dst_part_name, params);
+        } catch(...){
+            // Hard link fail. Try copy.
+            LOG_WARNING(&Poco::Logger::get("MergeTreeDataPartCloner"), "Hard link fail, try tp copy directly. to:{}, path:{}", merge_tree_data->getRelativeDataPath(),tmp_dst_part_name);
+            dst_part_storage = cloneAllFiles(merge_tree_data, read_settings, write_settings, src_part_storage, tmp_dst_part_name);
+        }
+    }
 
     if (params.metadata_version_to_write.has_value())
     {
@@ -275,6 +309,25 @@ std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> cloneAndHand
 
     return std::make_pair(destination_part, std::move(temporary_directory_lock));
 }
+
+std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> cloneInsteadOfHardlinksAndProjections(
+    MergeTreeData * merge_tree_data,
+    const DataPartPtr & src_part,
+    const StorageMetadataPtr & metadata_snapshot,
+    const MergeTreePartInfo & dst_part_info,
+    const String & tmp_part_prefix,
+    const ReadSettings & read_settings,
+    const WriteSettings & write_settings,
+    const IDataPartStorage::ClonePartParams & params)
+{
+    chassert(!merge_tree_data->isStaticStorage());
+
+    auto [destination_part, temporary_directory_lock] = cloneSourcePart(
+        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
+
+    return std::make_pair(destination_part, std::move(temporary_directory_lock));
+}
+
 }
 
 std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> MergeTreeDataPartCloner::clone(
@@ -288,10 +341,19 @@ std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> MergeTreeDat
     const ReadSettings & read_settings,
     const WriteSettings & write_settings)
 {
-    auto [destination_part, temporary_directory_lock] = cloneAndHandleHardlinksAndProjections(
+    if (params.copy_instead_of_hardlink) 
+    {
+        auto [destination_part, temporary_directory_lock] = cloneInsteadOfHardlinksAndProjections(
         merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
+        return std::make_pair(finalizePart(destination_part, params, require_part_metadata), std::move(temporary_directory_lock));
+    } 
+    else 
+    {
+        auto [destination_part, temporary_directory_lock] = cloneAndHandleHardlinksAndProjections(
+        merge_tree_data, src_part, metadata_snapshot, dst_part_info, tmp_part_prefix, read_settings, write_settings, params);
+        return std::make_pair(finalizePart(destination_part, params, require_part_metadata), std::move(temporary_directory_lock));
 
-    return std::make_pair(finalizePart(destination_part, params, require_part_metadata), std::move(temporary_directory_lock));
+    }
 }
 
 std::pair<MergeTreeDataPartCloner::MutableDataPartPtr, scope_guard> MergeTreeDataPartCloner::cloneWithDistinctPartitionExpression(
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 0f75c726bce..0f95fef9c6e 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2118,17 +2118,40 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
         else
         {
             MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
-
-            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-                src_part,
-                TMP_PREFIX,
-                dst_part_info,
-                my_metadata_snapshot,
-                clone_params,
-                local_context->getReadSettings(),
-                local_context->getWriteSettings());
-            dst_parts.emplace_back(std::move(dst_part));
-            dst_parts_locks.emplace_back(std::move(part_lock));
+            LOG_TRACE(log, "Partition exps are the same:part id: {}; number of disks:{}",dst_part_info.partition_id, this->getStoragePolicy()->getDisks().size());
+            bool on_same_disk = false;
+            for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
+            {
+                if (disk->getName() == src_part->getDataPartStorage().getDiskName())
+                    on_same_disk = true;
+            }
+            if (on_same_disk)
+            {
+                auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
+                    src_part,
+                    TMP_PREFIX,
+                    dst_part_info,
+                    my_metadata_snapshot,
+                    clone_params,
+                    local_context->getReadSettings(),
+                    local_context->getWriteSettings());
+                dst_parts.emplace_back(std::move(dst_part));
+                dst_parts_locks.emplace_back(std::move(part_lock));
+            }
+            else
+            {
+                clone_params.copy_instead_of_hardlink = true;
+                auto [dst_part, part_lock] = cloneAndLoadDataPartOnOtherDisk(
+                    src_part,
+                    TMP_PREFIX,
+                    dst_part_info,
+                    my_metadata_snapshot,
+                    clone_params,
+                    local_context->getReadSettings(),
+                    local_context->getWriteSettings());
+                dst_parts.emplace_back(std::move(dst_part));
+                dst_parts_locks.emplace_back(std::move(part_lock));
+            }
         }
     }
 
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 6bd57cc4d6d..ba0d27fe612 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -8015,17 +8015,37 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
             {
                 MergeTreePartInfo dst_part_info(partition_id, index, index, src_part->info.level);
 
-                auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-                    src_part,
-                    TMP_PREFIX,
-                    dst_part_info,
-                    metadata_snapshot,
-                    clone_params,
-                    query_context->getReadSettings(),
-                    query_context->getWriteSettings());
-
-                dst_parts.emplace_back(dst_part);
-                dst_parts_locks.emplace_back(std::move(part_lock));
+                bool on_same_disk = false;
+                for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
+                    if (disk->getName() == src_part->getDataPartStorage().getDiskName())
+                        on_same_disk = true;
+                if (on_same_disk)
+                {
+                    auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
+                        src_part,
+                        TMP_PREFIX,
+                        dst_part_info,
+                        metadata_snapshot,
+                        clone_params,
+                        query_context->getReadSettings(),
+                        query_context->getWriteSettings());
+                    dst_parts.emplace_back(dst_part);
+                    dst_parts_locks.emplace_back(std::move(part_lock));
+                }
+                else
+                {
+                    clone_params.copy_instead_of_hardlink = true;
+                    auto [dst_part, part_lock] = cloneAndLoadDataPartOnOtherDisk(
+                        src_part,
+                        TMP_PREFIX,
+                        dst_part_info,
+                        metadata_snapshot,
+                        clone_params,
+                        query_context->getReadSettings(),
+                        query_context->getWriteSettings());
+                    dst_parts.emplace_back(dst_part);
+                    dst_parts_locks.emplace_back(std::move(part_lock));
+                }
             }
 
             src_parts.emplace_back(src_part);
diff --git a/tests/integration/test_attach_partition_using_copy/__init__.py b/tests/integration/test_attach_partition_using_copy/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_attach_partition_using_copy/configs/remote_servers.xml b/tests/integration/test_attach_partition_using_copy/configs/remote_servers.xml
new file mode 100644
index 00000000000..b40730e9f7d
--- /dev/null
+++ b/tests/integration/test_attach_partition_using_copy/configs/remote_servers.xml
@@ -0,0 +1,17 @@
+<clickhouse>
+    <remote_servers>
+        <test_cluster>
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <host>replica1</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>replica2</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_attach_partition_using_copy/test.py b/tests/integration/test_attach_partition_using_copy/test.py
new file mode 100644
index 00000000000..effb5708cf3
--- /dev/null
+++ b/tests/integration/test_attach_partition_using_copy/test.py
@@ -0,0 +1,183 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import assert_eq_with_retry
+
+cluster = ClickHouseCluster(__file__)
+
+replica1 = cluster.add_instance(
+    "replica1", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
+)
+replica2 = cluster.add_instance(
+    "replica2", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
+)
+
+
+@pytest.fixture(scope="module")
+def start_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    except Exception as ex:
+        print(ex)
+    finally:
+        cluster.shutdown()
+
+
+def cleanup(nodes):
+    for node in nodes:
+        node.query("DROP TABLE IF EXISTS source SYNC")
+        node.query("DROP TABLE IF EXISTS destination SYNC")
+
+
+def create_source_table(node, table_name, replicated):
+    replica = node.name
+    engine = (
+        f"ReplicatedMergeTree('/clickhouse/tables/1/{table_name}', '{replica}')"
+        if replicated
+        else "MergeTree()"
+    )
+    node.query_with_retry(
+        """
+        ATTACH TABLE {table_name} UUID 'cf712b4f-2ca8-435c-ac23-c4393efe52f7'
+        (
+        price UInt32,
+        date Date,
+        postcode1 LowCardinality(String),
+        postcode2 LowCardinality(String),
+        type Enum8('other' = 0, 'terraced' = 1, 'semi-detached' = 2, 'detached' = 3, 'flat' = 4),
+        is_new UInt8,
+        duration Enum8('unknown' = 0, 'freehold' = 1, 'leasehold' = 2),
+        addr1 String,
+        addr2 String,
+        street LowCardinality(String),
+        locality LowCardinality(String),
+        town LowCardinality(String),
+        district LowCardinality(String),
+        county LowCardinality(String)
+        )
+        ENGINE = {engine}
+        ORDER BY (postcode1, postcode2, addr1, addr2)
+        SETTINGS disk = disk(type = web, endpoint = 'https://raw.githubusercontent.com/ClickHouse/web-tables-demo/main/web/')
+        """.format(
+            table_name=table_name,
+            engine=engine
+        )
+    )
+
+
+
+def create_destination_table(node, table_name, replicated):
+    replica = node.name
+    engine = (
+        f"ReplicatedMergeTree('/clickhouse/tables/1/{table_name}', '{replica}')"
+        if replicated
+        else "MergeTree()"
+    )
+    node.query_with_retry(
+        """
+        CREATE TABLE {table_name}
+        (
+        price UInt32,
+        date Date,
+        postcode1 LowCardinality(String),
+        postcode2 LowCardinality(String),
+        type Enum8('other' = 0, 'terraced' = 1, 'semi-detached' = 2, 'detached' = 3, 'flat' = 4),
+        is_new UInt8,
+        duration Enum8('unknown' = 0, 'freehold' = 1, 'leasehold' = 2),
+        addr1 String,
+        addr2 String,
+        street LowCardinality(String),
+        locality LowCardinality(String),
+        town LowCardinality(String),
+        district LowCardinality(String),
+        county LowCardinality(String)
+        )
+        ENGINE = {engine} 
+        ORDER BY (postcode1, postcode2, addr1, addr2)
+        """.format(
+            table_name=table_name,
+            engine=engine
+        )
+    )
+
+def test_both_mergtree(start_cluster):
+    create_source_table(replica1, "source", False)
+    create_destination_table(replica1, "destination", False)
+
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION tuple() FROM source"
+    )
+    
+    assert_eq_with_retry(
+        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC",
+        replica1.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC"),
+    )
+    
+    assert_eq_with_retry(
+        replica1, f"SELECT town from destination LIMIT 1",
+        "SCARBOROUGH"
+    )
+
+    cleanup([replica1])
+
+def test_all_replicated(start_cluster):
+    create_source_table(replica1, "source", True)
+    create_destination_table(replica1, "destination", True)
+    create_destination_table(replica2, "destination", True)
+
+    replica1.query("SYSTEM SYNC REPLICA destination")
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION tuple() FROM source"
+    )
+
+    assert_eq_with_retry(
+        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC",
+        replica1.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC"),
+    )
+    assert_eq_with_retry(
+        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC",
+        replica2.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC"),
+    )
+
+    assert_eq_with_retry(
+        replica1, f"SELECT town from destination LIMIT 1",
+        "SCARBOROUGH"
+    )
+
+    assert_eq_with_retry(
+        replica2, f"SELECT town from destination LIMIT 1",
+        "SCARBOROUGH"
+    )
+
+    cleanup([replica1, replica2])
+
+def test_only_destination_replicated(start_cluster):
+    create_source_table(replica1, "source", False)
+    create_destination_table(replica1, "destination", True)
+    create_destination_table(replica2, "destination", True)
+
+    replica1.query("SYSTEM SYNC REPLICA destination")
+    replica1.query(
+        f"ALTER TABLE destination ATTACH PARTITION tuple() FROM source"
+    )
+
+    assert_eq_with_retry(
+        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC",
+        replica1.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC"),
+    )
+    assert_eq_with_retry(
+        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC",
+        replica2.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC"),
+    )
+
+    assert_eq_with_retry(
+        replica1, f"SELECT town from destination LIMIT 1",
+        "SCARBOROUGH"
+    )
+
+    assert_eq_with_retry(
+        replica2, f"SELECT town from destination LIMIT 1",
+        "SCARBOROUGH"
+    )
+
+    cleanup([replica1, replica2])

From 8c11f59ba82bd9ae3a322f7a9729c4a5a8644512 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 19 Feb 2024 11:01:37 +0100
Subject: [PATCH 034/985] Fix bad link, update disk web description

---
 docs/en/operations/storing-data.md | 19 ++++++++-----------
 1 file changed, 8 insertions(+), 11 deletions(-)

diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index 60e33fe2849..4b0345a3206 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -628,14 +628,9 @@ Cache profile events:
 
 ### Using static Web storage (read-only) {#web-storage}
 
-Web storage can be used for read-only purposes. An example use is for hosting sample
-data, or for migrating data.
-
-:::tip
-Storage can also be configured temporarily within a query, if a web dataset is not expected
-to be used routinely, see [dynamic storage](#dynamic-storage) and skip editing the
-configuration file.
-:::
+This is a read-only disk. Its data is only read and never modified. A new table is loaded to this disk via `ATTACH TABLE` query (see example below). Local disk is not actually used, each `SELECT` query will result in a `http` request to fetch required data. All modification of the table data will result in an exception, i.e. the following types of queries are not allowed: [CREATE TABLE](/docs/en/sql-reference/statements/create/table.md), [ALTER TABLE](/docs/en/sql-reference/statements/alter/index.md), [RENAME TABLE](/docs/en/sql-reference/statements/rename.md/#misc_operations-rename_table), [DETACH TABLE](/docs/en/sql-reference/statements/detach.md) and [TRUNCATE TABLE](/docs/en/sql-reference/statements/truncate.md).
+Web storage can be used for read-only purposes. An example use is for hosting sample data, or for migrating data.
+There is a tool `clickhouse-static-files-uploader`, which prepares a data directory for a given table (`SELECT data_paths FROM system.tables WHERE name = 'table_name'`). For each table you need, you get a directory of files. These files can be uploaded to, for example, a web server with static files. After this preparation, you can load this table into any ClickHouse server via `DiskWeb`.
 
 In this sample configuration:
 - the disk is of type `web`
@@ -677,9 +672,11 @@ In this sample configuration:
 </clickhouse>
 ```
 
-There is a tool `clickhouse-static-files-uploader`, which prepares a data directory for a given table (`SELECT data_paths FROM system.tables WHERE name = 'table_name'`). For each table you need, you get a directory of files. These files can be uploaded to, for example, a web server with static files. After this preparation, you can load this table into any ClickHouse server via `DiskWeb`.
-
-This is a read-only disk. Its data is only read and never modified. A new table is loaded to this disk via `ATTACH TABLE` query (see example below). Local disk is not actually used, each `SELECT` query will result in a `http` request to fetch required data. All modification of the table data will result in an exception, i.e. the following types of queries are not allowed: [CREATE TABLE](/docs/en/sql-reference/statements/create/table.md), [ALTER TABLE](/docs/en/sql-reference/statements/alter/index.md), [RENAME TABLE](/docs/en/sql-reference/statements/rename.md/#misc_operations-rename_table), [DETACH TABLE](/docs/en/sql-reference/statements/detach.md) and [TRUNCATE TABLE](/docs/en/sql-reference/statements/truncate.md).
+:::tip
+Storage can also be configured temporarily within a query, if a web dataset is not expected
+to be used routinely, see [dynamic configuration](#dynamic-configuration) and skip editing the
+configuration file.
+:::
 
 :::tip
 A [demo dataset](https://github.com/ClickHouse/web-tables-demo) is hosted in GitHub.  To prepare your own tables for web storage see the tool [clickhouse-static-files-uploader](/docs/en/operations/storing-data.md/#storing-data-on-webserver)

From 601b1dfaa14323db28f169b6b193d59ec75e8bfc Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 19 Feb 2024 12:21:52 +0100
Subject: [PATCH 035/985] Fix bad link

---
 docs/en/operations/storing-data.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index 4b0345a3206..4f676904375 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -10,7 +10,7 @@ Data, processed in ClickHouse, is usually stored in the local file system — on
 2. The Hadoop Distributed File System ([HDFS](https://hadoop.apache.org/docs/current/hadoop-project-dist/hadoop-hdfs/HdfsDesign.html))
 3. [Azure Blob Storage](https://azure.microsoft.com/en-us/products/storage/blobs).
 
-Note: to work with data stored on `Amazon S3` disks use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine, to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine, and to work with data stored in Azure Blob Storage use [AzureBlobStorage](/docs/en/engines/table-engines/integrations/AzureBlobStorage.md) table engine. They are different from external storage described on this page as they allow to read data stored in some general file format (like Parquet), while on this page we are describing storage configuration for ClickHouse `MergeTree` family or `Log` family tables.
+Note: to work with data stored on `Amazon S3` disks use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine, to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine, and to work with data stored in Azure Blob Storage use [AzureBlobStorage](/docs/en/engines/table-engines/integrations/azureBlobStorage.md) table engine. They are different from external storage described on this page as they allow to read data stored in some general file format (like Parquet), while on this page we are describing storage configuration for ClickHouse `MergeTree` family or `Log` family tables.
 
 ## Configuring external storage {#configuring-external-storage}
 

From 80fe3f78d99caeaed733548ca65b6bd466730d51 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 20 Feb 2024 11:12:09 +0800
Subject: [PATCH 036/985] [fix] black the python script

---
 .../test_attach_partition_using_copy/test.py  | 92 ++++++++++---------
 1 file changed, 48 insertions(+), 44 deletions(-)

diff --git a/tests/integration/test_attach_partition_using_copy/test.py b/tests/integration/test_attach_partition_using_copy/test.py
index effb5708cf3..df5378742ae 100644
--- a/tests/integration/test_attach_partition_using_copy/test.py
+++ b/tests/integration/test_attach_partition_using_copy/test.py
@@ -59,13 +59,11 @@ def create_source_table(node, table_name, replicated):
         ORDER BY (postcode1, postcode2, addr1, addr2)
         SETTINGS disk = disk(type = web, endpoint = 'https://raw.githubusercontent.com/ClickHouse/web-tables-demo/main/web/')
         """.format(
-            table_name=table_name,
-            engine=engine
+            table_name=table_name, engine=engine
         )
     )
 
 
-
 def create_destination_table(node, table_name, replicated):
     replica = node.name
     engine = (
@@ -95,89 +93,95 @@ def create_destination_table(node, table_name, replicated):
         ENGINE = {engine} 
         ORDER BY (postcode1, postcode2, addr1, addr2)
         """.format(
-            table_name=table_name,
-            engine=engine
+            table_name=table_name, engine=engine
         )
     )
 
+
 def test_both_mergtree(start_cluster):
     create_source_table(replica1, "source", False)
     create_destination_table(replica1, "destination", False)
 
-    replica1.query(
-        f"ALTER TABLE destination ATTACH PARTITION tuple() FROM source"
-    )
-    
+    replica1.query(f"ALTER TABLE destination ATTACH PARTITION tuple() FROM source")
+
     assert_eq_with_retry(
-        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC",
-        replica1.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC"),
+        replica1,
+        f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC",
+        replica1.query(
+            f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC"
+        ),
     )
-    
+
     assert_eq_with_retry(
-        replica1, f"SELECT town from destination LIMIT 1",
-        "SCARBOROUGH"
+        replica1, f"SELECT town from destination LIMIT 1", "SCARBOROUGH"
     )
 
     cleanup([replica1])
 
+
 def test_all_replicated(start_cluster):
     create_source_table(replica1, "source", True)
     create_destination_table(replica1, "destination", True)
     create_destination_table(replica2, "destination", True)
 
     replica1.query("SYSTEM SYNC REPLICA destination")
-    replica1.query(
-        f"ALTER TABLE destination ATTACH PARTITION tuple() FROM source"
+    replica1.query(f"ALTER TABLE destination ATTACH PARTITION tuple() FROM source")
+
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC",
+        replica1.query(
+            f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC"
+        ),
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC",
+        replica2.query(
+            f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC"
+        ),
     )
 
     assert_eq_with_retry(
-        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC",
-        replica1.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC"),
-    )
-    assert_eq_with_retry(
-        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC",
-        replica2.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC"),
+        replica1, f"SELECT town from destination LIMIT 1", "SCARBOROUGH"
     )
 
     assert_eq_with_retry(
-        replica1, f"SELECT town from destination LIMIT 1",
-        "SCARBOROUGH"
-    )
-
-    assert_eq_with_retry(
-        replica2, f"SELECT town from destination LIMIT 1",
-        "SCARBOROUGH"
+        replica2, f"SELECT town from destination LIMIT 1", "SCARBOROUGH"
     )
 
     cleanup([replica1, replica2])
 
+
 def test_only_destination_replicated(start_cluster):
     create_source_table(replica1, "source", False)
     create_destination_table(replica1, "destination", True)
     create_destination_table(replica2, "destination", True)
 
     replica1.query("SYSTEM SYNC REPLICA destination")
-    replica1.query(
-        f"ALTER TABLE destination ATTACH PARTITION tuple() FROM source"
+    replica1.query(f"ALTER TABLE destination ATTACH PARTITION tuple() FROM source")
+
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC",
+        replica1.query(
+            f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC"
+        ),
+    )
+    assert_eq_with_retry(
+        replica1,
+        f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC",
+        replica2.query(
+            f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC"
+        ),
     )
 
     assert_eq_with_retry(
-        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC",
-        replica1.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC"),
-    )
-    assert_eq_with_retry(
-        replica1, f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM source GROUP BY year ORDER BY year ASC",
-        replica2.query(f"SELECT toYear(date) AS year,round(avg(price)) AS price,bar(price, 0, 1000000, 80) FROM destination GROUP BY year ORDER BY year ASC"),
+        replica1, f"SELECT town from destination LIMIT 1", "SCARBOROUGH"
     )
 
     assert_eq_with_retry(
-        replica1, f"SELECT town from destination LIMIT 1",
-        "SCARBOROUGH"
-    )
-
-    assert_eq_with_retry(
-        replica2, f"SELECT town from destination LIMIT 1",
-        "SCARBOROUGH"
+        replica2, f"SELECT town from destination LIMIT 1", "SCARBOROUGH"
     )
 
     cleanup([replica1, replica2])

From 8de4a9dbfd32b7e82764a5c8efff3916b5c7ccda Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 20 Feb 2024 11:42:40 +0800
Subject: [PATCH 037/985] [fix] delete trailing whitespaces

---
 src/Storages/MergeTree/MergeTreeData.h | 2 +-
 src/Storages/StorageMergeTree.cpp      | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 5f387385d38..081087acbaa 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -853,7 +853,7 @@ public:
         const IDataPartStorage::ClonePartParams & params,
         const ReadSettings & read_settings,
         const WriteSettings & write_settings);
-    
+
     std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneAndLoadDataPartOnOtherDisk(
         const MergeTreeData::DataPartPtr & src_part,
         const String & tmp_part_prefix,
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index a2713775e65..47684925182 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2081,7 +2081,7 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
         /// This will generate unique name in scope of current server process.
         Int64 temp_index = insert_increment.get();
         MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
-        
+
         IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
         LOG_TRACE(log, "Partition exps are the same:part id: {}; number of disks:{}",dst_part_info.partition_id, this->getStoragePolicy()->getDisks().size());
         bool on_same_disk = false;

From 6437877a712bfaf4a36c180b332a0d6a37981af1 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 20 Feb 2024 20:31:59 +0800
Subject: [PATCH 038/985] [fix] add changelog; change some feature logic

---
 CHANGELOG.md                                |  1 +
 src/Storages/MergeTree/MergeTreeData.cpp    | 10 +++++++---
 src/Storages/StorageMergeTree.cpp           |  1 -
 src/Storages/StorageReplicatedMergeTree.cpp |  3 +--
 4 files changed, 9 insertions(+), 6 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index b3e5dd709ab..fd4ff90f841 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -42,6 +42,7 @@
 * Added `FROM <Replicas>` modifier for `SYSTEM SYNC REPLICA LIGHTWEIGHT` query. With the `FROM` modifier ensures we wait for fetches and drop-ranges only for the specified source replicas, as well as any replica not in zookeeper or with an empty source_replica. [#58393](https://github.com/ClickHouse/ClickHouse/pull/58393) ([Jayme Bird](https://github.com/jaymebrd)).
 * Added setting `update_insert_deduplication_token_in_dependent_materialized_views`. This setting allows to update insert deduplication token with table identifier during insert in dependent materialized views. Closes [#59165](https://github.com/ClickHouse/ClickHouse/issues/59165). [#59238](https://github.com/ClickHouse/ClickHouse/pull/59238) ([Maksim Kita](https://github.com/kitaisreal)).
 * Added statement `SYSTEM RELOAD ASYNCHRONOUS METRICS` which updates the asynchronous metrics. Mostly useful for testing and development. [#53710](https://github.com/ClickHouse/ClickHouse/pull/53710) ([Robert Schulze](https://github.com/rschu1ze)).
+* Attach parts from a different disk `ALTER TABLE destination ATTACH PARTITION tuple() FROM source` where source is an [instant table](https://github.com/ClickHouse/web-tables-demo). [#60112](https://github.com/ClickHouse/ClickHouse/pull/60112)([Unalian](https://github.com/Unalian)).
 
 #### Performance Improvement
 * Coordination for parallel replicas is rewritten for better parallelism and cache locality. It has been tested for linear scalability on hundreds of replicas. It also got support for reading in order. [#57968](https://github.com/ClickHouse/ClickHouse/pull/57968) ([Nikita Taranov](https://github.com/nickitat)).
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 64787d3509b..be1346e0ea2 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -8,6 +8,7 @@
 #include <Backups/BackupEntryWrappedWith.h>
 #include <Backups/IBackup.h>
 #include <Backups/RestorerFromBackup.h>
+#include "Common/logger_useful.h"
 #include <Common/Config/ConfigHelper.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/Increment.h>
@@ -7170,7 +7171,9 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
             }
         }
         if (!copy_successful)
-            throw;
+        {
+            LOG_FATAL(&Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail");
+        } 
     }
 
 
@@ -7301,8 +7304,9 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
         }
     }
     if (!copy_successful)
-        throw;
-
+    {
+        LOG_FATAL( &Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail.");
+    }
     if (params.metadata_version_to_write.has_value())
     {
         chassert(!params.keep_metadata_version);
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 47684925182..0748ac2dbdf 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2104,7 +2104,6 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
         }
         else
         {
-            clone_params.copy_instead_of_hardlink = true;
             auto [dst_part, part_lock] = cloneAndLoadDataPartOnOtherDisk(
                 src_part,
                 TMP_PREFIX,
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index df261053360..2460d2704c4 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -7933,7 +7933,7 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
             for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
                 if (disk->getName() == src_part->getDataPartStorage().getDiskName())
                     on_same_disk = true;
-            if (on_same_disk)
+            if (on_same_disk && !clone_params.copy_instead_of_hardlink)
             {
                 auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
                     src_part,
@@ -7948,7 +7948,6 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
             }
             else
             {
-                clone_params.copy_instead_of_hardlink = true;
                 auto [dst_part, part_lock] = cloneAndLoadDataPartOnOtherDisk(
                     src_part,
                     TMP_PREFIX,

From fc3ebe007b3b5dc905ecbd63ed402547a1cde3a5 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 20 Feb 2024 20:54:32 +0800
Subject: [PATCH 039/985] [fix] rm whitespaces

---
 src/Storages/MergeTree/MergeTreeData.cpp | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index be1346e0ea2..18bb0966bfc 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7171,9 +7171,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
             }
         }
         if (!copy_successful)
-        {
             LOG_FATAL(&Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail");
-        } 
     }
 
 
@@ -7304,9 +7302,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
         }
     }
     if (!copy_successful)
-    {
         LOG_FATAL( &Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail.");
-    }
     if (params.metadata_version_to_write.has_value())
     {
         chassert(!params.keep_metadata_version);

From f829a97d9130de5609e07e237b9486847422bc8c Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 20 Feb 2024 21:08:24 +0800
Subject: [PATCH 040/985] [fix] rm whitespaces

---
 src/Storages/MergeTree/MergeTreeData.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 18bb0966bfc..849ceb1b66d 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7302,7 +7302,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
         }
     }
     if (!copy_successful)
-        LOG_FATAL( &Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail.");
+        LOG_FATAL(&Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail.");
     if (params.metadata_version_to_write.has_value())
     {
         chassert(!params.keep_metadata_version);

From 28282eee91add78e5b18202bd38566d1d3797083 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 20 Feb 2024 21:37:09 +0800
Subject: [PATCH 041/985] [fix] Add description in partition.md

---
 docs/en/sql-reference/statements/alter/partition.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/en/sql-reference/statements/alter/partition.md b/docs/en/sql-reference/statements/alter/partition.md
index 114b8d5ffe3..277e174bb05 100644
--- a/docs/en/sql-reference/statements/alter/partition.md
+++ b/docs/en/sql-reference/statements/alter/partition.md
@@ -116,6 +116,8 @@ For the query to run successfully, the following conditions must be met:
 - Both tables must have the same indices and projections.
 - Both tables must have the same storage policy.
 
+If both tables have the same storage policy, use hardlink to attach partition. Otherwise, use copying the data to attach partition.
+
 ## REPLACE PARTITION
 
 ``` sql

From 1731a5a8afba5a48ce01cea20e0cdc1f91316841 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Wed, 21 Feb 2024 10:55:32 +0800
Subject: [PATCH 042/985] [improve]change the integration test
 test_multiple_disks::test_move_across_policies_not_work to
 test_move_across_policies_work_for_attach_not_work_for_move

---
 tests/integration/test_multiple_disks/test.py | 36 +++++++------------
 1 file changed, 13 insertions(+), 23 deletions(-)

diff --git a/tests/integration/test_multiple_disks/test.py b/tests/integration/test_multiple_disks/test.py
index fdd81284b2a..9584ace7f45 100644
--- a/tests/integration/test_multiple_disks/test.py
+++ b/tests/integration/test_multiple_disks/test.py
@@ -5,6 +5,7 @@ import string
 import threading
 import time
 from multiprocessing.dummy import Pool
+from helpers.test_tools import assert_eq_with_retry
 
 import pytest
 from helpers.client import QueryRuntimeException
@@ -1745,9 +1746,9 @@ def test_move_while_merge(start_cluster):
         node1.query(f"DROP TABLE IF EXISTS {name} SYNC")
 
 
-def test_move_across_policies_does_not_work(start_cluster):
+def test_move_across_policies_work_for_attach_not_work_for_move(start_cluster):
     try:
-        name = "test_move_across_policies_does_not_work"
+        name = "test_move_across_policies_work_for_attach_not_work_for_move"
 
         node1.query(
             """
@@ -1783,25 +1784,18 @@ def test_move_across_policies_does_not_work(start_cluster):
         except QueryRuntimeException:
             """All parts of partition 'all' are already on disk 'jbod2'."""
 
-        with pytest.raises(
-            QueryRuntimeException,
-            match=".*because disk does not belong to storage policy.*",
-        ):
-            node1.query(
-                """ALTER TABLE {name}2 ATTACH PARTITION tuple() FROM {name}""".format(
-                    name=name
-                )
+        node1.query(
+            """ALTER TABLE {name}2 ATTACH PARTITION tuple() FROM {name}""".format(
+                name=name
             )
-
-        with pytest.raises(
-            QueryRuntimeException,
-            match=".*because disk does not belong to storage policy.*",
-        ):
+        )
+        assert_eq_with_retry(
+            node1,
+            """SELECT * FROM {name}2""".format(name=name),
             node1.query(
-                """ALTER TABLE {name}2 REPLACE PARTITION tuple() FROM {name}""".format(
-                    name=name
-                )
-            )
+                """SELECT * FROM {name}""".format(name=name),
+            ),
+        )
 
         with pytest.raises(
             QueryRuntimeException,
@@ -1813,10 +1807,6 @@ def test_move_across_policies_does_not_work(start_cluster):
                 )
             )
 
-        assert node1.query(
-            """SELECT * FROM {name}""".format(name=name)
-        ).splitlines() == ["1"]
-
     finally:
         node1.query(f"DROP TABLE IF EXISTS {name} SYNC")
         node1.query(f"DROP TABLE IF EXISTS {name}2 SYNC")

From e98d09c93e6c54a2cc4eadab8614539c0a5eb0f8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 21 Feb 2024 21:41:04 +0100
Subject: [PATCH 043/985] Do not load useless columns from the index in memory

---
 contrib/rapidjson                             |  2 +-
 src/Processors/QueryPlan/PartsSplitter.cpp    |  9 ++++---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 21 +++++++++++++++
 .../MergeTree/MergeTreeDataSelectExecutor.cpp | 26 +++++++++++++++----
 src/Storages/MergeTree/MergeTreeSettings.h    |  2 +-
 5 files changed, 49 insertions(+), 11 deletions(-)

diff --git a/contrib/rapidjson b/contrib/rapidjson
index c4ef90ccdbc..a9bc56c9165 160000
--- a/contrib/rapidjson
+++ b/contrib/rapidjson
@@ -1 +1 @@
-Subproject commit c4ef90ccdbc21d5d5a628d08316bfd301e32d6fa
+Subproject commit a9bc56c9165f1dbbbcada64221bd3a59042c5b95
diff --git a/src/Processors/QueryPlan/PartsSplitter.cpp b/src/Processors/QueryPlan/PartsSplitter.cpp
index 0fc6ddd6408..fcb1d8dd92c 100644
--- a/src/Processors/QueryPlan/PartsSplitter.cpp
+++ b/src/Processors/QueryPlan/PartsSplitter.cpp
@@ -32,9 +32,9 @@ std::string toString(const Values & value)
 
 int compareValues(const Values & lhs, const Values & rhs)
 {
-    chassert(lhs.size() == rhs.size());
+    size_t size = std::min(lhs.size(), rhs.size());
 
-    for (size_t i = 0; i < lhs.size(); ++i)
+    for (size_t i = 0; i < size; ++i)
     {
         if (applyVisitor(FieldVisitorAccurateLess(), lhs[i], rhs[i]))
             return -1;
@@ -55,8 +55,9 @@ public:
     Values getValue(size_t part_idx, size_t mark) const
     {
         const auto & index = parts[part_idx].data_part->getIndex();
-        Values values(index.size());
-        for (size_t i = 0; i < values.size(); ++i)
+        size_t size = index.size();
+        Values values(size);
+        for (size_t i = 0; i < size; ++i)
         {
             index[i]->get(mark, values[i]);
             if (values[i].isNull())
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 11ede661f78..629f3688874 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -869,6 +869,27 @@ void IMergeTreeDataPart::loadIndex() const
             for (size_t j = 0; j < key_size; ++j)
                 key_serializations[j]->deserializeBinary(*loaded_index[j], *index_file, {});
 
+        /// Cut useless suffix columns, if necessary.
+        Float64 ratio_to_drop_suffix_columns = storage.getSettings()->primary_key_ratio_of_unique_prefix_values_to_skip_suffix_columns;
+        if (key_size > 1 && ratio_to_drop_suffix_columns > 0 && ratio_to_drop_suffix_columns < 1)
+        {
+            chassert(marks_count > 0);
+            for (size_t j = 0; j < key_size - 1; ++j)
+            {
+                size_t num_changes = 0;
+                for (size_t i = 1; i < marks_count; ++i)
+                    if (0 != loaded_index[j]->compareAt(i, i - 1, *loaded_index[j], 0))
+                        ++num_changes;
+
+                if (static_cast<Float64>(num_changes) / marks_count >= ratio_to_drop_suffix_columns)
+                {
+                    key_size = j + 1;
+                    loaded_index.resize(key_size);
+                    break;
+                }
+            }
+        }
+
         for (size_t i = 0; i < key_size; ++i)
         {
             loaded_index[i]->shrinkToFit();
diff --git a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
index 1ba28713680..175419f20e0 100644
--- a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
@@ -1110,7 +1110,11 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
     DataTypes key_types;
     for (size_t i : key_indices)
     {
-        index_columns->emplace_back(ColumnWithTypeAndName{index[i], primary_key.data_types[i], primary_key.column_names[i]});
+        if (i < index.size())
+            index_columns->emplace_back(index[i], primary_key.data_types[i], primary_key.column_names[i]);
+        else
+            index_columns->emplace_back(); /// The column of the primary key was not loaded in memory - we'll skip it.
+
         key_types.emplace_back(primary_key.data_types[i]);
     }
 
@@ -1119,7 +1123,6 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
     std::function<void(size_t, size_t, FieldRef &)> create_field_ref;
     if (key_condition.hasMonotonicFunctionsChain())
     {
-
         create_field_ref = [index_columns](size_t row, size_t column, FieldRef & field)
         {
             field = {index_columns.get(), row, column};
@@ -1159,7 +1162,11 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
             {
                 for (size_t i = 0; i < used_key_size; ++i)
                 {
-                    create_field_ref(range.begin, i, index_left[i]);
+                    if ((*index_columns)[i].column)
+                        create_field_ref(range.begin, i, index_left[i]);
+                    else
+                        index_left[i] = NEGATIVE_INFINITY;
+
                     index_right[i] = POSITIVE_INFINITY;
                 }
             }
@@ -1170,8 +1177,17 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
 
                 for (size_t i = 0; i < used_key_size; ++i)
                 {
-                    create_field_ref(range.begin, i, index_left[i]);
-                    create_field_ref(range.end, i, index_right[i]);
+                    if ((*index_columns)[i].column)
+                    {
+                        create_field_ref(range.begin, i, index_left[i]);
+                        create_field_ref(range.end, i, index_right[i]);
+                    }
+                    else
+                    {
+                        /// If the PK column was not loaded in memory - exclude it from the analysis.
+                        index_left[i] = NEGATIVE_INFINITY;
+                        index_right[i] = POSITIVE_INFINITY;
+                    }
                 }
             }
             key_condition_maybe_true = key_condition.mayBeTrueInRange(used_key_size, index_left.data(), index_right.data(), key_types);
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index b64632b6139..1cff44142bc 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -202,7 +202,7 @@ struct Settings;
     M(UInt64, marks_compress_block_size, 65536, "Mark compress block size, the actual size of the block to compress.", 0) \
     M(UInt64, primary_key_compress_block_size, 65536, "Primary compress block size, the actual size of the block to compress.", 0) \
     M(Bool, primary_key_lazy_load, true, "Load primary key in memory on first use instead of on table initialization. This can save memory in the presence of a large number of tables.", 0) \
-    \
+    M(Float, primary_key_ratio_of_unique_prefix_values_to_skip_suffix_columns, 0.9f, "If the value of a column of the primary key in data part changes at least in this ratio of times, skip loading next columns in memory. This allows to save memory usage by not loading useless columns of the primary key.", 0) \
     /** Projection settings. */ \
     M(UInt64, max_projections, 25, "The maximum number of merge tree projections.", 0) \
 

From 31de27b149ab2922647ff7d9141871330cc9d743 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 21 Feb 2024 21:42:19 +0100
Subject: [PATCH 044/985] Do not load useless columns from the index in memory

---
 contrib/rapidjson | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/rapidjson b/contrib/rapidjson
index a9bc56c9165..c4ef90ccdbc 160000
--- a/contrib/rapidjson
+++ b/contrib/rapidjson
@@ -1 +1 @@
-Subproject commit a9bc56c9165f1dbbbcada64221bd3a59042c5b95
+Subproject commit c4ef90ccdbc21d5d5a628d08316bfd301e32d6fa

From d0d84a840151675ee3c7a108709e4b0b486af577 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 21 Feb 2024 23:03:01 +0100
Subject: [PATCH 045/985] Add a test

---
 .../02998_primary_key_skip_columns.reference  | 18 ++++++++++
 .../02998_primary_key_skip_columns.sql        | 33 +++++++++++++++++++
 2 files changed, 51 insertions(+)
 create mode 100644 tests/queries/0_stateless/02998_primary_key_skip_columns.reference
 create mode 100644 tests/queries/0_stateless/02998_primary_key_skip_columns.sql

diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.reference b/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
new file mode 100644
index 00000000000..9df0a2c097c
--- /dev/null
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
@@ -0,0 +1,18 @@
+100000
+14954
+798
+15908
+108
+120
+2334
+19
+Key size: 	2400000
+100000
+14954
+798
+15907
+108
+120
+2334
+19
+Key size: 	800008
diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
new file mode 100644
index 00000000000..801fa35fb52
--- /dev/null
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
@@ -0,0 +1,33 @@
+DROP TABLE IF EXISTS test;
+
+CREATE TABLE test (a UInt64, b UInt64, c UInt64) ENGINE = MergeTree ORDER BY (a, b, c) SETTINGS index_granularity = 1, primary_key_ratio_of_unique_prefix_values_to_skip_suffix_columns = 1;
+INSERT INTO test SELECT sipHash64(number, 1), sipHash64(number, 2), sipHash64(number, 3) FROM numbers(100000);
+
+SELECT count() FROM test;
+SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760;
+SELECT count() FROM test WHERE b > 7898976344263989848 AND b < 8040320939819153137;
+SELECT count() FROM test WHERE c > 13239894303140990071 AND c < 16179795840886947236;
+SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND b > 7898976344263989848 AND b < 8040320939819153137;
+SELECT count() FROM test WHERE b > 7898976344263989848 AND b < 8040320939819153137 AND c > 13239894303140990071 AND c < 16179795840886947236;
+SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND c > 13239894303140990071 AND c < 16179795840886947236;
+SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND b > 7898976344263989848 AND b < 8040320939819153137 AND c > 13239894303140990071 AND c < 16179795840886947236;
+
+SELECT 'Key size: ', round(sum(primary_key_bytes_in_memory), -5) FROM system.parts WHERE database = currentDatabase() AND table = 'test';
+
+ALTER TABLE test MODIFY SETTING primary_key_ratio_of_unique_prefix_values_to_skip_suffix_columns = 0.9;
+
+DETACH TABLE test;
+ATTACH TABLE test;
+
+SELECT count() FROM test;
+SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760;
+SELECT count() FROM test WHERE b > 7898976344263989848 AND b < 8040320939819153137;
+SELECT count() FROM test WHERE c > 13239894303140990071 AND c < 16179795840886947236;
+SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND b > 7898976344263989848 AND b < 8040320939819153137;
+SELECT count() FROM test WHERE b > 7898976344263989848 AND b < 8040320939819153137 AND c > 13239894303140990071 AND c < 16179795840886947236;
+SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND c > 13239894303140990071 AND c < 16179795840886947236;
+SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND b > 7898976344263989848 AND b < 8040320939819153137 AND c > 13239894303140990071 AND c < 16179795840886947236;
+
+SELECT 'Key size: ', round(sum(primary_key_bytes_in_memory), 5) FROM system.parts WHERE database = currentDatabase() AND table = 'test';
+
+DROP TABLE test;

From 395ad35c93a185291a16449b1ac4d1dcecb1a127 Mon Sep 17 00:00:00 2001
From: Shanfeng Pang <shanfengp@myscale.com>
Date: Thu, 22 Feb 2024 10:41:16 +0800
Subject: [PATCH 046/985] fix LRUResource Cache bug

---
 src/Common/LRUResourceCache.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/LRUResourceCache.h b/src/Common/LRUResourceCache.h
index 4ccaa272346..60b4053bff5 100644
--- a/src/Common/LRUResourceCache.h
+++ b/src/Common/LRUResourceCache.h
@@ -221,7 +221,7 @@ private:
         {
             std::lock_guard lock(mutex);
             auto it = cells.find(key);
-            if (it != cells.end() && !it->second.expired)
+            if (it != cells.end())
             {
                 if (!it->second.expired)
                 {

From 999cf88ab79cf71bc82e7be3140496697a661416 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 22 Feb 2024 09:54:39 +0100
Subject: [PATCH 047/985] Improve test

---
 tests/queries/0_stateless/02998_primary_key_skip_columns.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
index 801fa35fb52..b2dadcc5e7c 100644
--- a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
@@ -28,6 +28,6 @@ SELECT count() FROM test WHERE b > 7898976344263989848 AND b < 80403209398191531
 SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND c > 13239894303140990071 AND c < 16179795840886947236;
 SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND b > 7898976344263989848 AND b < 8040320939819153137 AND c > 13239894303140990071 AND c < 16179795840886947236;
 
-SELECT 'Key size: ', round(sum(primary_key_bytes_in_memory), 5) FROM system.parts WHERE database = currentDatabase() AND table = 'test';
+SELECT 'Key size: ', round(sum(primary_key_bytes_in_memory), -5) FROM system.parts WHERE database = currentDatabase() AND table = 'test';
 
 DROP TABLE test;

From 9b10aebecc690e36ec3591ba7115991b00920289 Mon Sep 17 00:00:00 2001
From: Shanfeng Pang <shanfengp@myscale.com>
Date: Thu, 22 Feb 2024 17:24:59 +0800
Subject: [PATCH 048/985] add unit-test for bug fix

---
 src/Common/tests/gtest_lru_resource_cache.cpp | 27 +++++++++++++++++++
 1 file changed, 27 insertions(+)

diff --git a/src/Common/tests/gtest_lru_resource_cache.cpp b/src/Common/tests/gtest_lru_resource_cache.cpp
index bc037824ff8..94490d1e86d 100644
--- a/src/Common/tests/gtest_lru_resource_cache.cpp
+++ b/src/Common/tests/gtest_lru_resource_cache.cpp
@@ -45,6 +45,33 @@ struct MyWeight
     size_t operator()(const int & x) const { return static_cast<size_t>(x); }
 };
 
+TEST(LRUResourceCache, remove2)
+{
+    using MyCache = DB::LRUResourceCache<int, int, MyWeight>;
+    auto mcache = MyCache(10, 10);
+    for (int i = 1; i < 5; ++i)
+    {
+        auto load_int = [&] { return std::make_shared<int>(i); };
+        mcache.getOrSet(i, load_int);
+    }
+
+    auto n = mcache.size();
+    ASSERT_EQ(n, 4);
+    auto w = mcache.weight();
+    ASSERT_EQ(w, 10);
+    auto holder4 = mcache.get(4);
+    ASSERT_TRUE(holder4 != nullptr);
+    mcache.tryRemove(4);
+    auto holder_reget_4 = mcache.get(4);
+    ASSERT_TRUE(holder_reget_4 == nullptr);
+    mcache.getOrSet(4, [&]() { return std::make_shared<int>(4); });
+    holder4.reset();
+    auto holder1 = mcache.getOrSet(1, [&]() { return std::make_shared<int>(1); });
+    ASSERT_TRUE(holder1 != nullptr);
+    auto holder7 = mcache.getOrSet(7, [&] { return std::make_shared<int>(7); });
+    ASSERT_TRUE(holder7 != nullptr);
+}
+
 TEST(LRUResourceCache, evictOnWweight)
 {
     using MyCache = DB::LRUResourceCache<int, int, MyWeight>;

From 3ef159853c78e438e6088d60a64bcff2bbb77b17 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Thu, 22 Feb 2024 14:34:18 +0000
Subject: [PATCH 049/985] Do something to the test

---
 .../0_stateless/02998_primary_key_skip_columns.reference        | 2 +-
 tests/queries/0_stateless/02998_primary_key_skip_columns.sql    | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.reference b/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
index 9df0a2c097c..ec44acbd16b 100644
--- a/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
@@ -15,4 +15,4 @@ Key size: 	2400000
 120
 2334
 19
-Key size: 	800008
+Key size ok: 	1	1
diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
index b2dadcc5e7c..27672d7854e 100644
--- a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
@@ -28,6 +28,6 @@ SELECT count() FROM test WHERE b > 7898976344263989848 AND b < 80403209398191531
 SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND c > 13239894303140990071 AND c < 16179795840886947236;
 SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND b > 7898976344263989848 AND b < 8040320939819153137 AND c > 13239894303140990071 AND c < 16179795840886947236;
 
-SELECT 'Key size: ', round(sum(primary_key_bytes_in_memory), -5) FROM system.parts WHERE database = currentDatabase() AND table = 'test';
+SELECT 'Key size ok: ', (sum(primary_key_bytes_in_memory) as s) >= 800000, s < 1200000 FROM system.parts WHERE database = currentDatabase() AND table = 'test';
 
 DROP TABLE test;

From f1e95fb78bae190bb87e93704cf5f88c70cdccf4 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 22 Feb 2024 15:38:44 +0100
Subject: [PATCH 050/985] Add a way to force read-through cache for merges

---
 src/Core/Settings.h                           |   1 +
 src/Disks/IO/ReadBufferFromRemoteFSGather.cpp |  10 +-
 .../Cached/CachedObjectStorage.cpp            |  14 --
 .../Cached/CachedObjectStorage.h              |   2 -
 src/IO/ReadSettings.h                         |   2 +-
 src/Interpreters/Cache/FileSegment.cpp        |   3 +-
 src/Interpreters/Context.cpp                  |   1 +
 .../MergeTree/MergeTreeSequentialSource.cpp   |   2 +-
 .../integration/test_filesystem_cache/test.py |  79 ++++++++
 .../users.d/cache_on_write_operations.xml     |   7 +
 .../force_read_through_cache_on_merge.xml     |   7 +
 ...system_cache_on_write_operations.reference | 170 ++++++++++++++++++
 ...41_filesystem_cache_on_write_operations.sh |  81 +++++----
 13 files changed, 317 insertions(+), 62 deletions(-)
 create mode 100644 tests/integration/test_filesystem_cache/users.d/cache_on_write_operations.xml
 create mode 100644 tests/integration/test_filesystem_cache/users.d/force_read_through_cache_on_merge.xml

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 433195af9c3..db060bf712d 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -769,6 +769,7 @@ class IColumn;
     M(Bool, enable_filesystem_cache_on_write_operations, false, "Write into cache on write operations. To actually work this setting requires be added to disk config too", 0) \
     M(Bool, enable_filesystem_cache_log, false, "Allows to record the filesystem caching log for each query", 0) \
     M(Bool, read_from_filesystem_cache_if_exists_otherwise_bypass_cache, false, "Allow to use the filesystem cache in passive mode - benefit from the existing cache entries, but don't put more entries into the cache. If you set this setting for heavy ad-hoc queries and leave it disabled for short real-time queries, this will allows to avoid cache threshing by too heavy queries and to improve the overall system efficiency.", 0) \
+    M(Bool, force_read_through_cache_for_merges, false, "Force read-through cache for merges", 0) \
     M(Bool, skip_download_if_exceeds_query_cache, true, "Skip download from remote filesystem if exceeds query cache size", 0) \
     M(UInt64, filesystem_cache_max_download_size, (128UL * 1024 * 1024 * 1024), "Max remote filesystem cache size that can be downloaded by a single query", 0) \
     M(Bool, throw_on_error_from_cache_on_write_operations, false, "Ignore error from cache when caching on write operations (INSERT, merges)", 0) \
diff --git a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
index 0b3ecca3587..1da39c7011c 100644
--- a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
+++ b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
@@ -16,12 +16,10 @@ using namespace DB;
 
 namespace
 {
-bool withCache(const ReadSettings & settings)
-{
-    return settings.remote_fs_cache && settings.enable_filesystem_cache
-        && (!CurrentThread::getQueryId().empty() || settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache
-            || !settings.avoid_readthrough_cache_outside_query_context);
-}
+    bool withCache(const ReadSettings & settings)
+    {
+        return settings.remote_fs_cache && settings.enable_filesystem_cache;
+    }
 }
 
 namespace DB
diff --git a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp
index 1444f4c9c76..e3ab772e3b5 100644
--- a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp
@@ -43,10 +43,6 @@ ReadSettings CachedObjectStorage::patchSettings(const ReadSettings & read_settin
 {
     ReadSettings modified_settings{read_settings};
     modified_settings.remote_fs_cache = cache;
-
-    if (!canUseReadThroughCache(read_settings))
-        modified_settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = true;
-
     return object_storage->patchSettings(modified_settings);
 }
 
@@ -206,14 +202,4 @@ String CachedObjectStorage::getObjectsNamespace() const
     return object_storage->getObjectsNamespace();
 }
 
-bool CachedObjectStorage::canUseReadThroughCache(const ReadSettings & settings)
-{
-    if (!settings.avoid_readthrough_cache_outside_query_context)
-        return true;
-
-    return CurrentThread::isInitialized()
-        && CurrentThread::get().getQueryContext()
-        && !CurrentThread::getQueryId().empty();
-}
-
 }
diff --git a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
index 437baead7be..961c2709efc 100644
--- a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
+++ b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.h
@@ -119,8 +119,6 @@ public:
 
     const FileCacheSettings & getCacheSettings() const { return cache_settings; }
 
-    static bool canUseReadThroughCache(const ReadSettings & settings);
-
 #if USE_AZURE_BLOB_STORAGE
     std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> getAzureBlobStorageClient() override
     {
diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index c397689d6ad..2c79735317d 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -99,7 +99,7 @@ struct ReadSettings
     bool read_from_filesystem_cache_if_exists_otherwise_bypass_cache = false;
     bool enable_filesystem_cache_log = false;
     /// Don't populate cache when the read is not part of query execution (e.g. background thread).
-    bool avoid_readthrough_cache_outside_query_context = true;
+    bool force_read_through_cache_merges = false;
     size_t filesystem_cache_segments_batch_size = 20;
 
     size_t filesystem_cache_max_download_size = (128UL * 1024 * 1024 * 1024);
diff --git a/src/Interpreters/Cache/FileSegment.cpp b/src/Interpreters/Cache/FileSegment.cpp
index 8bd89465917..7c0505889da 100644
--- a/src/Interpreters/Cache/FileSegment.cpp
+++ b/src/Interpreters/Cache/FileSegment.cpp
@@ -10,6 +10,7 @@
 #include <Common/logger_useful.h>
 #include <Common/scope_guard_safe.h>
 #include <Common/ElapsedTimeProfileEventIncrement.h>
+#include <Common/setThreadName.h>
 
 #include <magic_enum.hpp>
 
@@ -194,7 +195,7 @@ bool FileSegment::isDownloaded() const
 String FileSegment::getCallerId()
 {
     if (!CurrentThread::isInitialized() || CurrentThread::getQueryId().empty())
-        return "None:" + toString(getThreadId());
+        return fmt::format("None:{}:{}", getThreadName(), toString(getThreadId()));
 
     return std::string(CurrentThread::getQueryId()) + ":" + toString(getThreadId());
 }
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 55a4df10206..36b362e36bb 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -5079,6 +5079,7 @@ ReadSettings Context::getReadSettings() const
     res.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache;
     res.enable_filesystem_cache_log = settings.enable_filesystem_cache_log;
     res.filesystem_cache_segments_batch_size = settings.filesystem_cache_segments_batch_size;
+    res.force_read_through_cache_merges = settings.force_read_through_cache_for_merges;
 
     res.filesystem_cache_max_download_size = settings.filesystem_cache_max_download_size;
     res.skip_download_if_exceeds_query_cache = settings.skip_download_if_exceeds_query_cache;
diff --git a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
index d0fbc316024..e375e8b0a9f 100644
--- a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
+++ b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
@@ -151,7 +151,7 @@ MergeTreeSequentialSource::MergeTreeSequentialSource(
 
     const auto & context = storage.getContext();
     ReadSettings read_settings = context->getReadSettings();
-    read_settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = true;
+    read_settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = !read_settings.force_read_through_cache_merges;
     /// It does not make sense to use pthread_threadpool for background merges/mutations
     /// And also to preserve backward compatibility
     read_settings.local_fs_method = LocalFSReadMethod::pread;
diff --git a/tests/integration/test_filesystem_cache/test.py b/tests/integration/test_filesystem_cache/test.py
index eb5f896f7a9..c1ba6702dcf 100644
--- a/tests/integration/test_filesystem_cache/test.py
+++ b/tests/integration/test_filesystem_cache/test.py
@@ -19,6 +19,9 @@ def cluster():
             main_configs=[
                 "config.d/storage_conf.xml",
             ],
+            user_configs=[
+                "users.d/cache_on_write_operations.xml",
+            ],
             stay_alive=True,
         )
         cluster.add_instance(
@@ -35,6 +38,17 @@ def cluster():
             ],
             stay_alive=True,
         )
+        cluster.add_instance(
+            "node_force_read_through_cache_on_merge",
+            main_configs=[
+                "config.d/storage_conf.xml",
+            ],
+            user_configs=[
+                "users.d/force_read_through_cache_on_merge.xml",
+                "users.d/cache_on_write_operations.xml",
+            ],
+            stay_alive=True,
+        )
 
         logging.info("Starting cluster...")
         cluster.start()
@@ -323,3 +337,68 @@ def test_custom_cached_disk(cluster):
             "SELECT cache_path FROM system.disks WHERE name = 'custom_cached4'"
         ).strip()
     )
+
+
+def test_force_filesystem_cache_on_merges(cluster):
+    def test(node, forced_read_through_cache_on_merge):
+        node.query(
+            """
+            DROP TABLE IF EXISTS test SYNC;
+
+            CREATE TABLE test (key UInt32, value String)
+            Engine=MergeTree()
+            ORDER BY value
+            SETTINGS disk = disk(
+                type = cache,
+                path = 'force_cache_on_merges',
+                disk = 'hdd_blob',
+                max_file_segment_size = '1Ki',
+                cache_on_write_operations = 1,
+                boundary_alignment = '1Ki',
+                max_size = '10Gi',
+                max_elements = 10000000,
+                load_metadata_threads = 30);
+
+            SYSTEM DROP FILESYSTEM CACHE;
+            INSERT INTO test SELECT * FROM generateRandom('a Int32, b String') LIMIT 1000000;
+            INSERT INTO test SELECT * FROM generateRandom('a Int32, b String') LIMIT 1000000;
+            """
+        )
+        assert int(node.query("SELECT count() FROM system.filesystem_cache")) > 0
+        assert int(node.query("SELECT max(size) FROM system.filesystem_cache")) == 1024
+
+        write_count = int(
+            node.query(
+                "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
+            )
+        )
+        assert write_count > 100000
+        assert "" == node.query(
+            "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
+        )
+
+        node.query("SYSTEM DROP FILESYSTEM CACHE")
+        node.query("OPTIMIZE TABLE test FINAL")
+
+        new_write_count = int(
+            node.query(
+                "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
+            )
+        )
+        assert new_write_count >= write_count
+
+        if forced_read_through_cache_on_merge:
+            assert 100000 < int(
+                node.query(
+                    "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
+                )
+            )
+        else:
+            assert "" == node.query(
+                "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
+            )
+
+    node = cluster.instances["node_force_read_through_cache_on_merge"]
+    test(node, True)
+    node = cluster.instances["node"]
+    test(node, False)
diff --git a/tests/integration/test_filesystem_cache/users.d/cache_on_write_operations.xml b/tests/integration/test_filesystem_cache/users.d/cache_on_write_operations.xml
new file mode 100644
index 00000000000..5de169edc1e
--- /dev/null
+++ b/tests/integration/test_filesystem_cache/users.d/cache_on_write_operations.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <profiles>
+        <default>
+            <enable_filesystem_cache_on_write_operations>1</enable_filesystem_cache_on_write_operations>
+        </default>
+    </profiles>
+</clickhouse>
diff --git a/tests/integration/test_filesystem_cache/users.d/force_read_through_cache_on_merge.xml b/tests/integration/test_filesystem_cache/users.d/force_read_through_cache_on_merge.xml
new file mode 100644
index 00000000000..4d26a1a8bc7
--- /dev/null
+++ b/tests/integration/test_filesystem_cache/users.d/force_read_through_cache_on_merge.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <profiles>
+        <default>
+            <force_read_through_cache_for_merges>1</force_read_through_cache_for_merges>
+        </default>
+    </profiles>
+</clickhouse>
diff --git a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference
index 157837983f7..c03b928684b 100644
--- a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference
+++ b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference
@@ -1,62 +1,232 @@
 Using storage policy: s3_cache
+DROP TABLE IF EXISTS test_02241
+CREATE TABLE test_02241 (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='s3_cache', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false, ratio_of_defaults_for_sparse_serialization = 1
+SYSTEM STOP MERGES test_02241
+SYSTEM DROP FILESYSTEM CACHE
+SELECT file_segment_range_begin, file_segment_range_end, size, state
+    FROM
+    (
+        SELECT file_segment_range_begin, file_segment_range_end, size, state, local_path
+        FROM
+        (
+            SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
+            FROM system.remote_data_paths
+        ) AS data_paths
+        INNER JOIN
+            system.filesystem_cache AS caches
+        ON data_paths.cache_path = caches.cache_path
+    )
+    WHERE endsWith(local_path, 'data.bin')
+    FORMAT Vertical
+SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path
 0
+SELECT count(), sum(size) FROM system.filesystem_cache
 0	0
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100)
+SELECT file_segment_range_begin, file_segment_range_end, size, state
+    FROM
+    (
+        SELECT file_segment_range_begin, file_segment_range_end, size, state, local_path
+        FROM
+        (
+            SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
+            FROM system.remote_data_paths
+        ) AS data_paths
+        INNER JOIN
+            system.filesystem_cache AS caches
+        ON data_paths.cache_path = caches.cache_path
+    )
+    WHERE endsWith(local_path, 'data.bin')
+    FORMAT Vertical
 Row 1:
 ──────
 file_segment_range_begin: 0
 file_segment_range_end:   745
 size:                     746
 state:                    DOWNLOADED
+SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path
 8
+SELECT count(), sum(size) FROM system.filesystem_cache
 8	1100
+SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0
 0
+SELECT * FROM test_02241 FORMAT Null
+SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0
 2
+SELECT * FROM test_02241 FORMAT Null
+SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0
 2
+SELECT count(), sum(size) size FROM system.filesystem_cache
 8	1100
+SYSTEM DROP FILESYSTEM CACHE
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100, 200)
+SELECT file_segment_range_begin, file_segment_range_end, size, state
+    FROM
+    (
+        SELECT file_segment_range_begin, file_segment_range_end, size, state, local_path
+        FROM
+        (
+            SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
+            FROM system.remote_data_paths
+        ) AS data_paths
+        INNER JOIN
+            system.filesystem_cache AS caches
+        ON data_paths.cache_path = caches.cache_path
+    )
+    WHERE endsWith(local_path, 'data.bin')
+    FORMAT Vertical;
 Row 1:
 ──────
 file_segment_range_begin: 0
 file_segment_range_end:   1659
 size:                     1660
 state:                    DOWNLOADED
+SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path
 8
+SELECT count(), sum(size) FROM system.filesystem_cache
 8	2014
+SELECT count(), sum(size) FROM system.filesystem_cache
 8	2014
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100) SETTINGS enable_filesystem_cache_on_write_operations=0
+SELECT count(), sum(size) FROM system.filesystem_cache
 8	2014
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100)
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(300, 10000)
+SELECT count(), sum(size) FROM system.filesystem_cache
 24	84045
+SYSTEM START MERGES test_02241
+SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'
+85146
+SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'
+OPTIMIZE TABLE test_02241 FINAL
+SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'
+251542
+SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'
+SELECT count(), sum(size) FROM system.filesystem_cache
 32	167243
+ALTER TABLE test_02241 UPDATE value = 'kek' WHERE key = 100
+SELECT count(), sum(size) FROM system.filesystem_cache
 41	250541
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(5000000)
+SYSTEM FLUSH LOGS
 INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(5000000)	0
+SELECT count() FROM test_02241
 5010500
+SELECT count() FROM test_02241 WHERE value LIKE '%010%'
 18816
 Using storage policy: local_cache
+DROP TABLE IF EXISTS test_02241
+CREATE TABLE test_02241 (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='local_cache', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false, ratio_of_defaults_for_sparse_serialization = 1
+SYSTEM STOP MERGES test_02241
+SYSTEM DROP FILESYSTEM CACHE
+SELECT file_segment_range_begin, file_segment_range_end, size, state
+    FROM
+    (
+        SELECT file_segment_range_begin, file_segment_range_end, size, state, local_path
+        FROM
+        (
+            SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
+            FROM system.remote_data_paths
+        ) AS data_paths
+        INNER JOIN
+            system.filesystem_cache AS caches
+        ON data_paths.cache_path = caches.cache_path
+    )
+    WHERE endsWith(local_path, 'data.bin')
+    FORMAT Vertical
+SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path
 0
+SELECT count(), sum(size) FROM system.filesystem_cache
 0	0
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100)
+SELECT file_segment_range_begin, file_segment_range_end, size, state
+    FROM
+    (
+        SELECT file_segment_range_begin, file_segment_range_end, size, state, local_path
+        FROM
+        (
+            SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
+            FROM system.remote_data_paths
+        ) AS data_paths
+        INNER JOIN
+            system.filesystem_cache AS caches
+        ON data_paths.cache_path = caches.cache_path
+    )
+    WHERE endsWith(local_path, 'data.bin')
+    FORMAT Vertical
 Row 1:
 ──────
 file_segment_range_begin: 0
 file_segment_range_end:   745
 size:                     746
 state:                    DOWNLOADED
+SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path
 8
+SELECT count(), sum(size) FROM system.filesystem_cache
 8	1100
+SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0
 0
+SELECT * FROM test_02241 FORMAT Null
+SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0
 2
+SELECT * FROM test_02241 FORMAT Null
+SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0
 2
+SELECT count(), sum(size) size FROM system.filesystem_cache
 8	1100
+SYSTEM DROP FILESYSTEM CACHE
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100, 200)
+SELECT file_segment_range_begin, file_segment_range_end, size, state
+    FROM
+    (
+        SELECT file_segment_range_begin, file_segment_range_end, size, state, local_path
+        FROM
+        (
+            SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path
+            FROM system.remote_data_paths
+        ) AS data_paths
+        INNER JOIN
+            system.filesystem_cache AS caches
+        ON data_paths.cache_path = caches.cache_path
+    )
+    WHERE endsWith(local_path, 'data.bin')
+    FORMAT Vertical;
 Row 1:
 ──────
 file_segment_range_begin: 0
 file_segment_range_end:   1659
 size:                     1660
 state:                    DOWNLOADED
+SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path
 8
+SELECT count(), sum(size) FROM system.filesystem_cache
 8	2014
+SELECT count(), sum(size) FROM system.filesystem_cache
 8	2014
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100) SETTINGS enable_filesystem_cache_on_write_operations=0
+SELECT count(), sum(size) FROM system.filesystem_cache
 8	2014
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100)
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(300, 10000)
+SELECT count(), sum(size) FROM system.filesystem_cache
 24	84045
+SYSTEM START MERGES test_02241
+SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'
+81715476
+SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'
+OPTIMIZE TABLE test_02241 FINAL
+SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'
+81881872
+SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'
+SELECT count(), sum(size) FROM system.filesystem_cache
 32	167243
+ALTER TABLE test_02241 UPDATE value = 'kek' WHERE key = 100
+SELECT count(), sum(size) FROM system.filesystem_cache
 41	250541
+INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(5000000)
+SYSTEM FLUSH LOGS
 INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(5000000)	0
+SELECT count() FROM test_02241
 5010500
+SELECT count() FROM test_02241 WHERE value LIKE '%010%'
 18816
diff --git a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh
index 96f61cf61e8..2b237492e98 100755
--- a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh
+++ b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh
@@ -10,13 +10,13 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 for STORAGE_POLICY in 's3_cache' 'local_cache'; do
     echo "Using storage policy: $STORAGE_POLICY"
 
-    $CLICKHOUSE_CLIENT --query "DROP TABLE IF EXISTS test_02241"
-    $CLICKHOUSE_CLIENT --query "CREATE TABLE test_02241 (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='$STORAGE_POLICY', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false, ratio_of_defaults_for_sparse_serialization = 1"
-    $CLICKHOUSE_CLIENT --query "SYSTEM STOP MERGES test_02241"
+    $CLICKHOUSE_CLIENT --echo --query "DROP TABLE IF EXISTS test_02241"
+    $CLICKHOUSE_CLIENT --echo --query "CREATE TABLE test_02241 (key UInt32, value String) Engine=MergeTree() ORDER BY key SETTINGS storage_policy='$STORAGE_POLICY', min_bytes_for_wide_part = 10485760, compress_marks=false, compress_primary_key=false, ratio_of_defaults_for_sparse_serialization = 1"
+    $CLICKHOUSE_CLIENT --echo --query "SYSTEM STOP MERGES test_02241"
 
-    $CLICKHOUSE_CLIENT --query "SYSTEM DROP FILESYSTEM CACHE"
+    $CLICKHOUSE_CLIENT --echo --query "SYSTEM DROP FILESYSTEM CACHE"
 
-    $CLICKHOUSE_CLIENT -n --query "SELECT file_segment_range_begin, file_segment_range_end, size, state
+    $CLICKHOUSE_CLIENT --echo -n --query "SELECT file_segment_range_begin, file_segment_range_end, size, state
     FROM
     (
         SELECT file_segment_range_begin, file_segment_range_end, size, state, local_path
@@ -32,12 +32,12 @@ for STORAGE_POLICY in 's3_cache' 'local_cache'; do
     WHERE endsWith(local_path, 'data.bin')
     FORMAT Vertical"
 
-    $CLICKHOUSE_CLIENT --query "SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path"
-    $CLICKHOUSE_CLIENT --query "SELECT count(), sum(size) FROM system.filesystem_cache"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) FROM system.filesystem_cache"
 
-    $CLICKHOUSE_CLIENT --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100)"
+    $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100)"
 
-    $CLICKHOUSE_CLIENT -n --query "SELECT file_segment_range_begin, file_segment_range_end, size, state
+    $CLICKHOUSE_CLIENT --echo -n --query "SELECT file_segment_range_begin, file_segment_range_end, size, state
     FROM
     (
         SELECT file_segment_range_begin, file_segment_range_end, size, state, local_path
@@ -53,24 +53,24 @@ for STORAGE_POLICY in 's3_cache' 'local_cache'; do
     WHERE endsWith(local_path, 'data.bin')
     FORMAT Vertical"
 
-    $CLICKHOUSE_CLIENT --query "SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path"
-    $CLICKHOUSE_CLIENT --query "SELECT count(), sum(size) FROM system.filesystem_cache"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) FROM system.filesystem_cache"
 
-    $CLICKHOUSE_CLIENT --query "SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0"
 
-    $CLICKHOUSE_CLIENT --query "SELECT * FROM test_02241 FORMAT Null"
-    $CLICKHOUSE_CLIENT --query "SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT * FROM test_02241 FORMAT Null"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0"
 
-    $CLICKHOUSE_CLIENT --query "SELECT * FROM test_02241 FORMAT Null"
-    $CLICKHOUSE_CLIENT --query "SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT * FROM test_02241 FORMAT Null"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count() FROM system.filesystem_cache WHERE cache_hits > 0"
 
-    $CLICKHOUSE_CLIENT --query "SELECT count(), sum(size) size FROM system.filesystem_cache"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) size FROM system.filesystem_cache"
 
-    $CLICKHOUSE_CLIENT --query "SYSTEM DROP FILESYSTEM CACHE"
+    $CLICKHOUSE_CLIENT --echo --query "SYSTEM DROP FILESYSTEM CACHE"
 
-    $CLICKHOUSE_CLIENT --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100, 200)"
+    $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100, 200)"
 
-    $CLICKHOUSE_CLIENT -n --query "SELECT file_segment_range_begin, file_segment_range_end, size, state
+    $CLICKHOUSE_CLIENT --echo -n --query "SELECT file_segment_range_begin, file_segment_range_end, size, state
     FROM
     (
         SELECT file_segment_range_begin, file_segment_range_end, size, state, local_path
@@ -86,27 +86,34 @@ for STORAGE_POLICY in 's3_cache' 'local_cache'; do
     WHERE endsWith(local_path, 'data.bin')
     FORMAT Vertical;"
 
-    $CLICKHOUSE_CLIENT --query "SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path"
-    $CLICKHOUSE_CLIENT --query "SELECT count(), sum(size) FROM system.filesystem_cache"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count() FROM (SELECT arrayJoin(cache_paths) AS cache_path, local_path, remote_path FROM system.remote_data_paths ) AS data_paths INNER JOIN system.filesystem_cache AS caches ON data_paths.cache_path = caches.cache_path"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) FROM system.filesystem_cache"
 
-    $CLICKHOUSE_CLIENT --query "SELECT count(), sum(size) FROM system.filesystem_cache"
-    $CLICKHOUSE_CLIENT --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100) SETTINGS enable_filesystem_cache_on_write_operations=0"
-    $CLICKHOUSE_CLIENT --query "SELECT count(), sum(size) FROM system.filesystem_cache"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) FROM system.filesystem_cache"
+    $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100) SETTINGS enable_filesystem_cache_on_write_operations=0"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) FROM system.filesystem_cache"
 
-    $CLICKHOUSE_CLIENT --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100)"
-    $CLICKHOUSE_CLIENT --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(300, 10000)"
-    $CLICKHOUSE_CLIENT --query "SELECT count(), sum(size) FROM system.filesystem_cache"
+    $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(100)"
+    $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(300, 10000)"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) FROM system.filesystem_cache"
 
-    $CLICKHOUSE_CLIENT --query "SYSTEM START MERGES test_02241"
+    $CLICKHOUSE_CLIENT --echo --query "SYSTEM START MERGES test_02241"
 
-    $CLICKHOUSE_CLIENT --enable_filesystem_cache_on_write_operations=1 --query "OPTIMIZE TABLE test_02241 FINAL"
-    $CLICKHOUSE_CLIENT --query "SELECT count(), sum(size) FROM system.filesystem_cache"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
 
-    $CLICKHOUSE_CLIENT --enable_filesystem_cache_on_write_operations=1 --mutations_sync=2 --query "ALTER TABLE test_02241 UPDATE value = 'kek' WHERE key = 100"
-    $CLICKHOUSE_CLIENT --query "SELECT count(), sum(size) FROM system.filesystem_cache"
-    $CLICKHOUSE_CLIENT --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(5000000)"
+    $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --query "OPTIMIZE TABLE test_02241 FINAL"
 
-    $CLICKHOUSE_CLIENT --query "SYSTEM FLUSH LOGS"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
+
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) FROM system.filesystem_cache"
+
+    $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --mutations_sync=2 --query "ALTER TABLE test_02241 UPDATE value = 'kek' WHERE key = 100"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) FROM system.filesystem_cache"
+    $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --query "INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(5000000)"
+
+    $CLICKHOUSE_CLIENT --echo --query "SYSTEM FLUSH LOGS"
 
     $CLICKHOUSE_CLIENT -n --query "SELECT
         query, ProfileEvents['RemoteFSReadBytes'] > 0 as remote_fs_read
@@ -121,6 +128,6 @@ for STORAGE_POLICY in 's3_cache' 'local_cache'; do
         DESC
     LIMIT 1"
 
-    $CLICKHOUSE_CLIENT --query "SELECT count() FROM test_02241"
-    $CLICKHOUSE_CLIENT --query "SELECT count() FROM test_02241 WHERE value LIKE '%010%'"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count() FROM test_02241"
+    $CLICKHOUSE_CLIENT --echo --query "SELECT count() FROM test_02241 WHERE value LIKE '%010%'"
 done

From a80747b2385647678771281d815867ef87b580f6 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Thu, 22 Feb 2024 15:57:10 +0000
Subject: [PATCH 051/985] Undo something to the test

---
 .../0_stateless/02998_primary_key_skip_columns.reference        | 2 +-
 tests/queries/0_stateless/02998_primary_key_skip_columns.sql    | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.reference b/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
index ec44acbd16b..08ccdb83b11 100644
--- a/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
@@ -15,4 +15,4 @@ Key size: 	2400000
 120
 2334
 19
-Key size ok: 	1	1
+Key size: 	800000
diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
index 27672d7854e..b2dadcc5e7c 100644
--- a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
@@ -28,6 +28,6 @@ SELECT count() FROM test WHERE b > 7898976344263989848 AND b < 80403209398191531
 SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND c > 13239894303140990071 AND c < 16179795840886947236;
 SELECT count() FROM test WHERE a > 1849813033528774208 AND a < 4594276315503201760 AND b > 7898976344263989848 AND b < 8040320939819153137 AND c > 13239894303140990071 AND c < 16179795840886947236;
 
-SELECT 'Key size ok: ', (sum(primary_key_bytes_in_memory) as s) >= 800000, s < 1200000 FROM system.parts WHERE database = currentDatabase() AND table = 'test';
+SELECT 'Key size: ', round(sum(primary_key_bytes_in_memory), -5) FROM system.parts WHERE database = currentDatabase() AND table = 'test';
 
 DROP TABLE test;

From a34f42ca22c8a4820e4cbcf67cdd48a3589e3879 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 13 Jan 2024 18:48:47 +0300
Subject: [PATCH 052/985] Remove lock from the ReadProgressCallback

It looks redundant (added in 5ef51ed), though it has "fix tests" in the
log message, but CI reports is not available for the commits from that
PR [1], so let's try.

  [1]: https://github.com/ClickHouse/ClickHouse/pull/37543

Also this can be a big problem, since the code under that lock
(throttling or quotas with previous implementation that uses
boost::atomic_shared_ptr) may sleep.

Some numbers:

    run                     | time
    ------------------------|------
    max_threads=100 before  | 23.1
    max_threads=100 after   | 15.1
    max_threads=4500 before | 4.5
    max_threads=4500 after  | 2.3

Query:

    select sum(number) from numbers_mt(2000000) settings max_threads=X, max_block_size = 1

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/QueryPipeline/ReadProgressCallback.cpp   | 2 --
 src/QueryPipeline/ReadProgressCallback.h     | 1 -
 tests/performance/small_block_contention.xml | 3 +++
 3 files changed, 3 insertions(+), 3 deletions(-)
 create mode 100644 tests/performance/small_block_contention.xml

diff --git a/src/QueryPipeline/ReadProgressCallback.cpp b/src/QueryPipeline/ReadProgressCallback.cpp
index 59843d8791d..e90fc24d882 100644
--- a/src/QueryPipeline/ReadProgressCallback.cpp
+++ b/src/QueryPipeline/ReadProgressCallback.cpp
@@ -126,8 +126,6 @@ bool ReadProgressCallback::onProgress(uint64_t read_rows, uint64_t read_bytes, c
 
         CurrentThread::updatePerformanceCountersIfNeeded();
 
-        std::lock_guard lock(limits_and_quotas_mutex);
-
         /// TODO: Should be done in PipelineExecutor.
         for (const auto & limits : storage_limits)
             limits.local_limits.speed_limits.throttle(progress.read_rows, progress.read_bytes, total_rows, total_stopwatch.elapsedMicroseconds(), limits.local_limits.timeout_overflow_mode);
diff --git a/src/QueryPipeline/ReadProgressCallback.h b/src/QueryPipeline/ReadProgressCallback.h
index 5dbf3344bdf..7dfed9df5da 100644
--- a/src/QueryPipeline/ReadProgressCallback.h
+++ b/src/QueryPipeline/ReadProgressCallback.h
@@ -41,7 +41,6 @@ private:
     /// The total number of bytes to read. For progress bar.
     std::atomic_size_t total_bytes = 0;
 
-    std::mutex limits_and_quotas_mutex;
     Stopwatch total_stopwatch{CLOCK_MONOTONIC_COARSE};  /// Including waiting time
 
     bool update_profile_events = true;
diff --git a/tests/performance/small_block_contention.xml b/tests/performance/small_block_contention.xml
new file mode 100644
index 00000000000..ce1995a0a29
--- /dev/null
+++ b/tests/performance/small_block_contention.xml
@@ -0,0 +1,3 @@
+<test>
+    <query>select sum(number) from numbers_mt(200000) settings max_threads=100, max_block_size = 1 format Null</query>
+</test>

From 9cb1ade3e2967507885f5b0e3deefab2ad40082c Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Thu, 22 Feb 2024 17:07:47 +0000
Subject: [PATCH 053/985] fix db iterator wait

---
 src/Common/AsyncLoader.cpp                |  2 +-
 src/Databases/DatabaseOrdinary.cpp        | 20 ++++++++++++++++----
 src/Databases/IDatabase.h                 | 17 +----------------
 src/Interpreters/InterpreterDropQuery.cpp |  2 +-
 4 files changed, 19 insertions(+), 22 deletions(-)

diff --git a/src/Common/AsyncLoader.cpp b/src/Common/AsyncLoader.cpp
index 140194e10b4..4a39454ccbb 100644
--- a/src/Common/AsyncLoader.cpp
+++ b/src/Common/AsyncLoader.cpp
@@ -39,7 +39,7 @@ void logAboutProgress(LoggerPtr log, size_t processed, size_t total, AtomicStopw
 {
     if (total && (processed % PRINT_MESSAGE_EACH_N_OBJECTS == 0 || watch.compareAndRestart(PRINT_MESSAGE_EACH_N_SECONDS)))
     {
-        LOG_INFO(log, "Processed: {}%", static_cast<Int64>(processed * 1000.0 / total) * 0.1);
+        LOG_INFO(log, "Processed: {:.1f}%", static_cast<double>(processed) * 100.0 / total);
         watch.restart();
     }
 }
diff --git a/src/Databases/DatabaseOrdinary.cpp b/src/Databases/DatabaseOrdinary.cpp
index 644bed23350..40e0fb0a0ed 100644
--- a/src/Databases/DatabaseOrdinary.cpp
+++ b/src/Databases/DatabaseOrdinary.cpp
@@ -289,10 +289,22 @@ void DatabaseOrdinary::stopLoading()
 
 DatabaseTablesIteratorPtr DatabaseOrdinary::getTablesIterator(ContextPtr local_context, const DatabaseOnDisk::FilterByNameFunction & filter_by_table_name) const
 {
-    auto result = DatabaseWithOwnTablesBase::getTablesIterator(local_context, filter_by_table_name);
-    std::scoped_lock lock(mutex);
-    typeid_cast<DatabaseTablesSnapshotIterator &>(*result).setLoadTasks(startup_table);
-    return result;
+    // Wait for every table (matching the filter) to be loaded and started up before we make the snapshot.
+    // It is important, because otherwise table might be:
+    //  - not attached and thus will be missed in the snapshot;
+    //  - not started, which is not good for DDL operations.
+    LoadTaskPtrs tasks_to_wait;
+    {
+        std::lock_guard lock(mutex);
+        if (!filter_by_table_name)
+            tasks_to_wait.reserve(startup_table.size());
+        for (const auto & [table_name, task] : startup_table)
+            if (!filter_by_table_name || filter_by_table_name(table_name))
+                tasks_to_wait.emplace_back(task);
+    }
+    waitLoad(currentPoolOr(TablesLoaderForegroundPoolId), tasks_to_wait);
+
+    return DatabaseWithOwnTablesBase::getTablesIterator(local_context, filter_by_table_name);
 }
 
 void DatabaseOrdinary::alterTable(ContextPtr local_context, const StorageID & table_id, const StorageInMemoryMetadata & metadata)
diff --git a/src/Databases/IDatabase.h b/src/Databases/IDatabase.h
index ec380fa759d..75662bfebe3 100644
--- a/src/Databases/IDatabase.h
+++ b/src/Databases/IDatabase.h
@@ -77,17 +77,12 @@ private:
     Tables tables;
     Tables::iterator it;
 
-    // Tasks to wait before returning a table
-    using Tasks = std::unordered_map<String, LoadTaskPtr>;
-    Tasks tasks;
-
 protected:
     DatabaseTablesSnapshotIterator(DatabaseTablesSnapshotIterator && other) noexcept
     : IDatabaseTablesIterator(std::move(other.database_name))
     {
         size_t idx = std::distance(other.tables.begin(), other.it);
         std::swap(tables, other.tables);
-        std::swap(tasks, other.tasks);
         other.it = other.tables.end();
         it = tables.begin();
         std::advance(it, idx);
@@ -110,17 +105,7 @@ public:
 
     const String & name() const override { return it->first; }
 
-    const StoragePtr & table() const override
-    {
-        if (auto task = tasks.find(it->first); task != tasks.end())
-            waitLoad(currentPoolOr(TablesLoaderForegroundPoolId), task->second);
-        return it->second;
-    }
-
-    void setLoadTasks(const Tasks & tasks_)
-    {
-        tasks = tasks_;
-    }
+    const StoragePtr & table() const override { return it->second; }
 };
 
 using DatabaseTablesIteratorPtr = std::unique_ptr<IDatabaseTablesIterator>;
diff --git a/src/Interpreters/InterpreterDropQuery.cpp b/src/Interpreters/InterpreterDropQuery.cpp
index 711100b5de1..72aa4cc63e3 100644
--- a/src/Interpreters/InterpreterDropQuery.cpp
+++ b/src/Interpreters/InterpreterDropQuery.cpp
@@ -417,7 +417,7 @@ BlockIO InterpreterDropQuery::executeToDatabaseImpl(const ASTDropQuery & query,
                     uuids_to_wait.push_back(table_to_wait);
                 }
             }
-           // only if operation is DETACH
+            // only if operation is DETACH
             if ((!drop || !truncate) && query.sync)
             {
                 /// Avoid "some tables are still in use" when sync mode is enabled

From 835b47519a7c575d70542e5a37c97dbf5a2b25f9 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Wed, 14 Feb 2024 00:44:38 +0100
Subject: [PATCH 054/985] impl

---
 src/Backups/BackupIO_S3.cpp                  |  1 +
 src/Coordination/KeeperSnapshotManagerS3.cpp |  1 +
 src/Disks/ObjectStorages/S3/diskSettings.cpp |  1 +
 src/IO/S3/Client.cpp                         | 19 +++++++++---
 src/IO/S3/Client.h                           |  6 ++++
 src/IO/S3/Requests.h                         | 32 ++++++++++++++++++--
 src/IO/S3/URI.cpp                            | 18 +++++------
 src/IO/S3/tests/gtest_aws_s3_client.cpp      | 25 ++++++++++++++-
 src/IO/WriteBufferFromS3.cpp                 | 15 ++++++++-
 src/IO/WriteBufferFromS3.h                   |  1 +
 src/IO/tests/gtest_s3_uri.cpp                |  8 +++++
 src/IO/tests/gtest_writebuffer_s3.cpp        | 21 +++++++------
 src/Storages/StorageS3.cpp                   |  1 +
 13 files changed, 119 insertions(+), 30 deletions(-)

diff --git a/src/Backups/BackupIO_S3.cpp b/src/Backups/BackupIO_S3.cpp
index 9359602a651..2063af2061c 100644
--- a/src/Backups/BackupIO_S3.cpp
+++ b/src/Backups/BackupIO_S3.cpp
@@ -73,6 +73,7 @@ namespace
             .use_virtual_addressing = s3_uri.is_virtual_hosted_style,
             .disable_checksum = local_settings.s3_disable_checksum,
             .gcs_issue_compose_request = context->getConfigRef().getBool("s3.gcs_issue_compose_request", false),
+            .is_s3express_bucket = S3::isS3ExpressEndpoint(s3_uri.endpoint),
         };
 
         return S3::ClientFactory::instance().create(
diff --git a/src/Coordination/KeeperSnapshotManagerS3.cpp b/src/Coordination/KeeperSnapshotManagerS3.cpp
index 0337a564660..9779a041095 100644
--- a/src/Coordination/KeeperSnapshotManagerS3.cpp
+++ b/src/Coordination/KeeperSnapshotManagerS3.cpp
@@ -103,6 +103,7 @@ void KeeperSnapshotManagerS3::updateS3Configuration(const Poco::Util::AbstractCo
             .use_virtual_addressing = new_uri.is_virtual_hosted_style,
             .disable_checksum = false,
             .gcs_issue_compose_request = false,
+            .is_s3express_bucket = S3::isS3ExpressEndpoint(new_uri.endpoint),
         };
 
         auto client = S3::ClientFactory::instance().create(
diff --git a/src/Disks/ObjectStorages/S3/diskSettings.cpp b/src/Disks/ObjectStorages/S3/diskSettings.cpp
index 4fd4b17aabe..b8688cd3de6 100644
--- a/src/Disks/ObjectStorages/S3/diskSettings.cpp
+++ b/src/Disks/ObjectStorages/S3/diskSettings.cpp
@@ -97,6 +97,7 @@ std::unique_ptr<S3::Client> getClient(
         .use_virtual_addressing = uri.is_virtual_hosted_style,
         .disable_checksum = local_settings.s3_disable_checksum,
         .gcs_issue_compose_request = config.getBool("s3.gcs_issue_compose_request", false),
+        .is_s3express_bucket = S3::isS3ExpressEndpoint(endpoint),
     };
 
     return S3::ClientFactory::instance().create(
diff --git a/src/IO/S3/Client.cpp b/src/IO/S3/Client.cpp
index 1b6b245b89a..a75d41df3d1 100644
--- a/src/IO/S3/Client.cpp
+++ b/src/IO/S3/Client.cpp
@@ -304,6 +304,9 @@ Model::HeadObjectOutcome Client::HeadObject(HeadObjectRequest & request) const
 
     request.setApiMode(api_mode);
 
+    if (isS3ExpressBucket())
+        request.setIsS3ExpressBucket();
+
     addAdditionalAMZHeadersToCanonicalHeadersList(request, client_configuration.extra_headers);
 
     if (auto region = getRegionForBucket(bucket); !region.empty())
@@ -530,7 +533,11 @@ Client::doRequest(RequestType & request, RequestFn request_fn) const
     addAdditionalAMZHeadersToCanonicalHeadersList(request, client_configuration.extra_headers);
     const auto & bucket = request.GetBucket();
     request.setApiMode(api_mode);
-    if (client_settings.disable_checksum)
+
+    /// We have to use checksums for S3Express buckets, so the order of checks should be the following
+    if (client_settings.is_s3express_bucket)
+        request.setIsS3ExpressBucket();
+    else if (client_settings.disable_checksum)
         request.disableChecksum();
 
     if (auto region = getRegionForBucket(bucket); !region.empty())
@@ -915,9 +922,9 @@ std::unique_ptr<S3::Client> ClientFactory::create( // NOLINT
         std::move(sse_kms_config),
         credentials_provider,
         client_configuration, // Client configuration.
-        Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy::Never,
-        client_settings
-    );
+        client_settings.is_s3express_bucket ? Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy::RequestDependent
+                                            : Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy::Never,
+        client_settings);
 }
 
 PocoHTTPClientConfiguration ClientFactory::createClientConfiguration( // NOLINT
@@ -956,6 +963,10 @@ PocoHTTPClientConfiguration ClientFactory::createClientConfiguration( // NOLINT
     return config;
 }
 
+bool isS3ExpressEndpoint(const std::string & endpoint)
+{
+    return endpoint.contains("s3express");
+}
 }
 
 }
diff --git a/src/IO/S3/Client.h b/src/IO/S3/Client.h
index 8da21bd2c2c..c7bc727bf32 100644
--- a/src/IO/S3/Client.h
+++ b/src/IO/S3/Client.h
@@ -92,6 +92,8 @@ private:
     std::unordered_map<ClientCache *, std::weak_ptr<ClientCache>> client_caches;
 };
 
+bool isS3ExpressEndpoint(const std::string & endpoint);
+
 struct ClientSettings
 {
     bool use_virtual_addressing;
@@ -107,6 +109,7 @@ struct ClientSettings
     /// Ability to enable it preserved since likely it is required for old
     /// files.
     bool gcs_issue_compose_request;
+    bool is_s3express_bucket;
 };
 
 /// Client that improves the client from the AWS SDK
@@ -208,6 +211,9 @@ public:
                           const std::shared_ptr<Aws::Http::HttpRequest>& httpRequest) const override;
 
     bool supportsMultiPartCopy() const;
+
+    bool isS3ExpressBucket() const { return client_settings.is_s3express_bucket; }
+
 private:
     friend struct ::MockS3::Client;
 
diff --git a/src/IO/S3/Requests.h b/src/IO/S3/Requests.h
index bfb94a5a67e..6f82a0f39d3 100644
--- a/src/IO/S3/Requests.h
+++ b/src/IO/S3/Requests.h
@@ -21,12 +21,32 @@
 #include <aws/s3/model/UploadPartCopyRequest.h>
 #include <aws/s3/model/DeleteObjectRequest.h>
 #include <aws/s3/model/DeleteObjectsRequest.h>
+#include <aws/s3/model/ChecksumAlgorithm.h>
+#include <aws/s3/model/CompletedPart.h>
+
+#include <base/defines.h>
 
 namespace DB::S3
 {
 
 namespace Model = Aws::S3::Model;
 
+/// Used only for S3Express
+namespace RequestChecksum
+{
+inline void setPartChecksum(Model::CompletedPart & part, const std::string & checksum)
+{
+    part.SetChecksumCRC32(checksum);
+}
+
+template <typename R>
+inline void setChecksumAlgorithm(R & request)
+{
+    if constexpr (requires { request.SetChecksumAlgorithm(Model::ChecksumAlgorithm::CRC32); })
+        request.SetChecksumAlgorithm(Model::ChecksumAlgorithm::CRC32);
+}
+};
+
 template <typename BaseRequest>
 class ExtendedRequest : public BaseRequest
 {
@@ -49,11 +69,13 @@ public:
 
     Aws::String GetChecksumAlgorithmName() const override
     {
+        chassert(!is_s3express_bucket || checksum);
+
         /// Return empty string is enough to disable checksums (see
         /// AWSClient::AddChecksumToRequest [1] for more details).
         ///
         ///   [1]: https://github.com/aws/aws-sdk-cpp/blob/b0ee1c0d336dbb371c34358b68fba6c56aae2c92/src/aws-cpp-sdk-core/source/client/AWSClient.cpp#L783-L839
-        if (!checksum)
+        if (!is_s3express_bucket && !checksum)
             return "";
         return BaseRequest::GetChecksumAlgorithmName();
     }
@@ -84,9 +106,12 @@ public:
     }
 
     /// Disable checksum to avoid extra read of the input stream
-    void disableChecksum() const
+    void disableChecksum() const { checksum = false; }
+
+    void setIsS3ExpressBucket()
     {
-        checksum = false;
+        is_s3express_bucket = true;
+        RequestChecksum::setChecksumAlgorithm(*this);
     }
 
 protected:
@@ -94,6 +119,7 @@ protected:
     mutable std::optional<S3::URI> uri_override;
     mutable ApiMode api_mode{ApiMode::AWS};
     mutable bool checksum = true;
+    bool is_s3express_bucket = false;
 };
 
 class CopyObjectRequest : public ExtendedRequest<Model::CopyObjectRequest>
diff --git a/src/IO/S3/URI.cpp b/src/IO/S3/URI.cpp
index 23f59420bfe..062d3b80850 100644
--- a/src/IO/S3/URI.cpp
+++ b/src/IO/S3/URI.cpp
@@ -35,7 +35,7 @@ URI::URI(const std::string & uri_)
     /// Case when bucket name represented in domain name of S3 URL.
     /// E.g. (https://bucket-name.s3.Region.amazonaws.com/key)
     /// https://docs.aws.amazon.com/AmazonS3/latest/dev/VirtualHosting.html#virtual-hosted-style-access
-    static const RE2 virtual_hosted_style_pattern(R"((.+)\.(s3|cos|obs|oss|eos)([.\-][a-z0-9\-.:]+))");
+    static const RE2 virtual_hosted_style_pattern(R"((.+)\.(s3express[\-a-z0-9]+|s3|cos|obs|oss|eos)([.\-][a-z0-9\-.:]+))");
 
     /// Case when bucket name and key represented in path of S3 URL.
     /// E.g. (https://s3.Region.amazonaws.com/bucket-name/key)
@@ -43,6 +43,7 @@ URI::URI(const std::string & uri_)
     static const RE2 path_style_pattern("^/([^/]*)/(.*)");
 
     static constexpr auto S3 = "S3";
+    static constexpr auto S3EXPRESS = "S3EXPRESS";
     static constexpr auto COSN = "COSN";
     static constexpr auto COS = "COS";
     static constexpr auto OBS = "OBS";
@@ -115,21 +116,16 @@ URI::URI(const std::string & uri_)
         }
 
         boost::to_upper(name);
-        if (name != S3 && name != COS && name != OBS && name != OSS && name != EOS)
+        /// For S3Express it will look like s3express-eun1-az1, i.e. contain region and AZ info
+        if (name != S3 && !name.starts_with(S3EXPRESS) && name != COS && name != OBS && name != OSS && name != EOS)
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
                             "Object storage system name is unrecognized in virtual hosted style S3 URI: {}",
                             quoteString(name));
 
-        if (name == S3)
-            storage_name = name;
-        else if (name == OBS)
-            storage_name = OBS;
-        else if (name == OSS)
-            storage_name = OSS;
-        else if (name == EOS)
-            storage_name = EOS;
-        else
+        if (name == COS || name == COSN)
             storage_name = COSN;
+        else
+            storage_name = name;
     }
     else if (re2::RE2::PartialMatch(uri.getPath(), path_style_pattern, &bucket, &key))
     {
diff --git a/src/IO/S3/tests/gtest_aws_s3_client.cpp b/src/IO/S3/tests/gtest_aws_s3_client.cpp
index 33917314bca..8edbe12a22f 100644
--- a/src/IO/S3/tests/gtest_aws_s3_client.cpp
+++ b/src/IO/S3/tests/gtest_aws_s3_client.cpp
@@ -110,7 +110,8 @@ void testServerSideEncryption(
     bool disable_checksum,
     String server_side_encryption_customer_key_base64,
     DB::S3::ServerSideEncryptionKMSConfig sse_kms_config,
-    String expected_headers)
+    String expected_headers,
+    bool is_s3express_bucket = false)
 {
     TestPocoHTTPServer http;
 
@@ -144,6 +145,7 @@ void testServerSideEncryption(
         .use_virtual_addressing = uri.is_virtual_hosted_style,
         .disable_checksum = disable_checksum,
         .gcs_issue_compose_request = false,
+        .is_s3express_bucket = is_s3express_bucket,
     };
 
     std::shared_ptr<DB::S3::Client> client = DB::S3::ClientFactory::instance().create(
@@ -295,4 +297,25 @@ TEST(IOTestAwsS3Client, AppendExtraSSEKMSHeadersWrite)
         "x-amz-server-side-encryption-context: arn:aws:s3:::bucket_ARN\n");
 }
 
+TEST(IOTestAwsS3Client, ChecksumHeaderIsPresentForS3Express)
+{
+    /// See https://github.com/ClickHouse/ClickHouse/pull/19748
+    testServerSideEncryption(
+        doWriteRequest,
+        /* disable_checksum= */ true,
+        "",
+        {},
+        "authorization: ... SignedHeaders="
+        "amz-sdk-invocation-id;"
+        "amz-sdk-request;"
+        "content-length;"
+        "content-type;"
+        "host;"
+        "x-amz-checksum-crc32;"
+        "x-amz-content-sha256;"
+        "x-amz-date;"
+        "x-amz-sdk-checksum-algorithm, ...\n",
+        /*is_s3express_bucket=*/true);
+}
+
 #endif
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index 5bb01050591..a162992278f 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -18,7 +18,9 @@
 #include <IO/S3/getObjectInfo.h>
 #include <IO/S3/BlobStorageLogWriter.h>
 
+#include <aws/core/utils/HashingUtils.h>
 #include <aws/s3/model/StorageClass.h>
+#include <aws/s3/model/ChecksumAlgorithm.h>
 
 #include <utility>
 
@@ -456,6 +458,14 @@ S3::UploadPartRequest WriteBufferFromS3::getUploadRequest(size_t part_number, Pa
     /// If we don't do it, AWS SDK can mistakenly set it to application/xml, see https://github.com/aws/aws-sdk-cpp/issues/1840
     req.SetContentType("binary/octet-stream");
 
+    /// Checksums need to be provided on CompleteMultipartUpload requests, so we calculate then manually and store in multipart_checksums
+    if (client_ptr->isS3ExpressBucket())
+    {
+        chassert(req.GetChecksumAlgorithm() == Aws::S3::Model::ChecksumAlgorithm::CRC32);
+        req.SetChecksumCRC32(Aws::Utils::HashingUtils::Base64Encode(Aws::Utils::HashingUtils::CalculateCRC32(*(req.GetBody()))));
+        multipart_checksums.push_back(req.GetChecksumCRC32());
+    }
+
     return req;
 }
 
@@ -575,7 +585,10 @@ void WriteBufferFromS3::completeMultipartUpload()
     for (size_t i = 0; i < multipart_tags.size(); ++i)
     {
         Aws::S3::Model::CompletedPart part;
-        multipart_upload.AddParts(part.WithETag(multipart_tags[i]).WithPartNumber(static_cast<int>(i + 1)));
+        part.WithETag(multipart_tags[i]).WithPartNumber(static_cast<int>(i + 1));
+        if (!multipart_checksums.empty())
+            S3::RequestChecksum::setPartChecksum(part, multipart_checksums.at(i));
+        multipart_upload.AddParts(part);
     }
 
     req.SetMultipartUpload(multipart_upload);
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 5dc269990a1..148cd27f854 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -100,6 +100,7 @@ private:
     /// We initiate upload, then upload each part and get ETag as a response, and then finalizeImpl() upload with listing all our parts.
     String multipart_upload_id;
     std::deque<String> multipart_tags;
+    std::deque<String> multipart_checksums;
     bool multipart_upload_finished = false;
 
     /// Track that prefinalize() is called only once
diff --git a/src/IO/tests/gtest_s3_uri.cpp b/src/IO/tests/gtest_s3_uri.cpp
index c088e41f1e8..5bf0dfb962d 100644
--- a/src/IO/tests/gtest_s3_uri.cpp
+++ b/src/IO/tests/gtest_s3_uri.cpp
@@ -162,6 +162,14 @@ TEST(S3UriTest, validPatterns)
         ASSERT_EQ("", uri.version_id);
         ASSERT_EQ(false, uri.is_virtual_hosted_style);
     }
+    {
+        S3::URI uri("https://test-perf-bucket--eun1-az1--x-s3.s3express-eun1-az1.eu-north-1.amazonaws.com/test.csv");
+        ASSERT_EQ("https://s3express-eun1-az1.eu-north-1.amazonaws.com", uri.endpoint);
+        ASSERT_EQ("test-perf-bucket--eun1-az1--x-s3", uri.bucket);
+        ASSERT_EQ("test.csv", uri.key);
+        ASSERT_EQ("", uri.version_id);
+        ASSERT_EQ(true, uri.is_virtual_hosted_style);
+    }
 }
 
 TEST_P(S3UriTest, invalidPatterns)
diff --git a/src/IO/tests/gtest_writebuffer_s3.cpp b/src/IO/tests/gtest_writebuffer_s3.cpp
index ae00bb2e9e2..d9cb486c09e 100644
--- a/src/IO/tests/gtest_writebuffer_s3.cpp
+++ b/src/IO/tests/gtest_writebuffer_s3.cpp
@@ -205,16 +205,17 @@ struct Client : DB::S3::Client
 {
     explicit Client(std::shared_ptr<S3MemStrore> mock_s3_store)
         : DB::S3::Client(
-               100,
-               DB::S3::ServerSideEncryptionKMSConfig(),
-               std::make_shared<Aws::Auth::SimpleAWSCredentialsProvider>("", ""),
-               GetClientConfiguration(),
-               Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy::Never,
-               DB::S3::ClientSettings{
-                   .use_virtual_addressing = true,
-                   .disable_checksum= false,
-                   .gcs_issue_compose_request = false,
-               })
+            100,
+            DB::S3::ServerSideEncryptionKMSConfig(),
+            std::make_shared<Aws::Auth::SimpleAWSCredentialsProvider>("", ""),
+            GetClientConfiguration(),
+            Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy::Never,
+            DB::S3::ClientSettings{
+                .use_virtual_addressing = true,
+                .disable_checksum = false,
+                .gcs_issue_compose_request = false,
+                .is_s3express_bucket = false,
+            })
         , store(mock_s3_store)
     {}
 
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 2d8ef3df1c8..044a1ca5362 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -1427,6 +1427,7 @@ void StorageS3::Configuration::connect(const ContextPtr & context)
         .use_virtual_addressing = url.is_virtual_hosted_style,
         .disable_checksum = local_settings.s3_disable_checksum,
         .gcs_issue_compose_request = context->getConfigRef().getBool("s3.gcs_issue_compose_request", false),
+        .is_s3express_bucket = S3::isS3ExpressEndpoint(url.endpoint),
     };
 
     auto credentials = Aws::Auth::AWSCredentials(auth_settings.access_key_id, auth_settings.secret_access_key, auth_settings.session_token);

From 18741f122eabaeb7903f355958af1e1a88818e83 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 26 Feb 2024 12:42:13 +0800
Subject: [PATCH 055/985] Move a setting to server setting

---
 src/Core/ServerSettings.h                                  | 2 ++
 src/Core/Settings.h                                        | 1 -
 src/Interpreters/Context.cpp                               | 2 +-
 .../config.d/force_read_through_cache_for_merges.xml       | 3 +++
 tests/integration/test_filesystem_cache/test.py            | 2 +-
 .../users.d/force_read_through_cache_on_merge.xml          | 7 -------
 6 files changed, 7 insertions(+), 10 deletions(-)
 create mode 100644 tests/integration/test_filesystem_cache/config.d/force_read_through_cache_for_merges.xml
 delete mode 100644 tests/integration/test_filesystem_cache/users.d/force_read_through_cache_on_merge.xml

diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index de2a4e9b755..0283b98638f 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -103,6 +103,8 @@ namespace DB
     M(Bool, async_load_databases, false, "Enable asynchronous loading of databases and tables to speedup server startup. Queries to not yet loaded entity will be blocked until load is finished.", 0) \
     M(Bool, display_secrets_in_show_and_select, false, "Allow showing secrets in SHOW and SELECT queries via a format setting and a grant", 0) \
     \
+    M(Bool, force_read_through_cache_for_merges, false, "Force read-through filesystem cache for merges", 0) \
+    \
     M(Seconds, keep_alive_timeout, DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT, "The number of seconds that ClickHouse waits for incoming requests before closing the connection.", 0) \
     M(Seconds, replicated_fetches_http_connection_timeout, 0, "HTTP connection timeout for part fetch requests. Inherited from default profile `http_connection_timeout` if not set explicitly.", 0) \
     M(Seconds, replicated_fetches_http_send_timeout, 0, "HTTP send timeout for part fetch requests. Inherited from default profile `http_send_timeout` if not set explicitly.", 0) \
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index db060bf712d..433195af9c3 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -769,7 +769,6 @@ class IColumn;
     M(Bool, enable_filesystem_cache_on_write_operations, false, "Write into cache on write operations. To actually work this setting requires be added to disk config too", 0) \
     M(Bool, enable_filesystem_cache_log, false, "Allows to record the filesystem caching log for each query", 0) \
     M(Bool, read_from_filesystem_cache_if_exists_otherwise_bypass_cache, false, "Allow to use the filesystem cache in passive mode - benefit from the existing cache entries, but don't put more entries into the cache. If you set this setting for heavy ad-hoc queries and leave it disabled for short real-time queries, this will allows to avoid cache threshing by too heavy queries and to improve the overall system efficiency.", 0) \
-    M(Bool, force_read_through_cache_for_merges, false, "Force read-through cache for merges", 0) \
     M(Bool, skip_download_if_exceeds_query_cache, true, "Skip download from remote filesystem if exceeds query cache size", 0) \
     M(UInt64, filesystem_cache_max_download_size, (128UL * 1024 * 1024 * 1024), "Max remote filesystem cache size that can be downloaded by a single query", 0) \
     M(Bool, throw_on_error_from_cache_on_write_operations, false, "Ignore error from cache when caching on write operations (INSERT, merges)", 0) \
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 36b362e36bb..a974eaca067 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -5079,7 +5079,7 @@ ReadSettings Context::getReadSettings() const
     res.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache;
     res.enable_filesystem_cache_log = settings.enable_filesystem_cache_log;
     res.filesystem_cache_segments_batch_size = settings.filesystem_cache_segments_batch_size;
-    res.force_read_through_cache_merges = settings.force_read_through_cache_for_merges;
+    res.force_read_through_cache_merges = getServerSettings().force_read_through_cache_for_merges;
 
     res.filesystem_cache_max_download_size = settings.filesystem_cache_max_download_size;
     res.skip_download_if_exceeds_query_cache = settings.skip_download_if_exceeds_query_cache;
diff --git a/tests/integration/test_filesystem_cache/config.d/force_read_through_cache_for_merges.xml b/tests/integration/test_filesystem_cache/config.d/force_read_through_cache_for_merges.xml
new file mode 100644
index 00000000000..bb2a6e850a4
--- /dev/null
+++ b/tests/integration/test_filesystem_cache/config.d/force_read_through_cache_for_merges.xml
@@ -0,0 +1,3 @@
+<clickhouse>
+    <force_read_through_cache_for_merges>1</force_read_through_cache_for_merges>
+</clickhouse>
diff --git a/tests/integration/test_filesystem_cache/test.py b/tests/integration/test_filesystem_cache/test.py
index c1ba6702dcf..f32fa4e9823 100644
--- a/tests/integration/test_filesystem_cache/test.py
+++ b/tests/integration/test_filesystem_cache/test.py
@@ -42,9 +42,9 @@ def cluster():
             "node_force_read_through_cache_on_merge",
             main_configs=[
                 "config.d/storage_conf.xml",
+                "config.d/force_read_through_cache_for_merges.xml",
             ],
             user_configs=[
-                "users.d/force_read_through_cache_on_merge.xml",
                 "users.d/cache_on_write_operations.xml",
             ],
             stay_alive=True,
diff --git a/tests/integration/test_filesystem_cache/users.d/force_read_through_cache_on_merge.xml b/tests/integration/test_filesystem_cache/users.d/force_read_through_cache_on_merge.xml
deleted file mode 100644
index 4d26a1a8bc7..00000000000
--- a/tests/integration/test_filesystem_cache/users.d/force_read_through_cache_on_merge.xml
+++ /dev/null
@@ -1,7 +0,0 @@
-<clickhouse>
-    <profiles>
-        <default>
-            <force_read_through_cache_for_merges>1</force_read_through_cache_for_merges>
-        </default>
-    </profiles>
-</clickhouse>

From bf5affbe640976d2b73e12f5213a13baacf40619 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 26 Feb 2024 16:37:09 +0800
Subject: [PATCH 056/985] Fix test

---
 .../02241_filesystem_cache_on_write_operations.sh           | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh
index 2b237492e98..ee1d942a421 100755
--- a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh
+++ b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.sh
@@ -99,14 +99,8 @@ for STORAGE_POLICY in 's3_cache' 'local_cache'; do
 
     $CLICKHOUSE_CLIENT --echo --query "SYSTEM START MERGES test_02241"
 
-    $CLICKHOUSE_CLIENT --echo --query "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
-    $CLICKHOUSE_CLIENT --echo --query "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
-
     $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --query "OPTIMIZE TABLE test_02241 FINAL"
 
-    $CLICKHOUSE_CLIENT --echo --query "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
-    $CLICKHOUSE_CLIENT --echo --query "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
-
     $CLICKHOUSE_CLIENT --echo --query "SELECT count(), sum(size) FROM system.filesystem_cache"
 
     $CLICKHOUSE_CLIENT --echo --enable_filesystem_cache_on_write_operations=1 --mutations_sync=2 --query "ALTER TABLE test_02241 UPDATE value = 'kek' WHERE key = 100"

From 277e8d965555b4fcd09a755282666bcae36adae6 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 26 Feb 2024 14:03:53 +0800
Subject: [PATCH 057/985] Fix usage plain metadata type with new configuration
 option

---
 src/Disks/DiskType.cpp                        | 48 +++++++++++++++++++
 src/Disks/DiskType.h                          | 34 +------------
 src/Disks/ObjectStorages/IObjectStorage.h     |  1 +
 .../ObjectStorages/MetadataStorageFactory.cpp | 36 +++++++++++---
 .../ObjectStorages/MetadataStorageFactory.h   |  7 +++
 .../ObjectStorages/ObjectStorageFactory.cpp   | 43 +++++++++++++----
 src/Disks/ObjectStorages/PlainObjectStorage.h | 29 +++++++++++
 .../RegisterDiskObjectStorage.cpp             | 24 ++--------
 src/Disks/ObjectStorages/S3/S3ObjectStorage.h | 21 --------
 .../configs/disk_s3.xml                       |  7 +++
 .../test_attach_backup_from_s3_plain/test.py  | 25 ++++++----
 11 files changed, 178 insertions(+), 97 deletions(-)
 create mode 100644 src/Disks/ObjectStorages/PlainObjectStorage.h

diff --git a/src/Disks/DiskType.cpp b/src/Disks/DiskType.cpp
index 218b6ee7f26..1778ae8025b 100644
--- a/src/Disks/DiskType.cpp
+++ b/src/Disks/DiskType.cpp
@@ -1,7 +1,27 @@
 #include "DiskType.h"
+#include <Poco/String.h>
+#include <Common/Exception.h>
 
 namespace DB
 {
+namespace ErrorCodes
+{
+    extern const int UNKNOWN_ELEMENT_IN_CONFIG;
+}
+
+MetadataStorageType metadataTypeFromString(const String & type)
+{
+    auto check_type = Poco::toLower(type);
+    if (check_type == "local")
+        return MetadataStorageType::Local;
+    if (check_type == "plain")
+        return MetadataStorageType::Plain;
+    if (check_type == "web")
+        return MetadataStorageType::StaticWeb;
+
+    throw Exception(ErrorCodes::UNKNOWN_ELEMENT_IN_CONFIG,
+                    "MetadataStorageFactory: unknown metadata storage type: {}", type);
+}
 
 bool DataSourceDescription::operator==(const DataSourceDescription & other) const
 {
@@ -14,4 +34,32 @@ bool DataSourceDescription::sameKind(const DataSourceDescription & other) const
         == std::tie(other.type, other.object_storage_type, other.description);
 }
 
+std::string DataSourceDescription::toString() const
+{
+    switch (type)
+    {
+        case DataSourceType::Local:
+            return "local";
+        case DataSourceType::RAM:
+            return "memory";
+        case DataSourceType::ObjectStorage:
+        {
+            switch (object_storage_type)
+            {
+                case ObjectStorageType::S3:
+                    return "s3";
+                case ObjectStorageType::HDFS:
+                    return "hdfs";
+                case ObjectStorageType::Azure:
+                    return "azure_blob_storage";
+                case ObjectStorageType::Local:
+                    return "local_blob_storage";
+                case ObjectStorageType::Web:
+                    return "web";
+                case ObjectStorageType::None:
+                    return "none";
+            }
+        }
+    }
+}
 }
diff --git a/src/Disks/DiskType.h b/src/Disks/DiskType.h
index 15940ea9155..36fe4d83004 100644
--- a/src/Disks/DiskType.h
+++ b/src/Disks/DiskType.h
@@ -17,7 +17,6 @@ enum class ObjectStorageType
 {
     None,
     S3,
-    S3_Plain,
     Azure,
     HDFS,
     Web,
@@ -30,9 +29,9 @@ enum class MetadataStorageType
     Local,
     Plain,
     StaticWeb,
-    Memory,
 };
 
+MetadataStorageType metadataTypeFromString(const String & type);
 String toString(DataSourceType data_source_type);
 
 struct DataSourceDescription
@@ -49,36 +48,7 @@ struct DataSourceDescription
     bool operator==(const DataSourceDescription & other) const;
     bool sameKind(const DataSourceDescription & other) const;
 
-    std::string toString() const
-    {
-        switch (type)
-        {
-            case DataSourceType::Local:
-                return "local";
-            case DataSourceType::RAM:
-                return "memory";
-            case DataSourceType::ObjectStorage:
-            {
-                switch (object_storage_type)
-                {
-                    case ObjectStorageType::S3:
-                        return "s3";
-                    case ObjectStorageType::S3_Plain:
-                        return "s3_plain";
-                    case ObjectStorageType::HDFS:
-                        return "hdfs";
-                    case ObjectStorageType::Azure:
-                        return "azure_blob_storage";
-                    case ObjectStorageType::Local:
-                        return "local_blob_storage";
-                    case ObjectStorageType::Web:
-                        return "web";
-                    case ObjectStorageType::None:
-                        return "none";
-                }
-            }
-        }
-    }
+    std::string toString() const;
 };
 
 }
diff --git a/src/Disks/ObjectStorages/IObjectStorage.h b/src/Disks/ObjectStorages/IObjectStorage.h
index 56c269a3fc5..fde97d82ad1 100644
--- a/src/Disks/ObjectStorages/IObjectStorage.h
+++ b/src/Disks/ObjectStorages/IObjectStorage.h
@@ -218,6 +218,7 @@ public:
 
     virtual bool isReadOnly() const { return false; }
     virtual bool isWriteOnce() const { return false; }
+    virtual bool isPlain() const { return false; }
 
     virtual bool supportParallelWrite() const { return false; }
 
diff --git a/src/Disks/ObjectStorages/MetadataStorageFactory.cpp b/src/Disks/ObjectStorages/MetadataStorageFactory.cpp
index 52a0b9ec268..adc1f84372c 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/MetadataStorageFactory.cpp
@@ -32,6 +32,35 @@ void MetadataStorageFactory::registerMetadataStorageType(const std::string & met
     }
 }
 
+std::string MetadataStorageFactory::getCompatibilityMetadataTypeHint(const ObjectStorageType & type)
+{
+    switch (type)
+    {
+        case ObjectStorageType::S3:
+        case ObjectStorageType::HDFS:
+        case ObjectStorageType::Local:
+        case ObjectStorageType::Azure:
+            return "local";
+        case ObjectStorageType::Web:
+            return "web";
+        default:
+            return "";
+    }
+}
+
+std::string MetadataStorageFactory::getMetadataType(
+    const Poco::Util::AbstractConfiguration & config,
+    const std::string & config_prefix,
+    const std::string & compatibility_type_hint)
+{
+    if (compatibility_type_hint.empty() && !config.has(config_prefix + ".metadata_type"))
+    {
+        throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Expected `metadata_type` in config");
+    }
+
+    return config.getString(config_prefix + ".metadata_type", compatibility_type_hint);
+}
+
 MetadataStoragePtr MetadataStorageFactory::create(
     const std::string & name,
     const Poco::Util::AbstractConfiguration & config,
@@ -39,12 +68,7 @@ MetadataStoragePtr MetadataStorageFactory::create(
     ObjectStoragePtr object_storage,
     const std::string & compatibility_type_hint) const
 {
-    if (compatibility_type_hint.empty() && !config.has(config_prefix + ".metadata_type"))
-    {
-        throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Expected `metadata_type` in config");
-    }
-
-    const auto type = config.getString(config_prefix + ".metadata_type", compatibility_type_hint);
+    const auto type = getMetadataType(config, config_prefix, compatibility_type_hint);
     const auto it = registry.find(type);
 
     if (it == registry.end())
diff --git a/src/Disks/ObjectStorages/MetadataStorageFactory.h b/src/Disks/ObjectStorages/MetadataStorageFactory.h
index 5f61125c599..467cd3cef98 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFactory.h
+++ b/src/Disks/ObjectStorages/MetadataStorageFactory.h
@@ -25,6 +25,13 @@ public:
         ObjectStoragePtr object_storage,
         const std::string & compatibility_type_hint) const;
 
+    static std::string getMetadataType(
+        const Poco::Util::AbstractConfiguration & config,
+        const std::string & config_prefix,
+        const std::string & compatibility_type_hint = "");
+
+    static std::string getCompatibilityMetadataTypeHint(const ObjectStorageType & type);
+
 private:
     using Registry = std::unordered_map<String, Creator>;
     Registry registry;
diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index b3626135177..6f6ff199902 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -16,8 +16,10 @@
 #ifndef CLICKHOUSE_KEEPER_STANDALONE_BUILD
 #include <Disks/ObjectStorages/Web/WebObjectStorage.h>
 #include <Disks/ObjectStorages/Local/LocalObjectStorage.h>
+#include <Disks/ObjectStorages/PlainObjectStorage.h>
 #include <Disks/loadLocalDiskConfig.h>
 #endif
+#include <Disks/ObjectStorages/MetadataStorageFactory.h>
 #include <Interpreters/Context.h>
 #include <Common/Macros.h>
 
@@ -32,6 +34,28 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
+namespace
+{
+    template <typename BaseObjectStorage, class ...Args>
+    ObjectStoragePtr createObjectStorage(
+        const Poco::Util::AbstractConfiguration & config,
+        const std::string & config_prefix,
+        Args && ...args)
+    {
+        auto compatibility_hint = MetadataStorageFactory::getCompatibilityMetadataTypeHint(ObjectStorageType::S3);
+        auto metadata_type = MetadataStorageFactory::getMetadataType(config, config_prefix, compatibility_hint);
+
+        if (metadataTypeFromString(metadata_type) == MetadataStorageType::Plain)
+        {
+            return std::make_shared<PlainObjectStorage<BaseObjectStorage>>(std::forward<Args>(args)...);
+        }
+        else
+        {
+            return std::make_shared<BaseObjectStorage>(std::forward<Args>(args)...);
+        }
+    }
+}
+
 ObjectStorageFactory & ObjectStorageFactory::instance()
 {
     static ObjectStorageFactory factory;
@@ -129,12 +153,12 @@ void registerS3ObjectStorage(ObjectStorageFactory & factory)
         auto client = getClient(config, config_prefix, context, *settings);
         auto key_generator = getKeyGenerator(disk_type, uri, config, config_prefix);
 
-        auto object_storage = std::make_shared<S3ObjectStorage>(
-            std::move(client), std::move(settings), uri, s3_capabilities, key_generator, name);
+        auto object_storage = createObjectStorage<S3ObjectStorage>(
+            config, config_prefix, std::move(client), std::move(settings), uri, s3_capabilities, key_generator, name);
 
         /// NOTE: should we still perform this check for clickhouse-disks?
         if (!skip_access_check)
-            checkS3Capabilities(*object_storage, s3_capabilities, name, uri.key);
+            checkS3Capabilities(*dynamic_cast<S3ObjectStorage *>(object_storage.get()), s3_capabilities, name, uri.key);
 
         return object_storage;
     });
@@ -165,12 +189,12 @@ void registerS3PlainObjectStorage(ObjectStorageFactory & factory)
         auto client = getClient(config, config_prefix, context, *settings);
         auto key_generator = getKeyGenerator(disk_type, uri, config, config_prefix);
 
-        auto object_storage = std::make_shared<S3PlainObjectStorage>(
+        auto object_storage = std::make_shared<PlainObjectStorage<S3ObjectStorage>>(
             std::move(client), std::move(settings), uri, s3_capabilities, key_generator, name);
 
         /// NOTE: should we still perform this check for clickhouse-disks?
         if (!skip_access_check)
-            checkS3Capabilities(*object_storage, s3_capabilities, name, uri.key);
+            checkS3Capabilities(*dynamic_cast<S3ObjectStorage *>(object_storage.get()), s3_capabilities, name, uri.key);
 
         return object_storage;
     });
@@ -198,7 +222,7 @@ void registerHDFSObjectStorage(ObjectStorageFactory & factory)
             context->getSettingsRef().hdfs_replication
         );
 
-        return std::make_unique<HDFSObjectStorage>(uri, std::move(settings), config);
+        return createObjectStorage<HDFSObjectStorage>(config, config_prefix, uri, std::move(settings), config);
     });
 }
 #endif
@@ -214,7 +238,8 @@ void registerAzureObjectStorage(ObjectStorageFactory & factory)
         bool /* skip_access_check */) -> ObjectStoragePtr
     {
         String container_name = config.getString(config_prefix + ".container_name", "default-container");
-        return std::make_unique<AzureObjectStorage>(
+        return createObjectStorage<AzureObjectStorage>(
+            config, config_prefix,
             name,
             getAzureBlobContainerClient(config, config_prefix),
             getAzureBlobStorageSettings(config, config_prefix, context),
@@ -248,7 +273,7 @@ void registerWebObjectStorage(ObjectStorageFactory & factory)
                 ErrorCodes::BAD_ARGUMENTS, "Bad URI: `{}`. Error: {}", uri, e.what());
         }
 
-        return std::make_shared<WebObjectStorage>(uri, context);
+        return createObjectStorage<WebObjectStorage>(config, config_prefix, uri, context);
     });
 }
 
@@ -266,7 +291,7 @@ void registerLocalObjectStorage(ObjectStorageFactory & factory)
         loadDiskLocalConfig(name, config, config_prefix, context, object_key_prefix, keep_free_space_bytes);
         /// keys are mapped to the fs, object_key_prefix is a directory also
         fs::create_directories(object_key_prefix);
-        return std::make_shared<LocalObjectStorage>(object_key_prefix);
+        return createObjectStorage<LocalObjectStorage>(config, config_prefix, object_key_prefix);
     });
 }
 #endif
diff --git a/src/Disks/ObjectStorages/PlainObjectStorage.h b/src/Disks/ObjectStorages/PlainObjectStorage.h
new file mode 100644
index 00000000000..3a81b85c44b
--- /dev/null
+++ b/src/Disks/ObjectStorages/PlainObjectStorage.h
@@ -0,0 +1,29 @@
+#pragma once
+#include <Disks/ObjectStorages/IObjectStorage.h>
+
+namespace DB
+{
+
+/// Do not encode keys, store as-is, and do not require separate disk for metadata.
+/// But because of this does not support renames/hardlinks/attrs/...
+///
+/// NOTE: This disk has excessive API calls.
+template <typename BaseObjectStorage>
+class PlainObjectStorage : public BaseObjectStorage
+{
+public:
+    template <class ...Args>
+    explicit PlainObjectStorage(Args && ...args)
+        : BaseObjectStorage(std::forward<Args>(args)...) {}
+
+    std::string getName() const override { return "" + BaseObjectStorage::getName(); }
+
+    /// Notes:
+    /// - supports BACKUP to this disk
+    /// - does not support INSERT into MergeTree table on this disk
+    bool isWriteOnce() const override { return true; }
+
+    bool isPlain() const override { return true; }
+};
+
+}
diff --git a/src/Disks/ObjectStorages/RegisterDiskObjectStorage.cpp b/src/Disks/ObjectStorages/RegisterDiskObjectStorage.cpp
index 383a0b079b5..669a0102951 100644
--- a/src/Disks/ObjectStorages/RegisterDiskObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/RegisterDiskObjectStorage.cpp
@@ -10,25 +10,6 @@ namespace DB
 void registerObjectStorages();
 void registerMetadataStorages();
 
-static std::string getCompatibilityMetadataTypeHint(const ObjectStorageType & type)
-{
-    switch (type)
-    {
-        case ObjectStorageType::S3:
-        case ObjectStorageType::HDFS:
-        case ObjectStorageType::Local:
-        case ObjectStorageType::Azure:
-            return "local";
-        case ObjectStorageType::S3_Plain:
-            return "plain";
-        case ObjectStorageType::Web:
-            return "web";
-        case ObjectStorageType::None:
-            return "";
-    }
-    UNREACHABLE();
-}
-
 void registerDiskObjectStorage(DiskFactory & factory, bool global_skip_access_check)
 {
     registerObjectStorages();
@@ -47,7 +28,10 @@ void registerDiskObjectStorage(DiskFactory & factory, bool global_skip_access_ch
         std::string compatibility_metadata_type_hint;
         if (!config.has(config_prefix + ".metadata_type"))
         {
-            compatibility_metadata_type_hint = getCompatibilityMetadataTypeHint(object_storage->getType());
+            if (object_storage->isPlain())
+                compatibility_metadata_type_hint = "plain";
+            else
+                compatibility_metadata_type_hint = MetadataStorageFactory::getCompatibilityMetadataTypeHint(object_storage->getType());
         }
 
         auto metadata_storage = MetadataStorageFactory::instance().create(
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.h b/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
index ab0fa5bed68..4ece98c5ec4 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
@@ -182,27 +182,6 @@ private:
     LoggerPtr log;
 };
 
-/// Do not encode keys, store as-is, and do not require separate disk for metadata.
-/// But because of this does not support renames/hardlinks/attrs/...
-///
-/// NOTE: This disk has excessive API calls.
-class S3PlainObjectStorage : public S3ObjectStorage
-{
-public:
-    std::string getName() const override { return "S3PlainObjectStorage"; }
-
-    template <class ...Args>
-    explicit S3PlainObjectStorage(Args && ...args)
-        : S3ObjectStorage("S3PlainObjectStorage", std::forward<Args>(args)...) {}
-
-    ObjectStorageType getType() const override { return ObjectStorageType::S3_Plain; }
-
-    /// Notes:
-    /// - supports BACKUP to this disk
-    /// - does not support INSERT into MergeTree table on this disk
-    bool isWriteOnce() const override { return true; }
-};
-
 }
 
 #endif
diff --git a/tests/integration/test_attach_backup_from_s3_plain/configs/disk_s3.xml b/tests/integration/test_attach_backup_from_s3_plain/configs/disk_s3.xml
index 779e4b6ae21..3166eea7ccb 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/configs/disk_s3.xml
+++ b/tests/integration/test_attach_backup_from_s3_plain/configs/disk_s3.xml
@@ -8,9 +8,16 @@
                 <access_key_id>minio</access_key_id>
                 <secret_access_key>minio123</secret_access_key>
             </backup_disk_s3_plain>
+            <backup_disk_local_plain>
+                <type>object_storage</type>
+                <object_storage_type>local</object_storage_type>
+                <metadata_type>plain</metadata_type>
+                <path>local_plain/</path>
+            </backup_disk_local_plain>
         </disks>
     </storage_configuration>
     <backups>
         <allowed_disk>backup_disk_s3_plain</allowed_disk>
+        <allowed_disk>backup_disk_local_plain</allowed_disk>
     </backups>
 </clickhouse>
diff --git a/tests/integration/test_attach_backup_from_s3_plain/test.py b/tests/integration/test_attach_backup_from_s3_plain/test.py
index e575c487b7a..4a8da1e6d66 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/test.py
+++ b/tests/integration/test_attach_backup_from_s3_plain/test.py
@@ -20,17 +20,27 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+s3_disk_def = """disk(type=s3_plain,
+    endpoint='http://minio1:9001/root/data/disks/disk_s3_plain/{backup_name}/',
+    access_key_id='minio',
+    secret_access_key='minio123');"""
+
+local_disk_def = "disk(type=object_storage, object_storage_type = 'local', metadata_type = 'plain'"
 
 @pytest.mark.parametrize(
-    "table_name,backup_name,storage_policy,min_bytes_for_wide_part",
+    "table_name,backup_name,storage_policy,disk_def,min_bytes_for_wide_part",
     [
         pytest.param(
-            "compact", "backup_compact", "s3_backup_compact", int(1e9), id="compact"
+            "compact", "backup_compact_s3", "backup_disk_s3_plain", s3_disk_def, int(1e9), id="compact"
         ),
-        pytest.param("wide", "backup_wide", "s3_backup_wide", int(0), id="wide"),
+        pytest.param("wide", "backup_wide_s3", "backup_disk_s3_plain", s3_disk_def, int(0), id="wide"),
+        pytest.param(
+            "compact", "backup_compact_local", "backup_disk_local_plain", local_disk_def, int(1e9), id="compact"
+        ),
+        pytest.param("wide", "backup_wide_local", "backup_disk_local_plain", local_disk_def, int(0), id="wide"),
     ],
 )
-def test_attach_part(table_name, backup_name, storage_policy, min_bytes_for_wide_part):
+def test_attach_part(table_name, backup_name, storage_policy, disk_def, min_bytes_for_wide_part):
     node.query(
         f"""
     -- Catch any errors (NOTE: warnings are ok)
@@ -45,7 +55,7 @@ def test_attach_part(table_name, backup_name, storage_policy, min_bytes_for_wide
     settings min_bytes_for_wide_part={min_bytes_for_wide_part}
     as select number%5 part, number key from numbers(100);
 
-    backup table ordinary_db.{table_name} TO Disk('backup_disk_s3_plain', '{backup_name}') settings deduplicate_files=0;
+    backup table ordinary_db.{table_name} TO Disk('{storage_policy}', '{backup_name}') settings deduplicate_files=0;
 
     drop table ordinary_db.{table_name};
     attach table ordinary_db.{table_name} (part UInt8, key UInt64)
@@ -53,10 +63,7 @@ def test_attach_part(table_name, backup_name, storage_policy, min_bytes_for_wide
     order by key partition by part
     settings
         max_suspicious_broken_parts=0,
-        disk=disk(type=s3_plain,
-            endpoint='http://minio1:9001/root/data/disks/disk_s3_plain/{backup_name}/',
-            access_key_id='minio',
-            secret_access_key='minio123');
+        disk={disk_def}
     """
     )
 

From 69b5bd02a915ae044b4116de759d11ae80525dc5 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Mon, 26 Feb 2024 09:37:17 +0000
Subject: [PATCH 058/985] Automatic style fix

---
 .../test_attach_backup_from_s3_plain/test.py  | 42 ++++++++++++++++---
 1 file changed, 36 insertions(+), 6 deletions(-)

diff --git a/tests/integration/test_attach_backup_from_s3_plain/test.py b/tests/integration/test_attach_backup_from_s3_plain/test.py
index 4a8da1e6d66..900366b2c9c 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/test.py
+++ b/tests/integration/test_attach_backup_from_s3_plain/test.py
@@ -20,27 +20,57 @@ def start_cluster():
     finally:
         cluster.shutdown()
 
+
 s3_disk_def = """disk(type=s3_plain,
     endpoint='http://minio1:9001/root/data/disks/disk_s3_plain/{backup_name}/',
     access_key_id='minio',
     secret_access_key='minio123');"""
 
-local_disk_def = "disk(type=object_storage, object_storage_type = 'local', metadata_type = 'plain'"
+local_disk_def = (
+    "disk(type=object_storage, object_storage_type = 'local', metadata_type = 'plain'"
+)
+
 
 @pytest.mark.parametrize(
     "table_name,backup_name,storage_policy,disk_def,min_bytes_for_wide_part",
     [
         pytest.param(
-            "compact", "backup_compact_s3", "backup_disk_s3_plain", s3_disk_def, int(1e9), id="compact"
+            "compact",
+            "backup_compact_s3",
+            "backup_disk_s3_plain",
+            s3_disk_def,
+            int(1e9),
+            id="compact",
         ),
-        pytest.param("wide", "backup_wide_s3", "backup_disk_s3_plain", s3_disk_def, int(0), id="wide"),
         pytest.param(
-            "compact", "backup_compact_local", "backup_disk_local_plain", local_disk_def, int(1e9), id="compact"
+            "wide",
+            "backup_wide_s3",
+            "backup_disk_s3_plain",
+            s3_disk_def,
+            int(0),
+            id="wide",
+        ),
+        pytest.param(
+            "compact",
+            "backup_compact_local",
+            "backup_disk_local_plain",
+            local_disk_def,
+            int(1e9),
+            id="compact",
+        ),
+        pytest.param(
+            "wide",
+            "backup_wide_local",
+            "backup_disk_local_plain",
+            local_disk_def,
+            int(0),
+            id="wide",
         ),
-        pytest.param("wide", "backup_wide_local", "backup_disk_local_plain", local_disk_def, int(0), id="wide"),
     ],
 )
-def test_attach_part(table_name, backup_name, storage_policy, disk_def, min_bytes_for_wide_part):
+def test_attach_part(
+    table_name, backup_name, storage_policy, disk_def, min_bytes_for_wide_part
+):
     node.query(
         f"""
     -- Catch any errors (NOTE: warnings are ok)

From ac4af6a4ad3b67860eae79b2ed3320fc5981a954 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 26 Feb 2024 19:58:49 +0000
Subject: [PATCH 059/985] Don't allow to set max_parallel_replicas to 0 as it
 doesn't make sense

---
 src/Client/ConnectionPoolWithFailover.cpp                | 9 +++++++++
 src/Client/HedgedConnectionsFactory.cpp                  | 3 +++
 src/Client/HedgedConnectionsFactory.h                    | 2 +-
 src/Interpreters/InterpreterSelectQuery.cpp              | 4 ++--
 src/Planner/PlannerJoinTree.cpp                          | 4 ++--
 .../03001_max_parallel_replicas_zero_value.reference     | 0
 .../03001_max_parallel_replicas_zero_value.sql           | 5 +++++
 7 files changed, 22 insertions(+), 5 deletions(-)
 create mode 100644 tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.reference
 create mode 100644 tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.sql

diff --git a/src/Client/ConnectionPoolWithFailover.cpp b/src/Client/ConnectionPoolWithFailover.cpp
index 492fd4ae9e2..46b9741c812 100644
--- a/src/Client/ConnectionPoolWithFailover.cpp
+++ b/src/Client/ConnectionPoolWithFailover.cpp
@@ -191,11 +191,20 @@ std::vector<ConnectionPoolWithFailover::TryResult> ConnectionPoolWithFailover::g
         max_entries = nested_pools.size();
     }
     else if (pool_mode == PoolMode::GET_ONE)
+    {
         max_entries = 1;
+    }
     else if (pool_mode == PoolMode::GET_MANY)
+    {
+        if (settings.max_parallel_replicas == 0)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "The value of the setting max_parallel_replicas must be greater than 0");
+
         max_entries = settings.max_parallel_replicas;
+    }
     else
+    {
         throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Unknown pool allocation mode");
+    }
 
     if (!priority_func)
         priority_func = makeGetPriorityFunc(settings);
diff --git a/src/Client/HedgedConnectionsFactory.cpp b/src/Client/HedgedConnectionsFactory.cpp
index f5b074a0257..a4e5dbf04ac 100644
--- a/src/Client/HedgedConnectionsFactory.cpp
+++ b/src/Client/HedgedConnectionsFactory.cpp
@@ -82,6 +82,9 @@ std::vector<Connection *> HedgedConnectionsFactory::getManyConnections(PoolMode
         }
         case PoolMode::GET_MANY:
         {
+            if (max_parallel_replicas == 0)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The value of the setting max_parallel_replicas must be greater than 0");
+
             max_entries = max_parallel_replicas;
             break;
         }
diff --git a/src/Client/HedgedConnectionsFactory.h b/src/Client/HedgedConnectionsFactory.h
index ce7b553acdd..dd600d58e1e 100644
--- a/src/Client/HedgedConnectionsFactory.h
+++ b/src/Client/HedgedConnectionsFactory.h
@@ -158,7 +158,7 @@ private:
     /// checking the number of requested replicas that are still in process).
     size_t requested_connections_count = 0;
 
-    const size_t max_parallel_replicas = 0;
+    const size_t max_parallel_replicas = 1;
     const bool skip_unavailable_shards = 0;
 };
 
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index d34294b4c4b..fe5e5dc69d1 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -871,7 +871,7 @@ bool InterpreterSelectQuery::adjustParallelReplicasAfterAnalysis()
     {
         /// The query could use trivial count if it didn't use parallel replicas, so let's disable it and reanalyze
         context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
-        context->setSetting("max_parallel_replicas", UInt64{0});
+        context->setSetting("max_parallel_replicas", UInt64{1});
         LOG_DEBUG(log, "Disabling parallel replicas to be able to use a trivial count optimization");
         return true;
     }
@@ -909,7 +909,7 @@ bool InterpreterSelectQuery::adjustParallelReplicasAfterAnalysis()
     if (number_of_replicas_to_use <= 1)
     {
         context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
-        context->setSetting("max_parallel_replicas", UInt64{0});
+        context->setSetting("max_parallel_replicas", UInt64{1});
         LOG_DEBUG(log, "Disabling parallel replicas because there aren't enough rows to read");
         return true;
     }
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index e6a459d0e8a..2b1cd7fb353 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -295,7 +295,7 @@ bool applyTrivialCountIfPossible(
 
         /// The query could use trivial count if it didn't use parallel replicas, so let's disable it
         query_context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
-        query_context->setSetting("max_parallel_replicas", UInt64{0});
+        query_context->setSetting("max_parallel_replicas", UInt64{1});
         LOG_TRACE(getLogger("Planner"), "Disabling parallel replicas to be able to use a trivial count optimization");
 
     }
@@ -756,7 +756,7 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
                     {
                         planner_context->getMutableQueryContext()->setSetting(
                             "allow_experimental_parallel_reading_from_replicas", Field(0));
-                        planner_context->getMutableQueryContext()->setSetting("max_parallel_replicas", UInt64{0});
+                        planner_context->getMutableQueryContext()->setSetting("max_parallel_replicas", UInt64{1});
                         LOG_DEBUG(getLogger("Planner"), "Disabling parallel replicas because there aren't enough rows to read");
                     }
                     else if (number_of_replicas_to_use < settings.max_parallel_replicas)
diff --git a/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.reference b/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.sql b/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.sql
new file mode 100644
index 00000000000..611aa4777ba
--- /dev/null
+++ b/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.sql
@@ -0,0 +1,5 @@
+drop table if exists test_d;
+create table test_d engine=Distributed(test_cluster_two_shard_three_replicas_localhost, system, numbers);
+select * from test_d limit 10 settings max_parallel_replicas = 0, prefer_localhost_replica = 0; --{serverError BAD_ARGUMENTS}
+drop table test_d;
+

From 8aa9f36484bbe814a1e3edccc608e71b73915857 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 26 Feb 2024 22:05:54 +0100
Subject: [PATCH 060/985] Fix style

---
 src/Client/ConnectionPoolWithFailover.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Client/ConnectionPoolWithFailover.cpp b/src/Client/ConnectionPoolWithFailover.cpp
index 46b9741c812..ad8ed0067d8 100644
--- a/src/Client/ConnectionPoolWithFailover.cpp
+++ b/src/Client/ConnectionPoolWithFailover.cpp
@@ -21,6 +21,7 @@ namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
     extern const int ALL_CONNECTION_TRIES_FAILED;
+    extern const int BAD_ARGUMENTS;
 }
 
 
From f264f0a0360baf1413ec38d3f3f30c70595064f4 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 26 Feb 2024 22:06:10 +0100
Subject: [PATCH 061/985] Fix style

---
 src/Client/HedgedConnectionsFactory.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Client/HedgedConnectionsFactory.cpp b/src/Client/HedgedConnectionsFactory.cpp
index a4e5dbf04ac..16a03a696bd 100644
--- a/src/Client/HedgedConnectionsFactory.cpp
+++ b/src/Client/HedgedConnectionsFactory.cpp
@@ -19,6 +19,7 @@ namespace ErrorCodes
     extern const int ALL_CONNECTION_TRIES_FAILED;
     extern const int ALL_REPLICAS_ARE_STALE;
     extern const int LOGICAL_ERROR;
+    extern const int BAD_ARGUMENTS;
 }
 
 HedgedConnectionsFactory::HedgedConnectionsFactory(

From f53f43b78d3cf2da6219ea4bdea7018d9811ae54 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 27 Feb 2024 17:33:47 +0800
Subject: [PATCH 062/985] Fixes for LocalObjectStorage and plain metadata

---
 .../Local/LocalObjectStorage.cpp              | 37 +++++++++++++++++--
 .../ObjectStorages/Local/LocalObjectStorage.h |  4 ++
 .../MetadataStorageFromPlainObjectStorage.cpp |  5 +--
 .../ObjectStorages/ObjectStorageFactory.cpp   | 31 ++++++++++------
 src/Disks/ObjectStorages/PlainObjectStorage.h |  6 +++
 src/Disks/ObjectStorages/S3/DiskS3Utils.cpp   |  6 ---
 src/Disks/ObjectStorages/S3/DiskS3Utils.h     |  1 -
 .../ObjectStorages/S3/S3ObjectStorage.cpp     |  2 +
 .../configs/disk_s3.xml                       |  4 +-
 .../test_attach_backup_from_s3_plain/test.py  |  7 ++--
 10 files changed, 71 insertions(+), 32 deletions(-)

diff --git a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
index 02700b358e0..51c260cc270 100644
--- a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
@@ -31,6 +31,8 @@ LocalObjectStorage::LocalObjectStorage(String key_prefix_)
         description = *block_device_id;
     else
         description = "/";
+
+    fs::create_directories(getCommonKeyPrefix());
 }
 
 bool LocalObjectStorage::exists(const StoredObject & object) const
@@ -53,6 +55,7 @@ std::unique_ptr<ReadBufferFromFileBase> LocalObjectStorage::readObjects( /// NOL
         return createReadBufferFromFileBase(file_path, modified_settings, read_hint, file_size);
     };
 
+    LOG_TEST(log, "Read object: {}", objects[0].remote_path);
     switch (read_settings.remote_fs_method)
     {
         case RemoteFSReadMethod::read:
@@ -111,8 +114,8 @@ std::unique_ptr<ReadBufferFromFileBase> LocalObjectStorage::readObject( /// NOLI
     if (!file_size)
         file_size = tryGetSizeFromFilePath(path);
 
-    LOG_TEST(log, "Read object: {}", path);
-    return createReadBufferFromFileBase(path, patchSettings(read_settings), read_hint, file_size);
+    LOG_TEST(log, "Read object: {}", object.remote_path);
+    return createReadBufferFromFileBase(object.remote_path, patchSettings(read_settings), read_hint, file_size);
 }
 
 std::unique_ptr<WriteBufferFromFileBase> LocalObjectStorage::writeObject( /// NOLINT
@@ -126,6 +129,7 @@ std::unique_ptr<WriteBufferFromFileBase> LocalObjectStorage::writeObject( /// NO
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "LocalObjectStorage doesn't support append to files");
 
     LOG_TEST(log, "Write object: {}", object.remote_path);
+    fs::create_directories(fs::path(object.remote_path).parent_path());
     return std::make_unique<WriteBufferFromFile>(object.remote_path, buf_size);
 }
 
@@ -157,9 +161,34 @@ void LocalObjectStorage::removeObjectsIfExist(const StoredObjects & objects)
         removeObjectIfExists(object);
 }
 
-ObjectMetadata LocalObjectStorage::getObjectMetadata(const std::string & /* path */) const
+ObjectMetadata LocalObjectStorage::getObjectMetadata(const std::string & path) const
 {
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Metadata is not supported for LocalObjectStorage");
+    ObjectMetadata object_metadata;
+    LOG_TEST(log, "Getting metadata for path: {}", path);
+    object_metadata.size_bytes = fs::file_size(path);
+    object_metadata.last_modified = Poco::Timestamp::fromEpochTime(
+        std::chrono::duration_cast<std::chrono::seconds>(fs::last_write_time(path).time_since_epoch()).count());
+    return object_metadata;
+}
+
+void LocalObjectStorage::listObjects(const std::string & path, RelativePathsWithMetadata & children, int /* max_keys */) const
+{
+    for (const auto & entry : fs::directory_iterator(path))
+    {
+        if (entry.is_directory())
+        {
+            listObjects(entry.path(), children, 0);
+            continue;
+        }
+
+        auto metadata = getObjectMetadata(entry.path());
+        children.emplace_back(entry.path(), std::move(metadata));
+    }
+}
+
+bool LocalObjectStorage::existsOrHasAnyChild(const std::string & path) const
+{
+    return exists(StoredObject(path));
 }
 
 void LocalObjectStorage::copyObject( // NOLINT
diff --git a/src/Disks/ObjectStorages/Local/LocalObjectStorage.h b/src/Disks/ObjectStorages/Local/LocalObjectStorage.h
index ed5f8c1f537..22429a99c76 100644
--- a/src/Disks/ObjectStorages/Local/LocalObjectStorage.h
+++ b/src/Disks/ObjectStorages/Local/LocalObjectStorage.h
@@ -58,6 +58,10 @@ public:
 
     ObjectMetadata getObjectMetadata(const std::string & path) const override;
 
+    void listObjects(const std::string & path, RelativePathsWithMetadata & children, int max_keys) const override;
+
+    bool existsOrHasAnyChild(const std::string & path) const override;
+
     void copyObject( /// NOLINT
         const StoredObject & object_from,
         const StoredObject & object_to,
diff --git a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
index b03809f5b39..4b8fc74e956 100644
--- a/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
@@ -48,10 +48,7 @@ bool MetadataStorageFromPlainObjectStorage::isDirectory(const std::string & path
     std::string directory = object_key.serialize();
     if (!directory.ends_with('/'))
         directory += '/';
-
-    RelativePathsWithMetadata files;
-    object_storage->listObjects(directory, files, 1);
-    return !files.empty();
+    return object_storage->existsOrHasAnyChild(directory);
 }
 
 uint64_t MetadataStorageFromPlainObjectStorage::getFileSize(const String & path) const
diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index 6f6ff199902..f64c42c1403 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -36,16 +36,24 @@ namespace ErrorCodes
 
 namespace
 {
+    bool isPlainStorage(
+        ObjectStorageType type,
+        const Poco::Util::AbstractConfiguration & config,
+        const std::string & config_prefix)
+    {
+        auto compatibility_hint = MetadataStorageFactory::getCompatibilityMetadataTypeHint(type);
+        auto metadata_type = MetadataStorageFactory::getMetadataType(config, config_prefix, compatibility_hint);
+        return metadataTypeFromString(metadata_type) == MetadataStorageType::Plain;
+    }
+
     template <typename BaseObjectStorage, class ...Args>
     ObjectStoragePtr createObjectStorage(
+        ObjectStorageType type,
         const Poco::Util::AbstractConfiguration & config,
         const std::string & config_prefix,
         Args && ...args)
     {
-        auto compatibility_hint = MetadataStorageFactory::getCompatibilityMetadataTypeHint(ObjectStorageType::S3);
-        auto metadata_type = MetadataStorageFactory::getMetadataType(config, config_prefix, compatibility_hint);
-
-        if (metadataTypeFromString(metadata_type) == MetadataStorageType::Plain)
+        if (isPlainStorage(type, config, config_prefix))
         {
             return std::make_shared<PlainObjectStorage<BaseObjectStorage>>(std::forward<Args>(args)...);
         }
@@ -151,10 +159,10 @@ void registerS3ObjectStorage(ObjectStorageFactory & factory)
         auto s3_capabilities = getCapabilitiesFromConfig(config, config_prefix);
         auto settings = getSettings(config, config_prefix, context);
         auto client = getClient(config, config_prefix, context, *settings);
-        auto key_generator = getKeyGenerator(disk_type, uri, config, config_prefix);
+        auto key_generator = getKeyGenerator(uri, config, config_prefix);
 
         auto object_storage = createObjectStorage<S3ObjectStorage>(
-            config, config_prefix, std::move(client), std::move(settings), uri, s3_capabilities, key_generator, name);
+            ObjectStorageType::S3, config, config_prefix, std::move(client), std::move(settings), uri, s3_capabilities, key_generator, name);
 
         /// NOTE: should we still perform this check for clickhouse-disks?
         if (!skip_access_check)
@@ -187,7 +195,7 @@ void registerS3PlainObjectStorage(ObjectStorageFactory & factory)
         auto s3_capabilities = getCapabilitiesFromConfig(config, config_prefix);
         auto settings = getSettings(config, config_prefix, context);
         auto client = getClient(config, config_prefix, context, *settings);
-        auto key_generator = getKeyGenerator(disk_type, uri, config, config_prefix);
+        auto key_generator = getKeyGenerator(uri, config, config_prefix);
 
         auto object_storage = std::make_shared<PlainObjectStorage<S3ObjectStorage>>(
             std::move(client), std::move(settings), uri, s3_capabilities, key_generator, name);
@@ -222,7 +230,7 @@ void registerHDFSObjectStorage(ObjectStorageFactory & factory)
             context->getSettingsRef().hdfs_replication
         );
 
-        return createObjectStorage<HDFSObjectStorage>(config, config_prefix, uri, std::move(settings), config);
+        return createObjectStorage<HDFSObjectStorage>(ObjectStorageType::HDFS, config, config_prefix, uri, std::move(settings), config);
     });
 }
 #endif
@@ -239,8 +247,7 @@ void registerAzureObjectStorage(ObjectStorageFactory & factory)
     {
         String container_name = config.getString(config_prefix + ".container_name", "default-container");
         return createObjectStorage<AzureObjectStorage>(
-            config, config_prefix,
-            name,
+            ObjectStorageType::Azure, config, config_prefix, name,
             getAzureBlobContainerClient(config, config_prefix),
             getAzureBlobStorageSettings(config, config_prefix, context),
             container_name);
@@ -273,7 +280,7 @@ void registerWebObjectStorage(ObjectStorageFactory & factory)
                 ErrorCodes::BAD_ARGUMENTS, "Bad URI: `{}`. Error: {}", uri, e.what());
         }
 
-        return createObjectStorage<WebObjectStorage>(config, config_prefix, uri, context);
+        return createObjectStorage<WebObjectStorage>(ObjectStorageType::Web, config, config_prefix, uri, context);
     });
 }
 
@@ -291,7 +298,7 @@ void registerLocalObjectStorage(ObjectStorageFactory & factory)
         loadDiskLocalConfig(name, config, config_prefix, context, object_key_prefix, keep_free_space_bytes);
         /// keys are mapped to the fs, object_key_prefix is a directory also
         fs::create_directories(object_key_prefix);
-        return createObjectStorage<LocalObjectStorage>(config, config_prefix, object_key_prefix);
+        return createObjectStorage<LocalObjectStorage>(ObjectStorageType::Local, config, config_prefix, object_key_prefix);
     });
 }
 #endif
diff --git a/src/Disks/ObjectStorages/PlainObjectStorage.h b/src/Disks/ObjectStorages/PlainObjectStorage.h
index 3a81b85c44b..e0907d0b4d8 100644
--- a/src/Disks/ObjectStorages/PlainObjectStorage.h
+++ b/src/Disks/ObjectStorages/PlainObjectStorage.h
@@ -1,5 +1,6 @@
 #pragma once
 #include <Disks/ObjectStorages/IObjectStorage.h>
+#include <Common/ObjectStorageKeyGenerator.h>
 
 namespace DB
 {
@@ -24,6 +25,11 @@ public:
     bool isWriteOnce() const override { return true; }
 
     bool isPlain() const override { return true; }
+
+    ObjectStorageKey generateObjectKeyForPath(const std::string & path) const override
+    {
+        return ObjectStorageKey::createAsRelative(BaseObjectStorage::getCommonKeyPrefix(), path);
+    }
 };
 
 }
diff --git a/src/Disks/ObjectStorages/S3/DiskS3Utils.cpp b/src/Disks/ObjectStorages/S3/DiskS3Utils.cpp
index bb7b53b2d22..4b889f89f90 100644
--- a/src/Disks/ObjectStorages/S3/DiskS3Utils.cpp
+++ b/src/Disks/ObjectStorages/S3/DiskS3Utils.cpp
@@ -15,16 +15,10 @@ namespace ErrorCodes
 }
 
 ObjectStorageKeysGeneratorPtr getKeyGenerator(
-    String type,
     const S3::URI & uri,
     const Poco::Util::AbstractConfiguration & config,
     const String & config_prefix)
 {
-    if (type == "s3_plain")
-        return createObjectStorageKeysGeneratorAsIsWithPrefix(uri.key);
-
-    chassert(type == "s3");
-
     bool storage_metadata_write_full_object_key = DiskObjectStorageMetadata::getWriteFullObjectKeySetting();
     bool send_metadata = config.getBool(config_prefix + ".send_metadata", false);
 
diff --git a/src/Disks/ObjectStorages/S3/DiskS3Utils.h b/src/Disks/ObjectStorages/S3/DiskS3Utils.h
index 29e39d4bc1b..8524a9ccac3 100644
--- a/src/Disks/ObjectStorages/S3/DiskS3Utils.h
+++ b/src/Disks/ObjectStorages/S3/DiskS3Utils.h
@@ -12,7 +12,6 @@ namespace DB
 namespace S3 { struct URI; }
 
 ObjectStorageKeysGeneratorPtr getKeyGenerator(
-    String type,
     const S3::URI & uri,
     const Poco::Util::AbstractConfiguration & config,
     const String & config_prefix);
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
index 5771eb1ebe0..b2a9ab8fdc3 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
@@ -561,6 +561,8 @@ std::unique_ptr<IObjectStorage> S3ObjectStorage::cloneObjectStorage(
 
 ObjectStorageKey S3ObjectStorage::generateObjectKeyForPath(const std::string & path) const
 {
+    if (!key_generator)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Key generator is not set");
     return key_generator->generate(path);
 }
 
diff --git a/tests/integration/test_attach_backup_from_s3_plain/configs/disk_s3.xml b/tests/integration/test_attach_backup_from_s3_plain/configs/disk_s3.xml
index 3166eea7ccb..2edabc76c8b 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/configs/disk_s3.xml
+++ b/tests/integration/test_attach_backup_from_s3_plain/configs/disk_s3.xml
@@ -10,9 +10,9 @@
             </backup_disk_s3_plain>
             <backup_disk_local_plain>
                 <type>object_storage</type>
-                <object_storage_type>local</object_storage_type>
+                <object_storage_type>local_blob_storage</object_storage_type>
                 <metadata_type>plain</metadata_type>
-                <path>local_plain/</path>
+                <path>/local_plain/</path>
             </backup_disk_local_plain>
         </disks>
     </storage_configuration>
diff --git a/tests/integration/test_attach_backup_from_s3_plain/test.py b/tests/integration/test_attach_backup_from_s3_plain/test.py
index 4a8da1e6d66..983275cc24f 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/test.py
+++ b/tests/integration/test_attach_backup_from_s3_plain/test.py
@@ -21,11 +21,11 @@ def start_cluster():
         cluster.shutdown()
 
 s3_disk_def = """disk(type=s3_plain,
-    endpoint='http://minio1:9001/root/data/disks/disk_s3_plain/{backup_name}/',
+    endpoint='http://minio1:9001/root/data/disks/disk_s3_plain/{}/',
     access_key_id='minio',
     secret_access_key='minio123');"""
 
-local_disk_def = "disk(type=object_storage, object_storage_type = 'local', metadata_type = 'plain'"
+local_disk_def = "disk(type=object_storage, object_storage_type = 'local_blob_storage', metadata_type = 'plain', path = '/local_plain/{}/')"
 
 @pytest.mark.parametrize(
     "table_name,backup_name,storage_policy,disk_def,min_bytes_for_wide_part",
@@ -41,6 +41,7 @@ local_disk_def = "disk(type=object_storage, object_storage_type = 'local', metad
     ],
 )
 def test_attach_part(table_name, backup_name, storage_policy, disk_def, min_bytes_for_wide_part):
+    disk_definition = disk_def.format(backup_name)
     node.query(
         f"""
     -- Catch any errors (NOTE: warnings are ok)
@@ -63,7 +64,7 @@ def test_attach_part(table_name, backup_name, storage_policy, disk_def, min_byte
     order by key partition by part
     settings
         max_suspicious_broken_parts=0,
-        disk={disk_def}
+        disk={disk_definition}
     """
     )
 

From fb38bd139c433ead685028f232e8c4fad5e566d2 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 27 Feb 2024 17:38:02 +0800
Subject: [PATCH 063/985] Remove debug logging

---
 src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
index 51c260cc270..4ec998a2bb0 100644
--- a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
@@ -55,7 +55,6 @@ std::unique_ptr<ReadBufferFromFileBase> LocalObjectStorage::readObjects( /// NOL
         return createReadBufferFromFileBase(file_path, modified_settings, read_hint, file_size);
     };
 
-    LOG_TEST(log, "Read object: {}", objects[0].remote_path);
     switch (read_settings.remote_fs_method)
     {
         case RemoteFSReadMethod::read:
@@ -109,10 +108,8 @@ std::unique_ptr<ReadBufferFromFileBase> LocalObjectStorage::readObject( /// NOLI
     std::optional<size_t> read_hint,
     std::optional<size_t> file_size) const
 {
-    const auto & path = object.remote_path;
-
     if (!file_size)
-        file_size = tryGetSizeFromFilePath(path);
+        file_size = tryGetSizeFromFilePath(object.remote_path);
 
     LOG_TEST(log, "Read object: {}", object.remote_path);
     return createReadBufferFromFileBase(object.remote_path, patchSettings(read_settings), read_hint, file_size);

From 978fe9fa1a069a231bb52c66b3898c6ce112a215 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 27 Feb 2024 17:43:34 +0800
Subject: [PATCH 064/985] Add comments

---
 src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
index 4ec998a2bb0..7f34ca48f7f 100644
--- a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
@@ -126,7 +126,11 @@ std::unique_ptr<WriteBufferFromFileBase> LocalObjectStorage::writeObject( /// NO
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "LocalObjectStorage doesn't support append to files");
 
     LOG_TEST(log, "Write object: {}", object.remote_path);
+
+    /// Unlike real blob storage, in local fs we cannot create a file with non-existing prefix.
+    /// So let's create it.
     fs::create_directories(fs::path(object.remote_path).parent_path());
+
     return std::make_unique<WriteBufferFromFile>(object.remote_path, buf_size);
 }
 
@@ -185,6 +189,8 @@ void LocalObjectStorage::listObjects(const std::string & path, RelativePathsWith
 
 bool LocalObjectStorage::existsOrHasAnyChild(const std::string & path) const
 {
+    /// Unlike real object storage, existance of a prefix path can be checked by
+    /// just checking existence of this prefix directly, so simple exists is enough here.
     return exists(StoredObject(path));
 }
 

From 33788250b1f74384661cd241e2badef82c8fdbf6 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 27 Feb 2024 18:07:19 +0800
Subject: [PATCH 065/985] Update test.py

---
 tests/integration/test_attach_backup_from_s3_plain/test.py | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/tests/integration/test_attach_backup_from_s3_plain/test.py b/tests/integration/test_attach_backup_from_s3_plain/test.py
index 3a0fa70a715..c2f8936b82c 100644
--- a/tests/integration/test_attach_backup_from_s3_plain/test.py
+++ b/tests/integration/test_attach_backup_from_s3_plain/test.py
@@ -26,9 +26,8 @@ s3_disk_def = """disk(type=s3_plain,
     access_key_id='minio',
     secret_access_key='minio123');"""
 
-local_disk_def = (
-    "disk(type=object_storage, object_storage_type = 'local', metadata_type = 'plain', path = '/local_plain/{}/'"
-)
+local_disk_def = "disk(type=object_storage, object_storage_type = 'local_blob_storage', metadata_type = 'plain', path = '/local_plain/{}/');"
+
 
 @pytest.mark.parametrize(
     "table_name,backup_name,storage_policy,disk_def,min_bytes_for_wide_part",
@@ -67,7 +66,6 @@ local_disk_def = (
         ),
     ],
 )
-
 def test_attach_part(
     table_name, backup_name, storage_policy, disk_def, min_bytes_for_wide_part
 ):

From 58a53b42acb3b25a41e8529186db9df0d4387f77 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 27 Feb 2024 14:31:35 +0100
Subject: [PATCH 066/985] Set max_entries to min(max_parallel_replicas, all
 available reolicas)

---
 src/Client/HedgedConnectionsFactory.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Client/HedgedConnectionsFactory.cpp b/src/Client/HedgedConnectionsFactory.cpp
index 16a03a696bd..703cc1f8821 100644
--- a/src/Client/HedgedConnectionsFactory.cpp
+++ b/src/Client/HedgedConnectionsFactory.cpp
@@ -86,7 +86,7 @@ std::vector<Connection *> HedgedConnectionsFactory::getManyConnections(PoolMode
             if (max_parallel_replicas == 0)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "The value of the setting max_parallel_replicas must be greater than 0");
 
-            max_entries = max_parallel_replicas;
+            max_entries = std::min(max_parallel_replicas, shuffled_pools.size());
             break;
         }
     }

From 98b27fd45fbe1109442c2313181ca4e8435e2024 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 27 Feb 2024 23:00:27 +0800
Subject: [PATCH 067/985] Fix style check

---
 src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp | 2 +-
 src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp       | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
index 7f34ca48f7f..eba57969580 100644
--- a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
@@ -189,7 +189,7 @@ void LocalObjectStorage::listObjects(const std::string & path, RelativePathsWith
 
 bool LocalObjectStorage::existsOrHasAnyChild(const std::string & path) const
 {
-    /// Unlike real object storage, existance of a prefix path can be checked by
+    /// Unlike real object storage, existence of a prefix path can be checked by
     /// just checking existence of this prefix directly, so simple exists is enough here.
     return exists(StoredObject(path));
 }
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
index b2a9ab8fdc3..eec3a5914fc 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
@@ -48,6 +48,7 @@ namespace ErrorCodes
 {
     extern const int S3_ERROR;
     extern const int BAD_ARGUMENTS;
+    extern const int LOGICAL_ERROR;
 }
 
 namespace

From 416638461fe832673252445d8fabb3fe554eed49 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 27 Feb 2024 15:02:13 +0000
Subject: [PATCH 068/985] Try to fix logical error 'Cannot capture column
 because it has incompatible type' in mapContainsKeyLike

---
 src/Functions/array/FunctionArrayMapped.h                     | 4 ++--
 .../03002_map_array_functions_with_low_cardinality.reference  | 1 +
 .../03002_map_array_functions_with_low_cardinality.sql        | 2 ++
 3 files changed, 5 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.reference
 create mode 100644 tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.sql

diff --git a/src/Functions/array/FunctionArrayMapped.h b/src/Functions/array/FunctionArrayMapped.h
index 49ed9d495e2..136d3481771 100644
--- a/src/Functions/array/FunctionArrayMapped.h
+++ b/src/Functions/array/FunctionArrayMapped.h
@@ -355,7 +355,7 @@ public:
                     {
                         arrays.emplace_back(
                             column_tuple->getColumnPtr(j),
-                            recursiveRemoveLowCardinality(type_tuple.getElement(j)),
+                            type_tuple.getElement(j),
                             array_with_type_and_name.name + "." + tuple_names[j]);
                     }
                 }
@@ -363,7 +363,7 @@ public:
                 {
                     arrays.emplace_back(
                         column_array->getDataPtr(),
-                        recursiveRemoveLowCardinality(array_type->getNestedType()),
+                        array_type->getNestedType(),
                         array_with_type_and_name.name);
                 }
 
diff --git a/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.reference b/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.sql b/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.sql
new file mode 100644
index 00000000000..8240a8f93f5
--- /dev/null
+++ b/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.sql
@@ -0,0 +1,2 @@
+SELECT mapContainsKeyLike(map('aa', toLowCardinality(1), 'bb', toLowCardinality(2)), toLowCardinality('a%'));
+

From 5771e739f0e65baae69f1e7abd42495d5fbc5488 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 27 Feb 2024 23:11:29 +0800
Subject: [PATCH 069/985] Update ReadSettings.h

---
 src/IO/ReadSettings.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index 2c79735317d..846fcd668f0 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -98,7 +98,6 @@ struct ReadSettings
     bool enable_filesystem_cache = true;
     bool read_from_filesystem_cache_if_exists_otherwise_bypass_cache = false;
     bool enable_filesystem_cache_log = false;
-    /// Don't populate cache when the read is not part of query execution (e.g. background thread).
     bool force_read_through_cache_merges = false;
     size_t filesystem_cache_segments_batch_size = 20;
 

From 1eba06dc113881b2845d36a7d3a4703ad64659d7 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 27 Feb 2024 23:12:41 +0800
Subject: [PATCH 070/985] Update
 02241_filesystem_cache_on_write_operations.reference

---
 .../02241_filesystem_cache_on_write_operations.reference    | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference
index c03b928684b..53566a18edc 100644
--- a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference
+++ b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference
@@ -95,13 +95,7 @@ INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(300, 10000)
 SELECT count(), sum(size) FROM system.filesystem_cache
 24	84045
 SYSTEM START MERGES test_02241
-SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'
-85146
-SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'
 OPTIMIZE TABLE test_02241 FINAL
-SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'
-251542
-SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'
 SELECT count(), sum(size) FROM system.filesystem_cache
 32	167243
 ALTER TABLE test_02241 UPDATE value = 'kek' WHERE key = 100

From ffd69e0e127f64cf90a41d7b710c375ced13f092 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 27 Feb 2024 23:22:04 +0800
Subject: [PATCH 071/985] Move setting to merge-tree level

---
 src/Core/ServerSettings.h                                     | 3 ---
 src/Interpreters/Context.cpp                                  | 1 -
 src/Storages/MergeTree/MergeTreeSequentialSource.cpp          | 3 ++-
 src/Storages/MergeTree/MergeTreeSettings.h                    | 1 +
 .../config.d/force_read_through_cache_for_merges.xml          | 4 +++-
 5 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index 0283b98638f..0063b3a2bd6 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -102,9 +102,6 @@ namespace DB
     M(UInt64, tables_loader_background_pool_size, 0, "The maximum number of threads that will be used for background async loading of tables. Zero means use all CPUs.", 0) \
     M(Bool, async_load_databases, false, "Enable asynchronous loading of databases and tables to speedup server startup. Queries to not yet loaded entity will be blocked until load is finished.", 0) \
     M(Bool, display_secrets_in_show_and_select, false, "Allow showing secrets in SHOW and SELECT queries via a format setting and a grant", 0) \
-    \
-    M(Bool, force_read_through_cache_for_merges, false, "Force read-through filesystem cache for merges", 0) \
-    \
     M(Seconds, keep_alive_timeout, DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT, "The number of seconds that ClickHouse waits for incoming requests before closing the connection.", 0) \
     M(Seconds, replicated_fetches_http_connection_timeout, 0, "HTTP connection timeout for part fetch requests. Inherited from default profile `http_connection_timeout` if not set explicitly.", 0) \
     M(Seconds, replicated_fetches_http_send_timeout, 0, "HTTP send timeout for part fetch requests. Inherited from default profile `http_send_timeout` if not set explicitly.", 0) \
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index a974eaca067..55a4df10206 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -5079,7 +5079,6 @@ ReadSettings Context::getReadSettings() const
     res.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache;
     res.enable_filesystem_cache_log = settings.enable_filesystem_cache_log;
     res.filesystem_cache_segments_batch_size = settings.filesystem_cache_segments_batch_size;
-    res.force_read_through_cache_merges = getServerSettings().force_read_through_cache_for_merges;
 
     res.filesystem_cache_max_download_size = settings.filesystem_cache_max_download_size;
     res.skip_download_if_exceeds_query_cache = settings.skip_download_if_exceeds_query_cache;
diff --git a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
index e375e8b0a9f..6b0c5ccb59a 100644
--- a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
+++ b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
@@ -151,7 +151,8 @@ MergeTreeSequentialSource::MergeTreeSequentialSource(
 
     const auto & context = storage.getContext();
     ReadSettings read_settings = context->getReadSettings();
-    read_settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = !read_settings.force_read_through_cache_merges;
+    read_settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = !storage.getSettings()->force_read_through_cache_for_merges;
+
     /// It does not make sense to use pthread_threadpool for background merges/mutations
     /// And also to preserve backward compatibility
     read_settings.local_fs_method = LocalFSReadMethod::pread;
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index b64632b6139..9cb74e76dd5 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -191,6 +191,7 @@ struct Settings;
     M(String, remote_fs_zero_copy_zookeeper_path, "/clickhouse/zero_copy", "ZooKeeper path for zero-copy table-independent info.", 0) \
     M(Bool, remote_fs_zero_copy_path_compatible_mode, false, "Run zero-copy in compatible mode during conversion process.", 0) \
     M(Bool, cache_populated_by_fetch, false, "Only available in ClickHouse Cloud", 0) \
+    M(Bool, force_read_through_cache_for_merges, false, "Force read-through filesystem cache for merges", 0) \
     M(Bool, allow_experimental_block_number_column, false, "Enable persisting column _block_number for each row.", 0) \
     M(Bool, allow_experimental_replacing_merge_with_cleanup, false, "Allow experimental CLEANUP merges for ReplacingMergeTree with is_deleted column.", 0) \
     \
diff --git a/tests/integration/test_filesystem_cache/config.d/force_read_through_cache_for_merges.xml b/tests/integration/test_filesystem_cache/config.d/force_read_through_cache_for_merges.xml
index bb2a6e850a4..23d3fdea800 100644
--- a/tests/integration/test_filesystem_cache/config.d/force_read_through_cache_for_merges.xml
+++ b/tests/integration/test_filesystem_cache/config.d/force_read_through_cache_for_merges.xml
@@ -1,3 +1,5 @@
 <clickhouse>
-    <force_read_through_cache_for_merges>1</force_read_through_cache_for_merges>
+    <merge_tree>
+        <force_read_through_cache_for_merges>1</force_read_through_cache_for_merges>
+    </merge_tree>
 </clickhouse>

From 524a2ca72decc124ef1e38b79843c2388cceb0bb Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 27 Feb 2024 19:17:34 +0100
Subject: [PATCH 072/985] WIP on createForShard

---
 .../OptimizeShardingKeyRewriteInVisitor.cpp   | 44 +++++++++++++++++++
 1 file changed, 44 insertions(+)

diff --git a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
index 3a592c0fe55..8aca28a90ef 100644
--- a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
+++ b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
@@ -5,6 +5,12 @@
 #include <Parsers/ASTIdentifier.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <Interpreters/OptimizeShardingKeyRewriteInVisitor.h>
+#include "Analyzer/ColumnNode.h"
+#include "Analyzer/ConstantNode.h"
+#include "Analyzer/FunctionNode.h"
+#include "Analyzer/IQueryTreeNode.h"
+#include "Analyzer/InDepthQueryTreeVisitor.h"
+#include "DataTypes/IDataType.h"
 
 namespace
 {
@@ -119,4 +125,42 @@ void OptimizeShardingKeyRewriteInMatcher::visit(ASTFunction & function, Data & d
     }
 }
 
+
+class OptimizeShardingKeyRewriteIn : InDepthQueryTreeVisitorWithContext<OptimizeShardingKeyRewriteIn>
+{
+public:
+    using Base = InDepthQueryTreeVisitorWithContext<OptimizeShardingKeyRewriteIn>;
+    using Base::Base;
+
+    void enterImpl(QueryTreeNodePtr & node)
+    {
+        auto * function_node = node->as<FunctionNode>();
+        if (!function_node || function_node->getFunctionName() != "in")
+            return;
+
+        auto & arguments = function_node->getArguments().getNodes();
+        auto * column = arguments[0]->as<ColumnNode>();
+        if (!column)
+            return;
+
+        if (!data.sharding_key_expr->getRequiredColumnsWithTypes().contains(column->getColumnName()))
+            return;
+
+        if (auto * constant = arguments[1]->as<ConstantNode>())
+        {
+            if (isTuple(constant->getResultType()))
+            {
+                auto & tuple = constant->getValue().get<Tuple &>();
+                std::erase_if(tuple, [&](auto & child)
+                {
+                    return tuple.size() > 1 && !shardContains(child, name, data);
+                });
+            }
+        }
+    }
+
+    OptimizeShardingKeyRewriteInMatcher::Data data;
+};
+
+
 }

From cb8390e9c8672bcdead0108be75021d6c6f21331 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 28 Feb 2024 13:32:43 +0800
Subject: [PATCH 073/985] Fix build

---
 src/Disks/ObjectStorages/ObjectStorageFactory.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index f64c42c1403..d0c2c9ac4f4 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -16,10 +16,10 @@
 #ifndef CLICKHOUSE_KEEPER_STANDALONE_BUILD
 #include <Disks/ObjectStorages/Web/WebObjectStorage.h>
 #include <Disks/ObjectStorages/Local/LocalObjectStorage.h>
-#include <Disks/ObjectStorages/PlainObjectStorage.h>
 #include <Disks/loadLocalDiskConfig.h>
 #endif
 #include <Disks/ObjectStorages/MetadataStorageFactory.h>
+#include <Disks/ObjectStorages/PlainObjectStorage.h>
 #include <Interpreters/Context.h>
 #include <Common/Macros.h>
 

From 0de2d766fa971f54eff40641e16ed6857e1ece5f Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 28 Feb 2024 15:30:06 +0100
Subject: [PATCH 074/985] WIP on different JSONs on shards

---
 src/Analyzer/IdentifierNode.cpp               |  10 +-
 src/Analyzer/IdentifierNode.h                 |   6 ++
 src/DataTypes/ObjectUtils.cpp                 |  75 ++++++++++++-
 src/DataTypes/ObjectUtils.h                   |  11 ++
 .../ClusterProxy/SelectStreamFactory.cpp      |  79 +++++++++++++-
 .../ClusterProxy/SelectStreamFactory.h        |  26 +++++
 .../ClusterProxy/executeQuery.cpp             | 101 ++++++++++++------
 src/Interpreters/ClusterProxy/executeQuery.h  |   2 -
 .../OptimizeShardingKeyRewriteInVisitor.cpp   |  35 ++++--
 .../OptimizeShardingKeyRewriteInVisitor.h     |   3 +
 src/Processors/QueryPlan/ReadFromRemote.cpp   |  10 +-
 src/Storages/StorageDistributed.cpp           |  32 +++---
 12 files changed, 325 insertions(+), 65 deletions(-)

diff --git a/src/Analyzer/IdentifierNode.cpp b/src/Analyzer/IdentifierNode.cpp
index 88b3daacb12..7e4d4c02a4c 100644
--- a/src/Analyzer/IdentifierNode.cpp
+++ b/src/Analyzer/IdentifierNode.cpp
@@ -1,3 +1,4 @@
+#include <memory>
 #include <Analyzer/IdentifierNode.h>
 
 #include <Common/assert_cast.h>
@@ -56,13 +57,18 @@ void IdentifierNode::updateTreeHashImpl(HashState & state) const
 
 QueryTreeNodePtr IdentifierNode::cloneImpl() const
 {
-    return std::make_shared<IdentifierNode>(identifier);
+    auto result = std::make_shared<IdentifierNode>(identifier);
+    result->use_parts_for_to_ast = use_parts_for_to_ast;
+    return result;
 }
 
 ASTPtr IdentifierNode::toASTImpl(const ConvertToASTOptions & /* options */) const
 {
     auto identifier_parts = identifier.getParts();
-    return std::make_shared<ASTIdentifier>(std::move(identifier_parts));
+    if (use_parts_for_to_ast)
+        return std::make_shared<ASTIdentifier>(std::move(identifier_parts));
+    else
+        return std::make_shared<ASTIdentifier>(identifier.getFullName());
 }
 
 }
diff --git a/src/Analyzer/IdentifierNode.h b/src/Analyzer/IdentifierNode.h
index 872bb14d512..3bc37b4c69d 100644
--- a/src/Analyzer/IdentifierNode.h
+++ b/src/Analyzer/IdentifierNode.h
@@ -52,6 +52,11 @@ public:
 
     void dumpTreeImpl(WriteBuffer & buffer, FormatState & format_state, size_t indent) const override;
 
+    void useFullNameInToAST()
+    {
+        use_parts_for_to_ast = false;
+    }
+
 protected:
     bool isEqualImpl(const IQueryTreeNode & rhs) const override;
 
@@ -64,6 +69,7 @@ protected:
 private:
     Identifier identifier;
     std::optional<TableExpressionModifiers> table_expression_modifiers;
+    bool use_parts_for_to_ast = false;
 
     static constexpr size_t children_size = 0;
 };
diff --git a/src/DataTypes/ObjectUtils.cpp b/src/DataTypes/ObjectUtils.cpp
index 23d29136c85..01ba50d90f3 100644
--- a/src/DataTypes/ObjectUtils.cpp
+++ b/src/DataTypes/ObjectUtils.cpp
@@ -1,3 +1,4 @@
+#include <memory>
 #include <DataTypes/ObjectUtils.h>
 #include <DataTypes/DataTypeObject.h>
 #include <DataTypes/DataTypeNothing.h>
@@ -20,6 +21,16 @@
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTFunction.h>
 #include <IO/Operators.h>
+#include "Analyzer/ConstantNode.h"
+#include "Analyzer/FunctionNode.h"
+#include "Analyzer/IQueryTreeNode.h"
+#include "Analyzer/Identifier.h"
+#include "Analyzer/IdentifierNode.h"
+#include "Analyzer/QueryNode.h"
+#include "Analyzer/Utils.h"
+#include <Functions/FunctionFactory.h>
+#include <Poco/Logger.h>
+#include "Common/logger_useful.h"
 
 
 namespace DB
@@ -888,10 +899,10 @@ static void addConstantToWithClause(const ASTPtr & query, const String & column_
 
 /// @expected_columns and @available_columns contain descriptions
 /// of extended Object columns.
-void replaceMissedSubcolumnsByConstants(
+NamesAndTypes calculateMissedSubcolumns(
     const ColumnsDescription & expected_columns,
-    const ColumnsDescription & available_columns,
-    ASTPtr query)
+    const ColumnsDescription & available_columns
+)
 {
     NamesAndTypes missed_names_types;
 
@@ -928,6 +939,18 @@ void replaceMissedSubcolumnsByConstants(
             [](const auto & lhs, const auto & rhs) { return lhs.name < rhs.name; });
     }
 
+    return missed_names_types;
+}
+
+/// @expected_columns and @available_columns contain descriptions
+/// of extended Object columns.
+void replaceMissedSubcolumnsByConstants(
+    const ColumnsDescription & expected_columns,
+    const ColumnsDescription & available_columns,
+    ASTPtr query)
+{
+    NamesAndTypes missed_names_types = calculateMissedSubcolumns(expected_columns, available_columns);
+
     if (missed_names_types.empty())
         return;
 
@@ -940,6 +963,52 @@ void replaceMissedSubcolumnsByConstants(
             addConstantToWithClause(query, name, type);
 }
 
+/// @expected_columns and @available_columns contain descriptions
+/// of extended Object columns.
+void replaceMissedSubcolumnsByConstants(
+    const ColumnsDescription & expected_columns,
+    const ColumnsDescription & available_columns,
+    QueryTreeNodePtr & query,
+    const ContextPtr & context [[maybe_unused]])
+{
+    NamesAndTypes missed_names_types = calculateMissedSubcolumns(expected_columns, available_columns);
+
+    if (missed_names_types.empty())
+        return;
+
+    auto * query_node = query->as<QueryNode>();
+    if (!query_node)
+        return;
+
+    auto table_expression = extractLeftTableExpression(query_node->getJoinTree());
+
+    auto & with_nodes = query_node->getWith().getNodes();
+
+    std::unordered_map<std::string, QueryTreeNodePtr> column_name_to_node;
+    for (const auto & [name, type] : missed_names_types)
+    {
+        auto constant = std::make_shared<ConstantNode>(type->getDefault(), type);
+        constant->setAlias(table_expression->getAlias() + name);
+        // auto materialize = std::make_shared<FunctionNode>("materialize");
+
+        // auto function = FunctionFactory::instance().get("materialize", context);
+        // materialize->getArguments().getNodes() = { constant };
+        // materialize->resolveAsFunction(function->build(materialize->getArgumentColumns()));
+        // materialize->setAlias(name);
+
+        with_nodes.push_back(constant);
+
+        auto id = std::make_shared<IdentifierNode>(Identifier(table_expression->getAlias() + name));
+        id->useFullNameInToAST();
+        column_name_to_node[name] = id;
+        LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "Name {} Expression\n{}", name, column_name_to_node[name]->dumpTree());
+    }
+
+    LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "Table expression\n{} ", table_expression->dumpTree());
+    replaceColumns(query, table_expression, column_name_to_node);
+    LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "Result:\n{} ", query->dumpTree());
+}
+
 Field FieldVisitorReplaceScalars::operator()(const Array & x) const
 {
     if (num_dimensions_to_keep == 0)
diff --git a/src/DataTypes/ObjectUtils.h b/src/DataTypes/ObjectUtils.h
index 2bfcaae09ca..f4a8abe8abf 100644
--- a/src/DataTypes/ObjectUtils.h
+++ b/src/DataTypes/ObjectUtils.h
@@ -3,6 +3,8 @@
 #include <Core/Block.h>
 #include <Core/NamesAndTypes.h>
 #include <Common/FieldVisitors.h>
+#include "Analyzer/IQueryTreeNode.h"
+#include "Interpreters/Context_fwd.h"
 #include <Storages/ColumnsDescription.h>
 #include <DataTypes/DataTypeTuple.h>
 #include <DataTypes/DataTypesNumber.h>
@@ -14,6 +16,9 @@ namespace DB
 struct StorageSnapshot;
 using StorageSnapshotPtr = std::shared_ptr<StorageSnapshot>;
 
+class IQueryTreeNode;
+using QueryTreeNodePtr = std::shared_ptr<IQueryTreeNode>;
+
 /// Returns number of dimensions in Array type. 0 if type is not array.
 size_t getNumberOfDimensions(const IDataType & type);
 
@@ -97,6 +102,12 @@ void replaceMissedSubcolumnsByConstants(
     const ColumnsDescription & available_columns,
     ASTPtr query);
 
+void replaceMissedSubcolumnsByConstants(
+    const ColumnsDescription & expected_columns,
+    const ColumnsDescription & available_columns,
+    QueryTreeNodePtr & query,
+    const ContextPtr & context);
+
 /// Visitor that keeps @num_dimensions_to_keep dimensions in arrays
 /// and replaces all scalars or nested arrays to @replacement at that level.
 class FieldVisitorReplaceScalars : public StaticVisitor<Field>
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
index f0592735caf..5167ffc0e27 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
@@ -5,6 +5,10 @@
 #include <Common/checkStackSize.h>
 #include <Common/logger_useful.h>
 #include <Common/FailPoint.h>
+#include "Analyzer/IQueryTreeNode.h"
+#include "Interpreters/InterpreterSelectQueryAnalyzer.h"
+#include "Interpreters/SelectQueryOptions.h"
+#include "Planner/Utils.h"
 #include <TableFunctions/TableFunctionFactory.h>
 #include <IO/ConnectionTimeouts.h>
 #include <Interpreters/ClusterProxy/SelectStreamFactory.h>
@@ -124,18 +128,55 @@ void SelectStreamFactory::createForShard(
     if (it != objects_by_shard.end())
         replaceMissedSubcolumnsByConstants(storage_snapshot->object_columns, it->second, query_ast);
 
+    createForShardImpl(
+        shard_info,
+        query_ast,
+        main_table,
+        table_func_ptr,
+        std::move(context),
+        local_plans,
+        remote_shards,
+        shard_count,
+        parallel_replicas_enabled,
+        std::move(shard_filter_generator));
+}
+
+void SelectStreamFactory::createForShardImpl(
+    const Cluster::ShardInfo & shard_info,
+    const ASTPtr & query_ast,
+    const StorageID & main_table,
+    const ASTPtr & table_func_ptr,
+    ContextPtr context,
+    std::vector<QueryPlanPtr> & local_plans,
+    Shards & remote_shards,
+    UInt32 shard_count,
+    bool parallel_replicas_enabled,
+    AdditionalShardFilterGenerator shard_filter_generator)
+{
     auto emplace_local_stream = [&]()
     {
+        Block shard_header;
+        if (context->getSettingsRef().allow_experimental_analyzer)
+            shard_header = InterpreterSelectQueryAnalyzer::getSampleBlock(query_ast, context, SelectQueryOptions(processed_stage).analyze());
+        else
+            shard_header = header;
+
         local_plans.emplace_back(createLocalPlan(
-            query_ast, header, context, processed_stage, shard_info.shard_num, shard_count));
+            query_ast, shard_header, context, processed_stage, shard_info.shard_num, shard_count));
     };
 
     auto emplace_remote_stream = [&](bool lazy = false, time_t local_delay = 0)
     {
+        Block shard_header;
+        if (context->getSettingsRef().allow_experimental_analyzer)
+            shard_header = InterpreterSelectQueryAnalyzer::getSampleBlock(query_ast, context, SelectQueryOptions(processed_stage).analyze());
+        else
+            shard_header = header;
+
         remote_shards.emplace_back(Shard{
             .query = query_ast,
             .main_table = main_table,
-            .header = header,
+            .header = shard_header,
             .shard_info = shard_info,
             .lazy = lazy,
             .local_delay = local_delay,
@@ -243,6 +284,40 @@ void SelectStreamFactory::createForShard(
         emplace_remote_stream();
 }
 
+void SelectStreamFactory::createForShard(
+    const Cluster::ShardInfo & shard_info,
+    const QueryTreeNodePtr & query_tree,
+    const StorageID & main_table,
+    const ASTPtr & table_func_ptr,
+    ContextPtr context,
+    std::vector<QueryPlanPtr> & local_plans,
+    Shards & remote_shards,
+    UInt32 shard_count,
+    bool parallel_replicas_enabled,
+    AdditionalShardFilterGenerator shard_filter_generator)
+{
+
+    auto it = objects_by_shard.find(shard_info.shard_num);
+    QueryTreeNodePtr modified_query = query_tree;
+    if (it != objects_by_shard.end())
+        replaceMissedSubcolumnsByConstants(storage_snapshot->object_columns, it->second, modified_query, context);
+
+    auto query_ast = queryNodeToDistributedSelectQuery(modified_query);
+
+    createForShardImpl(
+        shard_info,
+        query_ast,
+        main_table,
+        table_func_ptr,
+        std::move(context),
+        local_plans,
+        remote_shards,
+        shard_count,
+        parallel_replicas_enabled,
+        std::move(shard_filter_generator));
+
+}
+
 
 }
 }
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.h b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
index 9993ea7028d..45d6ea14c01 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.h
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
@@ -7,6 +7,7 @@
 #include <Parsers/IAST.h>
 #include <Storages/IStorage_fwd.h>
 #include <Storages/StorageSnapshot.h>
+#include "Analyzer/IQueryTreeNode.h"
 
 namespace DB
 {
@@ -83,10 +84,35 @@ public:
         bool parallel_replicas_enabled,
         AdditionalShardFilterGenerator shard_filter_generator);
 
+    void createForShard(
+        const Cluster::ShardInfo & shard_info,
+        const QueryTreeNodePtr & query_tree,
+        const StorageID & main_table,
+        const ASTPtr & table_func_ptr,
+        ContextPtr context,
+        std::vector<QueryPlanPtr> & local_plans,
+        Shards & remote_shards,
+        UInt32 shard_count,
+        bool parallel_replicas_enabled,
+        AdditionalShardFilterGenerator shard_filter_generator);
+
     const Block header;
     const ColumnsDescriptionByShardNum objects_by_shard;
     const StorageSnapshotPtr storage_snapshot;
     QueryProcessingStage::Enum processed_stage;
+
+private:
+    void createForShardImpl(
+        const Cluster::ShardInfo & shard_info,
+        const ASTPtr & query_ast,
+        const StorageID & main_table,
+        const ASTPtr & table_func_ptr,
+        ContextPtr context,
+        std::vector<QueryPlanPtr> & local_plans,
+        Shards & remote_shards,
+        UInt32 shard_count,
+        bool parallel_replicas_enabled,
+        AdditionalShardFilterGenerator shard_filter_generator);
 };
 
 }
diff --git a/src/Interpreters/ClusterProxy/executeQuery.cpp b/src/Interpreters/ClusterProxy/executeQuery.cpp
index 6cdff939af1..07ef7aa6c96 100644
--- a/src/Interpreters/ClusterProxy/executeQuery.cpp
+++ b/src/Interpreters/ClusterProxy/executeQuery.cpp
@@ -204,12 +204,10 @@ void executeQuery(
     const ASTPtr & table_func_ptr,
     SelectStreamFactory & stream_factory,
     LoggerPtr log,
-    const ASTPtr & query_ast,
     ContextPtr context,
     const SelectQueryInfo & query_info,
     const ExpressionActionsPtr & sharding_key_expr,
     const std::string & sharding_key_column_name,
-    const ClusterPtr & not_optimized_cluster,
     const DistributedSettings & distributed_settings,
     AdditionalShardFilterGenerator shard_filter_generator)
 {
@@ -218,6 +216,8 @@ void executeQuery(
     if (settings.max_distributed_depth && context->getClientInfo().distributed_depth >= settings.max_distributed_depth)
         throw Exception(ErrorCodes::TOO_LARGE_DISTRIBUTED_DEPTH, "Maximum distributed depth exceeded");
 
+    const ClusterPtr & not_optimized_cluster = query_info.cluster;
+
     std::vector<QueryPlanPtr> plans;
     SelectStreamFactory::Shards remote_shards;
 
@@ -237,40 +237,81 @@ void executeQuery(
     new_context->increaseDistributedDepth();
 
     const size_t shards = cluster->getShardCount();
-    for (size_t i = 0, s = cluster->getShardsInfo().size(); i < s; ++i)
+
+    if (context->getSettingsRef().allow_experimental_analyzer)
     {
-        const auto & shard_info = cluster->getShardsInfo()[i];
-
-        ASTPtr query_ast_for_shard = query_ast->clone();
-        if (sharding_key_expr && query_info.optimized_cluster && settings.optimize_skip_unused_shards_rewrite_in && shards > 1)
+        for (size_t i = 0, s = cluster->getShardsInfo().size(); i < s; ++i)
         {
-            OptimizeShardingKeyRewriteInVisitor::Data visitor_data{
-                sharding_key_expr,
-                sharding_key_expr->getSampleBlock().getByPosition(0).type,
-                sharding_key_column_name,
+            const auto & shard_info = cluster->getShardsInfo()[i];
+
+            auto query_for_shard = query_info.query_tree->clone();
+            if (sharding_key_expr && query_info.optimized_cluster && settings.optimize_skip_unused_shards_rewrite_in && shards > 1)
+            {
+                OptimizeShardingKeyRewriteInVisitor::Data visitor_data{
+                    sharding_key_expr,
+                    sharding_key_expr->getSampleBlock().getByPosition(0).type,
+                    sharding_key_column_name,
+                    shard_info,
+                    not_optimized_cluster->getSlotToShard(),
+                };
+                optimizeShardingKeyRewriteIn(query_for_shard, std::move(visitor_data), new_context);
+            }
+
+            // decide for each shard if parallel reading from replicas should be enabled
+            // according to settings and number of replicas declared per shard
+            const auto & addresses = cluster->getShardsAddresses().at(i);
+            bool parallel_replicas_enabled = addresses.size() > 1 && context->canUseTaskBasedParallelReplicas();
+
+            stream_factory.createForShard(
                 shard_info,
-                not_optimized_cluster->getSlotToShard(),
-            };
-            OptimizeShardingKeyRewriteInVisitor visitor(visitor_data);
-            visitor.visit(query_ast_for_shard);
+                query_for_shard,
+                main_table,
+                table_func_ptr,
+                new_context,
+                plans,
+                remote_shards,
+                static_cast<UInt32>(shards),
+                parallel_replicas_enabled,
+                shard_filter_generator);
         }
+    }
+    else
+    {
+        for (size_t i = 0, s = cluster->getShardsInfo().size(); i < s; ++i)
+        {
+            const auto & shard_info = cluster->getShardsInfo()[i];
 
-        // decide for each shard if parallel reading from replicas should be enabled
-        // according to settings and number of replicas declared per shard
-        const auto & addresses = cluster->getShardsAddresses().at(i);
-        bool parallel_replicas_enabled = addresses.size() > 1 && context->canUseTaskBasedParallelReplicas();
+            ASTPtr query_ast_for_shard = query_info.query->clone();
+            if (sharding_key_expr && query_info.optimized_cluster && settings.optimize_skip_unused_shards_rewrite_in && shards > 1)
+            {
+                OptimizeShardingKeyRewriteInVisitor::Data visitor_data{
+                    sharding_key_expr,
+                    sharding_key_expr->getSampleBlock().getByPosition(0).type,
+                    sharding_key_column_name,
+                    shard_info,
+                    not_optimized_cluster->getSlotToShard(),
+                };
+                OptimizeShardingKeyRewriteInVisitor visitor(visitor_data);
+                visitor.visit(query_ast_for_shard);
+            }
 
-        stream_factory.createForShard(
-            shard_info,
-            query_ast_for_shard,
-            main_table,
-            table_func_ptr,
-            new_context,
-            plans,
-            remote_shards,
-            static_cast<UInt32>(shards),
-            parallel_replicas_enabled,
-            shard_filter_generator);
+            // decide for each shard if parallel reading from replicas should be enabled
+            // according to settings and number of replicas declared per shard
+            const auto & addresses = cluster->getShardsAddresses().at(i);
+            bool parallel_replicas_enabled = addresses.size() > 1 && context->canUseTaskBasedParallelReplicas();
+
+            stream_factory.createForShard(
+                shard_info,
+                query_ast_for_shard,
+                main_table,
+                table_func_ptr,
+                new_context,
+                plans,
+                remote_shards,
+                static_cast<UInt32>(shards),
+                parallel_replicas_enabled,
+                shard_filter_generator);
+        }
     }
 
     if (!remote_shards.empty())
diff --git a/src/Interpreters/ClusterProxy/executeQuery.h b/src/Interpreters/ClusterProxy/executeQuery.h
index bbc3c6c9e49..8f6f6300c7b 100644
--- a/src/Interpreters/ClusterProxy/executeQuery.h
+++ b/src/Interpreters/ClusterProxy/executeQuery.h
@@ -58,12 +58,10 @@ void executeQuery(
     const ASTPtr & table_func_ptr,
     SelectStreamFactory & stream_factory,
     LoggerPtr log,
-    const ASTPtr & query_ast,
     ContextPtr context,
     const SelectQueryInfo & query_info,
     const ExpressionActionsPtr & sharding_key_expr,
     const std::string & sharding_key_column_name,
-    const ClusterPtr & not_optimized_cluster,
     const DistributedSettings & distributed_settings,
     AdditionalShardFilterGenerator shard_filter_generator);
 
diff --git a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
index 8aca28a90ef..42c6e63da01 100644
--- a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
+++ b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
@@ -1,3 +1,4 @@
+#include <memory>
 #include <Interpreters/ExpressionActions.h>
 #include <Interpreters/convertFieldToType.h>
 #include <Parsers/ASTFunction.h>
@@ -11,6 +12,7 @@
 #include "Analyzer/IQueryTreeNode.h"
 #include "Analyzer/InDepthQueryTreeVisitor.h"
 #include "DataTypes/IDataType.h"
+#include "Interpreters/Context_fwd.h"
 
 namespace
 {
@@ -126,11 +128,15 @@ void OptimizeShardingKeyRewriteInMatcher::visit(ASTFunction & function, Data & d
 }
 
 
-class OptimizeShardingKeyRewriteIn : InDepthQueryTreeVisitorWithContext<OptimizeShardingKeyRewriteIn>
+class OptimizeShardingKeyRewriteIn : public InDepthQueryTreeVisitorWithContext<OptimizeShardingKeyRewriteIn>
 {
 public:
     using Base = InDepthQueryTreeVisitorWithContext<OptimizeShardingKeyRewriteIn>;
-    using Base::Base;
+    
+    OptimizeShardingKeyRewriteIn(OptimizeShardingKeyRewriteInVisitor::Data data_, ContextPtr context)
+        : Base(std::move(context))
+        , data(std::move(data_))
+    {}
 
     void enterImpl(QueryTreeNodePtr & node)
     {
@@ -143,6 +149,8 @@ public:
         if (!column)
             return;
 
+        auto name = column->getColumnName();
+
         if (!data.sharding_key_expr->getRequiredColumnsWithTypes().contains(column->getColumnName()))
             return;
 
@@ -150,17 +158,30 @@ public:
         {
             if (isTuple(constant->getResultType()))
             {
-                auto & tuple = constant->getValue().get<Tuple &>();
-                std::erase_if(tuple, [&](auto & child)
+                const auto & tuple = constant->getValue().get<Tuple &>();
+                Tuple new_tuple;
+                new_tuple.reserve(tuple.size());
+
+                for (const auto & child : tuple)
                 {
-                    return tuple.size() > 1 && !shardContains(child, name, data);
-                });
+                    if (shardContains(child, name, data))
+                        new_tuple.push_back(child);
+                }
+
+                if (new_tuple.empty())
+                    new_tuple.push_back(tuple.back());
+                node = std::make_shared<ConstantNode>(new_tuple);
             }
         }
     }
 
-    OptimizeShardingKeyRewriteInMatcher::Data data;
+    OptimizeShardingKeyRewriteInVisitor::Data data;
 };
 
+void optimizeShardingKeyRewriteIn(QueryTreeNodePtr & node, OptimizeShardingKeyRewriteInVisitor::Data data, ContextPtr context)
+{
+    OptimizeShardingKeyRewriteIn visitor(std::move(data), std::move(context));
+    visitor.visit(node);
+}
 
 }
diff --git a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.h b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.h
index d546db40df7..d202609160b 100644
--- a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.h
+++ b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.h
@@ -2,6 +2,7 @@
 
 #include <Interpreters/InDepthNodeVisitor.h>
 #include <Interpreters/Cluster.h>
+#include "Analyzer/IQueryTreeNode.h"
 
 namespace DB
 {
@@ -44,4 +45,6 @@ struct OptimizeShardingKeyRewriteInMatcher
 
 using OptimizeShardingKeyRewriteInVisitor = InDepthNodeVisitor<OptimizeShardingKeyRewriteInMatcher, true>;
 
+void optimizeShardingKeyRewriteIn(QueryTreeNodePtr & node, OptimizeShardingKeyRewriteInVisitor::Data data, ContextPtr context);
+
 }
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 93c73a66b78..022c4f699f2 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -216,7 +216,7 @@ void ReadFromRemote::addLazyPipe(Pipes & pipes, const ClusterProxy::SelectStream
     };
 
     pipes.emplace_back(createDelayedPipe(shard.header, lazily_create_stream, add_totals, add_extremes));
-    addConvertingActions(pipes.back(), output_stream->header);
+    addConvertingActions(pipes.back(), shard.header);
 }
 
 void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFactory::Shard & shard)
@@ -281,7 +281,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
             auto remote_query_executor = std::make_shared<RemoteQueryExecutor>(
                 shard.shard_info.pool,
                 query_string,
-                output_stream->header,
+                shard.header,
                 context,
                 throttler,
                 scalars,
@@ -297,7 +297,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
             pipes.emplace_back(
                 createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
-            addConvertingActions(pipes.back(), output_stream->header);
+            addConvertingActions(pipes.back(), shard.header);
         }
     }
     else
@@ -305,7 +305,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
         const String query_string = formattedAST(shard.query);
 
         auto remote_query_executor = std::make_shared<RemoteQueryExecutor>(
-            shard.shard_info.pool, query_string, output_stream->header, context, throttler, scalars, external_tables, stage);
+            shard.shard_info.pool, query_string, shard.header, context, throttler, scalars, external_tables, stage);
         remote_query_executor->setLogger(log);
 
         if (context->canUseTaskBasedParallelReplicas())
@@ -326,7 +326,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
         pipes.emplace_back(
             createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
-        addConvertingActions(pipes.back(), output_stream->header);
+        addConvertingActions(pipes.back(), shard.header);
     }
 }
 
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 92e7dcdf4f2..34ab21a4751 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -30,6 +30,7 @@
 #include <Common/randomSeed.h>
 #include <Common/formatReadable.h>
 #include <Common/CurrentMetrics.h>
+#include "Analyzer/IQueryTreeNode.h"
 
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
@@ -813,7 +814,8 @@ void StorageDistributed::read(
     const size_t /*num_streams*/)
 {
     Block header;
-    ASTPtr query_ast;
+
+    SelectQueryInfo modified_query_info = query_info;
 
     if (local_context->getSettingsRef().allow_experimental_analyzer)
     {
@@ -821,7 +823,7 @@ void StorageDistributed::read(
         if (!remote_table_function_ptr)
             remote_storage_id = StorageID{remote_database, remote_table};
 
-        auto query_tree_distributed = buildQueryTreeDistributed(query_info,
+        auto query_tree_distributed = buildQueryTreeDistributed(modified_query_info,
             storage_snapshot,
             remote_storage_id,
             remote_table_function_ptr);
@@ -831,20 +833,24 @@ void StorageDistributed::read(
           */
         for (auto & column : header)
             column.column = column.column->convertToFullColumnIfConst();
-        query_ast = queryNodeToDistributedSelectQuery(query_tree_distributed);
+        modified_query_info.query = queryNodeToDistributedSelectQuery(query_tree_distributed);
+
+        modified_query_info.query_tree = std::move(query_tree_distributed);
     }
     else
     {
-        header = InterpreterSelectQuery(query_info.query, local_context, SelectQueryOptions(processed_stage).analyze()).getSampleBlock();
-        query_ast = query_info.query;
+        header = InterpreterSelectQuery(modified_query_info.query, local_context, SelectQueryOptions(processed_stage).analyze()).getSampleBlock();
     }
 
-    const auto & modified_query_ast = ClusterProxy::rewriteSelectQuery(
-        local_context, query_ast,
-        remote_database, remote_table, remote_table_function_ptr);
+    if (!local_context->getSettingsRef().allow_experimental_analyzer)
+    {
+        modified_query_info.query = ClusterProxy::rewriteSelectQuery(
+            local_context, modified_query_info.query,
+            remote_database, remote_table, remote_table_function_ptr);
+    }
 
     /// Return directly (with correct header) if no shard to query.
-    if (query_info.getCluster()->getShardsInfo().empty())
+    if (modified_query_info.getCluster()->getShardsInfo().empty())
     {
         if (local_context->getSettingsRef().allow_experimental_analyzer)
             return;
@@ -872,7 +878,7 @@ void StorageDistributed::read(
     const auto & settings = local_context->getSettingsRef();
 
     ClusterProxy::AdditionalShardFilterGenerator additional_shard_filter_generator;
-    if (local_context->canUseParallelReplicasCustomKey(*query_info.getCluster()))
+    if (local_context->canUseParallelReplicasCustomKey(*modified_query_info.getCluster()))
     {
         if (auto custom_key_ast = parseCustomKeyForTable(settings.parallel_replicas_custom_key, *local_context))
         {
@@ -881,7 +887,7 @@ void StorageDistributed::read(
                  column_description = this->getInMemoryMetadataPtr()->columns,
                  custom_key_type = settings.parallel_replicas_custom_key_filter_type.value,
                  context = local_context,
-                 replica_count = query_info.getCluster()->getShardsInfo().front().per_replica_pools.size()](uint64_t replica_num) -> ASTPtr
+                 replica_count = modified_query_info.getCluster()->getShardsInfo().front().per_replica_pools.size()](uint64_t replica_num) -> ASTPtr
             {
                 return getCustomKeyFilterForParallelReplica(
                     replica_count, replica_num - 1, my_custom_key_ast, custom_key_type, column_description, context);
@@ -897,12 +903,10 @@ void StorageDistributed::read(
         remote_table_function_ptr,
         select_stream_factory,
         log,
-        modified_query_ast,
         local_context,
-        query_info,
+        modified_query_info,
         sharding_key_expr,
         sharding_key_column_name,
-        query_info.cluster,
         distributed_settings,
         additional_shard_filter_generator);
 

From 8bf7c2c5971afc22dda32f9f4ad453ac481f2359 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 28 Feb 2024 15:40:42 +0100
Subject: [PATCH 075/985] Use output header

---
 src/Processors/QueryPlan/ReadFromRemote.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 022c4f699f2..fde2313bc15 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -216,7 +216,7 @@ void ReadFromRemote::addLazyPipe(Pipes & pipes, const ClusterProxy::SelectStream
     };
 
     pipes.emplace_back(createDelayedPipe(shard.header, lazily_create_stream, add_totals, add_extremes));
-    addConvertingActions(pipes.back(), shard.header);
+    addConvertingActions(pipes.back(), output_stream->header);
 }
 
 void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFactory::Shard & shard)
@@ -297,7 +297,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
             pipes.emplace_back(
                 createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
-            addConvertingActions(pipes.back(), shard.header);
+            addConvertingActions(pipes.back(), output_stream->header);
         }
     }
     else
@@ -326,7 +326,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
         pipes.emplace_back(
             createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
-        addConvertingActions(pipes.back(), shard.header);
+        addConvertingActions(pipes.back(), output_stream->header);
     }
 }
 

From d2ea882bd8105f5d2e173a6670bf23b2917b3190 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 28 Feb 2024 21:26:19 +0000
Subject: [PATCH 076/985] Fix deadlock in parallel parsing when lots of rows
 are skipped due to errors

---
 .../Formats/Impl/ParallelParsingInputFormat.cpp      |  4 +++-
 .../03001_parallel_parsing_deadlock.reference        |  0
 .../0_stateless/03001_parallel_parsing_deadlock.sh   | 12 ++++++++++++
 3 files changed, 15 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/03001_parallel_parsing_deadlock.reference
 create mode 100755 tests/queries/0_stateless/03001_parallel_parsing_deadlock.sh

diff --git a/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp b/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp
index 8b6969bbfcc..447adb1ed48 100644
--- a/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp
@@ -224,7 +224,9 @@ Chunk ParallelParsingInputFormat::read()
             /// skipped all rows. For example, it can happen while using settings
             /// input_format_allow_errors_num/input_format_allow_errors_ratio
             /// and this segment contained only rows with errors.
-            /// Process the next unit.
+            /// Return this empty unit back to segmentator and process the next unit.
+            unit->status = READY_TO_INSERT;
+            segmentator_condvar.notify_all();
             ++reader_ticket_number;
             unit = &processing_units[reader_ticket_number % processing_units.size()];
         }
diff --git a/tests/queries/0_stateless/03001_parallel_parsing_deadlock.reference b/tests/queries/0_stateless/03001_parallel_parsing_deadlock.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03001_parallel_parsing_deadlock.sh b/tests/queries/0_stateless/03001_parallel_parsing_deadlock.sh
new file mode 100755
index 00000000000..1bf21dfc53b
--- /dev/null
+++ b/tests/queries/0_stateless/03001_parallel_parsing_deadlock.sh
@@ -0,0 +1,12 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, no-cpu-aarch64
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+DATA_FILE=$CLICKHOUSE_TEST_UNIQUE_NAME.csv
+$CLICKHOUSE_LOCAL -q "select number > 1000000 ? 'error' : toString(number) from numbers(2000000) format CSV" > $DATA_FILE
+$CLICKHOUSE_LOCAL -q "select * from file($DATA_FILE, CSV, 'x UInt64') format Null settings input_format_allow_errors_ratio=1"
+rm $DATA_FILE
+

From 974ba7364f193838f735a9233c6dec4298172542 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Thu, 29 Feb 2024 00:55:17 +0100
Subject: [PATCH 077/985] better

---
 src/Disks/ObjectStorages/S3/diskSettings.cpp | 16 +++++++++++++---
 src/IO/S3/Client.cpp                         |  2 ++
 src/IO/S3/URI.cpp                            |  2 +-
 src/IO/WriteBufferFromS3.h                   |  2 +-
 src/Storages/StorageS3.cpp                   |  4 ++++
 5 files changed, 21 insertions(+), 5 deletions(-)

diff --git a/src/Disks/ObjectStorages/S3/diskSettings.cpp b/src/Disks/ObjectStorages/S3/diskSettings.cpp
index b8688cd3de6..10172805f06 100644
--- a/src/Disks/ObjectStorages/S3/diskSettings.cpp
+++ b/src/Disks/ObjectStorages/S3/diskSettings.cpp
@@ -1,5 +1,6 @@
 #include <Disks/ObjectStorages/S3/diskSettings.h>
-#include "IO/S3/Client.h"
+#include <IO/S3/Client.h>
+#include <Common/Exception.h>
 
 #if USE_AWS_S3
 
@@ -10,7 +11,7 @@
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Context.h>
-#include "Disks/DiskFactory.h"
+#include <Disks/DiskFactory.h>
 
 #include <aws/core/client/DefaultRetryStrategy.h>
 #include <base/getFQDNOrHostName.h>
@@ -25,6 +26,11 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+extern const int NO_ELEMENTS_IN_CONFIG;
+}
+
 std::unique_ptr<S3ObjectStorageSettings> getSettings(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr context)
 {
     const Settings & settings = context->getSettingsRef();
@@ -47,11 +53,15 @@ std::unique_ptr<S3::Client> getClient(
     const Settings & global_settings = context->getGlobalContext()->getSettingsRef();
     const Settings & local_settings = context->getSettingsRef();
 
-    String endpoint = context->getMacros()->expand(config.getString(config_prefix + ".endpoint"));
+    const String endpoint = context->getMacros()->expand(config.getString(config_prefix + ".endpoint"));
     S3::URI uri(endpoint);
     if (!uri.key.ends_with('/'))
         uri.key.push_back('/');
 
+    if (S3::isS3ExpressEndpoint(endpoint) && !config.has(config_prefix + ".region"))
+        throw Exception(
+            ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Region should be explicitly specified for directory buckets ({})", config_prefix);
+
     S3::PocoHTTPClientConfiguration client_configuration = S3::ClientFactory::instance().createClientConfiguration(
         config.getString(config_prefix + ".region", ""),
         context->getRemoteHostFilter(),
diff --git a/src/IO/S3/Client.cpp b/src/IO/S3/Client.cpp
index a75d41df3d1..4f93aba2f84 100644
--- a/src/IO/S3/Client.cpp
+++ b/src/IO/S3/Client.cpp
@@ -1,4 +1,5 @@
 #include <IO/S3/Client.h>
+#include <Common/Exception.h>
 
 #if USE_AWS_S3
 
@@ -965,6 +966,7 @@ PocoHTTPClientConfiguration ClientFactory::createClientConfiguration( // NOLINT
 
 bool isS3ExpressEndpoint(const std::string & endpoint)
 {
+    /// On one hand this check isn't 100% reliable, on the other - all it will change is whether we attach checksums to the requests.
     return endpoint.contains("s3express");
 }
 }
diff --git a/src/IO/S3/URI.cpp b/src/IO/S3/URI.cpp
index 062d3b80850..027cb624ed5 100644
--- a/src/IO/S3/URI.cpp
+++ b/src/IO/S3/URI.cpp
@@ -122,7 +122,7 @@ URI::URI(const std::string & uri_)
                             "Object storage system name is unrecognized in virtual hosted style S3 URI: {}",
                             quoteString(name));
 
-        if (name == COS || name == COSN)
+        if (name == COS)
             storage_name = COSN;
         else
             storage_name = name;
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 148cd27f854..59f4e19e15b 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -100,7 +100,7 @@ private:
     /// We initiate upload, then upload each part and get ETag as a response, and then finalizeImpl() upload with listing all our parts.
     String multipart_upload_id;
     std::deque<String> multipart_tags;
-    std::deque<String> multipart_checksums;
+    std::deque<String> multipart_checksums; // if enabled
     bool multipart_upload_finished = false;
 
     /// Track that prefinalize() is called only once
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 044a1ca5362..f96ff8b7eb6 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -133,6 +133,7 @@ namespace ErrorCodes
     extern const int NOT_IMPLEMENTED;
     extern const int CANNOT_COMPILE_REGEXP;
     extern const int FILE_DOESNT_EXIST;
+    extern const int NO_ELEMENTS_IN_CONFIG;
 }
 
 
@@ -1403,6 +1404,9 @@ void StorageS3::Configuration::connect(const ContextPtr & context)
     const Settings & global_settings = context->getGlobalContext()->getSettingsRef();
     const Settings & local_settings = context->getSettingsRef();
 
+    if (S3::isS3ExpressEndpoint(url.endpoint) && auth_settings.region.empty())
+        throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Region should be explicitly specified for directory buckets");
+
     S3::PocoHTTPClientConfiguration client_configuration = S3::ClientFactory::instance().createClientConfiguration(
         auth_settings.region,
         context->getRemoteHostFilter(),

From 37917a3ed34df22756562a04a90d3c985ca23bd8 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Thu, 29 Feb 2024 01:42:32 +0100
Subject: [PATCH 078/985] better

---
 src/IO/S3/Requests.h         | 12 ++++++++++++
 src/IO/WriteBufferFromS3.cpp | 10 +++-------
 2 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/src/IO/S3/Requests.h b/src/IO/S3/Requests.h
index 6f82a0f39d3..196f074c9df 100644
--- a/src/IO/S3/Requests.h
+++ b/src/IO/S3/Requests.h
@@ -23,6 +23,7 @@
 #include <aws/s3/model/DeleteObjectsRequest.h>
 #include <aws/s3/model/ChecksumAlgorithm.h>
 #include <aws/s3/model/CompletedPart.h>
+#include <aws/core/utils/HashingUtils.h>
 
 #include <base/defines.h>
 
@@ -39,6 +40,17 @@ inline void setPartChecksum(Model::CompletedPart & part, const std::string & che
     part.SetChecksumCRC32(checksum);
 }
 
+inline void setRequestChecksum(Model::UploadPartRequest & req, const std::string & checksum)
+{
+    req.SetChecksumCRC32(checksum);
+}
+
+inline std::string calculateChecksum(Model::UploadPartRequest & req)
+{
+    chassert(req.GetChecksumAlgorithm() == Aws::S3::Model::ChecksumAlgorithm::CRC32);
+    return Aws::Utils::HashingUtils::Base64Encode(Aws::Utils::HashingUtils::CalculateCRC32(*(req.GetBody())));
+}
+
 template <typename R>
 inline void setChecksumAlgorithm(R & request)
 {
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index a162992278f..80ca96b0382 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -18,10 +18,6 @@
 #include <IO/S3/getObjectInfo.h>
 #include <IO/S3/BlobStorageLogWriter.h>
 
-#include <aws/core/utils/HashingUtils.h>
-#include <aws/s3/model/StorageClass.h>
-#include <aws/s3/model/ChecksumAlgorithm.h>
-
 #include <utility>
 
 
@@ -461,9 +457,9 @@ S3::UploadPartRequest WriteBufferFromS3::getUploadRequest(size_t part_number, Pa
     /// Checksums need to be provided on CompleteMultipartUpload requests, so we calculate then manually and store in multipart_checksums
     if (client_ptr->isS3ExpressBucket())
     {
-        chassert(req.GetChecksumAlgorithm() == Aws::S3::Model::ChecksumAlgorithm::CRC32);
-        req.SetChecksumCRC32(Aws::Utils::HashingUtils::Base64Encode(Aws::Utils::HashingUtils::CalculateCRC32(*(req.GetBody()))));
-        multipart_checksums.push_back(req.GetChecksumCRC32());
+        auto checksum = S3::RequestChecksum::calculateChecksum(req);
+        S3::RequestChecksum::setRequestChecksum(req, checksum);
+        multipart_checksums.push_back(std::move(checksum));
     }
 
     return req;

From 6fbd298b3d7cc06b1f11727263a25bc613f7c295 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 29 Feb 2024 05:03:09 +0300
Subject: [PATCH 079/985] Revert "Revert "Use `MergeTree` as a default table
 engine""

---
 src/Core/Settings.h                                      | 2 +-
 src/Core/SettingsChangesHistory.h                        | 1 +
 tests/queries/0_stateless/02184_default_table_engine.sql | 2 ++
 3 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index ae6ea165cc9..5f52396d3bb 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -566,7 +566,7 @@ class IColumn;
     M(UInt64, min_free_disk_space_for_temporary_data, 0, "The minimum disk space to keep while writing temporary data used in external sorting and aggregation.", 0) \
     \
     M(DefaultTableEngine, default_temporary_table_engine, DefaultTableEngine::Memory, "Default table engine used when ENGINE is not set in CREATE TEMPORARY statement.",0) \
-    M(DefaultTableEngine, default_table_engine, DefaultTableEngine::None, "Default table engine used when ENGINE is not set in CREATE statement.",0) \
+    M(DefaultTableEngine, default_table_engine, DefaultTableEngine::MergeTree, "Default table engine used when ENGINE is not set in CREATE statement.",0) \
     M(Bool, show_table_uuid_in_table_create_query_if_not_nil, false, "For tables in databases with Engine=Atomic show UUID of the table in its CREATE query.", 0) \
     M(Bool, database_atomic_wait_for_drop_and_detach_synchronously, false, "When executing DROP or DETACH TABLE in Atomic database, wait for table data to be finally dropped or detached.", 0) \
     M(Bool, enable_scalar_subquery_optimization, true, "If it is set to true, prevent scalar subqueries from (de)serializing large scalar values and possibly avoid running the same subquery more than once.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index e8d013d13ec..661e7cb80da 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -133,6 +133,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
+              {"default_table_engine", "None", "MergeTree", "Set default table engine to MergeTree for better usability"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"},
diff --git a/tests/queries/0_stateless/02184_default_table_engine.sql b/tests/queries/0_stateless/02184_default_table_engine.sql
index a984ec1b6c9..aff30eeea98 100644
--- a/tests/queries/0_stateless/02184_default_table_engine.sql
+++ b/tests/queries/0_stateless/02184_default_table_engine.sql
@@ -1,3 +1,5 @@
+SET default_table_engine = 'None';
+
 CREATE TABLE table_02184 (x UInt8); --{serverError 119}
 SET default_table_engine = 'Log';
 CREATE TABLE table_02184 (x UInt8);

From 0d4648b535a61561d122c87cf181434215753b35 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Thu, 29 Feb 2024 10:30:17 +0800
Subject: [PATCH 080/985] Fix clang-tidy

---
 src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
index eba57969580..c0b45e1d46a 100644
--- a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
@@ -32,7 +32,7 @@ LocalObjectStorage::LocalObjectStorage(String key_prefix_)
     else
         description = "/";
 
-    fs::create_directories(getCommonKeyPrefix());
+    fs::create_directories(key_prefix);
 }
 
 bool LocalObjectStorage::exists(const StoredObject & object) const

From 3188c1ebdac52efbdadb8f64a13b0c4b6f4e1acc Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Wed, 28 Feb 2024 13:51:48 +0800
Subject: [PATCH 081/985] Update test.py

---
 tests/integration/test_filesystem_cache/test.py | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_filesystem_cache/test.py b/tests/integration/test_filesystem_cache/test.py
index f32fa4e9823..0cb1866f8e4 100644
--- a/tests/integration/test_filesystem_cache/test.py
+++ b/tests/integration/test_filesystem_cache/test.py
@@ -94,12 +94,21 @@ def test_parallel_cache_loading_on_startup(cluster, node_name):
     cache_state = node.query(
         "SELECT key, file_segment_range_begin, size FROM system.filesystem_cache WHERE size > 0 ORDER BY key, file_segment_range_begin, size"
     )
+    keys = (
+        node.query(
+            "SELECT distinct(key) FROM system.filesystem_cache WHERE size > 0 ORDER BY key, file_segment_range_begin, size"
+        )
+        .strip()
+        .splitlines()
+    )
 
     node.restart_clickhouse()
 
-    assert cache_count == int(node.query("SELECT count() FROM system.filesystem_cache"))
+    # < because of additional files loaded into cache on server startup.
+    assert cache_count <= int(node.query("SELECT count() FROM system.filesystem_cache"))
+    keys_set = ",".join(["'" + x + "'" for x in keys])
     assert cache_state == node.query(
-        "SELECT key, file_segment_range_begin, size FROM system.filesystem_cache ORDER BY key, file_segment_range_begin, size"
+        f"SELECT key, file_segment_range_begin, size FROM system.filesystem_cache WHERE key in ({keys_set}) ORDER BY key, file_segment_range_begin, size"
     )
 
     assert node.contains_in_log("Loading filesystem cache with 30 threads")

From f8561b2265b924c64c60bdbc5305785c0f0b6f2e Mon Sep 17 00:00:00 2001
From: Sergei Trifonov <svtrifonov@gmail.com>
Date: Thu, 29 Feb 2024 13:53:27 +0100
Subject: [PATCH 082/985] Revert "Revert "Support resource request canceling""

---
 docs/en/operations/system-tables/scheduler.md |  4 +
 src/Common/Scheduler/ISchedulerNode.h         |  2 +
 src/Common/Scheduler/ISchedulerQueue.h        |  6 ++
 src/Common/Scheduler/Nodes/FairPolicy.h       | 99 ++++++++++---------
 src/Common/Scheduler/Nodes/FifoQueue.h        | 31 ++++--
 src/Common/Scheduler/Nodes/PriorityPolicy.h   | 38 ++++---
 .../tests/gtest_dynamic_resource_manager.cpp  |  1 -
 .../Nodes/tests/gtest_resource_scheduler.cpp  | 63 ++++++++++++
 src/Common/Scheduler/ResourceGuard.h          |  9 +-
 src/Common/Scheduler/ResourceRequest.cpp      | 13 +++
 src/Common/Scheduler/ResourceRequest.h        | 30 +++---
 src/Common/Scheduler/SchedulerRoot.h          | 32 +++---
 .../System/StorageSystemScheduler.cpp         |  4 +
 13 files changed, 224 insertions(+), 108 deletions(-)
 create mode 100644 src/Common/Scheduler/ResourceRequest.cpp

diff --git a/docs/en/operations/system-tables/scheduler.md b/docs/en/operations/system-tables/scheduler.md
index 953db4c28f2..c4de7f76fdc 100644
--- a/docs/en/operations/system-tables/scheduler.md
+++ b/docs/en/operations/system-tables/scheduler.md
@@ -26,7 +26,9 @@ priority:          0
 is_active:         0
 active_children:   0
 dequeued_requests: 67
+canceled_requests: 0
 dequeued_cost:     4692272
+canceled_cost:     0
 busy_periods:      63
 vruntime:          938454.1999999989
 system_vruntime:   ᴺᵁᴸᴸ
@@ -54,7 +56,9 @@ Columns:
 - `is_active` (`UInt8`) - Whether this node is currently active - has resource requests to be dequeued and constraints satisfied.
 - `active_children` (`UInt64`) - The number of children in active state.
 - `dequeued_requests` (`UInt64`) - The total number of resource requests dequeued from this node.
+- `canceled_requests` (`UInt64`) - The total number of resource requests canceled from this node.
 - `dequeued_cost` (`UInt64`) - The sum of costs (e.g. size in bytes) of all requests dequeued from this node.
+- `canceled_cost` (`UInt64`) - The sum of costs (e.g. size in bytes) of all requests canceled from this node.
 - `busy_periods` (`UInt64`) - The total number of deactivations of this node.
 - `vruntime` (`Nullable(Float64)`) - For children of `fair` nodes only. Virtual runtime of a node used by SFQ algorithm to select the next child to process in a max-min fair manner.
 - `system_vruntime` (`Nullable(Float64)`) - For `fair` nodes only. Virtual runtime showing `vruntime` of the last processed resource request. Used during child activation as the new value of `vruntime`.
diff --git a/src/Common/Scheduler/ISchedulerNode.h b/src/Common/Scheduler/ISchedulerNode.h
index 804026d7bf4..20c1f4332da 100644
--- a/src/Common/Scheduler/ISchedulerNode.h
+++ b/src/Common/Scheduler/ISchedulerNode.h
@@ -387,7 +387,9 @@ public:
 
     /// Introspection
     std::atomic<UInt64> dequeued_requests{0};
+    std::atomic<UInt64> canceled_requests{0};
     std::atomic<ResourceCost> dequeued_cost{0};
+    std::atomic<ResourceCost> canceled_cost{0};
     std::atomic<UInt64> busy_periods{0};
 };
 
diff --git a/src/Common/Scheduler/ISchedulerQueue.h b/src/Common/Scheduler/ISchedulerQueue.h
index cbe63bd304a..532f4bf6c63 100644
--- a/src/Common/Scheduler/ISchedulerQueue.h
+++ b/src/Common/Scheduler/ISchedulerQueue.h
@@ -50,6 +50,12 @@ public:
     /// Should be called outside of scheduling subsystem, implementation must be thread-safe.
     virtual void enqueueRequest(ResourceRequest * request) = 0;
 
+    /// Cancel previously enqueued request.
+    /// Returns `false` and does nothing given unknown or already executed request.
+    /// Returns `true` if requests has been found and canceled.
+    /// Should be called outside of scheduling subsystem, implementation must be thread-safe.
+    virtual bool cancelRequest(ResourceRequest * request) = 0;
+
     /// For introspection
     ResourceCost getBudget() const
     {
diff --git a/src/Common/Scheduler/Nodes/FairPolicy.h b/src/Common/Scheduler/Nodes/FairPolicy.h
index c0e187e6fa9..ce2bf729a04 100644
--- a/src/Common/Scheduler/Nodes/FairPolicy.h
+++ b/src/Common/Scheduler/Nodes/FairPolicy.h
@@ -134,56 +134,65 @@ public:
 
     std::pair<ResourceRequest *, bool> dequeueRequest() override
     {
-        if (heap_size == 0)
-            return {nullptr, false};
-
-        // Recursively pull request from child
-        auto [request, child_active] = items.front().child->dequeueRequest();
-        assert(request != nullptr);
-        std::pop_heap(items.begin(), items.begin() + heap_size);
-        Item & current = items[heap_size - 1];
-
-        // SFQ fairness invariant: system vruntime equals last served request start-time
-        assert(current.vruntime >= system_vruntime);
-        system_vruntime = current.vruntime;
-
-        // By definition vruntime is amount of consumed resource (cost) divided by weight
-        current.vruntime += double(request->cost) / current.child->info.weight;
-        max_vruntime = std::max(max_vruntime, current.vruntime);
-
-        if (child_active) // Put active child back in heap after vruntime update
+        // Cycle is required to do deactivations in the case of canceled requests, when dequeueRequest returns `nullptr`
+        while (true)
         {
-            std::push_heap(items.begin(), items.begin() + heap_size);
-        }
-        else // Deactivate child if it is empty, but remember it's vruntime for latter activations
-        {
-            heap_size--;
+            if (heap_size == 0)
+                return {nullptr, false};
 
-            // Store index of this inactive child in `parent.idx`
-            // This enables O(1) search of inactive children instead of O(n)
-            current.child->info.parent.idx = heap_size;
-        }
+            // Recursively pull request from child
+            auto [request, child_active] = items.front().child->dequeueRequest();
+            std::pop_heap(items.begin(), items.begin() + heap_size);
+            Item & current = items[heap_size - 1];
 
-        // Reset any difference between children on busy period end
-        if (heap_size == 0)
-        {
-            // Reset vtime to zero to avoid floating-point error accumulation,
-            // but do not reset too often, because it's O(N)
-            UInt64 ns = clock_gettime_ns();
-            if (last_reset_ns + 1000000000 < ns)
+            if (request)
             {
-                last_reset_ns = ns;
-                for (Item & item : items)
-                    item.vruntime = 0;
-                max_vruntime = 0;
-            }
-            system_vruntime = max_vruntime;
-            busy_periods++;
-        }
+                // SFQ fairness invariant: system vruntime equals last served request start-time
+                assert(current.vruntime >= system_vruntime);
+                system_vruntime = current.vruntime;
 
-        dequeued_requests++;
-        dequeued_cost += request->cost;
-        return {request, heap_size > 0};
+                // By definition vruntime is amount of consumed resource (cost) divided by weight
+                current.vruntime += double(request->cost) / current.child->info.weight;
+                max_vruntime = std::max(max_vruntime, current.vruntime);
+            }
+
+            if (child_active) // Put active child back in heap after vruntime update
+            {
+                std::push_heap(items.begin(), items.begin() + heap_size);
+            }
+            else // Deactivate child if it is empty, but remember it's vruntime for latter activations
+            {
+                heap_size--;
+
+                // Store index of this inactive child in `parent.idx`
+                // This enables O(1) search of inactive children instead of O(n)
+                current.child->info.parent.idx = heap_size;
+            }
+
+            // Reset any difference between children on busy period end
+            if (heap_size == 0)
+            {
+                // Reset vtime to zero to avoid floating-point error accumulation,
+                // but do not reset too often, because it's O(N)
+                UInt64 ns = clock_gettime_ns();
+                if (last_reset_ns + 1000000000 < ns)
+                {
+                    last_reset_ns = ns;
+                    for (Item & item : items)
+                        item.vruntime = 0;
+                    max_vruntime = 0;
+                }
+                system_vruntime = max_vruntime;
+                busy_periods++;
+            }
+
+            if (request)
+            {
+                dequeued_requests++;
+                dequeued_cost += request->cost;
+                return {request, heap_size > 0};
+            }
+        }
     }
 
     bool isActive() override
diff --git a/src/Common/Scheduler/Nodes/FifoQueue.h b/src/Common/Scheduler/Nodes/FifoQueue.h
index 38ae902bc2f..45ed32343ff 100644
--- a/src/Common/Scheduler/Nodes/FifoQueue.h
+++ b/src/Common/Scheduler/Nodes/FifoQueue.h
@@ -39,8 +39,7 @@ public:
 
     void enqueueRequest(ResourceRequest * request) override
     {
-        std::unique_lock lock(mutex);
-        request->enqueue_ns = clock_gettime_ns();
+        std::lock_guard lock(mutex);
         queue_cost += request->cost;
         bool was_empty = requests.empty();
         requests.push_back(request);
@@ -50,7 +49,7 @@ public:
 
     std::pair<ResourceRequest *, bool> dequeueRequest() override
     {
-        std::unique_lock lock(mutex);
+        std::lock_guard lock(mutex);
         if (requests.empty())
             return {nullptr, false};
         ResourceRequest * result = requests.front();
@@ -63,9 +62,29 @@ public:
         return {result, !requests.empty()};
     }
 
+    bool cancelRequest(ResourceRequest * request) override
+    {
+        std::lock_guard lock(mutex);
+        // TODO(serxa): reimplement queue as intrusive list of ResourceRequest to make this O(1) instead of O(N)
+        for (auto i = requests.begin(), e = requests.end(); i != e; ++i)
+        {
+            if (*i == request)
+            {
+                requests.erase(i);
+                if (requests.empty())
+                    busy_periods++;
+                queue_cost -= request->cost;
+                canceled_requests++;
+                canceled_cost += request->cost;
+                return true;
+            }
+        }
+        return false;
+    }
+
     bool isActive() override
     {
-        std::unique_lock lock(mutex);
+        std::lock_guard lock(mutex);
         return !requests.empty();
     }
 
@@ -98,14 +117,14 @@ public:
 
     std::pair<UInt64, Int64> getQueueLengthAndCost()
     {
-        std::unique_lock lock(mutex);
+        std::lock_guard lock(mutex);
         return {requests.size(), queue_cost};
     }
 
 private:
     std::mutex mutex;
     Int64 queue_cost = 0;
-    std::deque<ResourceRequest *> requests;
+    std::deque<ResourceRequest *> requests; // TODO(serxa): reimplement it using intrusive list to avoid allocations/deallocations and O(N) during cancel
 };
 
 }
diff --git a/src/Common/Scheduler/Nodes/PriorityPolicy.h b/src/Common/Scheduler/Nodes/PriorityPolicy.h
index 6d6b15bd063..9b4cfc37f8c 100644
--- a/src/Common/Scheduler/Nodes/PriorityPolicy.h
+++ b/src/Common/Scheduler/Nodes/PriorityPolicy.h
@@ -102,25 +102,31 @@ public:
 
     std::pair<ResourceRequest *, bool> dequeueRequest() override
     {
-        if (items.empty())
-            return {nullptr, false};
-
-        // Recursively pull request from child
-        auto [request, child_active] = items.front().child->dequeueRequest();
-        assert(request != nullptr);
-
-        // Deactivate child if it is empty
-        if (!child_active)
+        // Cycle is required to do deactivations in the case of canceled requests, when dequeueRequest returns `nullptr`
+        while (true)
         {
-            std::pop_heap(items.begin(), items.end());
-            items.pop_back();
             if (items.empty())
-                busy_periods++;
-        }
+                return {nullptr, false};
 
-        dequeued_requests++;
-        dequeued_cost += request->cost;
-        return {request, !items.empty()};
+            // Recursively pull request from child
+            auto [request, child_active] = items.front().child->dequeueRequest();
+
+            // Deactivate child if it is empty
+            if (!child_active)
+            {
+                std::pop_heap(items.begin(), items.end());
+                items.pop_back();
+                if (items.empty())
+                    busy_periods++;
+            }
+
+            if (request)
+            {
+                dequeued_requests++;
+                dequeued_cost += request->cost;
+                return {request, !items.empty()};
+            }
+        }
     }
 
     bool isActive() override
diff --git a/src/Common/Scheduler/Nodes/tests/gtest_dynamic_resource_manager.cpp b/src/Common/Scheduler/Nodes/tests/gtest_dynamic_resource_manager.cpp
index 961a3b6f713..cdf09776077 100644
--- a/src/Common/Scheduler/Nodes/tests/gtest_dynamic_resource_manager.cpp
+++ b/src/Common/Scheduler/Nodes/tests/gtest_dynamic_resource_manager.cpp
@@ -38,7 +38,6 @@ TEST(SchedulerDynamicResourceManager, Smoke)
     {
         ResourceGuard gA(cA->get("res1"), ResourceGuard::PostponeLocking);
         gA.lock();
-        gA.setFailure();
         gA.unlock();
 
         ResourceGuard gB(cB->get("res1"));
diff --git a/src/Common/Scheduler/Nodes/tests/gtest_resource_scheduler.cpp b/src/Common/Scheduler/Nodes/tests/gtest_resource_scheduler.cpp
index 9fefbc02cbd..e76639a4b01 100644
--- a/src/Common/Scheduler/Nodes/tests/gtest_resource_scheduler.cpp
+++ b/src/Common/Scheduler/Nodes/tests/gtest_resource_scheduler.cpp
@@ -4,6 +4,7 @@
 
 #include <Common/Scheduler/Nodes/tests/ResourceTest.h>
 
+#include <barrier>
 #include <future>
 
 using namespace DB;
@@ -73,6 +74,22 @@ struct ResourceHolder
     }
 };
 
+struct MyRequest : public ResourceRequest
+{
+    std::function<void()> on_execute;
+
+    explicit MyRequest(ResourceCost cost_, std::function<void()> on_execute_)
+        : ResourceRequest(cost_)
+        , on_execute(on_execute_)
+    {}
+
+    void execute() override
+    {
+        if (on_execute)
+            on_execute();
+    }
+};
+
 TEST(SchedulerRoot, Smoke)
 {
     ResourceTest t;
@@ -111,3 +128,49 @@ TEST(SchedulerRoot, Smoke)
         EXPECT_TRUE(fc2->requests.contains(&rg.request));
     }
 }
+
+TEST(SchedulerRoot, Cancel)
+{
+    ResourceTest t;
+
+    ResourceHolder r1(t);
+    auto * fc1 = r1.add<ConstraintTest>("/", "<max_requests>1</max_requests>");
+    r1.add<PriorityPolicy>("/prio");
+    auto a = r1.addQueue("/prio/A", "<priority>1</priority>");
+    auto b = r1.addQueue("/prio/B", "<priority>2</priority>");
+    r1.registerResource();
+
+    std::barrier sync(2);
+    std::thread consumer1([&]
+    {
+        std::barrier destruct_sync(2);
+        MyRequest request(1,[&]
+        {
+            sync.arrive_and_wait(); // (A)
+            EXPECT_TRUE(fc1->requests.contains(&request));
+            sync.arrive_and_wait(); // (B)
+            request.finish();
+            destruct_sync.arrive_and_wait(); // (C)
+        });
+        a.queue->enqueueRequest(&request);
+        destruct_sync.arrive_and_wait(); // (C)
+    });
+
+    std::thread consumer2([&]
+    {
+        MyRequest request(1,[&]
+        {
+            FAIL() << "This request must be canceled, but instead executes";
+        });
+        sync.arrive_and_wait(); // (A) wait for request of consumer1 to be inside execute, so that constraint is in violated state and our request will not be executed immediately
+        b.queue->enqueueRequest(&request);
+        bool canceled = b.queue->cancelRequest(&request);
+        EXPECT_TRUE(canceled);
+        sync.arrive_and_wait(); // (B) release request of consumer1 to be finished
+    });
+
+    consumer1.join();
+    consumer2.join();
+
+    EXPECT_TRUE(fc1->requests.empty());
+}
diff --git a/src/Common/Scheduler/ResourceGuard.h b/src/Common/Scheduler/ResourceGuard.h
index dca4041b176..50f665a384b 100644
--- a/src/Common/Scheduler/ResourceGuard.h
+++ b/src/Common/Scheduler/ResourceGuard.h
@@ -71,8 +71,7 @@ public:
             // lock(mutex) is not required because `Dequeued` request cannot be used by the scheduler thread
             chassert(state == Dequeued);
             state = Finished;
-            if (constraint)
-                constraint->finishRequest(this);
+            ResourceRequest::finish();
         }
 
         static Request & local()
@@ -126,12 +125,6 @@ public:
         }
     }
 
-    /// Mark request as unsuccessful; by default request is considered to be successful
-    void setFailure()
-    {
-        request.successful = false;
-    }
-
     ResourceLink link;
     Request & request;
 };
diff --git a/src/Common/Scheduler/ResourceRequest.cpp b/src/Common/Scheduler/ResourceRequest.cpp
new file mode 100644
index 00000000000..26e8084cdfa
--- /dev/null
+++ b/src/Common/Scheduler/ResourceRequest.cpp
@@ -0,0 +1,13 @@
+#include <Common/Scheduler/ResourceRequest.h>
+#include <Common/Scheduler/ISchedulerConstraint.h>
+
+namespace DB
+{
+
+void ResourceRequest::finish()
+{
+    if (constraint)
+        constraint->finishRequest(this);
+}
+
+}
diff --git a/src/Common/Scheduler/ResourceRequest.h b/src/Common/Scheduler/ResourceRequest.h
index 3d2230746f9..f3153ad382c 100644
--- a/src/Common/Scheduler/ResourceRequest.h
+++ b/src/Common/Scheduler/ResourceRequest.h
@@ -14,9 +14,6 @@ class ISchedulerConstraint;
 using ResourceCost = Int64;
 constexpr ResourceCost ResourceCostMax = std::numeric_limits<int>::max();
 
-/// Timestamps (nanoseconds since epoch)
-using ResourceNs = UInt64;
-
 /*
  * Request for a resource consumption. The main moving part of the scheduling subsystem.
  * Resource requests processing workflow:
@@ -31,7 +28,7 @@ using ResourceNs = UInt64;
  *  3) Scheduler calls ISchedulerNode::dequeueRequest() that returns the request.
  *  4) Callback ResourceRequest::execute() is called to provide access to the resource.
  *  5) The resource consumption is happening outside of the scheduling subsystem.
- *  6) request->constraint->finishRequest() is called when consumption is finished.
+ *  6) ResourceRequest::finish() is called when consumption is finished.
  *
  * Steps (5) and (6) can be omitted if constraint is not used by the resource.
  *
@@ -39,7 +36,10 @@ using ResourceNs = UInt64;
  * Request ownership is done outside of the scheduling subsystem.
  * After (6) request can be destructed safely.
  *
- * Request cancelling is not supported yet.
+ * Request can also be canceled before (3) using ISchedulerQueue::cancelRequest().
+ * Returning false means it is too late for request to be canceled. It should be processed in a regular way.
+ * Returning true means successful cancel and therefore steps (4) and (5) are not going to happen
+ * and step (6) MUST be omitted.
  */
 class ResourceRequest
 {
@@ -48,32 +48,20 @@ public:
     /// NOTE: If cost is not known in advance, ResourceBudget should be used (note that every ISchedulerQueue has it)
     ResourceCost cost;
 
-    /// Request outcome
-    /// Should be filled during resource consumption
-    bool successful;
-
     /// Scheduler node to be notified on consumption finish
     /// Auto-filled during request enqueue/dequeue
     ISchedulerConstraint * constraint;
 
-    /// Timestamps for introspection
-    ResourceNs enqueue_ns;
-    ResourceNs execute_ns;
-    ResourceNs finish_ns;
-
     explicit ResourceRequest(ResourceCost cost_ = 1)
     {
         reset(cost_);
     }
 
+    /// ResourceRequest object may be reused again after reset()
     void reset(ResourceCost cost_)
     {
         cost = cost_;
-        successful = true;
         constraint = nullptr;
-        enqueue_ns = 0;
-        execute_ns = 0;
-        finish_ns = 0;
     }
 
     virtual ~ResourceRequest() = default;
@@ -83,6 +71,12 @@ public:
     /// just triggering start of a consumption, not doing the consumption itself
     /// (e.g. setting an std::promise or creating a job in a thread pool)
     virtual void execute() = 0;
+
+    /// Stop resource consumption and notify resource scheduler.
+    /// Should be called when resource consumption is finished by consumer.
+    /// ResourceRequest should not be destructed or reset before calling to `finish()`.
+    /// WARNING: this function MUST not be called if request was canceled.
+    void finish();
 };
 
 }
diff --git a/src/Common/Scheduler/SchedulerRoot.h b/src/Common/Scheduler/SchedulerRoot.h
index 3a23a8df834..ab3f702a422 100644
--- a/src/Common/Scheduler/SchedulerRoot.h
+++ b/src/Common/Scheduler/SchedulerRoot.h
@@ -145,22 +145,27 @@ public:
 
     std::pair<ResourceRequest *, bool> dequeueRequest() override
     {
-        if (current == nullptr) // No active resources
-            return {nullptr, false};
+        while (true)
+        {
+            if (current == nullptr) // No active resources
+                return {nullptr, false};
 
-        // Dequeue request from current resource
-        auto [request, resource_active] = current->root->dequeueRequest();
-        assert(request != nullptr);
+            // Dequeue request from current resource
+            auto [request, resource_active] = current->root->dequeueRequest();
 
-        // Deactivate resource if required
-        if (!resource_active)
-            deactivate(current);
-        else
-            current = current->next; // Just move round-robin pointer
+            // Deactivate resource if required
+            if (!resource_active)
+                deactivate(current);
+            else
+                current = current->next; // Just move round-robin pointer
 
-        dequeued_requests++;
-        dequeued_cost += request->cost;
-        return {request, current != nullptr};
+            if (request == nullptr) // Possible in case of request cancel, just retry
+                continue;
+
+            dequeued_requests++;
+            dequeued_cost += request->cost;
+            return {request, current != nullptr};
+        }
     }
 
     bool isActive() override
@@ -245,7 +250,6 @@ private:
 
     void execute(ResourceRequest * request)
     {
-        request->execute_ns = clock_gettime_ns();
         request->execute();
     }
 
diff --git a/src/Storages/System/StorageSystemScheduler.cpp b/src/Storages/System/StorageSystemScheduler.cpp
index ba07d44dbf9..633bac5d285 100644
--- a/src/Storages/System/StorageSystemScheduler.cpp
+++ b/src/Storages/System/StorageSystemScheduler.cpp
@@ -30,7 +30,9 @@ ColumnsDescription StorageSystemScheduler::getColumnsDescription()
         {"is_active", std::make_shared<DataTypeUInt8>(), "Whether this node is currently active - has resource requests to be dequeued and constraints satisfied."},
         {"active_children", std::make_shared<DataTypeUInt64>(), "The number of children in active state."},
         {"dequeued_requests", std::make_shared<DataTypeUInt64>(), "The total number of resource requests dequeued from this node."},
+        {"canceled_requests", std::make_shared<DataTypeUInt64>(), "The total number of resource requests canceled from this node."},
         {"dequeued_cost", std::make_shared<DataTypeInt64>(), "The sum of costs (e.g. size in bytes) of all requests dequeued from this node."},
+        {"canceled_cost", std::make_shared<DataTypeInt64>(), "The sum of costs (e.g. size in bytes) of all requests canceled from this node."},
         {"busy_periods", std::make_shared<DataTypeUInt64>(), "The total number of deactivations of this node."},
         {"vruntime", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeFloat64>()),
             "For children of `fair` nodes only. Virtual runtime of a node used by SFQ algorithm to select the next child to process in a max-min fair manner."},
@@ -93,7 +95,9 @@ void StorageSystemScheduler::fillData(MutableColumns & res_columns, ContextPtr c
         res_columns[i++]->insert(node->isActive());
         res_columns[i++]->insert(node->activeChildren());
         res_columns[i++]->insert(node->dequeued_requests.load());
+        res_columns[i++]->insert(node->canceled_requests.load());
         res_columns[i++]->insert(node->dequeued_cost.load());
+        res_columns[i++]->insert(node->canceled_cost.load());
         res_columns[i++]->insert(node->busy_periods.load());
 
         Field vruntime;

From 8b1a1d42daa01e946aa8102d683dbab90b447838 Mon Sep 17 00:00:00 2001
From: Aleksei Filatov <alexfvk@yandex-team.ru>
Date: Thu, 29 Feb 2024 18:07:00 +0300
Subject: [PATCH 083/985] Traverse shadow directory for
 system.remote_data_paths

---
 src/Core/Settings.h                                 |  1 +
 src/Disks/IDisk.h                                   |  5 ++++-
 src/Disks/ObjectStorages/DiskObjectStorage.cpp      | 10 ++++++++--
 src/Disks/ObjectStorages/DiskObjectStorage.h        |  5 ++++-
 .../System/StorageSystemRemoteDataPaths.cpp         | 13 +++++++++++++
 5 files changed, 30 insertions(+), 4 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d77b3a45188..7cf068d7f1f 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -843,6 +843,7 @@ class IColumn;
     M(Bool, optimize_uniq_to_count, true, "Rewrite uniq and its variants(except uniqUpTo) to count if subquery has distinct or group by clause.", 0) \
     M(Bool, use_variant_as_common_type, false, "Use Variant as a result type for if/multiIf in case when there is no common type for arguments", 0) \
     M(Bool, enable_order_by_all, true, "Enable sorting expression ORDER BY ALL.", 0) \
+    M(Bool, traverse_shadow_remote_data_paths, false, "Traverse shadow directory when query system.remote_data_paths", 0) \
     \
     /** Experimental functions */ \
     M(Bool, allow_experimental_materialized_postgresql_table, false, "Allows to use the MaterializedPostgreSQL table engine. Disabled by default, because this feature is experimental", 0) \
diff --git a/src/Disks/IDisk.h b/src/Disks/IDisk.h
index 3d228850537..62b02938d1a 100644
--- a/src/Disks/IDisk.h
+++ b/src/Disks/IDisk.h
@@ -320,7 +320,10 @@ public:
         {}
     };
 
-    virtual void getRemotePathsRecursive(const String &, std::vector<LocalPathWithObjectStoragePaths> &)
+    virtual void getRemotePathsRecursive(
+        const String &,
+        std::vector<LocalPathWithObjectStoragePaths> &,
+        const std::function<bool(const String &)> & /* skip_predicate */ = {})
     {
         throw Exception(ErrorCodes::NOT_IMPLEMENTED,
             "Method `getRemotePathsRecursive() not implemented for disk: {}`",
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.cpp b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
index 2a648f28f14..460d242d5cd 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
@@ -90,11 +90,17 @@ StoredObjects DiskObjectStorage::getStorageObjects(const String & local_path) co
     return metadata_storage->getStorageObjects(local_path);
 }
 
-void DiskObjectStorage::getRemotePathsRecursive(const String & local_path, std::vector<LocalPathWithObjectStoragePaths> & paths_map)
+void DiskObjectStorage::getRemotePathsRecursive(
+    const String & local_path,
+    std::vector<LocalPathWithObjectStoragePaths> & paths_map,
+    const std::function<bool(const String &)> & skip_predicate)
 {
     if (!metadata_storage->exists(local_path))
         return;
 
+    if (skip_predicate && skip_predicate(local_path))
+        return;
+
     /// Protect against concurrent delition of files (for example because of a merge).
     if (metadata_storage->isFile(local_path))
     {
@@ -142,7 +148,7 @@ void DiskObjectStorage::getRemotePathsRecursive(const String & local_path, std::
         }
 
         for (; it->isValid(); it->next())
-            DiskObjectStorage::getRemotePathsRecursive(fs::path(local_path) / it->name(), paths_map);
+            DiskObjectStorage::getRemotePathsRecursive(fs::path(local_path) / it->name(), paths_map, skip_predicate);
     }
 }
 
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.h b/src/Disks/ObjectStorages/DiskObjectStorage.h
index e1576509713..d7af656bea3 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.h
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.h
@@ -48,7 +48,10 @@ public:
 
     StoredObjects getStorageObjects(const String & local_path) const override;
 
-    void getRemotePathsRecursive(const String & local_path, std::vector<LocalPathWithObjectStoragePaths> & paths_map) override;
+    void getRemotePathsRecursive(
+        const String & local_path,
+        std::vector<LocalPathWithObjectStoragePaths> & paths_map,
+        const std::function<bool(const String &)> & skip_predicate = {}) override;
 
     const std::string & getCacheName() const override { return object_storage->getCacheName(); }
 
diff --git a/src/Storages/System/StorageSystemRemoteDataPaths.cpp b/src/Storages/System/StorageSystemRemoteDataPaths.cpp
index 87b7a84e8ba..708c1369965 100644
--- a/src/Storages/System/StorageSystemRemoteDataPaths.cpp
+++ b/src/Storages/System/StorageSystemRemoteDataPaths.cpp
@@ -9,6 +9,7 @@
 #include <Interpreters/Context.h>
 #include <Disks/IDisk.h>
 
+namespace fs = std::filesystem;
 
 namespace DB
 {
@@ -59,6 +60,18 @@ Pipe StorageSystemRemoteDataPaths::read(
             std::vector<IDisk::LocalPathWithObjectStoragePaths> remote_paths_by_local_path;
             disk->getRemotePathsRecursive("store", remote_paths_by_local_path);
             disk->getRemotePathsRecursive("data", remote_paths_by_local_path);
+            if (context->getSettingsRef().traverse_shadow_remote_data_paths)
+                disk->getRemotePathsRecursive(
+                    "shadow",
+                    remote_paths_by_local_path,
+                    [](const String & local_path)
+                    {
+                        // `shadow/{backup_name}/revision.txt` is not an object metadata file
+                        const auto path = fs::path(local_path);
+                        return path.filename() == "revision.txt" &&
+                               path.parent_path().has_parent_path() &&
+                               path.parent_path().parent_path().filename() == "shadow";
+                    });
 
             FileCachePtr cache;
 

From 5641fd8ba9c4f27794367e22632365df5cdf0303 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 29 Feb 2024 16:13:05 +0100
Subject: [PATCH 084/985] Fix build after merge

---
 src/IO/WriteBufferFromS3TaskTracker.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/IO/WriteBufferFromS3TaskTracker.h b/src/IO/WriteBufferFromS3TaskTracker.h
index 134abbbc4c1..4061f084a76 100644
--- a/src/IO/WriteBufferFromS3TaskTracker.h
+++ b/src/IO/WriteBufferFromS3TaskTracker.h
@@ -1,7 +1,7 @@
 #pragma once
 
 #include "config.h"
-#include <Interpreters/threadPoolCallbackRunner.h>
+#include <Common/threadPoolCallbackRunner.h>
 #include "WriteBufferFromS3.h"
 
 #include <Common/logger_useful.h>

From 7632c2c33f357c1c616f734c7bf2502ccbfbd496 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 29 Feb 2024 15:17:12 +0000
Subject: [PATCH 085/985] Remove non-deterministic functions in virtual columns
 filter

---
 src/Storages/MergeTree/MergeTreeData.cpp      |  2 ++
 src/Storages/VirtualColumnUtils.cpp           | 21 +++++++++++++++++++
 ...with_non_deterministic_functions.reference | 11 ++++++++++
 ...lumns_with_non_deterministic_functions.sql |  6 ++++++
 4 files changed, 40 insertions(+)
 create mode 100644 tests/queries/0_stateless/03002_filter_skip_virtual_columns_with_non_deterministic_functions.reference
 create mode 100644 tests/queries/0_stateless/03002_filter_skip_virtual_columns_with_non_deterministic_functions.sql

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 8aa188cfe5c..6494ed5d844 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -1082,6 +1082,8 @@ std::optional<UInt64> MergeTreeData::totalRowsByPartitionPredicateImpl(
     Block virtual_columns_block = getBlockWithVirtualPartColumns(parts, true /* one_part */);
 
     auto filter_dag = VirtualColumnUtils::splitFilterDagForAllowedInputs(filter_actions_dag->getOutputs().at(0), nullptr);
+    if (!filter_dag)
+        return {};
 
     // Generate valid expressions for filtering
     bool valid = true;
diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index 33ff6e7104f..3e0ef1d7990 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -467,6 +467,23 @@ static bool canEvaluateSubtree(const ActionsDAG::Node * node, const Block & allo
     return true;
 }
 
+static bool isDeterministic(const ActionsDAG::Node * node)
+{
+    if (node->type != ActionsDAG::ActionType::FUNCTION)
+        return true;
+
+    if (!node->function_base->isDeterministic())
+        return false;
+
+    for (const auto * child : node->children)
+    {
+        if (!isDeterministic(child))
+            return false;
+    }
+
+    return true;
+}
+
 static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
     const ActionsDAG::Node * node,
     const Block * allowed_inputs,
@@ -542,6 +559,10 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
                 }
             }
         }
+        else if (!isDeterministic(node))
+        {
+            return nullptr;
+        }
     }
 
     if (allowed_inputs && !canEvaluateSubtree(node, *allowed_inputs))
diff --git a/tests/queries/0_stateless/03002_filter_skip_virtual_columns_with_non_deterministic_functions.reference b/tests/queries/0_stateless/03002_filter_skip_virtual_columns_with_non_deterministic_functions.reference
new file mode 100644
index 00000000000..4c9646d6ffa
--- /dev/null
+++ b/tests/queries/0_stateless/03002_filter_skip_virtual_columns_with_non_deterministic_functions.reference
@@ -0,0 +1,11 @@
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+1
diff --git a/tests/queries/0_stateless/03002_filter_skip_virtual_columns_with_non_deterministic_functions.sql b/tests/queries/0_stateless/03002_filter_skip_virtual_columns_with_non_deterministic_functions.sql
new file mode 100644
index 00000000000..9f8bc6bd3d7
--- /dev/null
+++ b/tests/queries/0_stateless/03002_filter_skip_virtual_columns_with_non_deterministic_functions.sql
@@ -0,0 +1,6 @@
+create table test (number UInt64) engine=MergeTree order by number;
+insert into test select * from numbers(100000000);
+select ignore(number) from test where RAND() > 4292390314 limit 10;
+select count() > 0 from test where RAND() > 4292390314;
+drop table test;
+

From 09a392772d75b38e1b19ad6bd2a863168ea0de5c Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 29 Feb 2024 15:34:45 +0000
Subject: [PATCH 086/985] Use isDeterministicInScopeOfQuery

---
 src/Storages/VirtualColumnUtils.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index 3e0ef1d7990..6d66453442e 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -467,17 +467,17 @@ static bool canEvaluateSubtree(const ActionsDAG::Node * node, const Block & allo
     return true;
 }
 
-static bool isDeterministic(const ActionsDAG::Node * node)
+static bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node)
 {
     if (node->type != ActionsDAG::ActionType::FUNCTION)
         return true;
 
-    if (!node->function_base->isDeterministic())
+    if (!node->function_base->isDeterministicInScopeOfQuery())
         return false;
 
     for (const auto * child : node->children)
     {
-        if (!isDeterministic(child))
+        if (!isDeterministicInScopeOfQuery(child))
             return false;
     }
 
@@ -559,7 +559,7 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
                 }
             }
         }
-        else if (!isDeterministic(node))
+        else if (!isDeterministicInScopeOfQuery(node))
         {
             return nullptr;
         }

From 55053dae4459b1d1a6c05d436d1ab421a96c3934 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 29 Feb 2024 19:18:06 +0100
Subject: [PATCH 087/985] Some progress

---
 src/Analyzer/IdentifierNode.cpp               | 10 +---
 src/Analyzer/IdentifierNode.h                 |  6 ---
 src/DataTypes/ObjectUtils.cpp                 | 24 +++++-----
 src/DataTypes/ObjectUtils.h                   |  4 +-
 .../ClusterProxy/SelectStreamFactory.cpp      | 10 ++--
 .../ClusterProxy/SelectStreamFactory.h        |  8 +++-
 src/Processors/QueryPlan/ReadFromRemote.cpp   | 47 +++++++++++++++++++
 .../test_distributed_type_object/test.py      |  2 +-
 8 files changed, 80 insertions(+), 31 deletions(-)

diff --git a/src/Analyzer/IdentifierNode.cpp b/src/Analyzer/IdentifierNode.cpp
index 7e4d4c02a4c..88b3daacb12 100644
--- a/src/Analyzer/IdentifierNode.cpp
+++ b/src/Analyzer/IdentifierNode.cpp
@@ -1,4 +1,3 @@
-#include <memory>
 #include <Analyzer/IdentifierNode.h>
 
 #include <Common/assert_cast.h>
@@ -57,18 +56,13 @@ void IdentifierNode::updateTreeHashImpl(HashState & state) const
 
 QueryTreeNodePtr IdentifierNode::cloneImpl() const
 {
-    auto result = std::make_shared<IdentifierNode>(identifier);
-    result->use_parts_for_to_ast = use_parts_for_to_ast;
-    return result;
+    return std::make_shared<IdentifierNode>(identifier);
 }
 
 ASTPtr IdentifierNode::toASTImpl(const ConvertToASTOptions & /* options */) const
 {
     auto identifier_parts = identifier.getParts();
-    if (use_parts_for_to_ast)
-        return std::make_shared<ASTIdentifier>(std::move(identifier_parts));
-    else
-        return std::make_shared<ASTIdentifier>(identifier.getFullName());
+    return std::make_shared<ASTIdentifier>(std::move(identifier_parts));
 }
 
 }
diff --git a/src/Analyzer/IdentifierNode.h b/src/Analyzer/IdentifierNode.h
index 3bc37b4c69d..872bb14d512 100644
--- a/src/Analyzer/IdentifierNode.h
+++ b/src/Analyzer/IdentifierNode.h
@@ -52,11 +52,6 @@ public:
 
     void dumpTreeImpl(WriteBuffer & buffer, FormatState & format_state, size_t indent) const override;
 
-    void useFullNameInToAST()
-    {
-        use_parts_for_to_ast = false;
-    }
-
 protected:
     bool isEqualImpl(const IQueryTreeNode & rhs) const override;
 
@@ -69,7 +64,6 @@ protected:
 private:
     Identifier identifier;
     std::optional<TableExpressionModifiers> table_expression_modifiers;
-    bool use_parts_for_to_ast = false;
 
     static constexpr size_t children_size = 0;
 };
diff --git a/src/DataTypes/ObjectUtils.cpp b/src/DataTypes/ObjectUtils.cpp
index 01ba50d90f3..47d8c5c9113 100644
--- a/src/DataTypes/ObjectUtils.cpp
+++ b/src/DataTypes/ObjectUtils.cpp
@@ -965,30 +965,32 @@ void replaceMissedSubcolumnsByConstants(
 
 /// @expected_columns and @available_columns contain descriptions
 /// of extended Object columns.
-void replaceMissedSubcolumnsByConstants(
+MissingObjectList replaceMissedSubcolumnsByConstants(
     const ColumnsDescription & expected_columns,
     const ColumnsDescription & available_columns,
     QueryTreeNodePtr & query,
     const ContextPtr & context [[maybe_unused]])
 {
+    MissingObjectList missed_list;
+
     NamesAndTypes missed_names_types = calculateMissedSubcolumns(expected_columns, available_columns);
 
     if (missed_names_types.empty())
-        return;
+        return missed_list;
 
     auto * query_node = query->as<QueryNode>();
     if (!query_node)
-        return;
+        return missed_list;
+
+    missed_list.reserve(missed_names_types.size());
 
     auto table_expression = extractLeftTableExpression(query_node->getJoinTree());
 
-    auto & with_nodes = query_node->getWith().getNodes();
-
     std::unordered_map<std::string, QueryTreeNodePtr> column_name_to_node;
     for (const auto & [name, type] : missed_names_types)
     {
         auto constant = std::make_shared<ConstantNode>(type->getDefault(), type);
-        constant->setAlias(table_expression->getAlias() + name);
+        constant->setAlias(table_expression->getAlias() + "." + name);
         // auto materialize = std::make_shared<FunctionNode>("materialize");
 
         // auto function = FunctionFactory::instance().get("materialize", context);
@@ -996,17 +998,17 @@ void replaceMissedSubcolumnsByConstants(
         // materialize->resolveAsFunction(function->build(materialize->getArgumentColumns()));
         // materialize->setAlias(name);
 
-        with_nodes.push_back(constant);
-
-        auto id = std::make_shared<IdentifierNode>(Identifier(table_expression->getAlias() + name));
-        id->useFullNameInToAST();
-        column_name_to_node[name] = id;
+        column_name_to_node[name] = buildCastFunction(constant, type, context);
+        missed_list.push_back({ constant->getValueStringRepresentation() + "_" + constant->getResultType()->getName(), table_expression->getAlias() + "." + name });
+        LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "{} -> {}", missed_list.back().first, missed_list.back().second);
         LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "Name {} Expression\n{}", name, column_name_to_node[name]->dumpTree());
     }
 
     LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "Table expression\n{} ", table_expression->dumpTree());
     replaceColumns(query, table_expression, column_name_to_node);
     LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "Result:\n{} ", query->dumpTree());
+
+    return missed_list;
 }
 
 Field FieldVisitorReplaceScalars::operator()(const Array & x) const
diff --git a/src/DataTypes/ObjectUtils.h b/src/DataTypes/ObjectUtils.h
index f4a8abe8abf..013e525832e 100644
--- a/src/DataTypes/ObjectUtils.h
+++ b/src/DataTypes/ObjectUtils.h
@@ -102,7 +102,9 @@ void replaceMissedSubcolumnsByConstants(
     const ColumnsDescription & available_columns,
     ASTPtr query);
 
-void replaceMissedSubcolumnsByConstants(
+using MissingObjectList = std::vector<std::pair<String, String>>;
+
+MissingObjectList replaceMissedSubcolumnsByConstants(
     const ColumnsDescription & expected_columns,
     const ColumnsDescription & available_columns,
     QueryTreeNodePtr & query,
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
index 5167ffc0e27..5bcd1ce68cb 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
@@ -151,7 +151,8 @@ void SelectStreamFactory::createForShardImpl(
     Shards & remote_shards,
     UInt32 shard_count,
     bool parallel_replicas_enabled,
-    AdditionalShardFilterGenerator shard_filter_generator)
+    AdditionalShardFilterGenerator shard_filter_generator,
+    MissingObjectList missed_list)
 {
     auto emplace_local_stream = [&]()
     {
@@ -177,6 +178,7 @@ void SelectStreamFactory::createForShardImpl(
             .query = query_ast,
             .main_table = main_table,
             .header = shard_header,
+            .missing_object_list = std::move(missed_list),
             .shard_info = shard_info,
             .lazy = lazy,
             .local_delay = local_delay,
@@ -299,8 +301,9 @@ void SelectStreamFactory::createForShard(
 
     auto it = objects_by_shard.find(shard_info.shard_num);
     QueryTreeNodePtr modified_query = query_tree;
+    MissingObjectList missed_list;
     if (it != objects_by_shard.end())
-        replaceMissedSubcolumnsByConstants(storage_snapshot->object_columns, it->second, modified_query, context);
+        missed_list = replaceMissedSubcolumnsByConstants(storage_snapshot->object_columns, it->second, modified_query, context);
 
     auto query_ast = queryNodeToDistributedSelectQuery(modified_query);
 
@@ -314,7 +317,8 @@ void SelectStreamFactory::createForShard(
         remote_shards,
         shard_count,
         parallel_replicas_enabled,
-        std::move(shard_filter_generator));
+        std::move(shard_filter_generator),
+        std::move(missed_list));
 
 }
 
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.h b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
index 45d6ea14c01..bee7edb3c19 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.h
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <vector>
 #include <Client/ConnectionPool.h>
 #include <Core/QueryProcessingStage.h>
 #include <Interpreters/Cluster.h>
@@ -43,6 +44,8 @@ ASTPtr rewriteSelectQuery(
 using ColumnsDescriptionByShardNum = std::unordered_map<UInt32, ColumnsDescription>;
 using AdditionalShardFilterGenerator = std::function<ASTPtr(uint64_t)>;
 
+using MissingObjectList = std::vector<std::pair<String, String>>;
+
 class SelectStreamFactory
 {
 public:
@@ -55,6 +58,8 @@ public:
         StorageID main_table;
         Block header;
 
+        MissingObjectList missing_object_list;
+
         Cluster::ShardInfo shard_info;
 
         /// If we connect to replicas lazily.
@@ -112,7 +117,8 @@ private:
         Shards & remote_shards,
         UInt32 shard_count,
         bool parallel_replicas_enabled,
-        AdditionalShardFilterGenerator shard_filter_generator);
+        AdditionalShardFilterGenerator shard_filter_generator,
+        MissingObjectList missed_list = {});
 };
 
 }
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index fde2313bc15..ac507c6d555 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -1,3 +1,4 @@
+#include <memory>
 #include <Processors/QueryPlan/ReadFromRemote.h>
 
 #include <DataTypes/DataTypesNumber.h>
@@ -14,6 +15,7 @@
 #include <Interpreters/ActionsDAG.h>
 #include <Common/logger_useful.h>
 #include <Common/checkStackSize.h>
+#include "DataTypes/ObjectUtils.h"
 #include <Core/QueryProcessingStage.h>
 #include <Client/ConnectionPool.h>
 #include <Client/ConnectionPoolWithFailover.h>
@@ -31,6 +33,48 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
+static void addRenamingActions(Pipe & pipe, const MissingObjectList & missed_list, const Block & output_header)
+{
+    if (missed_list.empty())
+        return;
+
+    const auto & output_columns = output_header.getColumnsWithTypeAndName();
+    std::vector<size_t> indexes;
+    for (size_t i = 0; i < output_columns.size(); ++i)
+    {
+        bool found = false;
+        for (auto const & elem : missed_list)
+        {
+            if (output_columns[i].name.contains(elem.second))
+            {
+                found = true;
+                break;
+            }
+        }
+        if (found)
+            indexes.push_back(i);
+    }
+
+    auto dag = std::make_shared<ActionsDAG>(pipe.getHeader().getColumnsWithTypeAndName());
+
+    for (size_t index : indexes)
+    {
+        dag->addOrReplaceInOutputs(dag->addAlias(*dag->getOutputs()[index], output_header.getByPosition(index).name));
+    }
+
+    // dag->addAliases(rename_to_apply);
+
+    auto convert_actions = std::make_shared<ExpressionActions>(dag);
+    pipe.addSimpleTransform([&](const Block & cur_header, Pipe::StreamType) -> ProcessorPtr
+    {
+        return std::make_shared<ExpressionTransform>(cur_header, convert_actions);
+    });
+
+    LOG_DEBUG(&Poco::Logger::get("addRenamingActions"), "EXPECTED:\n{}", output_header.dumpStructure());
+
+    LOG_DEBUG(&Poco::Logger::get("addRenamingActions"), "{}", pipe.getHeader().dumpStructure());
+}
+
 static void addConvertingActions(Pipe & pipe, const Block & header)
 {
     if (blocksHaveEqualStructure(pipe.getHeader(), header))
@@ -216,6 +260,7 @@ void ReadFromRemote::addLazyPipe(Pipes & pipes, const ClusterProxy::SelectStream
     };
 
     pipes.emplace_back(createDelayedPipe(shard.header, lazily_create_stream, add_totals, add_extremes));
+    addRenamingActions(pipes.back(), shard.missing_object_list, output_stream->header);
     addConvertingActions(pipes.back(), output_stream->header);
 }
 
@@ -297,6 +342,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
             pipes.emplace_back(
                 createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
+            addRenamingActions(pipes.back(), shard.missing_object_list, output_stream->header);
             addConvertingActions(pipes.back(), output_stream->header);
         }
     }
@@ -326,6 +372,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
         pipes.emplace_back(
             createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
+        addRenamingActions(pipes.back(), shard.missing_object_list, output_stream->header);
         addConvertingActions(pipes.back(), output_stream->header);
     }
 }
diff --git a/tests/integration/test_distributed_type_object/test.py b/tests/integration/test_distributed_type_object/test.py
index b2179af8a3f..f77e0248f02 100644
--- a/tests/integration/test_distributed_type_object/test.py
+++ b/tests/integration/test_distributed_type_object/test.py
@@ -59,7 +59,7 @@ def test_distributed_type_object(started_cluster):
     )
 
     expected = TSV("120\n")
-    assert TSV(node1.query("SELECT sum(data.k2 * id) FROM dist_table")) == expected
+    assert TSV(node1.query("SELECT sum(data.k2 * id) FROM dist_table SETTINGS optimize_arithmetic_operations_in_aggregate_functions = 0")) == expected
 
     node1.query("TRUNCATE TABLE local_table")
     node2.query("TRUNCATE TABLE local_table")

From 41deadda359ca02528fa6ffe9ecfed09c36b364a Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Thu, 29 Feb 2024 18:37:00 +0000
Subject: [PATCH 088/985] Automatic style fix

---
 tests/integration/test_distributed_type_object/test.py | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_distributed_type_object/test.py b/tests/integration/test_distributed_type_object/test.py
index f77e0248f02..7e6c000cb8e 100644
--- a/tests/integration/test_distributed_type_object/test.py
+++ b/tests/integration/test_distributed_type_object/test.py
@@ -59,7 +59,14 @@ def test_distributed_type_object(started_cluster):
     )
 
     expected = TSV("120\n")
-    assert TSV(node1.query("SELECT sum(data.k2 * id) FROM dist_table SETTINGS optimize_arithmetic_operations_in_aggregate_functions = 0")) == expected
+    assert (
+        TSV(
+            node1.query(
+                "SELECT sum(data.k2 * id) FROM dist_table SETTINGS optimize_arithmetic_operations_in_aggregate_functions = 0"
+            )
+        )
+        == expected
+    )
 
     node1.query("TRUNCATE TABLE local_table")
     node2.query("TRUNCATE TABLE local_table")

From a6cebad52bf4f29984db99cd4d4aa1eb41c50895 Mon Sep 17 00:00:00 2001
From: Nataly Merezhuk <nataly.merezhuk@clickhouse.com>
Date: Thu, 29 Feb 2024 16:32:29 -0500
Subject: [PATCH 089/985] Adds note on supported PostgreSQL versions.

---
 docs/en/engines/table-engines/integrations/postgresql.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/en/engines/table-engines/integrations/postgresql.md b/docs/en/engines/table-engines/integrations/postgresql.md
index 131df1a435b..9cc4b11243e 100644
--- a/docs/en/engines/table-engines/integrations/postgresql.md
+++ b/docs/en/engines/table-engines/integrations/postgresql.md
@@ -8,6 +8,10 @@ sidebar_label: PostgreSQL
 
 The PostgreSQL engine allows to perform `SELECT` and `INSERT` queries on data that is stored on a remote PostgreSQL server.
 
+:::note
+Currently, only PostgreSQL versions 12 and up are supported.
+:::
+
 ## Creating a Table {#creating-a-table}
 
 ``` sql

From 0f2d47e5a444bf78ffef6b2506e50079e6bb55c9 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 1 Mar 2024 10:52:44 +0100
Subject: [PATCH 090/985] Renamed WriteBufferFromS3TaskTracker to
 ThreadPoolTaskTracker

---
 .../ThreadPoolTaskTracker.cpp}                              | 2 +-
 .../ThreadPoolTaskTracker.h}                                | 6 +++---
 src/Disks/IO/WriteBufferFromAzureBlobStorage.h              | 2 +-
 src/IO/WriteBufferFromS3.cpp                                | 2 +-
 src/IO/WriteBufferFromS3.h                                  | 2 +-
 5 files changed, 7 insertions(+), 7 deletions(-)
 rename src/{IO/WriteBufferFromS3TaskTracker.cpp => Common/ThreadPoolTaskTracker.cpp} (99%)
 rename src/{IO/WriteBufferFromS3TaskTracker.h => Common/ThreadPoolTaskTracker.h} (94%)

diff --git a/src/IO/WriteBufferFromS3TaskTracker.cpp b/src/Common/ThreadPoolTaskTracker.cpp
similarity index 99%
rename from src/IO/WriteBufferFromS3TaskTracker.cpp
rename to src/Common/ThreadPoolTaskTracker.cpp
index e62de261fc2..10207eb6296 100644
--- a/src/IO/WriteBufferFromS3TaskTracker.cpp
+++ b/src/Common/ThreadPoolTaskTracker.cpp
@@ -1,6 +1,6 @@
 #include "config.h"
 
-#include <IO/WriteBufferFromS3TaskTracker.h>
+#include "ThreadPoolTaskTracker.h"
 
 namespace ProfileEvents
 {
diff --git a/src/IO/WriteBufferFromS3TaskTracker.h b/src/Common/ThreadPoolTaskTracker.h
similarity index 94%
rename from src/IO/WriteBufferFromS3TaskTracker.h
rename to src/Common/ThreadPoolTaskTracker.h
index 4061f084a76..d37b759a913 100644
--- a/src/IO/WriteBufferFromS3TaskTracker.h
+++ b/src/Common/ThreadPoolTaskTracker.h
@@ -1,10 +1,10 @@
 #pragma once
 
 #include "config.h"
-#include <Common/threadPoolCallbackRunner.h>
-#include "WriteBufferFromS3.h"
+#include "threadPoolCallbackRunner.h"
+#include "IO/WriteBufferFromS3.h"
 
-#include <Common/logger_useful.h>
+#include "logger_useful.h"
 
 #include <list>
 
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
index 2d11014fa2a..4897ca9a846 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
@@ -11,7 +11,7 @@
 #include <IO/WriteSettings.h>
 #include <azure/storage/blobs.hpp>
 #include <azure/core/io/body_stream.hpp>
-#include <IO/WriteBufferFromS3TaskTracker.h>
+#include <Common/ThreadPoolTaskTracker.h>
 
 
 namespace Poco
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index 6fc0a35672f..510d9bef4d3 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -4,8 +4,8 @@
 
 #include "StdIStreamFromMemory.h"
 #include "WriteBufferFromS3.h"
-#include "WriteBufferFromS3TaskTracker.h"
 
+#include <Common/ThreadPoolTaskTracker.h>
 #include <Common/logger_useful.h>
 #include <Common/ProfileEvents.h>
 #include <Common/Throttler.h>
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 28754d180bf..afd8b9909c1 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -12,7 +12,7 @@
 #include <Storages/StorageS3Settings.h>
 #include <Common/threadPoolCallbackRunner.h>
 #include <IO/S3/BlobStorageLogWriter.h>
-#include <IO/WriteBufferFromS3TaskTracker.h>
+#include <Common/ThreadPoolTaskTracker.h>
 
 #include <memory>
 #include <vector>

From 6143986b6d79c0262f5f7dc3052ec2a3f4cfc490 Mon Sep 17 00:00:00 2001
From: Aleksei Filatov <alexfvk@yandex-team.ru>
Date: Fri, 1 Mar 2024 14:55:02 +0300
Subject: [PATCH 091/985] Add query test

---
 ...raverse_shadow_system_data_paths.reference |  3 ++
 ...03000_traverse_shadow_system_data_paths.sh | 34 +++++++++++++++++++
 2 files changed, 37 insertions(+)
 create mode 100644 tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.reference
 create mode 100755 tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh

diff --git a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.reference b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.reference
new file mode 100644
index 00000000000..e8183f05f5d
--- /dev/null
+++ b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.reference
@@ -0,0 +1,3 @@
+1
+1
+1
diff --git a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
new file mode 100755
index 00000000000..a22cb200f9a
--- /dev/null
+++ b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
@@ -0,0 +1,34 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+TABLE="03000_traverse_shadow_system_data_path_table"
+BACKUP="03000_traverse_shadow_system_data_path_backup"
+
+${CLICKHOUSE_CLIENT} --query="CREATE TABLE ${TABLE} (
+    id Int64,
+    data String
+) ENGINE=MergeTree()
+ORDER BY id
+SETTINGS storage_policy='s3_cache';"
+
+${CLICKHOUSE_CLIENT} --query="INSERT INTO ${TABLE} VALUES (0, 'data');"
+${CLICKHOUSE_CLIENT} --query "SELECT count() > 0 FROM system.remote_data_paths WHERE disk_name = 's3_cache'"
+
+${CLICKHOUSE_CLIENT} --query="ALTER TABLE ${TABLE} FREEZE WITH NAME '${BACKUP}';"
+${CLICKHOUSE_CLIENT} --query="DROP TABLE ${TABLE} SYNC;"
+
+${CLICKHOUSE_CLIENT} --query "
+    SELECT count() > 0
+    FROM system.remote_data_paths 
+    WHERE disk_name = 's3_cache' AND local_path LIKE '%shadow/${BACKUP}%'
+    SETTINGS traverse_shadow_remote_data_paths=1;"
+${CLICKHOUSE_CLIENT} --query "SYSTEM UNFREEZE WITH NAME '${BACKUP}';" >/dev/null
+${CLICKHOUSE_CLIENT} --query "
+    SELECT count() == 0
+    FROM system.remote_data_paths 
+    WHERE disk_name = 's3_cache' AND local_path LIKE '%shadow/${BACKUP}%'
+    SETTINGS traverse_shadow_remote_data_paths=1;"

From a7aeb4c00f106d396364bf2a21697e329d3d284d Mon Sep 17 00:00:00 2001
From: Peter <peter279k@gmail.com>
Date: Fri, 1 Mar 2024 23:44:58 +0800
Subject: [PATCH 092/985] Add --now option to enable and start the service

---
 packages/clickhouse-server.postinstall | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/packages/clickhouse-server.postinstall b/packages/clickhouse-server.postinstall
index d3b49db758f..41d4405a790 100644
--- a/packages/clickhouse-server.postinstall
+++ b/packages/clickhouse-server.postinstall
@@ -36,7 +36,7 @@ if [ "$1" = configure ] || [ -n "$not_deb_os" ]; then
         fi
 
         /bin/systemctl daemon-reload
-        /bin/systemctl enable clickhouse-server
+        /bin/systemctl enable --now clickhouse-server
     else
         # If you downgrading to version older than 1.1.54336 run: systemctl disable clickhouse-server
         if [ -x "/etc/init.d/clickhouse-server" ]; then

From 3825cb3ad0d7f2296cf075648d022ef26f1e0cef Mon Sep 17 00:00:00 2001
From: Yakov Olkhovskiy <yakov@clickhouse.com>
Date: Sat, 2 Mar 2024 15:28:45 +0000
Subject: [PATCH 093/985] expand CTE in alter modify query

---
 src/Interpreters/InterpreterAlterQuery.cpp        | 11 +++++++++++
 .../0_stateless/03002_modify_query_cte.reference  |  2 ++
 .../0_stateless/03002_modify_query_cte.sql        | 15 +++++++++++++++
 3 files changed, 28 insertions(+)
 create mode 100644 tests/queries/0_stateless/03002_modify_query_cte.reference
 create mode 100644 tests/queries/0_stateless/03002_modify_query_cte.sql

diff --git a/src/Interpreters/InterpreterAlterQuery.cpp b/src/Interpreters/InterpreterAlterQuery.cpp
index b768593da98..7acaf95becc 100644
--- a/src/Interpreters/InterpreterAlterQuery.cpp
+++ b/src/Interpreters/InterpreterAlterQuery.cpp
@@ -1,3 +1,4 @@
+#include <Interpreters/ApplyWithSubqueryVisitor.h>
 #include <Interpreters/InterpreterAlterQuery.h>
 #include <Interpreters/InterpreterFactory.h>
 
@@ -71,11 +72,15 @@ BlockIO InterpreterAlterQuery::execute()
 
 BlockIO InterpreterAlterQuery::executeToTable(const ASTAlterQuery & alter)
 {
+    ASTSelectWithUnionQuery * modify_query = nullptr;
+
     for (auto & child : alter.command_list->children)
     {
         auto * command_ast = child->as<ASTAlterCommand>();
         if (command_ast->sql_security)
             InterpreterCreateQuery::processSQLSecurityOption(getContext(), command_ast->sql_security->as<ASTSQLSecurity &>());
+        else if (command_ast->type == ASTAlterCommand::MODIFY_QUERY)
+            modify_query = command_ast->select->as<ASTSelectWithUnionQuery>();
     }
 
     BlockIO res;
@@ -123,6 +128,12 @@ BlockIO InterpreterAlterQuery::executeToTable(const ASTAlterQuery & alter)
         throw Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is read-only");
     auto table_lock = table->lockForShare(getContext()->getCurrentQueryId(), getContext()->getSettingsRef().lock_acquire_timeout);
 
+    if (modify_query)
+    {
+        // Expand CTE before filling default database
+        ApplyWithSubqueryVisitor().visit(*modify_query);
+    }
+
     /// Add default database to table identifiers that we can encounter in e.g. default expressions, mutation expression, etc.
     AddDefaultDatabaseVisitor visitor(getContext(), table_id.getDatabaseName());
     ASTPtr command_list_ptr = alter.command_list->ptr();
diff --git a/tests/queries/0_stateless/03002_modify_query_cte.reference b/tests/queries/0_stateless/03002_modify_query_cte.reference
new file mode 100644
index 00000000000..a3d66f70f8f
--- /dev/null
+++ b/tests/queries/0_stateless/03002_modify_query_cte.reference
@@ -0,0 +1,2 @@
+CREATE MATERIALIZED VIEW default.mv_03002 TO default.table_03002\n(\n    `ts` DateTime\n)\nAS SELECT ts\nFROM default.table_03002
+CREATE MATERIALIZED VIEW default.mv_03002 TO default.table_03002\n(\n    `ts` DateTime\n)\nAS WITH MY_CTE AS\n    (\n        SELECT ts\n        FROM default.table_03002\n    )\nSELECT *\nFROM\nMY_CTE
diff --git a/tests/queries/0_stateless/03002_modify_query_cte.sql b/tests/queries/0_stateless/03002_modify_query_cte.sql
new file mode 100644
index 00000000000..3a36ce7e7fd
--- /dev/null
+++ b/tests/queries/0_stateless/03002_modify_query_cte.sql
@@ -0,0 +1,15 @@
+
+CREATE TABLE table_03002 (ts DateTime, event_type String) ENGINE = MergeTree ORDER BY (event_type, ts);
+
+CREATE MATERIALIZED VIEW mv_03002 TO table_03002 AS SELECT ts FROM table_03002;
+
+SHOW CREATE TABLE mv_03002;
+
+ALTER TABLE mv_03002 MODIFY QUERY
+WITH MY_CTE AS (SELECT ts FROM table_03002)
+SELECT * FROM MY_CTE;
+
+SHOW CREATE TABLE mv_03002;
+
+DROP TABLE mv_03002;
+DROP TABLE table_03002;

From 17413ded759ebcef809e03a80284f6f805507560 Mon Sep 17 00:00:00 2001
From: Yakov Olkhovskiy <99031427+yakov-olkhovskiy@users.noreply.github.com>
Date: Sat, 2 Mar 2024 11:11:44 -0500
Subject: [PATCH 094/985] Update 03002_modify_query_cte.reference

---
 tests/queries/0_stateless/03002_modify_query_cte.reference | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03002_modify_query_cte.reference b/tests/queries/0_stateless/03002_modify_query_cte.reference
index a3d66f70f8f..50e4a7c6a07 100644
--- a/tests/queries/0_stateless/03002_modify_query_cte.reference
+++ b/tests/queries/0_stateless/03002_modify_query_cte.reference
@@ -1,2 +1,2 @@
 CREATE MATERIALIZED VIEW default.mv_03002 TO default.table_03002\n(\n    `ts` DateTime\n)\nAS SELECT ts\nFROM default.table_03002
-CREATE MATERIALIZED VIEW default.mv_03002 TO default.table_03002\n(\n    `ts` DateTime\n)\nAS WITH MY_CTE AS\n    (\n        SELECT ts\n        FROM default.table_03002\n    )\nSELECT *\nFROM\nMY_CTE
+CREATE MATERIALIZED VIEW default.mv_03002 TO default.table_03002\n(\n    `ts` DateTime\n)\nAS WITH MY_CTE AS\n    (\n        SELECT ts\n        FROM default.table_03002\n    )\nSELECT *\nFROM MY_CTE

From a6cb302ab54082db5650263d6417052f81f30710 Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Sun, 3 Mar 2024 15:48:49 +0000
Subject: [PATCH 095/985] fix 'AddressSanitizer: stack-use-after-return'

---
 src/Common/Scheduler/Nodes/tests/gtest_resource_scheduler.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/Scheduler/Nodes/tests/gtest_resource_scheduler.cpp b/src/Common/Scheduler/Nodes/tests/gtest_resource_scheduler.cpp
index e76639a4b01..f8196d15819 100644
--- a/src/Common/Scheduler/Nodes/tests/gtest_resource_scheduler.cpp
+++ b/src/Common/Scheduler/Nodes/tests/gtest_resource_scheduler.cpp
@@ -140,10 +140,10 @@ TEST(SchedulerRoot, Cancel)
     auto b = r1.addQueue("/prio/B", "<priority>2</priority>");
     r1.registerResource();
 
+    std::barrier destruct_sync(2);
     std::barrier sync(2);
     std::thread consumer1([&]
     {
-        std::barrier destruct_sync(2);
         MyRequest request(1,[&]
         {
             sync.arrive_and_wait(); // (A)

From 77fe221665ac8610e5ae42f547771e1877793ad0 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Sun, 3 Mar 2024 14:25:25 -0700
Subject: [PATCH 096/985] Adds undocumented rand functions. Prettifies
 markdown.

---
 .../functions/random-functions.md             | 277 +++++++++++++-----
 1 file changed, 206 insertions(+), 71 deletions(-)

diff --git a/docs/en/sql-reference/functions/random-functions.md b/docs/en/sql-reference/functions/random-functions.md
index 6fd31e8d25c..2ce9c75eae4 100644
--- a/docs/en/sql-reference/functions/random-functions.md
+++ b/docs/en/sql-reference/functions/random-functions.md
@@ -11,79 +11,213 @@ elimination](../../sql-reference/functions/index.md#common-subexpression-elimina
 function return different random values.
 
 Related content
+
 - Blog: [Generating random data in ClickHouse](https://clickhouse.com/blog/generating-random-test-distribution-data-for-clickhouse)
 
 :::note
 The random numbers are generated by non-cryptographic algorithms.
 :::
 
-## rand, rand32
+## rand
 
-Returns a random UInt32 number, evenly distributed across the range of all possible UInt32 numbers.
+Returns a random UInt32 number.
+
+### Syntax
+
+```sql
+rand()
+```
+
+### Parameters
+
+None.
+
+### Output
+
+Returns a number of type UInt32.
+
+### Example
+
+```sql
+SELECT rand()
+```
+
+```response
+1569354847
+```
+
+### Implementation details
 
 Uses a linear congruential generator.
 
+## rand32
+
+Returns a random 32-bit unsigned integer (UInt32) number.
+
+### Syntax
+
+```sql
+rand32()
+```
+
+### Parameters
+
+None.
+
+### Output
+
+Returns a number of type UInt32, evenly distributed across the range of all possible UInt32 values.
+
+### Example
+
+```sql
+SELECT rand32();
+```
+
+```response
+2754546224
+```
+
+**Note:** The actual output will be a random number, not the specific number shown in the example.
+
 ## rand64
 
-Returns a random UInt64 number, evenly distributed across the range of all possible UInt64 numbers.
+Returns a random 64-bit unsigned integer (UInt64) number.
 
-Uses a linear congruential generator.
+### Syntax
+
+```sql
+rand64()
+```
+
+### Parameters
+
+None.
+
+### Implementation details
+
+The `rand64` function uses a linear congruential generator, which means that while it appears random, it's not truly random and can be predictable if the initial state is known.
+
+For scenarios where true randomness is crucial, consider using alternative methods like system-level calls or integrating with external libraries.
+
+### Output
+
+Returns a number of type UInt64, evenly distributed across the range of all possible UInt64 values.
+
+### Example
+
+```sql
+SELECT rand64();
+```
+
+```response
+15030268859237645412
+```
+
+**Note:** The actual output will be a random number, not the specific number shown in the example.
 
 ## randCanonical
 
-Returns a random Float64 value, evenly distributed in interval [0, 1).
+Returns a random floating-point number of type Float64, evenly distributed within the closed interval.
+
+### Syntax
+
+```sql
+randCanonical()
+```
+
+### Parameters
+
+None.
+
+### Output
+
+Returns a Float64 value between 0 (inclusive) and 1 (exclusive).
+
+### Example
+
+```sql
+SELECT randCanonical();
+```
+
+```response
+0.3452178901234567
+```
+
+**Note:** The actual output will be a random decimal number between 0 and 1, not the specific number shown in the example.
 
 ## randConstant
 
-Like `rand` but produces a constant column with a random value.
+Generates a single constant column filled with a random value. Unlike `rand`, `randConstant` ensures the same random value appears in every row of the generated column, making it useful for scenarios requiring a consistent random seed across rows in a single query.
 
-**Example**
+### Syntax
 
-``` sql
-SELECT rand(), rand(1), rand(number), randConstant(), randConstant(1), randConstant(number)
-FROM numbers(3)
+```sql
+randConstant([x]);
 ```
 
-Result:
+### Parameters
 
-``` result
-┌─────rand()─┬────rand(1)─┬─rand(number)─┬─randConstant()─┬─randConstant(1)─┬─randConstant(number)─┐
-│ 3047369878 │ 4132449925 │   4044508545 │     2740811946 │      4229401477 │           1924032898 │
-│ 2938880146 │ 1267722397 │   4154983056 │     2740811946 │      4229401477 │           1924032898 │
-│  956619638 │ 4238287282 │   1104342490 │     2740811946 │      4229401477 │           1924032898 │
-└────────────┴────────────┴──────────────┴────────────────┴─────────────────┴──────────────────────┘
+- **[x] (Optional):** An optional expression that influences the generated random value. Even if provided, the resulting value will still be constant within the same query execution. Different queries using the same expression will likely generate different constant values.
+
+### Implementation details
+
+The actual output will be different for each query execution, even with the same optional expression.
+
+The optional parameter may not significantly change the generated value compared to using `randConstant` alone.
+
+### Output
+
+Returns a column of type UInt32 containing the same random value in each row.
+
+### Examples
+
+```sql
+SELECT randConstant() AS random_value;
+```
+
+```response
+| random_value |
+|--------------|
+| 1234567890   |
+```
+
+```sql
+SELECT randConstant(10) AS random_value;
+```
+
+```response
+| random_value |
+|--------------|
+| 9876543210   |
 ```
 
 ## randUniform
 
-Returns a random Float64 drawn uniformly from interval [`min`, `max`) ([continuous uniform distribution](https://en.wikipedia.org/wiki/Continuous_uniform_distribution)).
+Returns a random Float64 drawn uniformly from interval [`min`, `max`].
 
-**Syntax**
+### Syntax
 
-``` sql
+```sql
 randUniform(min, max)
 ```
 
-**Arguments**
+### Parameters
 
 - `min` - `Float64` - left boundary of the range,
 - `max` - `Float64` - right boundary of the range.
 
-**Returned value**
+### Output
 
-- Random number.
+A random number of type [Float64](/docs/en/sql-reference/data-types/float.md).
 
-Type: [Float64](/docs/en/sql-reference/data-types/float.md).
+### Example
 
-**Example**
-
-``` sql
+```sql
 SELECT randUniform(5.5, 10) FROM numbers(5)
 ```
 
-Result:
-
-``` result
+```response
 ┌─randUniform(5.5, 10)─┐
 │    8.094978491443102 │
 │   7.3181248914450885 │
@@ -99,7 +233,7 @@ Returns a random Float64 drawn from a [normal distribution](https://en.wikipedia
 
 **Syntax**
 
-``` sql
+```sql
 randNormal(mean, variance)
 ```
 
@@ -116,13 +250,13 @@ Type: [Float64](/docs/en/sql-reference/data-types/float.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randNormal(10, 2) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌──randNormal(10, 2)─┐
 │ 13.389228911709653 │
 │  8.622949707401295 │
@@ -138,7 +272,7 @@ Returns a random Float64 drawn from a [log-normal distribution](https://en.wikip
 
 **Syntax**
 
-``` sql
+```sql
 randLogNormal(mean, variance)
 ```
 
@@ -155,13 +289,13 @@ Type: [Float64](/docs/en/sql-reference/data-types/float.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randLogNormal(100, 5) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌─randLogNormal(100, 5)─┐
 │  1.295699673937363e48 │
 │  9.719869109186684e39 │
@@ -177,7 +311,7 @@ Returns a random UInt64 drawn from a [binomial distribution](https://en.wikipedi
 
 **Syntax**
 
-``` sql
+```sql
 randBinomial(experiments, probability)
 ```
 
@@ -194,13 +328,13 @@ Type: [UInt64](/docs/en/sql-reference/data-types/int-uint.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randBinomial(100, .75) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌─randBinomial(100, 0.75)─┐
 │                      74 │
 │                      78 │
@@ -216,7 +350,7 @@ Returns a random UInt64 drawn from a [negative binomial distribution](https://en
 
 **Syntax**
 
-``` sql
+```sql
 randNegativeBinomial(experiments, probability)
 ```
 
@@ -233,13 +367,13 @@ Type: [UInt64](/docs/en/sql-reference/data-types/int-uint.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randNegativeBinomial(100, .75) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌─randNegativeBinomial(100, 0.75)─┐
 │                              33 │
 │                              32 │
@@ -255,7 +389,7 @@ Returns a random UInt64 drawn from a [Poisson distribution](https://en.wikipedia
 
 **Syntax**
 
-``` sql
+```sql
 randPoisson(n)
 ```
 
@@ -271,13 +405,13 @@ Type: [UInt64](/docs/en/sql-reference/data-types/int-uint.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randPoisson(10) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌─randPoisson(10)─┐
 │               8 │
 │               8 │
@@ -293,7 +427,7 @@ Returns a random UInt64 drawn from a [Bernoulli distribution](https://en.wikiped
 
 **Syntax**
 
-``` sql
+```sql
 randBernoulli(probability)
 ```
 
@@ -309,13 +443,13 @@ Type: [UInt64](/docs/en/sql-reference/data-types/int-uint.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randBernoulli(.75) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌─randBernoulli(0.75)─┐
 │                   1 │
 │                   1 │
@@ -331,7 +465,7 @@ Returns a random Float64 drawn from a [exponential distribution](https://en.wiki
 
 **Syntax**
 
-``` sql
+```sql
 randExponential(lambda)
 ```
 
@@ -347,13 +481,13 @@ Type: [Float64](/docs/en/sql-reference/data-types/float.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randExponential(1/10) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌─randExponential(divide(1, 10))─┐
 │              44.71628934340778 │
 │              4.211013337903262 │
@@ -369,7 +503,7 @@ Returns a random Float64 drawn from a [Chi-square distribution](https://en.wikip
 
 **Syntax**
 
-``` sql
+```sql
 randChiSquared(degree_of_freedom)
 ```
 
@@ -385,13 +519,13 @@ Type: [Float64](/docs/en/sql-reference/data-types/float.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randChiSquared(10) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌─randChiSquared(10)─┐
 │ 10.015463656521543 │
 │  9.621799919882768 │
@@ -407,7 +541,7 @@ Returns a random Float64 drawn from a [Student's t-distribution](https://en.wiki
 
 **Syntax**
 
-``` sql
+```sql
 randStudentT(degree_of_freedom)
 ```
 
@@ -423,13 +557,13 @@ Type: [Float64](/docs/en/sql-reference/data-types/float.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randStudentT(10) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌─────randStudentT(10)─┐
 │   1.2217309938538725 │
 │   1.7941971681200541 │
@@ -445,7 +579,7 @@ Returns a random Float64 drawn from a [F-distribution](https://en.wikipedia.org/
 
 **Syntax**
 
-``` sql
+```sql
 randFisherF(d1, d2)
 ```
 
@@ -462,13 +596,13 @@ Type: [Float64](/docs/en/sql-reference/data-types/float.md).
 
 **Example**
 
-``` sql
+```sql
 SELECT randFisherF(10, 3) FROM numbers(5)
 ```
 
 Result:
 
-``` result
+```result
 ┌──randFisherF(10, 3)─┐
 │   7.286287504216609 │
 │ 0.26590779413050386 │
@@ -484,7 +618,7 @@ Generates a string of the specified length filled with random bytes (including z
 
 **Syntax**
 
-``` sql
+```sql
 randomString(length)
 ```
 
@@ -502,13 +636,13 @@ Type: [String](../../sql-reference/data-types/string.md).
 
 Query:
 
-``` sql
+```sql
 SELECT randomString(30) AS str, length(str) AS len FROM numbers(2) FORMAT Vertical;
 ```
 
 Result:
 
-``` text
+```text
 Row 1:
 ──────
 str: 3 G  :   pT ?w тi  k aV f6
@@ -526,7 +660,7 @@ Generates a binary string of the specified length filled with random bytes (incl
 
 **Syntax**
 
-``` sql
+```sql
 randomFixedString(length);
 ```
 
@@ -563,7 +697,7 @@ If you pass `length < 0`, the behavior of the function is undefined.
 
 **Syntax**
 
-``` sql
+```sql
 randomPrintableASCII(length)
 ```
 
@@ -579,11 +713,11 @@ Type: [String](../../sql-reference/data-types/string.md)
 
 **Example**
 
-``` sql
+```sql
 SELECT number, randomPrintableASCII(30) as str, length(str) FROM system.numbers LIMIT 3
 ```
 
-``` text
+```text
 ┌─number─┬─str────────────────────────────┬─length(randomPrintableASCII(30))─┐
 │      0 │ SuiCOSTvC0csfABSw=UcSzp2.`rv8x │                               30 │
 │      1 │ 1Ag NlJ &RCN:*>HVPG;PE-nO"SUFD │                               30 │
@@ -597,7 +731,7 @@ Generates a random string of a specified length. Result string contains valid UT
 
 **Syntax**
 
-``` sql
+```sql
 randomStringUTF8(length);
 ```
 
@@ -635,11 +769,12 @@ Flips the bits of String or FixedString `s`, each with probability `prob`.
 
 **Syntax**
 
-``` sql
+```sql
 fuzzBits(s, prob)
 ```
 
 **Arguments**
+
 - `s` - `String` or `FixedString`,
 - `prob` - constant `Float32/64` between 0.0 and 1.0.
 
@@ -649,14 +784,14 @@ Fuzzed string with same type as `s`.
 
 **Example**
 
-``` sql
+```sql
 SELECT fuzzBits(materialize('abacaba'), 0.1)
 FROM numbers(3)
 ```
 
 Result:
 
-``` result
+```result
 ┌─fuzzBits(materialize('abacaba'), 0.1)─┐
 │ abaaaja                               │
 │ a*cjab+                               │

From e98c30c161303d91c483e7928326f0d8efc1f9df Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Sun, 3 Mar 2024 14:38:59 -0700
Subject: [PATCH 097/985] Reorganizes rand docs page.

---
 .../functions/random-functions.md             | 30 +++++++++----------
 1 file changed, 14 insertions(+), 16 deletions(-)

diff --git a/docs/en/sql-reference/functions/random-functions.md b/docs/en/sql-reference/functions/random-functions.md
index 2ce9c75eae4..b745d2833d3 100644
--- a/docs/en/sql-reference/functions/random-functions.md
+++ b/docs/en/sql-reference/functions/random-functions.md
@@ -36,19 +36,21 @@ None.
 
 Returns a number of type UInt32.
 
+### Implementation details
+
+Uses a linear congruential generator.
+
 ### Example
 
 ```sql
-SELECT rand()
+SELECT rand();
 ```
 
 ```response
 1569354847
 ```
 
-### Implementation details
-
-Uses a linear congruential generator.
+**Note:** The actual output will be a random number, not the specific number shown in the example.
 
 ## rand32
 
@@ -94,16 +96,14 @@ rand64()
 
 None.
 
-### Implementation details
-
-The `rand64` function uses a linear congruential generator, which means that while it appears random, it's not truly random and can be predictable if the initial state is known.
-
-For scenarios where true randomness is crucial, consider using alternative methods like system-level calls or integrating with external libraries.
-
 ### Output
 
 Returns a number of type UInt64, evenly distributed across the range of all possible UInt64 values.
 
+### Implementation details
+
+The `rand64` function uses a linear congruential generator, which means that while it appears random, it's not truly random and can be predictable if the initial state is known. For scenarios where true randomness is crucial, consider using alternative methods like system-level calls or integrating with external libraries.
+
 ### Example
 
 ```sql
@@ -160,16 +160,14 @@ randConstant([x]);
 
 - **[x] (Optional):** An optional expression that influences the generated random value. Even if provided, the resulting value will still be constant within the same query execution. Different queries using the same expression will likely generate different constant values.
 
-### Implementation details
-
-The actual output will be different for each query execution, even with the same optional expression.
-
-The optional parameter may not significantly change the generated value compared to using `randConstant` alone.
-
 ### Output
 
 Returns a column of type UInt32 containing the same random value in each row.
 
+### Implementation details
+
+The actual output will be different for each query execution, even with the same optional expression. The optional parameter may not significantly change the generated value compared to using `randConstant` alone.
+
 ### Examples
 
 ```sql

From 671b0f678afcdcb354a85aa141920bff09e2bcb2 Mon Sep 17 00:00:00 2001
From: M1eyu2018 <857037797@qq.com>
Date: Mon, 4 Mar 2024 10:12:27 +0800
Subject: [PATCH 098/985] Add positional read in libhdfs3

Signed-off-by: M1eyu2018 <857037797@qq.com>
---
 contrib/libhdfs3 | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/libhdfs3 b/contrib/libhdfs3
index b9598e60167..0d04201c453 160000
--- a/contrib/libhdfs3
+++ b/contrib/libhdfs3
@@ -1 +1 @@
-Subproject commit b9598e6016720a7c088bfe85ce1fa0410f9d2103
+Subproject commit 0d04201c45359f0d0701fb1e8297d25eff7cfecf

From c435d5894f48d37478454b1934d000fb967e2973 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Mon, 4 Mar 2024 14:23:59 +0800
Subject: [PATCH 099/985] remove wrong assertion n quantileGK

---
 .../AggregateFunctionGroupArray.cpp                 | 13 ++++++++-----
 .../AggregateFunctionQuantileGK.cpp                 | 12 ++++--------
 2 files changed, 12 insertions(+), 13 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
index d72ddb42d9e..6af8b1018dd 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
@@ -182,11 +182,14 @@ public:
 
         if constexpr (Trait::sampler == Sampler::NONE)
         {
-            if (limit_num_elems && cur_elems.value.size() >= max_elems)
+            if constexpr (limit_num_elems)
             {
-                if constexpr (Trait::last)
-                    cur_elems.value[(cur_elems.total_values - 1) % max_elems] = row_value;
-                return;
+                if (cur_elems.value.size() >= max_elems)
+                {
+                    if constexpr (Trait::last)
+                        cur_elems.value[(cur_elems.total_values - 1) % max_elems] = row_value;
+                    return;
+                }
             }
 
             cur_elems.value.push_back(row_value, arena);
@@ -236,7 +239,7 @@ public:
 
     void mergeNoSampler(Data & cur_elems, const Data & rhs_elems, Arena * arena) const
     {
-        if (!limit_num_elems)
+        if constexpr (!limit_num_elems)
         {
             if (rhs_elems.value.size())
                 cur_elems.value.insertByOffsets(rhs_elems.value, 0, rhs_elems.value.size(), arena);
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
index 2e8ccb2e5e4..26737e43eef 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
@@ -144,7 +144,7 @@ public:
             count = other.count;
             compressed = other.compressed;
 
-            sampled.resize(other.sampled.size());
+            sampled.resize_exact(other.sampled.size());
             memcpy(sampled.data(), other.sampled.data(), sizeof(Stats) * other.sampled.size());
             return;
         }
@@ -180,7 +180,7 @@ public:
             compress();
 
             backup_sampled.clear();
-            backup_sampled.reserve(sampled.size() + other.sampled.size());
+            backup_sampled.reserve_exact(sampled.size() + other.sampled.size());
             double merged_relative_error = std::max(relative_error, other.relative_error);
             size_t merged_count = count + other.count;
             Int64 additional_self_delta = static_cast<Int64>(std::floor(2 * other.relative_error * other.count));
@@ -268,11 +268,7 @@ public:
 
         size_t sampled_len = 0;
         readBinaryLittleEndian(sampled_len, buf);
-        if (sampled_len > compress_threshold)
-            throw Exception(
-                ErrorCodes::INCORRECT_DATA, "The number of elements {} for quantileGK exceeds {}", sampled_len, compress_threshold);
-
-        sampled.resize(sampled_len);
+        sampled.resize_exact(sampled_len);
 
         for (size_t i = 0; i < sampled_len; ++i)
         {
@@ -317,7 +313,7 @@ private:
             ::sort(head_sampled.begin(), head_sampled.end());
 
         backup_sampled.clear();
-        backup_sampled.reserve(sampled.size() + head_sampled.size());
+        backup_sampled.reserve_exact(sampled.size() + head_sampled.size());
 
         size_t sample_idx = 0;
         size_t ops_idx = 0;

From 6fbfd42a0522fe4161d367e3d923f2480c1df21a Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 4 Mar 2024 16:13:44 +0800
Subject: [PATCH 100/985] Update
 02241_filesystem_cache_on_write_operations.reference

---
 .../02241_filesystem_cache_on_write_operations.reference    | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference
index 53566a18edc..186dcc1eeb2 100644
--- a/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference
+++ b/tests/queries/0_stateless/02241_filesystem_cache_on_write_operations.reference
@@ -205,13 +205,7 @@ INSERT INTO test_02241 SELECT number, toString(number) FROM numbers(300, 10000)
 SELECT count(), sum(size) FROM system.filesystem_cache
 24	84045
 SYSTEM START MERGES test_02241
-SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'
-81715476
-SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'
 OPTIMIZE TABLE test_02241 FINAL
-SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'
-81881872
-SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'
 SELECT count(), sum(size) FROM system.filesystem_cache
 32	167243
 ALTER TABLE test_02241 UPDATE value = 'kek' WHERE key = 100

From 1768b4477f4ff5db238cd4cc553587b136ed015d Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 3 Mar 2024 11:50:22 +0100
Subject: [PATCH 101/985] Revert "Merge pull request #60690 from
 ClickHouse/remove-bad-test-8"

This reverts commit c77eb8b1427f98daf63f7087bbdc0530b07db825, reversing
changes made to bae4783fe9bd25decc41383a1234b0e936284c21.
---
 ..._external_tables_memory_tracking.reference | 16 ++++++
 ...52_http_external_tables_memory_tracking.sh | 51 +++++++++++++++++++
 2 files changed, 67 insertions(+)
 create mode 100644 tests/queries/0_stateless/02152_http_external_tables_memory_tracking.reference
 create mode 100755 tests/queries/0_stateless/02152_http_external_tables_memory_tracking.sh

diff --git a/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.reference b/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.reference
new file mode 100644
index 00000000000..1fc09c8d154
--- /dev/null
+++ b/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.reference
@@ -0,0 +1,16 @@
+Checking input_format_parallel_parsing=false&
+1
+Checking input_format_parallel_parsing=false&cancel_http_readonly_queries_on_client_close=1&readonly=1
+1
+Checking input_format_parallel_parsing=false&send_progress_in_http_headers=true
+1
+Checking input_format_parallel_parsing=false&cancel_http_readonly_queries_on_client_close=1&readonly=1&send_progress_in_http_headers=true
+1
+Checking input_format_parallel_parsing=true&
+1
+Checking input_format_parallel_parsing=true&cancel_http_readonly_queries_on_client_close=1&readonly=1
+1
+Checking input_format_parallel_parsing=true&send_progress_in_http_headers=true
+1
+Checking input_format_parallel_parsing=true&cancel_http_readonly_queries_on_client_close=1&readonly=1&send_progress_in_http_headers=true
+1
diff --git a/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.sh b/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.sh
new file mode 100755
index 00000000000..5f9eb460e44
--- /dev/null
+++ b/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.sh
@@ -0,0 +1,51 @@
+#!/usr/bin/env bash
+# Tags: no-tsan, no-cpu-aarch64, no-parallel
+# TSan does not supports tracing.
+# trace_log doesn't work on aarch64
+
+# Regression for proper release of Context,
+# via tracking memory of external tables.
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+tmp_file=$(mktemp "$CURDIR/clickhouse.XXXXXX.csv")
+trap 'rm $tmp_file' EXIT
+
+$CLICKHOUSE_CLIENT -q "SELECT toString(number) FROM numbers(1e6) FORMAT TSV" > "$tmp_file"
+
+function run_and_check()
+{
+    local query_id
+    query_id="$(${CLICKHOUSE_CURL} -sS "${CLICKHOUSE_URL}" --data-binary @- <<<'SELECT generateUUIDv4()')"
+
+    echo "Checking $*"
+
+    # Run query with external table (implicit StorageMemory user)
+    $CLICKHOUSE_CURL -sS -F "s=@$tmp_file;" "$CLICKHOUSE_URL&s_structure=key+Int&query=SELECT+count()+FROM+s&memory_profiler_sample_probability=1&max_untracked_memory=0&query_id=$query_id&$*" -o /dev/null
+
+    ${CLICKHOUSE_CURL} -sS "${CLICKHOUSE_URL}" --data-binary @- <<<'SYSTEM FLUSH LOGS'
+
+    # Check that temporary table had been destroyed.
+    ${CLICKHOUSE_CURL} -sS "${CLICKHOUSE_URL}&allow_introspection_functions=1" --data-binary @- <<<"
+    WITH arrayStringConcat(arrayMap(x -> demangle(addressToSymbol(x)), trace), '\n') AS sym
+    SELECT count()>0 FROM system.trace_log
+    WHERE
+        sym LIKE '%DB::StorageMemory::drop%\n%TemporaryTableHolder::~TemporaryTableHolder%' AND
+        query_id = '$query_id'
+    "
+}
+
+for input_format_parallel_parsing in false true; do
+    query_args_variants=(
+        ""
+        "cancel_http_readonly_queries_on_client_close=1&readonly=1"
+        "send_progress_in_http_headers=true"
+        # nested progress callback
+        "cancel_http_readonly_queries_on_client_close=1&readonly=1&send_progress_in_http_headers=true"
+    )
+    for query_args in "${query_args_variants[@]}"; do
+        run_and_check "input_format_parallel_parsing=$input_format_parallel_parsing&$query_args"
+    done
+done

From 048a042dc4963631a23358d3e454dcd8a9eaafa2 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 3 Mar 2024 11:50:46 +0100
Subject: [PATCH 102/985] Make 02152_http_external_tables_memory_tracking less
 flaky

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../02152_http_external_tables_memory_tracking.sh  | 14 ++++++++++----
 1 file changed, 10 insertions(+), 4 deletions(-)

diff --git a/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.sh b/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.sh
index 5f9eb460e44..5494f7d59cb 100755
--- a/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.sh
+++ b/tests/queries/0_stateless/02152_http_external_tables_memory_tracking.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-tsan, no-cpu-aarch64, no-parallel
+# Tags: no-tsan, no-cpu-aarch64, no-parallel, no-debug
 # TSan does not supports tracing.
 # trace_log doesn't work on aarch64
 
@@ -30,10 +30,16 @@ function run_and_check()
     # Check that temporary table had been destroyed.
     ${CLICKHOUSE_CURL} -sS "${CLICKHOUSE_URL}&allow_introspection_functions=1" --data-binary @- <<<"
     WITH arrayStringConcat(arrayMap(x -> demangle(addressToSymbol(x)), trace), '\n') AS sym
-    SELECT count()>0 FROM system.trace_log
+    SELECT 1 FROM system.trace_log
+    PREWHERE
+        query_id = '$query_id' AND
+        trace_type = 'MemorySample' AND
+        /* only deallocations */
+        size < 0 AND
+        event_date >= yesterday()
     WHERE
-        sym LIKE '%DB::StorageMemory::drop%\n%TemporaryTableHolder::~TemporaryTableHolder%' AND
-        query_id = '$query_id'
+        sym LIKE '%DB::StorageMemory::drop%\n%TemporaryTableHolder::~TemporaryTableHolder%'
+    LIMIT 1
     "
 }
 

From a7db6688edb50f894457c414b207c25548bb18d3 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 4 Mar 2024 18:24:24 +0800
Subject: [PATCH 103/985] Update ObjectStorageFactory.cpp

---
 src/Disks/ObjectStorages/ObjectStorageFactory.cpp | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index 47c02f87b23..a0578ac4454 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -246,12 +246,11 @@ void registerAzureObjectStorage(ObjectStorageFactory & factory)
         bool /* skip_access_check */) -> ObjectStoragePtr
     {
         AzureBlobStorageEndpoint endpoint = processAzureBlobStorageEndpoint(config, config_prefix);
-        return std::make_unique<AzureObjectStorage>(
+        return createObjectStorage<AzureObjectStorage>(
             ObjectStorageType::Azure, config, config_prefix, name,
             getAzureBlobContainerClient(config, config_prefix),
             getAzureBlobStorageSettings(config, config_prefix, context),
             endpoint.prefix.empty() ? endpoint.container_name : endpoint.container_name + "/" + endpoint.prefix);
-
     });
 }
 #endif

From 81185815a48b36d344bda623dd175c30e9b87ba3 Mon Sep 17 00:00:00 2001
From: Aleksei Filatov <alexfvk@yandex-team.ru>
Date: Mon, 4 Mar 2024 14:09:31 +0300
Subject: [PATCH 104/985] Update settings_changes_history

---
 src/Core/SettingsChangesHistory.h | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 4805df46d9b..b8793f437d8 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -85,6 +85,9 @@ namespace SettingsChangesHistory
 /// It's used to implement `compatibility` setting (see https://github.com/ClickHouse/ClickHouse/issues/35972)
 static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> settings_changes_history =
 {
+    {"24.3", {
+              {"traverse_shadow_remote_data_paths", false, false, "Traverse shadow directory when query system.remote_data_paths."},
+              }},
     {"24.2", {
               {"output_format_values_escape_quote_with_quote", false, false, "If true escape ' with '', otherwise quoted with \\'"},
               {"input_format_try_infer_exponent_floats", true, false, "Don't infer floats in exponential notation by default"},

From fbdc5e305365e9d93b86ed47144ffb13c1ce70c1 Mon Sep 17 00:00:00 2001
From: Aleksei Filatov <alexfvk@yandex-team.ru>
Date: Mon, 4 Mar 2024 17:16:51 +0300
Subject: [PATCH 105/985] Ignore flaky fail of system unfreeze

---
 .../0_stateless/03000_traverse_shadow_system_data_paths.sh      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
index a22cb200f9a..2905d7801ca 100755
--- a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
+++ b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
@@ -26,7 +26,7 @@ ${CLICKHOUSE_CLIENT} --query "
     FROM system.remote_data_paths 
     WHERE disk_name = 's3_cache' AND local_path LIKE '%shadow/${BACKUP}%'
     SETTINGS traverse_shadow_remote_data_paths=1;"
-${CLICKHOUSE_CLIENT} --query "SYSTEM UNFREEZE WITH NAME '${BACKUP}';" >/dev/null
+${CLICKHOUSE_CLIENT} --query "SYSTEM UNFREEZE WITH NAME '${BACKUP}';" &>/dev/null || true
 ${CLICKHOUSE_CLIENT} --query "
     SELECT count() == 0
     FROM system.remote_data_paths 

From aa43885ac81924a73e9a151a550e7c1af43d23e2 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 5 Mar 2024 10:57:25 +0800
Subject: [PATCH 106/985] [improve] add check the remaining disk size before
 copying

---
 src/Storages/MergeTree/MergeTreeData.cpp | 11 +++++++++--
 1 file changed, 9 insertions(+), 2 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 849ceb1b66d..d8680958c21 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7160,14 +7160,18 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
         {
             try
             {
+                auto reservation_space = src_part_storage->reserve(src_part->getBytesOnDisk());
+                if (!reservation_space) {
+                    throw Exception(ErrorCodes::NOT_ENOUGH_SPACE, "Not enough space on disk.");
+                }
                 dst_part_storage
                     = src_part_storage->clonePart(this->getRelativeDataPath(), tmp_dst_part_name, disk, read_settings, write_settings, {}, {});
                 copy_successful = true;
                 break;
             }
-            catch (...)
+            catch (Exception & e)
             {
-                LOG_TRACE(&Poco::Logger::get("MergeTreeData"), "Clone part on disk {} fail", disk->getName());
+                LOG_TRACE(&Poco::Logger::get("MergeTreeData"), "Clone part on disk {} fail: {}", disk->getName(), e.what());
             }
         }
         if (!copy_successful)
@@ -7291,6 +7295,9 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     {
         try
         {
+            auto reservation_space = src_part_storage->reserve(src_part->getBytesOnDisk());
+            if (!reservation_space)
+                throw Exception(ErrorCodes::NOT_ENOUGH_SPACE, "Not enough space on disk.");
             dst_part_storage
                 = src_part_storage->clonePart(this->getRelativeDataPath(), tmp_dst_part_name, disk, read_settings, write_settings, {}, {});
             copy_successful = true;

From b0050566e22d10ca621a33c1b4fedb987ad2620c Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 5 Mar 2024 12:14:56 +0800
Subject: [PATCH 107/985] Fix style check

---
 src/Disks/IO/ReadBufferFromRemoteFSGather.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
index fe8d63b053d..298000ac015 100644
--- a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
+++ b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
@@ -21,7 +21,7 @@ namespace
     {
         return settings.remote_fs_cache && settings.enable_filesystem_cache;
     }
-  
+
     bool withPageCache(const ReadSettings & settings, bool with_file_cache)
     {
         return settings.page_cache && !with_file_cache && settings.use_page_cache_for_disks_without_file_cache;

From 2ee846b393d79f3f0d9710ddf910552ba1e040cd Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 5 Mar 2024 14:07:56 +0800
Subject: [PATCH 108/985] Fix build

---
 src/Disks/IO/ReadBufferFromRemoteFSGather.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
index 298000ac015..f72e6634465 100644
--- a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
+++ b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
@@ -17,7 +17,7 @@ using namespace DB;
 
 namespace
 {
-    bool withCache(const ReadSettings & settings)
+    bool withFileCache(const ReadSettings & settings)
     {
         return settings.remote_fs_cache && settings.enable_filesystem_cache;
     }

From 758a75c1b46fa27a88e3dcf6e70a18dcf41d62ef Mon Sep 17 00:00:00 2001
From: Aleksei Filatov <alexfvk@yandex-team.ru>
Date: Tue, 5 Mar 2024 09:53:30 +0300
Subject: [PATCH 109/985] Fix flaky test. Fix clang-tidy warning

---
 src/Disks/IDisk.h                                          | 7 +++----
 src/Disks/ObjectStorages/DiskObjectStorage.h               | 2 +-
 src/Storages/System/StorageSystemRemoteDataPaths.cpp       | 4 ++--
 .../0_stateless/03000_traverse_shadow_system_data_paths.sh | 7 +------
 4 files changed, 7 insertions(+), 13 deletions(-)

diff --git a/src/Disks/IDisk.h b/src/Disks/IDisk.h
index 62b02938d1a..fcc92db7b96 100644
--- a/src/Disks/IDisk.h
+++ b/src/Disks/IDisk.h
@@ -321,11 +321,10 @@ public:
     };
 
     virtual void getRemotePathsRecursive(
-        const String &,
-        std::vector<LocalPathWithObjectStoragePaths> &,
-        const std::function<bool(const String &)> & /* skip_predicate */ = {})
+        const String &, std::vector<LocalPathWithObjectStoragePaths> &, const std::function<bool(const String &)> & /* skip_predicate */)
     {
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+        throw Exception(
+            ErrorCodes::NOT_IMPLEMENTED,
             "Method `getRemotePathsRecursive() not implemented for disk: {}`",
             getDataSourceDescription().toString());
     }
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.h b/src/Disks/ObjectStorages/DiskObjectStorage.h
index d7af656bea3..9f11c0ed02e 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.h
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.h
@@ -51,7 +51,7 @@ public:
     void getRemotePathsRecursive(
         const String & local_path,
         std::vector<LocalPathWithObjectStoragePaths> & paths_map,
-        const std::function<bool(const String &)> & skip_predicate = {}) override;
+        const std::function<bool(const String &)> & skip_predicate) override;
 
     const std::string & getCacheName() const override { return object_storage->getCacheName(); }
 
diff --git a/src/Storages/System/StorageSystemRemoteDataPaths.cpp b/src/Storages/System/StorageSystemRemoteDataPaths.cpp
index 708c1369965..a6263f18492 100644
--- a/src/Storages/System/StorageSystemRemoteDataPaths.cpp
+++ b/src/Storages/System/StorageSystemRemoteDataPaths.cpp
@@ -58,8 +58,8 @@ Pipe StorageSystemRemoteDataPaths::read(
         if (disk->isRemote())
         {
             std::vector<IDisk::LocalPathWithObjectStoragePaths> remote_paths_by_local_path;
-            disk->getRemotePathsRecursive("store", remote_paths_by_local_path);
-            disk->getRemotePathsRecursive("data", remote_paths_by_local_path);
+            disk->getRemotePathsRecursive("store", remote_paths_by_local_path, /* skip_predicate = */ {});
+            disk->getRemotePathsRecursive("data", remote_paths_by_local_path, /* skip_predicate = */ {});
             if (context->getSettingsRef().traverse_shadow_remote_data_paths)
                 disk->getRemotePathsRecursive(
                     "shadow",
diff --git a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
index 2905d7801ca..a1d4b9bba46 100755
--- a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
+++ b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
@@ -26,9 +26,4 @@ ${CLICKHOUSE_CLIENT} --query "
     FROM system.remote_data_paths 
     WHERE disk_name = 's3_cache' AND local_path LIKE '%shadow/${BACKUP}%'
     SETTINGS traverse_shadow_remote_data_paths=1;"
-${CLICKHOUSE_CLIENT} --query "SYSTEM UNFREEZE WITH NAME '${BACKUP}';" &>/dev/null || true
-${CLICKHOUSE_CLIENT} --query "
-    SELECT count() == 0
-    FROM system.remote_data_paths 
-    WHERE disk_name = 's3_cache' AND local_path LIKE '%shadow/${BACKUP}%'
-    SETTINGS traverse_shadow_remote_data_paths=1;"
+${CLICKHOUSE_CLIENT} --query "SYSTEM UNFREEZE WITH NAME '${BACKUP}';" &>/dev/null

From df80c8c9f6ee0939cc6e6e05f3e951511a20f476 Mon Sep 17 00:00:00 2001
From: Aleksei Filatov <alexfvk@yandex-team.ru>
Date: Tue, 5 Mar 2024 10:43:48 +0300
Subject: [PATCH 110/985] Update test reference

---
 .../03000_traverse_shadow_system_data_paths.reference            | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.reference b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.reference
index e8183f05f5d..6ed281c757a 100644
--- a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.reference
+++ b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.reference
@@ -1,3 +1,2 @@
 1
 1
-1

From e789d15948eaec3eaa9a8604e24d2f6ed7b60db5 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Tue, 5 Mar 2024 16:06:25 +0800
Subject: [PATCH 111/985] optimize insertmanyfrom of nullable(number) or
 nullable(string)

---
 src/Columns/ColumnDecimal.h    |  7 +++++++
 src/Columns/ColumnNullable.cpp |  8 ++++++++
 src/Columns/ColumnNullable.h   |  1 +
 src/Columns/ColumnString.cpp   | 21 +++++++++++++++++++++
 src/Columns/ColumnString.h     |  2 ++
 5 files changed, 39 insertions(+)

diff --git a/src/Columns/ColumnDecimal.h b/src/Columns/ColumnDecimal.h
index 7ca01a8342c..e0ea26744dc 100644
--- a/src/Columns/ColumnDecimal.h
+++ b/src/Columns/ColumnDecimal.h
@@ -56,6 +56,13 @@ public:
     void shrinkToFit() override { data.shrink_to_fit(); }
 
     void insertFrom(const IColumn & src, size_t n) override { data.push_back(static_cast<const Self &>(src).getData()[n]); }
+
+    void insertManyFrom(const IColumn & src, size_t position, size_t length) override
+    {
+        ValueType v = assert_cast<const Self &>(src).getData()[position];
+        data.resize_fill(data.size() + length, v);
+    }
+
     void insertData(const char * src, size_t /*length*/) override;
     void insertDefault() override { data.push_back(T()); }
     void insertManyDefaults(size_t length) override { data.resize_fill(data.size() + length); }
diff --git a/src/Columns/ColumnNullable.cpp b/src/Columns/ColumnNullable.cpp
index 1d11827ac97..fa5fdfb8c21 100644
--- a/src/Columns/ColumnNullable.cpp
+++ b/src/Columns/ColumnNullable.cpp
@@ -231,6 +231,14 @@ void ColumnNullable::insertFrom(const IColumn & src, size_t n)
     getNullMapData().push_back(src_concrete.getNullMapData()[n]);
 }
 
+
+void ColumnNullable::insertManyFrom(const IColumn & src, size_t position, size_t length)
+{
+    const ColumnNullable & src_concrete = assert_cast<const ColumnNullable &>(src);
+    getNestedColumn().insertManyFrom(src_concrete.getNestedColumn(), position, length);
+    getNullMapColumn().insertManyFrom(src_concrete.getNullMapColumn(), position, length);
+}
+
 void ColumnNullable::insertFromNotNullable(const IColumn & src, size_t n)
 {
     getNestedColumn().insertFrom(src, n);
diff --git a/src/Columns/ColumnNullable.h b/src/Columns/ColumnNullable.h
index b4aef8e08fa..ef4bf4fa41b 100644
--- a/src/Columns/ColumnNullable.h
+++ b/src/Columns/ColumnNullable.h
@@ -69,6 +69,7 @@ public:
     void insert(const Field & x) override;
     bool tryInsert(const Field & x) override;
     void insertFrom(const IColumn & src, size_t n) override;
+    void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
 
     void insertFromNotNullable(const IColumn & src, size_t n);
     void insertRangeFromNotNullable(const IColumn & src, size_t start, size_t length);
diff --git a/src/Columns/ColumnString.cpp b/src/Columns/ColumnString.cpp
index b9128372cea..f3c7ac1bf0c 100644
--- a/src/Columns/ColumnString.cpp
+++ b/src/Columns/ColumnString.cpp
@@ -38,6 +38,27 @@ ColumnString::ColumnString(const ColumnString & src)
             last_offset, chars.size());
 }
 
+void ColumnString::insertManyFrom(const IColumn & src, size_t position, size_t length)
+{
+    const ColumnString & src_concrete = assert_cast<const ColumnString &>(src);
+    const UInt8 * src_buf = &src_concrete.chars[src_concrete.offsets[position - 1]];
+    const size_t src_buf_size
+        = src_concrete.offsets[position] - src_concrete.offsets[position - 1]; /// -1th index is Ok, see PaddedPODArray.
+
+    const size_t old_size = chars.size();
+    const size_t new_size = old_size + src_buf_size * length;
+    chars.resize(new_size);
+
+    const size_t old_rows = offsets.size();
+    offsets.resize(old_rows + length);
+
+    for (size_t current_offset = old_size; current_offset < new_size; current_offset += src_buf_size)
+        memcpySmallAllowReadWriteOverflow15(&chars[current_offset], src_buf, src_buf_size);
+
+    for (size_t i = 0, current_offset = old_size + src_buf_size; i < length; ++i, current_offset += src_buf_size)
+        offsets[old_rows + i] = current_offset;
+}
+
 
 MutableColumnPtr ColumnString::cloneResized(size_t to_size) const
 {
diff --git a/src/Columns/ColumnString.h b/src/Columns/ColumnString.h
index 04aa1849187..2d1d69ced73 100644
--- a/src/Columns/ColumnString.h
+++ b/src/Columns/ColumnString.h
@@ -160,6 +160,8 @@ public:
         }
     }
 
+    void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
+
     void insertData(const char * pos, size_t length) override
     {
         const size_t old_size = chars.size();

From 47ad21dd257ff1a5751d191dfd311a7950a93111 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 5 Mar 2024 12:17:04 +0100
Subject: [PATCH 112/985] Remove extra empty line

---
 .../03002_map_array_functions_with_low_cardinality.sql           | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.sql b/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.sql
index 8240a8f93f5..8820a433da8 100644
--- a/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.sql
+++ b/tests/queries/0_stateless/03002_map_array_functions_with_low_cardinality.sql
@@ -1,2 +1 @@
 SELECT mapContainsKeyLike(map('aa', toLowCardinality(1), 'bb', toLowCardinality(2)), toLowCardinality('a%'));
-

From 580fd4ba080df6e29c59b785b1fca0eea76e649c Mon Sep 17 00:00:00 2001
From: Aleksei Filatov <alexfvk@yandex-team.ru>
Date: Tue, 5 Mar 2024 10:43:48 +0300
Subject: [PATCH 113/985] Update test reference

---
 .../0_stateless/03000_traverse_shadow_system_data_paths.sh      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
index a1d4b9bba46..98575540923 100755
--- a/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
+++ b/tests/queries/0_stateless/03000_traverse_shadow_system_data_paths.sh
@@ -26,4 +26,4 @@ ${CLICKHOUSE_CLIENT} --query "
     FROM system.remote_data_paths 
     WHERE disk_name = 's3_cache' AND local_path LIKE '%shadow/${BACKUP}%'
     SETTINGS traverse_shadow_remote_data_paths=1;"
-${CLICKHOUSE_CLIENT} --query "SYSTEM UNFREEZE WITH NAME '${BACKUP}';" &>/dev/null
+${CLICKHOUSE_CLIENT} --query "SYSTEM UNFREEZE WITH NAME '${BACKUP}';" &>/dev/null || true

From a109952960acac12790cffde030062ec60208994 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Tue, 5 Mar 2024 22:08:36 +0800
Subject: [PATCH 114/985] dev columnstring

---
 src/Columns/ColumnArray.cpp       | 83 +++++++++++++++++++++++++++++++
 src/Columns/ColumnArray.h         |  9 ++++
 src/Columns/ColumnConst.h         |  2 +
 src/Columns/ColumnFixedString.cpp | 14 ++++++
 src/Columns/ColumnFixedString.h   |  2 +
 5 files changed, 110 insertions(+)

diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index 7b268b80116..b620da81ae8 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -347,6 +347,89 @@ void ColumnArray::insertFrom(const IColumn & src_, size_t n)
     getOffsets().push_back(getOffsets().back() + size);
 }
 
+template <typename T>
+void ColumnArray::insertManyFromNumber(const ColumnArray & src, size_t position, size_t length)
+{
+    using ColVecType = ColumnVectorOrDecimal<T>;
+    size_t src_size = src.sizeAt(position);
+    size_t src_offset = src.offsetAt(position);
+
+    const typename ColVecType::Container & src_data = typeid_cast<const ColVecType &>(src.getData()).getData();
+    typename ColVecType::Container & data_ref = typeid_cast<ColVecType &>(getData()).getData();
+    size_t old_size = data_ref.size();
+    size_t new_size = old_size + src_size * length;
+    data_ref.resize(new_size);
+    for (size_t i = 0, offset = old_size; i < length; ++i, offset += src_size)
+        memcpy(&data_ref[offset], &src_data[src_offset], src_size * sizeof(T));
+}
+
+void ColumnArray::insertManyFromString(const ColumnArray & src, size_t position, size_t length)
+{
+    size_t src_size = src.sizeAt(position);
+    size_t src_offset = src.offsetAt(position);
+
+    const auto & src_string = typeid_cast<const ColumnString &>(src.getData());
+    const auto & src_chars = src_string.getChars();
+    const auto & src_string_offsets = src_string.getOffsets();
+    auto & dst_string = typeid_cast<ColumnString &>(getData());
+    auto & dst_chars = dst_string.getChars();
+    auto & dst_string_offsets = dst_string.getOffsets();
+
+    /// Each row may have multiple strings, copy them to dst_chars and update dst_offsets
+    size_t old_size = dst_string_offsets.size();
+    size_t new_size = old_size + src_size * length;
+    dst_string_offsets.resize(new_size);
+    size_t dst_string_offset = dst_chars.size();
+    for (size_t i = 0; i < length; ++i)
+    {
+        for (size_t j = 0; j < src_size; ++j)
+        {
+            size_t nested_offset = src_string_offsets[src_offset + j - 1];
+            size_t nested_length = src_string_offsets[src_offset + j] - nested_offset;
+
+            dst_string_offset += nested_length;
+            dst_string_offsets[old_size + i * src_size + j] = dst_string_offset;
+        }
+    }
+
+    size_t chars_to_copy = src_string_offsets[src_offset + src_size - 1] - src_string_offsets[src_offset - 1];
+    dst_chars.resize(dst_chars.size() + chars_to_copy * length);
+    for (size_t dst_offset = old_size; dst_offset < new_size; dst_offset += src_size)
+        memcpy(&dst_chars[dst_string_offsets[dst_offset - 1]], &src_chars[src_string_offsets[src_offset - 1]], chars_to_copy);
+}
+
+void ColumnArray::insertManyFromTuple(const ColumnArray & src, size_t position, size_t length)
+{
+
+}
+void ColumnArray::insertManyFromNullable(const ColumnArray & src, size_t position, size_t length)
+{
+
+}
+void ColumnArray::insertManyFromGeneric(const ColumnArray & src, size_t position, size_t length)
+{
+    size_t src_size = src.sizeAt(position);
+    size_t src_offset = src.offsetAt(position);
+    const auto & src_data = src.getData();
+    size_t new_size = data->size() + src_size * length;
+    data->reserve(new_size);
+    for (size_t i = 0; i < length; ++i)
+        data->insertRangeFrom(src_data, src_offset, src_size);
+}
+
+void ColumnArray::insertManyFrom(const IColumn & src_, size_t position, size_t length)
+{
+    /// First fill offsets
+    const ColumnArray & src = assert_cast<const ColumnArray &>(src_);
+    size_t src_size = src.sizeAt(position);
+    auto & offsets_ref = getOffsets();
+    size_t old_rows = offsets_ref.size();
+    size_t new_rows = old_rows + length;
+    size_t old_size = offsets_ref.back();
+    offsets_ref.resize(new_rows);
+    for (size_t i = 0, offset = old_size + src_size; i < length; ++i, offset += src_size)
+        offsets_ref[old_rows + i] = offset;
+}
 
 void ColumnArray::insertDefault()
 {
diff --git a/src/Columns/ColumnArray.h b/src/Columns/ColumnArray.h
index 230d8830265..73d632a38b9 100644
--- a/src/Columns/ColumnArray.h
+++ b/src/Columns/ColumnArray.h
@@ -88,6 +88,7 @@ public:
     void insert(const Field & x) override;
     bool tryInsert(const Field & x) override;
     void insertFrom(const IColumn & src_, size_t n) override;
+    void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
     void insertDefault() override;
     void popBack(size_t n) override;
     ColumnPtr filter(const Filter & filt, ssize_t result_size_hint) const override;
@@ -213,6 +214,14 @@ private:
     ColumnPtr filterNullable(const Filter & filt, ssize_t result_size_hint) const;
     ColumnPtr filterGeneric(const Filter & filt, ssize_t result_size_hint) const;
 
+    /// Specializations for insertManyFrom
+    template <typename T>
+    void insertManyFromNumber(const ColumnArray & src, size_t position, size_t length);
+    void insertManyFromString(const ColumnArray & src, size_t position, size_t length);
+    void insertManyFromTuple(const ColumnArray & src, size_t position, size_t length);
+    void insertManyFromNullable(const ColumnArray & src, size_t position, size_t length);
+    void insertManyFromGeneric(const ColumnArray & src, size_t position, size_t length);
+
     int compareAtImpl(size_t n, size_t m, const IColumn & rhs_, int nan_direction_hint, const Collator * collator=nullptr) const;
 };
 
diff --git a/src/Columns/ColumnConst.h b/src/Columns/ColumnConst.h
index 990b7189fa3..4a3d40ca0d2 100644
--- a/src/Columns/ColumnConst.h
+++ b/src/Columns/ColumnConst.h
@@ -150,6 +150,8 @@ public:
         ++s;
     }
 
+    void insertManyFrom(const IColumn & /*src*/, size_t /* position */, size_t length) override { s += length; }
+
     void insertDefault() override
     {
         ++s;
diff --git a/src/Columns/ColumnFixedString.cpp b/src/Columns/ColumnFixedString.cpp
index e460c84d696..b55f68d4687 100644
--- a/src/Columns/ColumnFixedString.cpp
+++ b/src/Columns/ColumnFixedString.cpp
@@ -85,6 +85,20 @@ void ColumnFixedString::insertFrom(const IColumn & src_, size_t index)
     memcpySmallAllowReadWriteOverflow15(chars.data() + old_size, &src.chars[n * index], n);
 }
 
+void ColumnFixedString::insertManyFrom(const IColumn & src, size_t position, size_t length)
+{
+    const ColumnFixedString & src_concrete = assert_cast<const ColumnFixedString &>(src);
+    if (n != src_concrete.getN())
+        throw Exception(ErrorCodes::SIZE_OF_FIXED_STRING_DOESNT_MATCH, "Size of FixedString doesn't match");
+
+    const size_t old_size = chars.size();
+    const size_t new_size = old_size + n * length;
+    chars.resize(new_size);
+
+    for (size_t offset = old_size; offset < new_size; offset += n)
+        memcpySmallAllowReadWriteOverflow15(&chars[offset], &src_concrete.chars[n * position], n);
+}
+
 void ColumnFixedString::insertData(const char * pos, size_t length)
 {
     if (length > n)
diff --git a/src/Columns/ColumnFixedString.h b/src/Columns/ColumnFixedString.h
index f40e1356b27..56d42e8b34e 100644
--- a/src/Columns/ColumnFixedString.h
+++ b/src/Columns/ColumnFixedString.h
@@ -100,6 +100,8 @@ public:
 
     void insertFrom(const IColumn & src_, size_t index) override;
 
+    void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
+
     void insertData(const char * pos, size_t length) override;
 
     void insertDefault() override

From bfb703b579fa192dc58e51ea842067e7e379e949 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Tue, 5 Mar 2024 15:38:42 +0100
Subject: [PATCH 115/985] Add mortonEncode and mortonDecode to documentation

---
 .../functions/encoding-functions.md           | 203 ++++++++++++++++++
 1 file changed, 203 insertions(+)

diff --git a/docs/en/sql-reference/functions/encoding-functions.md b/docs/en/sql-reference/functions/encoding-functions.md
index 618dd3f4b4f..7fd77ce3a6a 100644
--- a/docs/en/sql-reference/functions/encoding-functions.md
+++ b/docs/en/sql-reference/functions/encoding-functions.md
@@ -433,3 +433,206 @@ Result:
 │ [0,1,2,3,4,5,6,7] │
 └───────────────────┘
 ```
+
+## mortonEncode
+
+Calculates the Morton encoding (ZCurve) for a list of unsigned integers.
+
+The function has two modes of operation:
+- Simple
+- Expanded
+
+### Simple mode
+
+Accepts up to 8 unsigned integers as arguments and produces a UInt64 code.
+
+**Syntax**
+
+```sql
+mortonEncode(args)
+```
+
+**Parameters**
+
+- `args`: up to 8 [unsigned integers](../../sql-reference/data-types/int-uint.md) or columns of the aforementioned type.
+
+**Returned value**
+
+- A UInt64 code
+
+Type: [UInt64](../../sql-reference/data-types/int-uint.md)
+
+**Example**
+
+Query:
+
+```sql
+SELECT mortonEncode(1, 2, 3);
+```
+
+```response
+53
+```
+
+### Expanded mode
+
+Accepts a range mask ([tuple](../../sql-reference/data-types/tuple.md)) as a first argument and up to 8 [unsigned integers](../../sql-reference/data-types/int-uint.md) as other arguments.
+
+Each number in the mask configures the amount of range expansion:
+1 - no expansion
+2 - 2x expansion
+3 - 3x expansion
+...
+Up to 8x expansion.
+
+**Syntax**
+
+```sql
+mortonEncode(range_mask, args)
+```
+
+**Parameters**
+- `range_mask`: 1-8.
+- `args`: up to 8 [unsigned integers](../../sql-reference/data-types/int-uint.md) or columns of the aforementioned type.
+
+Note: when using columns for `args` the provided `range_mask` tuple should still be a constant. 
+
+**Returned value**
+
+- A UInt64 code
+
+Type: [UInt64](../../sql-reference/data-types/int-uint.md)
+
+
+**Example**
+
+Range expansion can be beneficial when you need a similar distribution for arguments with wildly different ranges (or cardinality)
+For example: 'IP Address' (0...FFFFFFFF) and 'Country code' (0...FF).
+
+Query:
+
+```sql
+SELECT mortonEncode((1,2), 1024, 16);
+```
+
+```response
+1572864
+```
+
+Note: tuple size must be equal to the number of the other arguments.
+
+**Example**
+
+Morton encoding for one argument is always the argument itself:
+
+Query:
+
+```sql
+SELECT mortonEncode(1);
+```
+
+```response
+1
+```
+
+**Example**
+
+It is also possible to expand one argument too:
+
+Query:
+
+```sql
+SELECT mortonEncode(tuple(2), 128);
+```
+
+```response
+32768
+```
+
+**implementation details**
+
+Please note that you can fit only so much bits of information into Morton code as [UInt64](../../sql-reference/data-types/int-uint.md) has. Two arguments will have a range of maximum 2^32 (64/2) each, three arguments a range of max 2^21 (64/3) each and so on. All overflow will be clamped to zero.
+
+## mortonDecode
+
+Decodes a Morton encoding (ZCurve) into the corresponding unsigned integer tuple.
+
+As with the `mortonEncode` function, this function has two modes of operation:
+- Simple
+- Expanded
+
+### Simple mode
+
+Accepts a resulting tuple size as the first argument and the code as the second argument.
+
+**Syntax**
+
+```sql
+mortonDecode(tuple_size, code)
+```
+
+**Parameters**
+- `tuple_size`: integer value no more than 8.
+- `code`: [UInt64](../../sql-reference/data-types/int-uint.md) code.
+
+**Returned value**
+
+- [tuple](../../sql-reference/data-types/tuple.md) of the specified size.
+
+Type: [UInt64](../../sql-reference/data-types/int-uint.md)
+
+**Example**
+
+Query:
+
+```sql
+SELECT mortonDecode(3, 53);
+```
+
+```response
+["1","2","3"]
+```
+
+### Expanded mode
+
+Accepts a range mask (tuple) as a first argument and the code as the second argument.
+Each number in the mask configures the amount of range shrink
+1 - no shrink
+2 - 2x shrink
+3 - 3x shrink
+...
+Up to 8x shrink.
+
+Range expansion can be beneficial when you need a similar distribution for arguments with wildly different ranges (or cardinality)
+For example: 'IP Address' (0...FFFFFFFF) and 'Country code' (0...FF).
+As with the encode function, this is limited to 8 numbers at most.
+
+**Example**
+
+Query:
+
+```sql
+SELECT mortonDecode(1, 1);
+```
+
+```response
+["1"]
+```
+
+**Example**
+
+It is also possible to shrink one argument:
+
+Query:
+
+```sql
+SELECT mortonDecode(tuple(2), 32768);
+```
+
+```response
+["128"]
+```
+
+
+
+

From 7930a26df136c8a2e10f839ea4738a338dbb6c9e Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Tue, 5 Mar 2024 15:47:45 +0100
Subject: [PATCH 116/985] Fix formatting of compression/expansion levels

---
 .../functions/encoding-functions.md           | 24 +++++++++----------
 1 file changed, 12 insertions(+), 12 deletions(-)

diff --git a/docs/en/sql-reference/functions/encoding-functions.md b/docs/en/sql-reference/functions/encoding-functions.md
index 7fd77ce3a6a..0cb459b8e07 100644
--- a/docs/en/sql-reference/functions/encoding-functions.md
+++ b/docs/en/sql-reference/functions/encoding-functions.md
@@ -478,12 +478,12 @@ SELECT mortonEncode(1, 2, 3);
 
 Accepts a range mask ([tuple](../../sql-reference/data-types/tuple.md)) as a first argument and up to 8 [unsigned integers](../../sql-reference/data-types/int-uint.md) as other arguments.
 
-Each number in the mask configures the amount of range expansion:
-1 - no expansion
-2 - 2x expansion
-3 - 3x expansion
-...
-Up to 8x expansion.
+Each number in the mask configures the amount of range expansion:<br/>
+1 - no expansion<br/>
+2 - 2x expansion<br/>
+3 - 3x expansion<br/>
+...<br/>
+Up to 8x expansion.<br/>
 
 **Syntax**
 
@@ -596,12 +596,12 @@ SELECT mortonDecode(3, 53);
 ### Expanded mode
 
 Accepts a range mask (tuple) as a first argument and the code as the second argument.
-Each number in the mask configures the amount of range shrink
-1 - no shrink
-2 - 2x shrink
-3 - 3x shrink
-...
-Up to 8x shrink.
+Each number in the mask configures the amount of range shrink:<br/>
+1 - no shrink<br/>
+2 - 2x shrink<br/> 
+3 - 3x shrink<br/>
+...<br/>
+Up to 8x shrink.<br/>
 
 Range expansion can be beneficial when you need a similar distribution for arguments with wildly different ranges (or cardinality)
 For example: 'IP Address' (0...FFFFFFFF) and 'Country code' (0...FF).

From 45509607ad139c099c5a4d5fea07ac34149dcf2d Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Tue, 5 Mar 2024 15:50:30 +0100
Subject: [PATCH 117/985] Fix spelling mistake

---
 docs/en/sql-reference/functions/encoding-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/encoding-functions.md b/docs/en/sql-reference/functions/encoding-functions.md
index 0cb459b8e07..28431c84add 100644
--- a/docs/en/sql-reference/functions/encoding-functions.md
+++ b/docs/en/sql-reference/functions/encoding-functions.md
@@ -551,7 +551,7 @@ SELECT mortonEncode(tuple(2), 128);
 
 **implementation details**
 
-Please note that you can fit only so much bits of information into Morton code as [UInt64](../../sql-reference/data-types/int-uint.md) has. Two arguments will have a range of maximum 2^32 (64/2) each, three arguments a range of max 2^21 (64/3) each and so on. All overflow will be clamped to zero.
+Please note that you can fit only so many bits of information into Morton code as [UInt64](../../sql-reference/data-types/int-uint.md) has. Two arguments will have a range of maximum 2^32 (64/2) each, three arguments a range of max 2^21 (64/3) each and so on. All overflow will be clamped to zero.
 
 ## mortonDecode
 

From aa6b70e5f2187be71b6bce835ecff0aa0c0bfca7 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Tue, 5 Mar 2024 16:55:08 +0000
Subject: [PATCH 118/985] Add documentation to `simpleJSON` functions

---
 .../sql-reference/functions/json-functions.md | 392 +++++++++++++++---
 1 file changed, 342 insertions(+), 50 deletions(-)

diff --git a/docs/en/sql-reference/functions/json-functions.md b/docs/en/sql-reference/functions/json-functions.md
index 2c837ff4a42..246cb8972fb 100644
--- a/docs/en/sql-reference/functions/json-functions.md
+++ b/docs/en/sql-reference/functions/json-functions.md
@@ -5,80 +5,372 @@ sidebar_label: JSON
 ---
 
 There are two sets of functions to parse JSON.
-   - `visitParam*` (`simpleJSON*`) is made to parse a special very limited subset of a JSON, but these functions are extremely fast.
+   - `simpleJSON*` (`visitParam*`) is made to parse a special very limited subset of a JSON, but these functions are extremely fast.
    - `JSONExtract*` is made to parse normal JSON.
 
-# visitParam functions
+# simpleJSON/visitParam functions
 
 ClickHouse has special functions for working with simplified JSON. All these JSON functions are based on strong assumptions about what the JSON can be, but they try to do as little as possible to get the job done.
 
 The following assumptions are made:
 
 1.  The field name (function argument) must be a constant.
-2.  The field name is somehow canonically encoded in JSON. For example: `visitParamHas('{"abc":"def"}', 'abc') = 1`, but `visitParamHas('{"\\u0061\\u0062\\u0063":"def"}', 'abc') = 0`
+2.  The field name is somehow canonically encoded in JSON. For example: `simpleJSONHas('{"abc":"def"}', 'abc') = 1`, but `simpleJSONHas('{"\\u0061\\u0062\\u0063":"def"}', 'abc') = 0`
 3.  Fields are searched for on any nesting level, indiscriminately. If there are multiple matching fields, the first occurrence is used.
 4.  The JSON does not have space characters outside of string literals.
 
-## visitParamHas(params, name)
+## simpleJSONHas
 
-Checks whether there is a field with the `name` name.
+Checks whether there is a field named `field_name`.  The result is `UInt8`.
 
-Alias: `simpleJSONHas`.
+**Syntax**
 
-## visitParamExtractUInt(params, name)
-
-Parses UInt64 from the value of the field named `name`. If this is a string field, it tries to parse a number from the beginning of the string. If the field does not exist, or it exists but does not contain a number, it returns 0.
-
-Alias: `simpleJSONExtractUInt`.
-
-## visitParamExtractInt(params, name)
-
-The same as for Int64.
-
-Alias: `simpleJSONExtractInt`.
-
-## visitParamExtractFloat(params, name)
-
-The same as for Float64.
-
-Alias: `simpleJSONExtractFloat`.
-
-## visitParamExtractBool(params, name)
-
-Parses a true/false value. The result is UInt8.
-
-Alias: `simpleJSONExtractBool`.
-
-## visitParamExtractRaw(params, name)
-
-Returns the value of a field, including separators.
-
-Alias: `simpleJSONExtractRaw`.
-
-Examples:
-
-``` sql
-visitParamExtractRaw('{"abc":"\\n\\u0000"}', 'abc') = '"\\n\\u0000"';
-visitParamExtractRaw('{"abc":{"def":[1,2,3]}}', 'abc') = '{"def":[1,2,3]}';
+```sql
+simpleJSONHas(json, field_name)
 ```
 
-## visitParamExtractString(params, name)
+**Parameters**
 
-Parses the string in double quotes. The value is unescaped. If unescaping failed, it returns an empty string.
+- `json`: The JSON in which the field is searched for. [String](../../sql-reference/data-types/string.md#string)
+- `field_name`: The name of the field to search for. [String literal](../syntax#string)
 
-Alias: `simpleJSONExtractString`.
+**Returned value**
 
-Examples:
+It returns `1` if the field exists, `0` otherwise.
 
-``` sql
-visitParamExtractString('{"abc":"\\n\\u0000"}', 'abc') = '\n\0';
-visitParamExtractString('{"abc":"\\u263a"}', 'abc') = '☺';
-visitParamExtractString('{"abc":"\\u263"}', 'abc') = '';
-visitParamExtractString('{"abc":"hello}', 'abc') = '';
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE jsons
+(
+    `json` String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"true","qux":1}');
+
+SELECT simpleJSONHas(json, 'foo') FROM jsons;
+SELECT simpleJSONHas(json, 'bar') FROM jsons;
 ```
 
+```response
+1
+0
+```
+## simpleJSONExtractUInt
+
+Parses `UInt64` from the value of the field named `field_name`. If this is a string field, it tries to parse a number from the beginning of the string. If the field does not exist, or it exists but does not contain a number, it returns `0`.
+
+**Syntax**
+
+```sql
+simpleJSONExtractUInt(json, field_name)
+```
+
+**Parameters**
+
+- `json`: The JSON in which the field is searched for. [String](../../sql-reference/data-types/string.md#string)
+- `field_name`: The name of the field to search for. [String literal](../syntax#string)
+
+**Returned value**
+
+It returns the number parsed from the field if the field exists and contains a number, `0` otherwise.
+
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE jsons
+(
+    `json` String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"4e3"}');
+INSERT INTO jsons VALUES ('{"foo":3.4}');
+INSERT INTO jsons VALUES ('{"foo":5}');
+INSERT INTO jsons VALUES ('{"foo":"not1number"}');
+INSERT INTO jsons VALUES ('{"baz":2}');
+
+SELECT simpleJSONExtractUInt(json, 'foo') FROM jsons ORDER BY json;
+```
+
+```response
+0
+4
+0
+3
+5
+```
+
+## simpleJSONExtractInt
+
+Parses `Int64` from the value of the field named `field_name`. If this is a string field, it tries to parse a number from the beginning of the string. If the field does not exist, or it exists but does not contain a number, it returns `0`.
+
+**Syntax**
+
+```sql
+simpleJSONExtractInt(json, field_name)
+```
+
+**Parameters**
+
+- `json`: The JSON in which the field is searched for. [String](../../sql-reference/data-types/string.md#string)
+- `field_name`: The name of the field to search for. [String literal](../syntax#string)
+
+**Returned value**
+
+It returns the number parsed from the field if the field exists and contains a number, `0` otherwise.
+
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE jsons
+(
+    `json` String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"-4e3"}');
+INSERT INTO jsons VALUES ('{"foo":-3.4}');
+INSERT INTO jsons VALUES ('{"foo":5}');
+INSERT INTO jsons VALUES ('{"foo":"not1number"}');
+INSERT INTO jsons VALUES ('{"baz":2}');
+
+SELECT simpleJSONExtractInt(json, 'foo') FROM jsons ORDER BY json;
+```
+
+```response
+0
+-4
+0
+-3
+5
+```
+
+## simpleJSONExtractFloat
+
+Parses `Float64` from the value of the field named `field_name`. If this is a string field, it tries to parse a number from the beginning of the string. If the field does not exist, or it exists but does not contain a number, it returns `0`.
+
+**Syntax**
+
+```sql
+simpleJSONExtractFloat(json, field_name)
+```
+
+**Parameters**
+
+- `json`: The JSON in which the field is searched for. [String](../../sql-reference/data-types/string.md#string)
+- `field_name`: The name of the field to search for. [String literal](../syntax#string)
+
+**Returned value**
+
+It returns the number parsed from the field if the field exists and contains a number, `0` otherwise.
+
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE jsons
+(
+    `json` String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"-4e3"}');
+INSERT INTO jsons VALUES ('{"foo":-3.4}');
+INSERT INTO jsons VALUES ('{"foo":5}');
+INSERT INTO jsons VALUES ('{"foo":"not1number"}');
+INSERT INTO jsons VALUES ('{"baz":2}');
+
+SELECT simpleJSONExtractFloat(json, 'foo') FROM jsons ORDER BY json;
+```
+
+```response
+0
+-4000
+0
+-3.4
+5
+```
+
+## simpleJSONExtractBool
+
+Parses a true/false value from the value of the field named `field_name`. The result is `UInt8`.
+
+**Syntax**
+
+```sql
+simpleJSONExtractBool(json, field_name)
+```
+
+**Parameters**
+
+- `json`: The JSON in which the field is searched for. [String](../../sql-reference/data-types/string.md#string)
+- `field_name`: The name of the field to search for. [String literal](../syntax#string)
+
+**Returned value**
+
+It returns `1` if the value of the field is `true`, `0` otherwise. This means this function will return `0` including (and not only) in the following cases:
+ - If the field doesn't exists.
+ - If the field contains `true` as a string, e.g.: `{"field":"true"}`.
+ - If the field contains `1` as a numerical value.
+
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE jsons
+(
+    `json` String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":false,"bar":true}');
+INSERT INTO jsons VALUES ('{"foo":"true","qux":1}');
+
+SELECT simpleJSONExtractBool(json, 'bar') FROM jsons ORDER BY json;
+SELECT simpleJSONExtractBool(json, 'foo') FROM jsons ORDER BY json;
+```
+
+```response
+0
+1
+0
+0
+```
+
+## simpleJSONExtractRaw
+
+Returns the value of the field named `field_name` as a `String`, including separators.
+
+**Syntax**
+
+```sql
+simpleJSONExtractRaw(json, field_name)
+```
+
+**Parameters**
+
+- `json`: The JSON in which the field is searched for. [String](../../sql-reference/data-types/string.md#string)
+- `field_name`: The name of the field to search for. [String literal](../syntax#string)
+
+**Returned value**
+
+It returns the value of the field as a [`String`](../../sql-reference/data-types/string.md#string), including separators if the field exists, or an emtpy `String` otherwise.
+
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE jsons
+(
+    `json` String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"-4e3"}');
+INSERT INTO jsons VALUES ('{"foo":-3.4}');
+INSERT INTO jsons VALUES ('{"foo":5}');
+INSERT INTO jsons VALUES ('{"foo":{"def":[1,2,3]}}');
+INSERT INTO jsons VALUES ('{"baz":2}');
+
+SELECT simpleJSONExtractRaw(json, 'foo') FROM jsons ORDER BY json;
+```
+
+```response
+
+"-4e3"
+-3.4
+5
+{"def":[1,2,3]}
+```
+
+## simpleJSONExtractString
+
+Parses `String` in double quotes from the value of the field named `field_name`.
+
+**Syntax**
+
+```sql
+simpleJSONExtractString(json, field_name)
+```
+
+**Parameters**
+
+- `json`: The JSON in which the field is searched for. [String](../../sql-reference/data-types/string.md#string)
+- `field_name`: The name of the field to search for. [String literal](../syntax#string)
+
+**Returned value**
+
+It returns the value of a field as a [`String`](../../sql-reference/data-types/string.md#string), including separators. The value is unescaped. It returns an empty `String`: if the field doesn't contain a double quoted string, if unescaping fails or if the field doesn't exist.
+
+**Implementation details**
+
 There is currently no support for code points in the format `\uXXXX\uYYYY` that are not from the basic multilingual plane (they are converted to CESU-8 instead of UTF-8).
 
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE jsons
+(
+    `json` String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"\\n\\u0000"}');
+INSERT INTO jsons VALUES ('{"foo":"\\u263"}');
+INSERT INTO jsons VALUES ('{"foo":"\\u263a"}');
+INSERT INTO jsons VALUES ('{"foo":"hello}');
+
+SELECT simpleJSONExtractString(json, 'foo') FROM jsons ORDER BY json;
+```
+
+```response
+\n\0
+
+☺
+
+```
+
+## visitParamHas
+
+This function is [an alias of `simpleJSONHas`](./json-functions#simplejsonhas).
+
+## visitParamExtractUInt
+
+This function is [an alias of `simpleJSONExtractUInt`](./json-functions#simplejsonextractuint).
+
+## visitParamExtractInt
+
+This function is [an alias of `simpleJSONExtractInt`](./json-functions#simplejsonextractint).
+
+## visitParamExtractFloat
+
+This function is [an alias of `simpleJSONExtractFloat`](./json-functions#simplejsonextractfloat).
+
+## visitParamExtractBool
+
+This function is [an alias of `simpleJSONExtractBool`](./json-functions#simplejsonextractbool).
+
+## visitParamExtractRaw
+
+This function is [an alias of `simpleJSONExtractRaw`](./json-functions#simplejsonextractraw).
+
+## visitParamExtractString
+
+This function is [an alias of `simpleJSONExtractString`](./json-functions#simplejsonextractstring).
+
 # JSONExtract functions
 
 The following functions are based on [simdjson](https://github.com/lemire/simdjson) designed for more complex JSON parsing requirements.

From 981c507d8007a4f7761a83a2ecfa0956a364317d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Tue, 5 Mar 2024 17:01:54 +0000
Subject: [PATCH 119/985] Add example to `sin`.

---
 docs/en/sql-reference/functions/math-functions.md | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/docs/en/sql-reference/functions/math-functions.md b/docs/en/sql-reference/functions/math-functions.md
index b27668caf0c..fc659891b5c 100644
--- a/docs/en/sql-reference/functions/math-functions.md
+++ b/docs/en/sql-reference/functions/math-functions.md
@@ -299,6 +299,18 @@ sin(x)
 
 Type: [Float*](../../sql-reference/data-types/float.md).
 
+**Example**
+
+Query:
+
+```sql
+SELECT sin(1.23);
+```
+
+```response
+0.9424888019316975
+```
+
 ## cos
 
 Returns the cosine of the argument.

From 57670a69be7aee37141aad13c3c9509ea2a40162 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Wed, 6 Mar 2024 04:15:57 +0100
Subject: [PATCH 120/985] Add mortonEncode, mortonDecode and related to
 spelling exceptions

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index f61448b2f35..6257b2fcd95 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -260,6 +260,7 @@ ExactEdgeLengthRads
 ExecutablePool
 ExtType
 ExternalDistributed
+FFFFFFFF
 FFFD
 FIPS
 FOSDEM
@@ -546,6 +547,8 @@ MinIO
 MinMax
 MindsDB
 Mongodb
+mortonDecode
+mortonEncode
 MsgPack
 MultiPolygon
 Multiline
@@ -2741,6 +2744,7 @@ xz
 yaml
 yandex
 youtube
+ZCurve
 zLib
 zLinux
 zabbix

From 53c9d4513c4b93ed79df305bb5c36c0cfb43ef79 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 6 Mar 2024 12:16:17 +0800
Subject: [PATCH 121/985] finish dev column array

---
 src/Columns/ColumnArray.cpp | 132 +++++++++++++++++++++++++++++++++---
 src/Columns/ColumnArray.h   |   3 +
 2 files changed, 125 insertions(+), 10 deletions(-)

diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index b620da81ae8..aa0d5aa3e50 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -31,6 +31,7 @@ namespace ErrorCodes
     extern const int SIZES_OF_COLUMNS_DOESNT_MATCH;
     extern const int LOGICAL_ERROR;
     extern const int TOO_LARGE_ARRAY_SIZE;
+    extern const int ILLEGAL_COLUMN;
 }
 
 /** Obtaining array as Field can be slow for large arrays and consume vast amount of memory.
@@ -363,6 +364,19 @@ void ColumnArray::insertManyFromNumber(const ColumnArray & src, size_t position,
         memcpy(&data_ref[offset], &src_data[src_offset], src_size * sizeof(T));
 }
 
+void ColumnArray::insertManyFromConst(const ColumnConst & src, size_t position, size_t length)
+{
+    const ColumnArray * src_array = typeid_cast<const ColumnArray *>(&src.getDataColumn());
+    if (!src_array)
+        throw Exception(
+            ErrorCodes::ILLEGAL_COLUMN,
+            "Cannot insert from const column of type {} to column of type {}",
+            src.getDataColumn().getName(),
+            getName());
+
+    insertManyFromImpl(*src_array, 0, length, true);
+}
+
 void ColumnArray::insertManyFromString(const ColumnArray & src, size_t position, size_t length)
 {
     size_t src_size = src.sizeAt(position);
@@ -400,12 +414,53 @@ void ColumnArray::insertManyFromString(const ColumnArray & src, size_t position,
 
 void ColumnArray::insertManyFromTuple(const ColumnArray & src, size_t position, size_t length)
 {
+    ColumnTuple & tuple = assert_cast<ColumnTuple &>(getData());
+    const ColumnTuple & src_tuple = assert_cast<const ColumnTuple &>(src.getData());
 
+    /// Make temporary arrays for each components of Tuple. In the same way as for Nullable.
+    size_t tuple_size = tuple.tupleSize();
+    size_t src_tuple_size = src_tuple.tupleSize();
+    if (tuple_size == 0)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Empty tuple");
+    if (tuple_size != src_tuple_size)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Nested tuple size mismatch: {} vs {}", tuple_size, src_tuple_size);
+
+    Columns temporary_arrays(tuple_size);
+    Columns src_temporary_arrays(tuple_size);
+    for (size_t i = 0; i < tuple_size; ++i)
+    {
+        temporary_arrays[i] = ColumnArray::create(tuple.getColumn(i).assumeMutable(), getOffsetsPtr()->assumeMutable());
+        src_temporary_arrays[i] = ColumnArray::create(src_tuple.getColumn(i).assumeMutable(), src.getOffsetsPtr()->assumeMutable());
+        assert_cast<ColumnArray &>(*temporary_arrays[i])
+            .insertManyFromImpl(assert_cast<const ColumnArray &>(*src_temporary_arrays[i]), position, length, false);
+    }
+
+    Columns tuple_columns(tuple_size);
+    for (size_t i = 0; i < tuple_size; ++i)
+        tuple_columns[i] = assert_cast<const ColumnArray &>(*temporary_arrays[i]).getDataPtr();
+
+    getDataPtr() = ColumnTuple::create(std::move(tuple_columns));
 }
+
 void ColumnArray::insertManyFromNullable(const ColumnArray & src, size_t position, size_t length)
 {
+    ColumnNullable & nullable = assert_cast<ColumnNullable &>(getData());
+    const ColumnNullable & src_nullable = assert_cast<const ColumnNullable &>(src.getData());
 
+    /// Process nested column without updating array offsets
+    auto array_of_nested = ColumnArray(nullable.getNestedColumnPtr()->assumeMutable(), getOffsetsPtr()->assumeMutable());
+    auto src_array_of_nested = ColumnArray(src_nullable.getNestedColumnPtr()->assumeMutable(), src.getOffsetsPtr()->assumeMutable());
+    array_of_nested.insertManyFromImpl(src_array_of_nested, position, length, false);
+
+    /// Process null map column without updating array offsets
+    auto array_of_null_map = ColumnArray(nullable.getNullMapColumnPtr()->assumeMutable(), getOffsetsPtr()->assumeMutable());
+    auto src_array_of_null_map = ColumnArray(src_nullable.getNullMapColumnPtr()->assumeMutable(), src.getOffsetsPtr()->assumeMutable());
+    array_of_null_map.insertManyFromImpl(src_array_of_null_map, position, length, false);
+
+    /// Update array data
+    getDataPtr() = ColumnNullable::create(array_of_nested.getDataPtr(), array_of_null_map.getDataPtr());
 }
+
 void ColumnArray::insertManyFromGeneric(const ColumnArray & src, size_t position, size_t length)
 {
     size_t src_size = src.sizeAt(position);
@@ -419,16 +474,73 @@ void ColumnArray::insertManyFromGeneric(const ColumnArray & src, size_t position
 
 void ColumnArray::insertManyFrom(const IColumn & src_, size_t position, size_t length)
 {
-    /// First fill offsets
-    const ColumnArray & src = assert_cast<const ColumnArray &>(src_);
-    size_t src_size = src.sizeAt(position);
-    auto & offsets_ref = getOffsets();
-    size_t old_rows = offsets_ref.size();
-    size_t new_rows = old_rows + length;
-    size_t old_size = offsets_ref.back();
-    offsets_ref.resize(new_rows);
-    for (size_t i = 0, offset = old_size + src_size; i < length; ++i, offset += src_size)
-        offsets_ref[old_rows + i] = offset;
+    const ColumnConst * src_const = typeid_cast<const ColumnConst *>(&src_);
+    if (src_const)
+        return insertManyFromConst(*src_const, position, length);
+
+    const ColumnArray * src_array = typeid_cast<const ColumnArray *>(&src_);
+    if (!src_array)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert from column of type {} to column of type {}", src_.getName(), getName());
+
+    return insertManyFromImpl(*src_array, position, length, true);
+}
+
+void ColumnArray::insertManyFromImpl(const ColumnArray & src, size_t position, size_t length, bool update_offsets)
+{
+    /// First fill offsets if needed
+    if (update_offsets)
+    {
+        size_t src_size = src.sizeAt(position);
+        auto & offsets_ref = getOffsets();
+        size_t old_rows = offsets_ref.size();
+        size_t new_rows = old_rows + length;
+        size_t old_size = offsets_ref.back();
+        offsets_ref.resize(new_rows);
+        for (size_t i = 0, offset = old_size + src_size; i < length; ++i, offset += src_size)
+            offsets_ref[old_rows + i] = offset;
+    }
+
+    if (typeid_cast<const ColumnUInt8 *>(data.get()))
+        return insertManyFromNumber<UInt8>(src, position, length);
+    if (typeid_cast<const ColumnUInt16 *>(data.get()))
+        return insertManyFromNumber<UInt16>(src, position, length);
+    if (typeid_cast<const ColumnUInt32 *>(data.get()))
+        return insertManyFromNumber<UInt32>(src, position, length);
+    if (typeid_cast<const ColumnUInt64 *>(data.get()))
+        return insertManyFromNumber<UInt64>(src, position, length);
+    if (typeid_cast<const ColumnUInt128 *>(data.get()))
+        return insertManyFromNumber<UInt128>(src, position, length);
+    if (typeid_cast<const ColumnUInt256 *>(data.get()))
+        return insertManyFromNumber<UInt256>(src, position, length);
+    if (typeid_cast<const ColumnInt16 *>(data.get()))
+        return insertManyFromNumber<Int16>(src, position, length);
+    if (typeid_cast<const ColumnInt32 *>(data.get()))
+        return insertManyFromNumber<Int32>(src, position, length);
+    if (typeid_cast<const ColumnInt64 *>(data.get()))
+        return insertManyFromNumber<Int64>(src, position, length);
+    if (typeid_cast<const ColumnInt128 *>(data.get()))
+        return insertManyFromNumber<Int128>(src, position, length);
+    if (typeid_cast<const ColumnInt256 *>(data.get()))
+        return insertManyFromNumber<Int256>(src, position, length);
+    if (typeid_cast<const ColumnFloat32 *>(data.get()))
+        return insertManyFromNumber<Float32>(src, position, length);
+    if (typeid_cast<const ColumnFloat64 *>(data.get()))
+        return insertManyFromNumber<Float64>(src, position, length);
+    if (typeid_cast<const ColumnDecimal<Decimal32> *>(data.get()))
+        return insertManyFromNumber<Decimal32>(src, position, length);
+    if (typeid_cast<const ColumnDecimal<Decimal64> *>(data.get()))
+        return insertManyFromNumber<Decimal64>(src, position, length);
+    if (typeid_cast<const ColumnDecimal<Decimal128> *>(data.get()))
+        return insertManyFromNumber<Decimal128>(src, position, length);
+    if (typeid_cast<const ColumnDecimal<Decimal256> *>(data.get()))
+        return insertManyFromNumber<Decimal256>(src, position, length);
+    if (typeid_cast<const ColumnDecimal<DateTime64> *>(data.get()))
+        return insertManyFromNumber<DateTime64>(src, position, length);
+    if (typeid_cast<const ColumnNullable *>(data.get()))
+        return insertManyFromNullable(src, position, length);
+    if (typeid_cast<const ColumnTuple *>(data.get()))
+        return insertManyFromTuple(src, position, length);
+    return insertManyFromGeneric(src, position, length);
 }
 
 void ColumnArray::insertDefault()
diff --git a/src/Columns/ColumnArray.h b/src/Columns/ColumnArray.h
index 73d632a38b9..765f86ec552 100644
--- a/src/Columns/ColumnArray.h
+++ b/src/Columns/ColumnArray.h
@@ -215,6 +215,9 @@ private:
     ColumnPtr filterGeneric(const Filter & filt, ssize_t result_size_hint) const;
 
     /// Specializations for insertManyFrom
+    void insertManyFromConst(const ColumnConst & src, size_t position, size_t length);
+    void insertManyFromImpl(const ColumnArray & src, size_t position, size_t length, bool update_offsets = true);
+
     template <typename T>
     void insertManyFromNumber(const ColumnArray & src, size_t position, size_t length);
     void insertManyFromString(const ColumnArray & src, size_t position, size_t length);

From 3bf3c7cc708d1a564896d649a1a804b868f89d8d Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 6 Mar 2024 12:32:23 +0800
Subject: [PATCH 122/985] finish column map and tuple

---
 src/Columns/ColumnArray.cpp |  2 +-
 src/Columns/ColumnMap.cpp   |  5 +++++
 src/Columns/ColumnMap.h     |  1 +
 src/Columns/ColumnTuple.cpp | 12 ++++++++++++
 src/Columns/ColumnTuple.h   |  1 +
 5 files changed, 20 insertions(+), 1 deletion(-)

diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index aa0d5aa3e50..5b0df8e9b6b 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -364,7 +364,7 @@ void ColumnArray::insertManyFromNumber(const ColumnArray & src, size_t position,
         memcpy(&data_ref[offset], &src_data[src_offset], src_size * sizeof(T));
 }
 
-void ColumnArray::insertManyFromConst(const ColumnConst & src, size_t position, size_t length)
+void ColumnArray::insertManyFromConst(const ColumnConst & src, size_t  /*position*/, size_t length)
 {
     const ColumnArray * src_array = typeid_cast<const ColumnArray *>(&src.getDataColumn());
     if (!src_array)
diff --git a/src/Columns/ColumnMap.cpp b/src/Columns/ColumnMap.cpp
index 995f3103484..57e8ba685b4 100644
--- a/src/Columns/ColumnMap.cpp
+++ b/src/Columns/ColumnMap.cpp
@@ -158,6 +158,11 @@ void ColumnMap::insertFrom(const IColumn & src, size_t n)
     nested->insertFrom(assert_cast<const ColumnMap &>(src).getNestedColumn(), n);
 }
 
+void ColumnMap::insertManyFrom(const IColumn & src, size_t position, size_t length)
+{
+    assert_cast<ColumnArray &>(*nested).insertManyFrom(assert_cast<const ColumnMap &>(src).getNestedColumn(), position, length);
+}
+
 void ColumnMap::insertRangeFrom(const IColumn & src, size_t start, size_t length)
 {
     nested->insertRangeFrom(
diff --git a/src/Columns/ColumnMap.h b/src/Columns/ColumnMap.h
index 17cd86a3788..60aa69e7bf6 100644
--- a/src/Columns/ColumnMap.h
+++ b/src/Columns/ColumnMap.h
@@ -67,6 +67,7 @@ public:
     void updateWeakHash32(WeakHash32 & hash) const override;
     void updateHashFast(SipHash & hash) const override;
     void insertFrom(const IColumn & src_, size_t n) override;
+    void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
     void insertRangeFrom(const IColumn & src, size_t start, size_t length) override;
     ColumnPtr filter(const Filter & filt, ssize_t result_size_hint) const override;
     void expand(const Filter & mask, bool inverted) override;
diff --git a/src/Columns/ColumnTuple.cpp b/src/Columns/ColumnTuple.cpp
index 17cc58d92f5..062bdadf9d2 100644
--- a/src/Columns/ColumnTuple.cpp
+++ b/src/Columns/ColumnTuple.cpp
@@ -185,6 +185,18 @@ void ColumnTuple::insertFrom(const IColumn & src_, size_t n)
         columns[i]->insertFrom(*src.columns[i], n);
 }
 
+void ColumnTuple::insertManyFrom(const IColumn & src, size_t position, size_t length)
+{
+    const ColumnTuple & src_tuple = assert_cast<const ColumnTuple &>(src);
+
+    const size_t tuple_size = columns.size();
+    if (src_tuple.columns.size() != tuple_size)
+        throw Exception(ErrorCodes::CANNOT_INSERT_VALUE_OF_DIFFERENT_SIZE_INTO_TUPLE, "Cannot insert value of different size into tuple");
+
+    for (size_t i = 0; i < tuple_size; ++i)
+        columns[i]->insertManyFrom(*src_tuple.columns[i], position, length);
+}
+
 void ColumnTuple::insertDefault()
 {
     for (auto & column : columns)
diff --git a/src/Columns/ColumnTuple.h b/src/Columns/ColumnTuple.h
index 610416b8b11..5b626155754 100644
--- a/src/Columns/ColumnTuple.h
+++ b/src/Columns/ColumnTuple.h
@@ -60,6 +60,7 @@ public:
     void insert(const Field & x) override;
     bool tryInsert(const Field & x) override;
     void insertFrom(const IColumn & src_, size_t n) override;
+    void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
     void insertDefault() override;
     void popBack(size_t n) override;
     StringRef serializeValueIntoArena(size_t n, Arena & arena, char const *& begin) const override;

From 68a3ca37c40db7f9b928d9f20bde6912ba6bd7da Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Wed, 6 Mar 2024 06:42:01 +0100
Subject: [PATCH 123/985] Add examples using columns

---
 .../functions/encoding-functions.md           | 85 +++++++++++++++++++
 1 file changed, 85 insertions(+)

diff --git a/docs/en/sql-reference/functions/encoding-functions.md b/docs/en/sql-reference/functions/encoding-functions.md
index 28431c84add..c81b3e35317 100644
--- a/docs/en/sql-reference/functions/encoding-functions.md
+++ b/docs/en/sql-reference/functions/encoding-functions.md
@@ -515,6 +515,8 @@ Query:
 SELECT mortonEncode((1,2), 1024, 16);
 ```
 
+Result:
+
 ```response
 1572864
 ```
@@ -531,6 +533,8 @@ Query:
 SELECT mortonEncode(1);
 ```
 
+Result:
+
 ```response
 1
 ```
@@ -545,10 +549,49 @@ Query:
 SELECT mortonEncode(tuple(2), 128);
 ```
 
+Result:
+
 ```response
 32768
 ```
 
+**Example**
+
+You can also use column names in the function.
+
+Query:
+
+First create the table and insert some data.
+
+```sql
+create table morton_numbers(
+    n1 UInt32,
+    n2 UInt32,
+    n3 UInt16,
+    n4 UInt16,
+    n5 UInt8,
+    n6 UInt8,
+    n7 UInt8,
+    n8 UInt8
+)
+Engine=MergeTree()
+ORDER BY n1 SETTINGS index_granularity = 8192, index_granularity_bytes = '10Mi';
+insert into morton_numbers (*) values(1,2,3,4,5,6,7,8);
+```
+Use column names instead of constants as function arguments to `mortonEncode`
+
+Query:
+
+```sql
+SELECT mortonEncode(n1, n2, n3, n4, n5, n6, n7, n8) FROM morton_numbers;
+```
+
+Result:
+
+```response
+2155374165
+```
+
 **implementation details**
 
 Please note that you can fit only so many bits of information into Morton code as [UInt64](../../sql-reference/data-types/int-uint.md) has. Two arguments will have a range of maximum 2^32 (64/2) each, three arguments a range of max 2^21 (64/3) each and so on. All overflow will be clamped to zero.
@@ -589,6 +632,8 @@ Query:
 SELECT mortonDecode(3, 53);
 ```
 
+Result:
+
 ```response
 ["1","2","3"]
 ```
@@ -615,6 +660,8 @@ Query:
 SELECT mortonDecode(1, 1);
 ```
 
+Result:
+
 ```response
 ["1"]
 ```
@@ -629,10 +676,48 @@ Query:
 SELECT mortonDecode(tuple(2), 32768);
 ```
 
+Result:
+
 ```response
 ["128"]
 ```
 
+**Example**
+
+You can also use column names in the function.
+
+First create the table and insert some data.
+
+Query:
+```sql
+create table morton_numbers(
+    n1 UInt32,
+    n2 UInt32,
+    n3 UInt16,
+    n4 UInt16,
+    n5 UInt8,
+    n6 UInt8,
+    n7 UInt8,
+    n8 UInt8
+)
+Engine=MergeTree()
+ORDER BY n1 SETTINGS index_granularity = 8192, index_granularity_bytes = '10Mi';
+insert into morton_numbers (*) values(1,2,3,4,5,6,7,8);
+```
+Use column names instead of constants as function arguments to `mortonDecode`
+
+Query:
+
+```sql
+select untuple(mortonDecode(8, mortonEncode(n1, n2, n3, n4, n5, n6, n7, n8))) from morton_numbers;
+```
+
+Result:
+
+```response
+1	2	3	4	5	6	7	8
+```
+
 
 
From 3005bff23100539dbb71f9623dc3aed9c34a87f6 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 6 Mar 2024 14:43:33 +0800
Subject: [PATCH 124/985] fix building

---
 src/Columns/ColumnArray.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index 5b0df8e9b6b..389b3e97820 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -425,7 +425,7 @@ void ColumnArray::insertManyFromTuple(const ColumnArray & src, size_t position,
     if (tuple_size != src_tuple_size)
         throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Nested tuple size mismatch: {} vs {}", tuple_size, src_tuple_size);
 
-    Columns temporary_arrays(tuple_size);
+    MutableColumns temporary_arrays(tuple_size);
     Columns src_temporary_arrays(tuple_size);
     for (size_t i = 0; i < tuple_size; ++i)
     {

From 3dbb0a12fb433b29107d449099efbc99f5d71f34 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Wed, 6 Mar 2024 16:15:37 +0800
Subject: [PATCH 125/985] [fix] style

---
 src/Storages/MergeTree/MergeTreeData.cpp | 7 +++----
 tests/integration/helpers/cluster.py     | 2 +-
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index d8680958c21..c76ffeee874 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7161,11 +7161,10 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
             try
             {
                 auto reservation_space = src_part_storage->reserve(src_part->getBytesOnDisk());
-                if (!reservation_space) {
+                if (!reservation_space)
                     throw Exception(ErrorCodes::NOT_ENOUGH_SPACE, "Not enough space on disk.");
-                }
-                dst_part_storage
-                    = src_part_storage->clonePart(this->getRelativeDataPath(), tmp_dst_part_name, disk, read_settings, write_settings, {}, {});
+                dst_part_storage = src_part_storage->clonePart(
+                    this->getRelativeDataPath(), tmp_dst_part_name, disk, read_settings, write_settings, {}, {});
                 copy_successful = true;
                 break;
             }
diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 1d96563251b..767ba5b6660 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -3216,7 +3216,7 @@ services:
             - timeout:1
             - inet6
             - rotate
-        {networks}
+        {123}
             {app_net}
                 {ipv4_address}
                 {ipv6_address}

From b4dba828a4dcde93944e05b512818827fd3e5a85 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Wed, 6 Mar 2024 16:19:07 +0800
Subject: [PATCH 126/985] [fix]

---
 tests/integration/helpers/cluster.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 767ba5b6660..1d96563251b 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -3216,7 +3216,7 @@ services:
             - timeout:1
             - inet6
             - rotate
-        {123}
+        {networks}
             {app_net}
                 {ipv4_address}
                 {ipv6_address}

From 6d4514c045cc565919f9c8384710eee89354f0f3 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 6 Mar 2024 16:55:48 +0800
Subject: [PATCH 127/985] Fix test

---
 src/Storages/System/StorageSystemDisks.cpp       | 10 +++++++++-
 tests/integration/test_backup_restore_s3/test.py | 12 ++++++------
 2 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/src/Storages/System/StorageSystemDisks.cpp b/src/Storages/System/StorageSystemDisks.cpp
index 30d64156b22..0f8a6640f2c 100644
--- a/src/Storages/System/StorageSystemDisks.cpp
+++ b/src/Storages/System/StorageSystemDisks.cpp
@@ -25,6 +25,8 @@ StorageSystemDisks::StorageSystemDisks(const StorageID & table_id_)
         {"unreserved_space", std::make_shared<DataTypeUInt64>()},
         {"keep_free_space", std::make_shared<DataTypeUInt64>()},
         {"type", std::make_shared<DataTypeString>()},
+        {"object_storage_type", std::make_shared<DataTypeString>()},
+        {"metadata_type", std::make_shared<DataTypeString>()},
         {"is_encrypted", std::make_shared<DataTypeUInt8>()},
         {"is_read_only", std::make_shared<DataTypeUInt8>()},
         {"is_write_once", std::make_shared<DataTypeUInt8>()},
@@ -53,6 +55,8 @@ Pipe StorageSystemDisks::read(
     MutableColumnPtr col_unreserved = ColumnUInt64::create();
     MutableColumnPtr col_keep = ColumnUInt64::create();
     MutableColumnPtr col_type = ColumnString::create();
+    MutableColumnPtr col_object_storage_type = ColumnString::create();
+    MutableColumnPtr col_metadata_type = ColumnString::create();
     MutableColumnPtr col_is_encrypted = ColumnUInt8::create();
     MutableColumnPtr col_is_read_only = ColumnUInt8::create();
     MutableColumnPtr col_is_write_once = ColumnUInt8::create();
@@ -69,7 +73,9 @@ Pipe StorageSystemDisks::read(
         col_unreserved->insert(disk_ptr->getUnreservedSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_keep->insert(disk_ptr->getKeepingFreeSpace());
         auto data_source_description = disk_ptr->getDataSourceDescription();
-        col_type->insert(data_source_description.toString());
+        col_type->insert(data_source_description.type);
+        col_object_storage_type->insert(data_source_description.object_storage_type);
+        col_metadata_type->insert(data_source_description.metadata_type);
         col_is_encrypted->insert(data_source_description.is_encrypted);
         col_is_read_only->insert(disk_ptr->isReadOnly());
         col_is_write_once->insert(disk_ptr->isWriteOnce());
@@ -91,6 +97,8 @@ Pipe StorageSystemDisks::read(
     res_columns.emplace_back(std::move(col_unreserved));
     res_columns.emplace_back(std::move(col_keep));
     res_columns.emplace_back(std::move(col_type));
+    res_columns.emplace_back(std::move(col_object_storage_type));
+    res_columns.emplace_back(std::move(col_metadata_type));
     res_columns.emplace_back(std::move(col_is_encrypted));
     res_columns.emplace_back(std::move(col_is_read_only));
     res_columns.emplace_back(std::move(col_is_write_once));
diff --git a/tests/integration/test_backup_restore_s3/test.py b/tests/integration/test_backup_restore_s3/test.py
index 4d3ee8200a3..95e264107e4 100644
--- a/tests/integration/test_backup_restore_s3/test.py
+++ b/tests/integration/test_backup_restore_s3/test.py
@@ -124,15 +124,15 @@ def check_backup_and_restore(
 def check_system_tables(backup_query_id=None):
     disks = [
         tuple(disk.split("\t"))
-        for disk in node.query("SELECT name, type FROM system.disks").split("\n")
+        for disk in node.query("SELECT name, type, object_storage_type, metadata_type FROM system.disks").split("\n")
         if disk
     ]
     expected_disks = (
-        ("default", "local"),
-        ("disk_s3", "s3"),
-        ("disk_s3_cache", "s3"),
-        ("disk_s3_other_bucket", "s3"),
-        ("disk_s3_plain", "s3_plain"),
+        ("default", "local", "", ""),
+        ("disk_s3", "object_storage", "s3", "local"),
+        ("disk_s3_cache", "object_storage", "s3", "local"),
+        ("disk_s3_other_bucket", "object_storage", "s3", "local"),
+        ("disk_s3_plain", "object_storage", "s3", "plain"),
     )
     assert len(expected_disks) == len(disks)
     for expected_disk in expected_disks:

From be98c95f586762cdf20a6375917e30f296175593 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Wed, 6 Mar 2024 09:12:26 +0000
Subject: [PATCH 128/985] Automatic style fix

---
 tests/integration/test_backup_restore_s3/test.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_backup_restore_s3/test.py b/tests/integration/test_backup_restore_s3/test.py
index 95e264107e4..452a9143067 100644
--- a/tests/integration/test_backup_restore_s3/test.py
+++ b/tests/integration/test_backup_restore_s3/test.py
@@ -124,7 +124,9 @@ def check_backup_and_restore(
 def check_system_tables(backup_query_id=None):
     disks = [
         tuple(disk.split("\t"))
-        for disk in node.query("SELECT name, type, object_storage_type, metadata_type FROM system.disks").split("\n")
+        for disk in node.query(
+            "SELECT name, type, object_storage_type, metadata_type FROM system.disks"
+        ).split("\n")
         if disk
     ]
     expected_disks = (

From 8e413da8f156ab03c875b9525044265cffcc5b83 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 6 Mar 2024 17:32:08 +0800
Subject: [PATCH 129/985] apply opts for string nested in array

---
 src/Columns/ColumnArray.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index 389b3e97820..44b17c89ae1 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -536,6 +536,8 @@ void ColumnArray::insertManyFromImpl(const ColumnArray & src, size_t position, s
         return insertManyFromNumber<Decimal256>(src, position, length);
     if (typeid_cast<const ColumnDecimal<DateTime64> *>(data.get()))
         return insertManyFromNumber<DateTime64>(src, position, length);
+    if (typeid_cast<const ColumnString *>(data.get()))
+        return insertManyFromString(src, position, length);
     if (typeid_cast<const ColumnNullable *>(data.get()))
         return insertManyFromNullable(src, position, length);
     if (typeid_cast<const ColumnTuple *>(data.get()))

From 56fb61e1866e81e9a00b9b98299ddc56a54f5394 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 6 Mar 2024 10:53:39 +0000
Subject: [PATCH 130/985] Do not duplicate the first category in case of
 multiple categories in `FunctionDocumentation`

---
 src/Common/FunctionDocumentation.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Common/FunctionDocumentation.cpp b/src/Common/FunctionDocumentation.cpp
index 2aad23b90b7..0dc5b48f9d1 100644
--- a/src/Common/FunctionDocumentation.cpp
+++ b/src/Common/FunctionDocumentation.cpp
@@ -36,6 +36,7 @@ std::string FunctionDocumentation::categoriesAsString() const
 
     auto it = categories.begin();
     std::string res = *it;
+    ++it;
     for (; it != categories.end(); ++it)
         res += ", " + *it;
     return res;

From 6f726865baf3fea606e7ff46e5d8cd98bda94f5c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 6 Mar 2024 11:10:02 +0000
Subject: [PATCH 131/985] Add inline docs to functions

---
 src/Functions/sin.cpp                         | 10 +++++-
 src/Functions/visitParamExtractBool.cpp       | 30 +++++++++++++++++-
 src/Functions/visitParamExtractFloat.cpp      | 31 ++++++++++++++++++-
 src/Functions/visitParamExtractInt.cpp        | 31 ++++++++++++++++++-
 src/Functions/visitParamExtractRaw.cpp        | 30 +++++++++++++++++-
 src/Functions/visitParamExtractString.cpp     | 30 +++++++++++++++++-
 src/Functions/visitParamExtractUInt.cpp       | 31 ++++++++++++++++++-
 src/Functions/visitParamHas.cpp               | 23 +++++++++++++-
 ...new_functions_must_be_documented.reference |  8 -----
 9 files changed, 208 insertions(+), 16 deletions(-)

diff --git a/src/Functions/sin.cpp b/src/Functions/sin.cpp
index dc75f4800c0..914f431adb4 100644
--- a/src/Functions/sin.cpp
+++ b/src/Functions/sin.cpp
@@ -13,7 +13,15 @@ using FunctionSin = FunctionMathUnary<UnaryFunctionVectorized<SinName, sin>>;
 
 REGISTER_FUNCTION(Sin)
 {
-    factory.registerFunction<FunctionSin>({}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction<FunctionSin>(
+        FunctionDocumentation{
+            .description = "Returns the sine of the argument.",
+            .syntax = "sin(x)",
+            .arguments = {{"x", "The number whose sine will be returned. (U)Int*, Float* or Decimal*."}},
+            .returned_value = "The sine of x.",
+            .examples = {{.name = "simple", .query = "SELECT sin(1.23)", .result = "0.9424888019316975"}},
+            .categories{"Mathematical", "Trigonometric"}},
+        FunctionFactory::CaseInsensitive);
 }
 
 }
diff --git a/src/Functions/visitParamExtractBool.cpp b/src/Functions/visitParamExtractBool.cpp
index 31763fe54ce..2c413ec13bb 100644
--- a/src/Functions/visitParamExtractBool.cpp
+++ b/src/Functions/visitParamExtractBool.cpp
@@ -21,7 +21,35 @@ using FunctionSimpleJSONExtractBool = FunctionsStringSearch<ExtractParamImpl<Nam
 
 REGISTER_FUNCTION(VisitParamExtractBool)
 {
-    factory.registerFunction<FunctionSimpleJSONExtractBool>();
+    factory.registerFunction<FunctionSimpleJSONExtractBool>(FunctionDocumentation{
+        .description = "Parses a true/false value from the value of the field named field_name. The result is UInt8.",
+        .syntax = "simpleJSONExtractBool(json, field_name)",
+        .arguments
+        = {{"json", "The JSON in which the field is searched for. String."},
+           {"field_name", "The name of the field to search for. String literal."}},
+        .returned_value
+        = R"(It returns 1 if the value of the field is true, 0 otherwise. This means this function will return 0 including (and not only) in the following cases:
+ - If the field doesn't exists.
+ - If the field contains true as a string, e.g.: {"field":"true"}.
+ - If the field contains 1 as a numerical value.)",
+        .examples
+        = {{.name = "simple",
+            .query = R"(CREATE TABLE jsons
+(
+    json String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":false,"bar":true}');
+INSERT INTO jsons VALUES ('{"foo":"true","qux":1}');
+
+SELECT simpleJSONExtractBool(json, 'bar') FROM jsons ORDER BY json;
+SELECT simpleJSONExtractBool(json, 'foo') FROM jsons ORDER BY json;)",
+            .result = R"(0
+1
+0
+0)"}},
+        .categories{"JSON"}});
     factory.registerAlias("visitParamExtractBool", "simpleJSONExtractBool");
 }
 
diff --git a/src/Functions/visitParamExtractFloat.cpp b/src/Functions/visitParamExtractFloat.cpp
index 6f6d5274050..fc839142cc7 100644
--- a/src/Functions/visitParamExtractFloat.cpp
+++ b/src/Functions/visitParamExtractFloat.cpp
@@ -11,7 +11,36 @@ using FunctionSimpleJSONExtractFloat = FunctionsStringSearch<ExtractParamImpl<Na
 
 REGISTER_FUNCTION(VisitParamExtractFloat)
 {
-    factory.registerFunction<FunctionSimpleJSONExtractFloat>();
+    factory.registerFunction<FunctionSimpleJSONExtractFloat>(FunctionDocumentation{
+        .description
+        = "Parses Float64 from the value of the field named field_name. If this is a string field, it tries to parse a number from the "
+          "beginning of the string. If the field does not exist, or it exists but does not contain a number, it returns 0.",
+        .syntax = "simpleJSONExtractFloat(json, field_name)",
+        .arguments
+        = {{"json", "The JSON in which the field is searched for. String."},
+           {"field_name", "The name of the field to search for. String literal."}},
+        .returned_value = "It returns the number parsed from the field if the field exists and contains a number, 0 otherwise.",
+        .examples
+        = {{.name = "simple",
+            .query = R"(CREATE TABLE jsons
+(
+    json String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"-4e3"}');
+INSERT INTO jsons VALUES ('{"foo":-3.4}');
+INSERT INTO jsons VALUES ('{"foo":5}');
+INSERT INTO jsons VALUES ('{"foo":"not1number"}');
+INSERT INTO jsons VALUES ('{"baz":2}');
+
+SELECT simpleJSONExtractFloat(json, 'foo') FROM jsons ORDER BY json;)",
+            .result = R"(0
+-4000
+0
+-3.4
+5)"}},
+        .categories{"JSON"}});
     factory.registerAlias("visitParamExtractFloat", "simpleJSONExtractFloat");
 }
 
diff --git a/src/Functions/visitParamExtractInt.cpp b/src/Functions/visitParamExtractInt.cpp
index e020c43e8b4..4588fc55c52 100644
--- a/src/Functions/visitParamExtractInt.cpp
+++ b/src/Functions/visitParamExtractInt.cpp
@@ -11,7 +11,36 @@ using FunctionSimpleJSONExtractInt = FunctionsStringSearch<ExtractParamImpl<Name
 
 REGISTER_FUNCTION(VisitParamExtractInt)
 {
-    factory.registerFunction<FunctionSimpleJSONExtractInt>();
+    factory.registerFunction<FunctionSimpleJSONExtractInt>(FunctionDocumentation{
+        .description
+        = "Parses Int64 from the value of the field named field_name. If this is a string field, it tries to parse a number from the "
+          "beginning of the string. If the field does not exist, or it exists but does not contain a number, it returns 0.",
+        .syntax = "simpleJSONExtractInt(json, field_name)",
+        .arguments
+        = {{"json", "The JSON in which the field is searched for. String."},
+           {"field_name", "The name of the field to search for. String literal."}},
+        .returned_value = "It returns the number parsed from the field if the field exists and contains a number, 0 otherwise.",
+        .examples
+        = {{.name = "simple",
+            .query = R"(CREATE TABLE jsons
+(
+    json String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"-4e3"}');
+INSERT INTO jsons VALUES ('{"foo":-3.4}');
+INSERT INTO jsons VALUES ('{"foo":5}');
+INSERT INTO jsons VALUES ('{"foo":"not1number"}');
+INSERT INTO jsons VALUES ('{"baz":2}');
+
+SELECT simpleJSONExtractInt(json, 'foo') FROM jsons ORDER BY json;)",
+            .result = R"(0
+-4
+0
+-3
+5)"}},
+        .categories{"JSON"}});
     factory.registerAlias("visitParamExtractInt", "simpleJSONExtractInt");
 }
 
diff --git a/src/Functions/visitParamExtractRaw.cpp b/src/Functions/visitParamExtractRaw.cpp
index 74a83170545..296429423fe 100644
--- a/src/Functions/visitParamExtractRaw.cpp
+++ b/src/Functions/visitParamExtractRaw.cpp
@@ -61,7 +61,35 @@ using FunctionSimpleJSONExtractRaw = FunctionsStringSearchToString<ExtractParamT
 
 REGISTER_FUNCTION(VisitParamExtractRaw)
 {
-    factory.registerFunction<FunctionSimpleJSONExtractRaw>();
+    factory.registerFunction<FunctionSimpleJSONExtractRaw>(FunctionDocumentation{
+        .description = "Returns the value of the field named field_name as a String, including separators.",
+        .syntax = "simpleJSONExtractRaw(json, field_name)",
+        .arguments
+        = {{"json", "The JSON in which the field is searched for. String."},
+           {"field_name", "The name of the field to search for. String literal."}},
+        .returned_value
+        = "It returns the value of the field as a String including separators if the field exists, or an emtpy String otherwise.",
+        .examples
+        = {{.name = "simple",
+            .query = R"(CREATE TABLE jsons
+(
+    json String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"-4e3"}');
+INSERT INTO jsons VALUES ('{"foo":-3.4}');
+INSERT INTO jsons VALUES ('{"foo":5}');
+INSERT INTO jsons VALUES ('{"foo":{"def":[1,2,3]}}');
+INSERT INTO jsons VALUES ('{"baz":2}');
+
+SELECT simpleJSONExtractRaw(json, 'foo') FROM jsons ORDER BY json;)",
+            .result = R"(
+"-4e3"
+-3.4
+5
+{"def":[1,2,3]})"}},
+        .categories{"JSON"}});
     factory.registerAlias("visitParamExtractRaw", "simpleJSONExtractRaw");
 }
 
diff --git a/src/Functions/visitParamExtractString.cpp b/src/Functions/visitParamExtractString.cpp
index 50d5f345189..8dae10638f8 100644
--- a/src/Functions/visitParamExtractString.cpp
+++ b/src/Functions/visitParamExtractString.cpp
@@ -22,7 +22,35 @@ using FunctionSimpleJSONExtractString = FunctionsStringSearchToString<ExtractPar
 
 REGISTER_FUNCTION(VisitParamExtractString)
 {
-    factory.registerFunction<FunctionSimpleJSONExtractString>();
+    factory.registerFunction<FunctionSimpleJSONExtractString>(FunctionDocumentation{
+        .description = R"(Parses String in double quotes from the value of the field named field_name.
+
+        There is currently no support for code points in the format \uXXXX\uYYYY that are not from the basic multilingual plane (they are converted to CESU-8 instead of UTF-8).)",
+        .syntax = "simpleJSONExtractString(json, field_name)",
+        .arguments
+        = {{"json", "The JSON in which the field is searched for. String."},
+           {"field_name", "The name of the field to search for. String literal."}},
+        .returned_value = "It returns the value of a field as a String, including separators. The value is unescaped. It returns an empty "
+                          "String: if the field doesn't contain a double quoted string, if unescaping fails or if the field doesn't exist.",
+        .examples
+        = {{.name = "simple",
+            .query = R"(CREATE TABLE jsons
+(
+    json String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"\\n\\u0000"}');
+INSERT INTO jsons VALUES ('{"foo":"\\u263"}');
+INSERT INTO jsons VALUES ('{"foo":"\\u263a"}');
+INSERT INTO jsons VALUES ('{"foo":"hello}');
+
+SELECT simpleJSONExtractString(json, 'foo') FROM jsons ORDER BY json;)",
+            .result = R"(\n\0
+
+☺
+)"}},
+        .categories{"JSON"}});
     factory.registerAlias("visitParamExtractString", "simpleJSONExtractString");
 }
 
diff --git a/src/Functions/visitParamExtractUInt.cpp b/src/Functions/visitParamExtractUInt.cpp
index fb58e417f34..777df9fdd24 100644
--- a/src/Functions/visitParamExtractUInt.cpp
+++ b/src/Functions/visitParamExtractUInt.cpp
@@ -12,7 +12,36 @@ using FunctionSimpleJSONExtractUInt = FunctionsStringSearch<ExtractParamImpl<Nam
 
 REGISTER_FUNCTION(VisitParamExtractUInt)
 {
-    factory.registerFunction<FunctionSimpleJSONExtractUInt>();
+    factory.registerFunction<FunctionSimpleJSONExtractUInt>(FunctionDocumentation{
+        .description
+        = "Parses UInt64 from the value of the field named field_name. If this is a string field, it tries to parse a number from the "
+          "beginning of the string. If the field does not exist, or it exists but does not contain a number, it returns 0.",
+        .syntax = "simpleJSONExtractUInt(json, field_name)",
+        .arguments
+        = {{"json", "The JSON in which the field is searched for. String."},
+           {"field_name", "The name of the field to search for. String literal."}},
+        .returned_value = "It returns the number parsed from the field if the field exists and contains a number, 0 otherwise.",
+        .examples
+        = {{.name = "simple",
+            .query = R"(CREATE TABLE jsons
+(
+    json String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"4e3"}');
+INSERT INTO jsons VALUES ('{"foo":3.4}');
+INSERT INTO jsons VALUES ('{"foo":5}');
+INSERT INTO jsons VALUES ('{"foo":"not1number"}');
+INSERT INTO jsons VALUES ('{"baz":2}');
+
+SELECT simpleJSONExtractUInt(json, 'foo') FROM jsons ORDER BY json;)",
+            .result = R"(0
+4
+0
+3
+5)"}},
+        .categories{"JSON"}});
     factory.registerAlias("visitParamExtractUInt", "simpleJSONExtractUInt");
 }
 
diff --git a/src/Functions/visitParamHas.cpp b/src/Functions/visitParamHas.cpp
index 1ed1f1d16e7..09fec782980 100644
--- a/src/Functions/visitParamHas.cpp
+++ b/src/Functions/visitParamHas.cpp
@@ -21,7 +21,28 @@ using FunctionSimpleJSONHas = FunctionsStringSearch<ExtractParamImpl<NameSimpleJ
 
 REGISTER_FUNCTION(VisitParamHas)
 {
-    factory.registerFunction<FunctionSimpleJSONHas>();
+    factory.registerFunction<FunctionSimpleJSONHas>(FunctionDocumentation{
+        .description = "Checks whether there is a field named field_name.  The result is UInt8.",
+        .syntax = "simpleJSONHas(json, field_name)",
+        .arguments
+        = {{"json", "The JSON in which the field is searched for. String."},
+           {"field_name", "The name of the field to search for. String literal."}},
+        .returned_value = "It returns 1 if the field exists, 0 otherwise.",
+        .examples
+        = {{.name = "simple",
+            .query = R"(CREATE TABLE jsons
+(
+    json String
+)
+ENGINE = Memory;
+
+INSERT INTO jsons VALUES ('{"foo":"true","qux":1}');
+
+SELECT simpleJSONHas(json, 'foo') FROM jsons;
+SELECT simpleJSONHas(json, 'bar') FROM jsons;)",
+            .result = R"(1
+0)"}},
+        .categories{"JSON"}});
     factory.registerAlias("visitParamHas", "simpleJSONHas");
 }
 
diff --git a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
index 379eea4dbbb..0a11e8b5034 100644
--- a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
+++ b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
@@ -643,14 +643,6 @@ shardNum
 showCertificate
 sigmoid
 sign
-simpleJSONExtractBool
-simpleJSONExtractFloat
-simpleJSONExtractInt
-simpleJSONExtractRaw
-simpleJSONExtractString
-simpleJSONExtractUInt
-simpleJSONHas
-sin
 sinh
 sipHash128
 sipHash128Keyed

From 2dc1721262c9f483917750aaa6139ff7409e02dc Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 6 Mar 2024 11:53:00 +0000
Subject: [PATCH 132/985] Refactorings for consistency

---
 src/Functions/array/arrayDistance.cpp   | 54 +++++++--------
 src/Functions/array/arrayDotProduct.cpp | 91 +++++++++++++------------
 2 files changed, 73 insertions(+), 72 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index 71564f6fa93..6b72c99d829 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -379,17 +379,17 @@ public:
     }
 
 
-#define SUPPORTED_TYPES(action) \
-    action(UInt8)   \
-    action(UInt16)  \
-    action(UInt32)  \
-    action(UInt64)  \
-    action(Int8)    \
-    action(Int16)   \
-    action(Int32)   \
-    action(Int64)   \
-    action(Float32) \
-    action(Float64)
+#define SUPPORTED_TYPES(ACTION) \
+    ACTION(UInt8)   \
+    ACTION(UInt16)  \
+    ACTION(UInt32)  \
+    ACTION(UInt64)  \
+    ACTION(Int8)    \
+    ACTION(Int16)   \
+    ACTION(Int32)   \
+    ACTION(Int64)   \
+    ACTION(Float32) \
+    ACTION(Float64)
 
 
 private:
@@ -398,12 +398,11 @@ private:
     {
         DataTypePtr type_x = typeid_cast<const DataTypeArray *>(arguments[0].type.get())->getNestedType();
 
-        /// Dynamic disaptch based on the 1st argument type
         switch (type_x->getTypeId())
         {
         #define ON_TYPE(type) \
             case TypeIndex::type: \
-                return executeWithFirstType<ResultType, type>(arguments, input_rows_count); \
+                return executeWithResultTypeAndLeftType<ResultType, type>(arguments, input_rows_count); \
                 break;
 
             SUPPORTED_TYPES(ON_TYPE)
@@ -419,17 +418,16 @@ private:
         }
     }
 
-    template <typename ResultType, typename FirstArgType>
-    ColumnPtr executeWithFirstType(const ColumnsWithTypeAndName & arguments, size_t input_rows_count) const
+    template <typename ResultType, typename LeftType>
+    ColumnPtr executeWithResultTypeAndLeftType(const ColumnsWithTypeAndName & arguments, size_t input_rows_count) const
     {
         DataTypePtr type_y = typeid_cast<const DataTypeArray *>(arguments[1].type.get())->getNestedType();
 
-        /// Dynamic disaptch based on the 2nd argument type
         switch (type_y->getTypeId())
         {
         #define ON_TYPE(type) \
             case TypeIndex::type: \
-                return executeWithTypes<ResultType, FirstArgType, type>(arguments[0].column, arguments[1].column, input_rows_count, arguments); \
+                return executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, type>(arguments[0].column, arguments[1].column, input_rows_count, arguments); \
                 break;
 
             SUPPORTED_TYPES(ON_TYPE)
@@ -445,16 +443,16 @@ private:
         }
     }
 
-    template <typename ResultType, typename FirstArgType, typename SecondArgType>
-    ColumnPtr executeWithTypes(ColumnPtr col_x, ColumnPtr col_y, size_t input_rows_count, const ColumnsWithTypeAndName & arguments) const
+    template <typename ResultType, typename LeftType, typename RightType>
+    ColumnPtr executeWithResultTypeAndLeftTypeAndRightType(ColumnPtr col_x, ColumnPtr col_y, size_t input_rows_count, const ColumnsWithTypeAndName & arguments) const
     {
         if (typeid_cast<const ColumnConst *>(col_x.get()))
         {
-            return executeWithTypesFirstArgConst<ResultType, FirstArgType, SecondArgType>(col_x, col_y, input_rows_count, arguments);
+            return executeWithLeftArgConst<ResultType, LeftType, RightType>(col_x, col_y, input_rows_count, arguments);
         }
         else if (typeid_cast<const ColumnConst *>(col_y.get()))
         {
-            return executeWithTypesFirstArgConst<ResultType, SecondArgType, FirstArgType>(col_y, col_x, input_rows_count, arguments);
+            return executeWithLeftArgConst<ResultType, RightType, LeftType>(col_y, col_x, input_rows_count, arguments);
         }
 
         col_x = col_x->convertToFullColumnIfConst();
@@ -463,8 +461,8 @@ private:
         const auto & array_x = *assert_cast<const ColumnArray *>(col_x.get());
         const auto & array_y = *assert_cast<const ColumnArray *>(col_y.get());
 
-        const auto & data_x = typeid_cast<const ColumnVector<FirstArgType> &>(array_x.getData()).getData();
-        const auto & data_y = typeid_cast<const ColumnVector<SecondArgType> &>(array_y.getData()).getData();
+        const auto & data_x = typeid_cast<const ColumnVector<LeftType> &>(array_x.getData()).getData();
+        const auto & data_y = typeid_cast<const ColumnVector<RightType> &>(array_y.getData()).getData();
 
         const auto & offsets_x = array_x.getOffsets();
         const auto & offsets_y = array_y.getOffsets();
@@ -521,8 +519,8 @@ private:
     }
 
     /// Special case when the 1st parameter is Const
-    template <typename ResultType, typename FirstArgType, typename SecondArgType>
-    ColumnPtr executeWithTypesFirstArgConst(ColumnPtr col_x, ColumnPtr col_y, size_t input_rows_count, const ColumnsWithTypeAndName & arguments) const
+    template <typename ResultType, typename LeftType, typename RightType>
+    ColumnPtr executeWithLeftArgConst(ColumnPtr col_x, ColumnPtr col_y, size_t input_rows_count, const ColumnsWithTypeAndName & arguments) const
     {
         col_x = assert_cast<const ColumnConst *>(col_x.get())->getDataColumnPtr();
         col_y = col_y->convertToFullColumnIfConst();
@@ -530,8 +528,8 @@ private:
         const auto & array_x = *assert_cast<const ColumnArray *>(col_x.get());
         const auto & array_y = *assert_cast<const ColumnArray *>(col_y.get());
 
-        const auto & data_x = typeid_cast<const ColumnVector<FirstArgType> &>(array_x.getData()).getData();
-        const auto & data_y = typeid_cast<const ColumnVector<SecondArgType> &>(array_y.getData()).getData();
+        const auto & data_x = typeid_cast<const ColumnVector<LeftType> &>(array_x.getData()).getData();
+        const auto & data_y = typeid_cast<const ColumnVector<RightType> &>(array_y.getData()).getData();
 
         const auto & offsets_x = array_x.getOffsets();
         const auto & offsets_y = array_y.getOffsets();
@@ -574,7 +572,7 @@ private:
             /// - the two most common metrics L2 and cosine distance,
             /// - the most powerful SIMD instruction set (AVX-512F).
 #if USE_MULTITARGET_CODE
-            if constexpr (std::is_same_v<ResultType, FirstArgType> && std::is_same_v<ResultType, SecondArgType>) /// ResultType is Float32 or Float64
+            if constexpr (std::is_same_v<ResultType, LeftType> && std::is_same_v<ResultType, RightType>) /// ResultType is Float32 or Float64
             {
                 if constexpr (std::is_same_v<Kernel, L2Distance>
                            || std::is_same_v<Kernel, CosineDistance>)
diff --git a/src/Functions/array/arrayDotProduct.cpp b/src/Functions/array/arrayDotProduct.cpp
index 6c615a058c3..548c79c567f 100644
--- a/src/Functions/array/arrayDotProduct.cpp
+++ b/src/Functions/array/arrayDotProduct.cpp
@@ -163,26 +163,29 @@ public:
         return Kernel::getReturnType(nested_types[0], nested_types[1]);
     }
 
+#define SUPPORTED_TYPES(ACTION) \
+    ACTION(UInt8) \
+    ACTION(UInt16) \
+    ACTION(UInt32) \
+    ACTION(UInt64) \
+    ACTION(Int8) \
+    ACTION(Int16) \
+    ACTION(Int32) \
+    ACTION(Int64) \
+    ACTION(Float32) \
+    ACTION(Float64)
+
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t /* input_rows_count */) const override
     {
         switch (result_type->getTypeId())
         {
-        #define SUPPORTED_TYPE(type) \
+        #define ON_TYPE(type) \
             case TypeIndex::type: \
                 return executeWithResultType<type>(arguments); \
                 break;
 
-            SUPPORTED_TYPE(UInt8)
-            SUPPORTED_TYPE(UInt16)
-            SUPPORTED_TYPE(UInt32)
-            SUPPORTED_TYPE(UInt64)
-            SUPPORTED_TYPE(Int8)
-            SUPPORTED_TYPE(Int16)
-            SUPPORTED_TYPE(Int32)
-            SUPPORTED_TYPE(Int64)
-            SUPPORTED_TYPE(Float32)
-            SUPPORTED_TYPE(Float64)
-        #undef SUPPORTED_TYPE
+            SUPPORTED_TYPES(ON_TYPE)
+        #undef ON_TYPE
 
             default:
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected result type {}", result_type->getName());
@@ -194,16 +197,16 @@ private:
     ColumnPtr executeWithResultType(const ColumnsWithTypeAndName & arguments) const
     {
         ColumnPtr res;
-        if (!((res = executeWithResultTypeAndLeft<ResultType, UInt8>(arguments))
-            || (res = executeWithResultTypeAndLeft<ResultType, UInt16>(arguments))
-            || (res = executeWithResultTypeAndLeft<ResultType, UInt32>(arguments))
-            || (res = executeWithResultTypeAndLeft<ResultType, UInt64>(arguments))
-            || (res = executeWithResultTypeAndLeft<ResultType, Int8>(arguments))
-            || (res = executeWithResultTypeAndLeft<ResultType, Int16>(arguments))
-            || (res = executeWithResultTypeAndLeft<ResultType, Int32>(arguments))
-            || (res = executeWithResultTypeAndLeft<ResultType, Int64>(arguments))
-            || (res = executeWithResultTypeAndLeft<ResultType, Float32>(arguments))
-            || (res = executeWithResultTypeAndLeft<ResultType, Float64>(arguments))))
+        if (!((res = executeWithResultTypeAndLeftType<ResultType, UInt8>(arguments))
+            || (res = executeWithResultTypeAndLeftType<ResultType, UInt16>(arguments))
+            || (res = executeWithResultTypeAndLeftType<ResultType, UInt32>(arguments))
+            || (res = executeWithResultTypeAndLeftType<ResultType, UInt64>(arguments))
+            || (res = executeWithResultTypeAndLeftType<ResultType, Int8>(arguments))
+            || (res = executeWithResultTypeAndLeftType<ResultType, Int16>(arguments))
+            || (res = executeWithResultTypeAndLeftType<ResultType, Int32>(arguments))
+            || (res = executeWithResultTypeAndLeftType<ResultType, Int64>(arguments))
+            || (res = executeWithResultTypeAndLeftType<ResultType, Float32>(arguments))
+            || (res = executeWithResultTypeAndLeftType<ResultType, Float64>(arguments))))
             throw Exception(ErrorCodes::ILLEGAL_COLUMN,
                 "Illegal column {} of first argument of function {}", arguments[0].column->getName(), getName());
 
@@ -211,43 +214,43 @@ private:
     }
 
     template <typename ResultType, typename LeftType>
-    ColumnPtr executeWithResultTypeAndLeft(const ColumnsWithTypeAndName & arguments) const
+    ColumnPtr executeWithResultTypeAndLeftType(const ColumnsWithTypeAndName & arguments) const
     {
         ColumnPtr res;
-        if (   (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, UInt8>(arguments))
-            || (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, UInt16>(arguments))
-            || (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, UInt32>(arguments))
-            || (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, UInt64>(arguments))
-            || (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, Int8>(arguments))
-            || (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, Int16>(arguments))
-            || (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, Int32>(arguments))
-            || (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, Int64>(arguments))
-            || (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, Float32>(arguments))
-            || (res = executeWithResultTypeAndLeftAndRight<ResultType, LeftType, Float64>(arguments)))
+        if (   (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, UInt8>(arguments[0].column, arguments[1].column))
+            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, UInt16>(arguments[0].column, arguments[1].column))
+            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, UInt32>(arguments[0].column, arguments[1].column))
+            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, UInt64>(arguments[0].column, arguments[1].column))
+            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Int8>(arguments[0].column, arguments[1].column))
+            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Int16>(arguments[0].column, arguments[1].column))
+            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Int32>(arguments[0].column, arguments[1].column))
+            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Int64>(arguments[0].column, arguments[1].column))
+            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Float32>(arguments[0].column, arguments[1].column))
+            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Float64>(arguments[0].column, arguments[1].column)))
             return res;
 
        return nullptr;
     }
 
     template <typename ResultType, typename LeftType, typename RightType>
-    ColumnPtr executeWithResultTypeAndLeftAndRight(const ColumnsWithTypeAndName & arguments) const
+    ColumnPtr executeWithResultTypeAndLeftTypeAndRightType(ColumnPtr col_x, ColumnPtr col_y) const
     {
-        ColumnPtr col_left = arguments[0].column->convertToFullColumnIfConst();
-        ColumnPtr col_right = arguments[1].column->convertToFullColumnIfConst();
-        if (!col_left || !col_right)
+        col_x = col_x->convertToFullColumnIfConst();
+        col_y = col_y->convertToFullColumnIfConst();
+        if (!col_x || !col_y)
             return nullptr;
 
-        const ColumnArray * col_arr_left = checkAndGetColumn<ColumnArray>(col_left.get());
-        const ColumnArray * cokl_arr_right = checkAndGetColumn<ColumnArray>(col_right.get());
-        if (!col_arr_left || !cokl_arr_right)
+        const ColumnArray * array_x = checkAndGetColumn<ColumnArray>(col_x.get());
+        const ColumnArray * array_y = checkAndGetColumn<ColumnArray>(col_y.get());
+        if (!array_x || !array_y)
             return nullptr;
 
-        const ColumnVector<LeftType> * col_arr_nested_left = checkAndGetColumn<ColumnVector<LeftType>>(col_arr_left->getData());
-        const ColumnVector<RightType> * col_arr_nested_right = checkAndGetColumn<ColumnVector<RightType>>(cokl_arr_right->getData());
+        const ColumnVector<LeftType> * col_arr_nested_left = checkAndGetColumn<ColumnVector<LeftType>>(array_x->getData());
+        const ColumnVector<RightType> * col_arr_nested_right = checkAndGetColumn<ColumnVector<RightType>>(array_y->getData());
         if (!col_arr_nested_left || !col_arr_nested_right)
             return nullptr;
 
-        if (!col_arr_left->hasEqualOffsets(*cokl_arr_right))
+        if (!array_x->hasEqualOffsets(*array_y))
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Array arguments for function {} must have equal sizes", getName());
 
         auto col_res = ColumnVector<ResultType>::create();
@@ -255,7 +258,7 @@ private:
         vector(
             col_arr_nested_left->getData(),
             col_arr_nested_right->getData(),
-            col_arr_left->getOffsets(),
+            array_x->getOffsets(),
             col_res->getData());
 
         return col_res;

From 076482e8bd503ca352695173d87e9b48228389f0 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 6 Mar 2024 14:04:09 +0100
Subject: [PATCH 133/985] Remove whitespaces

---
 src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
index 42c6e63da01..e0d0fda81cb 100644
--- a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
+++ b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
@@ -132,7 +132,7 @@ class OptimizeShardingKeyRewriteIn : public InDepthQueryTreeVisitorWithContext<O
 {
 public:
     using Base = InDepthQueryTreeVisitorWithContext<OptimizeShardingKeyRewriteIn>;
-    
+
     OptimizeShardingKeyRewriteIn(OptimizeShardingKeyRewriteInVisitor::Data data_, ContextPtr context)
         : Base(std::move(context))
         , data(std::move(data_))

From 7065e650e1d007be4659ddb1f070b48e19cdef55 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 6 Mar 2024 14:34:03 +0100
Subject: [PATCH 134/985] Code cleanup

---
 src/DataTypes/ObjectUtils.cpp                 | 24 ++------
 src/DataTypes/ObjectUtils.h                   |  2 -
 .../ClusterProxy/SelectStreamFactory.cpp      |  7 +--
 .../ClusterProxy/SelectStreamFactory.h        |  2 +-
 src/Processors/QueryPlan/ReadFromRemote.cpp   | 61 +++----------------
 src/Storages/StorageDistributed.cpp           |  1 -
 tests/analyzer_integration_broken_tests.txt   |  1 -
 .../test_distributed_type_object/test.py      |  3 +-
 8 files changed, 18 insertions(+), 83 deletions(-)

diff --git a/src/DataTypes/ObjectUtils.cpp b/src/DataTypes/ObjectUtils.cpp
index 47d8c5c9113..ccfa0a28f13 100644
--- a/src/DataTypes/ObjectUtils.cpp
+++ b/src/DataTypes/ObjectUtils.cpp
@@ -1,4 +1,8 @@
 #include <memory>
+#include <Analyzer/ConstantNode.h>
+#include <Analyzer/FunctionNode.h>
+#include <Analyzer/QueryNode.h>
+#include <Analyzer/Utils.h>
 #include <DataTypes/ObjectUtils.h>
 #include <DataTypes/DataTypeObject.h>
 #include <DataTypes/DataTypeNothing.h>
@@ -21,16 +25,6 @@
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/ASTFunction.h>
 #include <IO/Operators.h>
-#include "Analyzer/ConstantNode.h"
-#include "Analyzer/FunctionNode.h"
-#include "Analyzer/IQueryTreeNode.h"
-#include "Analyzer/Identifier.h"
-#include "Analyzer/IdentifierNode.h"
-#include "Analyzer/QueryNode.h"
-#include "Analyzer/Utils.h"
-#include <Functions/FunctionFactory.h>
-#include <Poco/Logger.h>
-#include "Common/logger_useful.h"
 
 
 namespace DB
@@ -991,22 +985,12 @@ MissingObjectList replaceMissedSubcolumnsByConstants(
     {
         auto constant = std::make_shared<ConstantNode>(type->getDefault(), type);
         constant->setAlias(table_expression->getAlias() + "." + name);
-        // auto materialize = std::make_shared<FunctionNode>("materialize");
-
-        // auto function = FunctionFactory::instance().get("materialize", context);
-        // materialize->getArguments().getNodes() = { constant };
-        // materialize->resolveAsFunction(function->build(materialize->getArgumentColumns()));
-        // materialize->setAlias(name);
 
         column_name_to_node[name] = buildCastFunction(constant, type, context);
         missed_list.push_back({ constant->getValueStringRepresentation() + "_" + constant->getResultType()->getName(), table_expression->getAlias() + "." + name });
-        LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "{} -> {}", missed_list.back().first, missed_list.back().second);
-        LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "Name {} Expression\n{}", name, column_name_to_node[name]->dumpTree());
     }
 
-    LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "Table expression\n{} ", table_expression->dumpTree());
     replaceColumns(query, table_expression, column_name_to_node);
-    LOG_DEBUG(&Poco::Logger::get("replaceMissedSubcolumnsByConstants"), "Result:\n{} ", query->dumpTree());
 
     return missed_list;
 }
diff --git a/src/DataTypes/ObjectUtils.h b/src/DataTypes/ObjectUtils.h
index 013e525832e..6ef19baf5ae 100644
--- a/src/DataTypes/ObjectUtils.h
+++ b/src/DataTypes/ObjectUtils.h
@@ -3,8 +3,6 @@
 #include <Core/Block.h>
 #include <Core/NamesAndTypes.h>
 #include <Common/FieldVisitors.h>
-#include "Analyzer/IQueryTreeNode.h"
-#include "Interpreters/Context_fwd.h"
 #include <Storages/ColumnsDescription.h>
 #include <DataTypes/DataTypeTuple.h>
 #include <DataTypes/DataTypesNumber.h>
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
index 5bcd1ce68cb..4fccd83c8c0 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
@@ -5,10 +5,9 @@
 #include <Common/checkStackSize.h>
 #include <Common/logger_useful.h>
 #include <Common/FailPoint.h>
-#include "Analyzer/IQueryTreeNode.h"
-#include "Interpreters/InterpreterSelectQueryAnalyzer.h"
-#include "Interpreters/SelectQueryOptions.h"
-#include "Planner/Utils.h"
+#include <Interpreters/InterpreterSelectQueryAnalyzer.h>
+#include <Interpreters/SelectQueryOptions.h>
+#include <Planner/Utils.h>
 #include <TableFunctions/TableFunctionFactory.h>
 #include <IO/ConnectionTimeouts.h>
 #include <Interpreters/ClusterProxy/SelectStreamFactory.h>
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.h b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
index bee7edb3c19..61694830b3d 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.h
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <vector>
+#include <Analyzer/IQueryTreeNode.h>
 #include <Client/ConnectionPool.h>
 #include <Core/QueryProcessingStage.h>
 #include <Interpreters/Cluster.h>
@@ -8,7 +9,6 @@
 #include <Parsers/IAST.h>
 #include <Storages/IStorage_fwd.h>
 #include <Storages/StorageSnapshot.h>
-#include "Analyzer/IQueryTreeNode.h"
 
 namespace DB
 {
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index ac507c6d555..72848a37f6e 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -1,4 +1,3 @@
-#include <memory>
 #include <Processors/QueryPlan/ReadFromRemote.h>
 
 #include <DataTypes/DataTypesNumber.h>
@@ -15,7 +14,6 @@
 #include <Interpreters/ActionsDAG.h>
 #include <Common/logger_useful.h>
 #include <Common/checkStackSize.h>
-#include "DataTypes/ObjectUtils.h"
 #include <Core/QueryProcessingStage.h>
 #include <Client/ConnectionPool.h>
 #include <Client/ConnectionPoolWithFailover.h>
@@ -33,54 +31,14 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-static void addRenamingActions(Pipe & pipe, const MissingObjectList & missed_list, const Block & output_header)
-{
-    if (missed_list.empty())
-        return;
-
-    const auto & output_columns = output_header.getColumnsWithTypeAndName();
-    std::vector<size_t> indexes;
-    for (size_t i = 0; i < output_columns.size(); ++i)
-    {
-        bool found = false;
-        for (auto const & elem : missed_list)
-        {
-            if (output_columns[i].name.contains(elem.second))
-            {
-                found = true;
-                break;
-            }
-        }
-        if (found)
-            indexes.push_back(i);
-    }
-
-    auto dag = std::make_shared<ActionsDAG>(pipe.getHeader().getColumnsWithTypeAndName());
-
-    for (size_t index : indexes)
-    {
-        dag->addOrReplaceInOutputs(dag->addAlias(*dag->getOutputs()[index], output_header.getByPosition(index).name));
-    }
-
-    // dag->addAliases(rename_to_apply);
-
-    auto convert_actions = std::make_shared<ExpressionActions>(dag);
-    pipe.addSimpleTransform([&](const Block & cur_header, Pipe::StreamType) -> ProcessorPtr
-    {
-        return std::make_shared<ExpressionTransform>(cur_header, convert_actions);
-    });
-
-    LOG_DEBUG(&Poco::Logger::get("addRenamingActions"), "EXPECTED:\n{}", output_header.dumpStructure());
-
-    LOG_DEBUG(&Poco::Logger::get("addRenamingActions"), "{}", pipe.getHeader().dumpStructure());
-}
-
-static void addConvertingActions(Pipe & pipe, const Block & header)
+static void addConvertingActions(Pipe & pipe, const Block & header, bool use_positions_to_match = false)
 {
     if (blocksHaveEqualStructure(pipe.getHeader(), header))
         return;
 
-    auto get_converting_dag = [](const Block & block_, const Block & header_)
+    auto match_mode = use_positions_to_match ? ActionsDAG::MatchColumnsMode::Position : ActionsDAG::MatchColumnsMode::Name;
+
+    auto get_converting_dag = [mode = match_mode](const Block & block_, const Block & header_)
     {
         /// Convert header structure to expected.
         /// Also we ignore constants from result and replace it with constants from header.
@@ -88,7 +46,7 @@ static void addConvertingActions(Pipe & pipe, const Block & header)
         return ActionsDAG::makeConvertingActions(
             block_.getColumnsWithTypeAndName(),
             header_.getColumnsWithTypeAndName(),
-            ActionsDAG::MatchColumnsMode::Name,
+            mode,
             true);
     };
 
@@ -260,8 +218,7 @@ void ReadFromRemote::addLazyPipe(Pipes & pipes, const ClusterProxy::SelectStream
     };
 
     pipes.emplace_back(createDelayedPipe(shard.header, lazily_create_stream, add_totals, add_extremes));
-    addRenamingActions(pipes.back(), shard.missing_object_list, output_stream->header);
-    addConvertingActions(pipes.back(), output_stream->header);
+    addConvertingActions(pipes.back(), output_stream->header, !shard.missing_object_list.empty());
 }
 
 void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFactory::Shard & shard)
@@ -342,8 +299,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
             pipes.emplace_back(
                 createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
-            addRenamingActions(pipes.back(), shard.missing_object_list, output_stream->header);
-            addConvertingActions(pipes.back(), output_stream->header);
+            addConvertingActions(pipes.back(), output_stream->header, !shard.missing_object_list.empty());
         }
     }
     else
@@ -372,8 +328,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
         pipes.emplace_back(
             createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
-        addRenamingActions(pipes.back(), shard.missing_object_list, output_stream->header);
-        addConvertingActions(pipes.back(), output_stream->header);
+        addConvertingActions(pipes.back(), output_stream->header, !shard.missing_object_list.empty());
     }
 }
 
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 34ab21a4751..726f1788115 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -30,7 +30,6 @@
 #include <Common/randomSeed.h>
 #include <Common/formatReadable.h>
 #include <Common/CurrentMetrics.h>
-#include "Analyzer/IQueryTreeNode.h"
 
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index 796ca6bca22..a7954f91efa 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -1,6 +1,5 @@
 test_build_sets_from_multiple_threads/test.py::test_set
 test_concurrent_backups_s3/test.py::test_concurrent_backups
-test_distributed_type_object/test.py::test_distributed_type_object
 test_merge_table_over_distributed/test.py::test_global_in
 test_merge_table_over_distributed/test.py::test_select_table_name_from_merge_over_distributed
 test_passing_max_partitions_to_read_remotely/test.py::test_default_database_on_cluster
diff --git a/tests/integration/test_distributed_type_object/test.py b/tests/integration/test_distributed_type_object/test.py
index 7e6c000cb8e..360087c9dda 100644
--- a/tests/integration/test_distributed_type_object/test.py
+++ b/tests/integration/test_distributed_type_object/test.py
@@ -85,10 +85,11 @@ def test_distributed_type_object(started_cluster):
 3\t\t\t\tfoo"""
     )
 
+    # The following query is not supported by analyzer now
     assert (
         TSV(
             node1.query(
-                "SELECT id, data.k1, data.k2.k3, data.k2.k4, data.k5 FROM dist_table ORDER BY id"
+                "SELECT id, data.k1, data.k2.k3, data.k2.k4, data.k5 FROM dist_table ORDER BY id SETTINGS allow_experimental_analyzer = 0"
             )
         )
         == expected

From c3909743ed95adf5efd16e69f353aab8af73978b Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 6 Mar 2024 12:36:00 +0000
Subject: [PATCH 135/985] Remove repeated unnecessary unpacking of const
 columns

---
 src/Functions/array/arrayDotProduct.cpp | 88 +++++++++++++------------
 1 file changed, 46 insertions(+), 42 deletions(-)

diff --git a/src/Functions/array/arrayDotProduct.cpp b/src/Functions/array/arrayDotProduct.cpp
index 548c79c567f..c27170cd35b 100644
--- a/src/Functions/array/arrayDotProduct.cpp
+++ b/src/Functions/array/arrayDotProduct.cpp
@@ -19,7 +19,6 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
-    extern const int ILLEGAL_COLUMN;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int LOGICAL_ERROR;
 }
@@ -196,40 +195,51 @@ private:
     template <typename ResultType>
     ColumnPtr executeWithResultType(const ColumnsWithTypeAndName & arguments) const
     {
-        ColumnPtr res;
-        if (!((res = executeWithResultTypeAndLeftType<ResultType, UInt8>(arguments))
-            || (res = executeWithResultTypeAndLeftType<ResultType, UInt16>(arguments))
-            || (res = executeWithResultTypeAndLeftType<ResultType, UInt32>(arguments))
-            || (res = executeWithResultTypeAndLeftType<ResultType, UInt64>(arguments))
-            || (res = executeWithResultTypeAndLeftType<ResultType, Int8>(arguments))
-            || (res = executeWithResultTypeAndLeftType<ResultType, Int16>(arguments))
-            || (res = executeWithResultTypeAndLeftType<ResultType, Int32>(arguments))
-            || (res = executeWithResultTypeAndLeftType<ResultType, Int64>(arguments))
-            || (res = executeWithResultTypeAndLeftType<ResultType, Float32>(arguments))
-            || (res = executeWithResultTypeAndLeftType<ResultType, Float64>(arguments))))
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN,
-                "Illegal column {} of first argument of function {}", arguments[0].column->getName(), getName());
+        DataTypePtr type_x = typeid_cast<const DataTypeArray *>(arguments[0].type.get())->getNestedType();
 
-        return res;
+        switch (type_x->getTypeId())
+        {
+#define ON_TYPE(type) \
+            case TypeIndex::type: \
+                return executeWithResultTypeAndLeftType<ResultType, type>(arguments); \
+                break;
+
+            SUPPORTED_TYPES(ON_TYPE)
+#undef ON_TYPE
+
+            default:
+                throw Exception(
+                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Arguments of function {} has nested type {}. "
+                    "Support: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
+                    getName(),
+                    type_x->getName());
+        }
     }
 
     template <typename ResultType, typename LeftType>
     ColumnPtr executeWithResultTypeAndLeftType(const ColumnsWithTypeAndName & arguments) const
     {
-        ColumnPtr res;
-        if (   (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, UInt8>(arguments[0].column, arguments[1].column))
-            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, UInt16>(arguments[0].column, arguments[1].column))
-            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, UInt32>(arguments[0].column, arguments[1].column))
-            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, UInt64>(arguments[0].column, arguments[1].column))
-            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Int8>(arguments[0].column, arguments[1].column))
-            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Int16>(arguments[0].column, arguments[1].column))
-            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Int32>(arguments[0].column, arguments[1].column))
-            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Int64>(arguments[0].column, arguments[1].column))
-            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Float32>(arguments[0].column, arguments[1].column))
-            || (res = executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, Float64>(arguments[0].column, arguments[1].column)))
-            return res;
+        DataTypePtr type_y = typeid_cast<const DataTypeArray *>(arguments[1].type.get())->getNestedType();
 
-       return nullptr;
+        switch (type_y->getTypeId())
+        {
+        #define ON_TYPE(type) \
+            case TypeIndex::type: \
+                return executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, type>(arguments[0].column, arguments[1].column); \
+                break;
+
+            SUPPORTED_TYPES(ON_TYPE)
+        #undef ON_TYPE
+
+            default:
+                throw Exception(
+                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Arguments of function {} has nested type {}. "
+                    "Support: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
+                    getName(),
+                    type_y->getName());
+        }
     }
 
     template <typename ResultType, typename LeftType, typename RightType>
@@ -237,28 +247,22 @@ private:
     {
         col_x = col_x->convertToFullColumnIfConst();
         col_y = col_y->convertToFullColumnIfConst();
-        if (!col_x || !col_y)
-            return nullptr;
 
-        const ColumnArray * array_x = checkAndGetColumn<ColumnArray>(col_x.get());
-        const ColumnArray * array_y = checkAndGetColumn<ColumnArray>(col_y.get());
-        if (!array_x || !array_y)
-            return nullptr;
+        const auto & array_x = *assert_cast<const ColumnArray *>(col_x.get());
+        const auto & array_y = *assert_cast<const ColumnArray *>(col_y.get());
 
-        const ColumnVector<LeftType> * col_arr_nested_left = checkAndGetColumn<ColumnVector<LeftType>>(array_x->getData());
-        const ColumnVector<RightType> * col_arr_nested_right = checkAndGetColumn<ColumnVector<RightType>>(array_y->getData());
-        if (!col_arr_nested_left || !col_arr_nested_right)
-            return nullptr;
+        const auto & data_x = typeid_cast<const ColumnVector<LeftType> &>(array_x.getData()).getData();
+        const auto & data_y = typeid_cast<const ColumnVector<RightType> &>(array_y.getData()).getData();
 
-        if (!array_x->hasEqualOffsets(*array_y))
+        if (!array_x.hasEqualOffsets(array_y))
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Array arguments for function {} must have equal sizes", getName());
 
         auto col_res = ColumnVector<ResultType>::create();
 
         vector(
-            col_arr_nested_left->getData(),
-            col_arr_nested_right->getData(),
-            array_x->getOffsets(),
+            data_x,
+            data_y,
+            array_x.getOffsets(),
             col_res->getData());
 
         return col_res;

From 5b94f9b4115e3b7e03118b4a4f4999139e58511e Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 6 Mar 2024 15:31:19 +0100
Subject: [PATCH 136/985] Check children first

---
 src/Storages/VirtualColumnUtils.cpp | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index 6d66453442e..e8441b96782 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -469,18 +469,18 @@ static bool canEvaluateSubtree(const ActionsDAG::Node * node, const Block & allo
 
 static bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node)
 {
-    if (node->type != ActionsDAG::ActionType::FUNCTION)
-        return true;
-
-    if (!node->function_base->isDeterministicInScopeOfQuery())
-        return false;
-
     for (const auto * child : node->children)
     {
         if (!isDeterministicInScopeOfQuery(child))
             return false;
     }
 
+    if (node->type != ActionsDAG::ActionType::FUNCTION)
+        return true;
+
+    if (!node->function_base->isDeterministicInScopeOfQuery())
+        return false;
+
     return true;
 }
 

From a69bcc29f5bb0bdaca1757673dac1574c97b1e2f Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 6 Mar 2024 14:53:11 +0000
Subject: [PATCH 137/985] Refactor a sanity check

---
 src/Functions/array/arrayDistance.cpp         | 20 +++----------------
 src/Functions/array/arrayDotProduct.cpp       |  8 +++++---
 .../queries/0_stateless/02708_dotProduct.sql  |  2 +-
 3 files changed, 9 insertions(+), 21 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index 6b72c99d829..c9e6e97749f 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -18,11 +18,11 @@ namespace DB
 {
 namespace ErrorCodes
 {
+    extern const int ARGUMENT_OUT_OF_BOUND;
     extern const int ILLEGAL_COLUMN;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int LOGICAL_ERROR;
     extern const int SIZES_OF_ARRAYS_DONT_MATCH;
-    extern const int ARGUMENT_OUT_OF_BOUND;
 }
 
 struct L1Distance
@@ -465,22 +465,9 @@ private:
         const auto & data_y = typeid_cast<const ColumnVector<RightType> &>(array_y.getData()).getData();
 
         const auto & offsets_x = array_x.getOffsets();
-        const auto & offsets_y = array_y.getOffsets();
 
-        /// Check that arrays in both columns are the sames size
-        for (size_t row = 0; row < offsets_x.size(); ++row)
-        {
-            if (offsets_x[row] != offsets_y[row]) [[unlikely]]
-            {
-                ColumnArray::Offset prev_offset = row > 0 ? offsets_x[row] : 0;
-                throw Exception(
-                    ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH,
-                    "Arguments of function {} have different array sizes: {} and {}",
-                    getName(),
-                    offsets_x[row] - prev_offset,
-                    offsets_y[row] - prev_offset);
-            }
-        }
+        if (!array_x.hasEqualOffsets(array_y))
+            throw Exception(ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH, "Array arguments for function {} must have equal sizes", getName());
 
         const typename Kernel::ConstParams kernel_params = initConstParams(arguments);
 
@@ -534,7 +521,6 @@ private:
         const auto & offsets_x = array_x.getOffsets();
         const auto & offsets_y = array_y.getOffsets();
 
-        /// Check that arrays in both columns are the sames size
         ColumnArray::Offset prev_offset = 0;
         for (size_t row : collections::range(0, offsets_y.size()))
         {
diff --git a/src/Functions/array/arrayDotProduct.cpp b/src/Functions/array/arrayDotProduct.cpp
index c27170cd35b..3abd1a6c6db 100644
--- a/src/Functions/array/arrayDotProduct.cpp
+++ b/src/Functions/array/arrayDotProduct.cpp
@@ -18,9 +18,9 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int BAD_ARGUMENTS;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int LOGICAL_ERROR;
+    extern const int SIZES_OF_ARRAYS_DONT_MATCH;
 }
 
 
@@ -254,15 +254,17 @@ private:
         const auto & data_x = typeid_cast<const ColumnVector<LeftType> &>(array_x.getData()).getData();
         const auto & data_y = typeid_cast<const ColumnVector<RightType> &>(array_y.getData()).getData();
 
+        const auto & offsets_x = array_x.getOffsets();
+
         if (!array_x.hasEqualOffsets(array_y))
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Array arguments for function {} must have equal sizes", getName());
+            throw Exception(ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH, "Array arguments for function {} must have equal sizes", getName());
 
         auto col_res = ColumnVector<ResultType>::create();
 
         vector(
             data_x,
             data_y,
-            array_x.getOffsets(),
+            offsets_x,
             col_res->getData());
 
         return col_res;
diff --git a/tests/queries/0_stateless/02708_dotProduct.sql b/tests/queries/0_stateless/02708_dotProduct.sql
index 6ad615664e8..2035e23cf1d 100644
--- a/tests/queries/0_stateless/02708_dotProduct.sql
+++ b/tests/queries/0_stateless/02708_dotProduct.sql
@@ -4,7 +4,7 @@ SELECT arrayDotProduct([1, 2]); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATC
 SELECT arrayDotProduct([1, 2], 'abc'); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayDotProduct('abc', [1, 2]); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayDotProduct([1, 2], ['abc', 'def']); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
-SELECT arrayDotProduct([1, 2], [3, 4, 5]); -- { serverError BAD_ARGUMENTS }
+SELECT arrayDotProduct([1, 2], [3, 4, 5]); -- { serverError SIZES_OF_ARRAYS_DONT_MATCH }
 SELECT dotProduct([1, 2], (3, 4, 5)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 
 SELECT '-- Tests';

From 526f162082dfbb4ad2fb5d3d807dfd2ad9b54bdd Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 29 Feb 2024 18:20:47 +0000
Subject: [PATCH 138/985] Fix logical error on bad compatibility setting value
 type

---
 src/Core/Settings.cpp                                         | 4 ++++
 .../03003_compatibility_setting_bad_value.reference           | 0
 .../0_stateless/03003_compatibility_setting_bad_value.sql     | 2 ++
 3 files changed, 6 insertions(+)
 create mode 100644 tests/queries/0_stateless/03003_compatibility_setting_bad_value.reference
 create mode 100644 tests/queries/0_stateless/03003_compatibility_setting_bad_value.sql

diff --git a/src/Core/Settings.cpp b/src/Core/Settings.cpp
index a38197b9eeb..fb456b46d89 100644
--- a/src/Core/Settings.cpp
+++ b/src/Core/Settings.cpp
@@ -114,7 +114,11 @@ std::vector<String> Settings::getAllRegisteredNames() const
 void Settings::set(std::string_view name, const Field & value)
 {
     if (name == "compatibility")
+    {
+        if (value.getType() != Field::Types::Which::String)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unexpected type of value for setting 'compatibility'. Expected String, got {}", value.getTypeName());
         applyCompatibilitySetting(value.get<String>());
+    }
     /// If we change setting that was changed by compatibility setting before
     /// we should remove it from settings_changed_by_compatibility_setting,
     /// otherwise the next time we will change compatibility setting
diff --git a/tests/queries/0_stateless/03003_compatibility_setting_bad_value.reference b/tests/queries/0_stateless/03003_compatibility_setting_bad_value.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03003_compatibility_setting_bad_value.sql b/tests/queries/0_stateless/03003_compatibility_setting_bad_value.sql
new file mode 100644
index 00000000000..9a6f4e7944a
--- /dev/null
+++ b/tests/queries/0_stateless/03003_compatibility_setting_bad_value.sql
@@ -0,0 +1,2 @@
+select 42 settings compatibility=NULL;  -- {clientError BAD_GET}
+

From bdb76d9dd4b42ab4f40db0d371165665171afb4d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 6 Mar 2024 16:30:22 +0000
Subject: [PATCH 139/985] Fix aspell errors

---
 docs/en/sql-reference/functions/json-functions.md  |  2 +-
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 12 +++++++++---
 2 files changed, 10 insertions(+), 4 deletions(-)

diff --git a/docs/en/sql-reference/functions/json-functions.md b/docs/en/sql-reference/functions/json-functions.md
index 246cb8972fb..e920ab82988 100644
--- a/docs/en/sql-reference/functions/json-functions.md
+++ b/docs/en/sql-reference/functions/json-functions.md
@@ -264,7 +264,7 @@ simpleJSONExtractRaw(json, field_name)
 
 **Returned value**
 
-It returns the value of the field as a [`String`](../../sql-reference/data-types/string.md#string), including separators if the field exists, or an emtpy `String` otherwise.
+It returns the value of the field as a [`String`](../../sql-reference/data-types/string.md#string), including separators if the field exists, or an empty `String` otherwise.
 
 **Example**
 
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 3614bcb7452..917b2cdcc71 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1,4 +1,4 @@
-personal_ws-1.1 en 2724
+personal_ws-1.1 en 2758 
 AArch
 ACLs
 ALTERs
@@ -843,7 +843,6 @@ SendScalars
 ShareAlike
 SharedMergeTree
 Shortkeys
-Shortkeys
 SimHash
 Simhash
 SimpleAggregateFunction
@@ -1703,7 +1702,6 @@ hyperscan
 hypot
 hyvor
 iTerm
-iTerm
 icosahedron
 icudata
 idempotency
@@ -2327,6 +2325,14 @@ shortcircuit
 shortkeys
 shoutout
 simdjson
+simpleJSON
+simpleJSONExtractBool
+simpleJSONExtractFloat
+simpleJSONExtractInt
+simpleJSONExtractRaw
+simpleJSONExtractString
+simpleJSONExtractUInt
+simpleJSONHas
 simpleLinearRegression
 simpleaggregatefunction
 simplelinearregression

From 77a980373a1dab7c49e5713ba7050d218c1250c7 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 6 Mar 2024 16:31:27 +0000
Subject: [PATCH 140/985] Fix typo in inline doc

---
 src/Functions/visitParamExtractRaw.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/visitParamExtractRaw.cpp b/src/Functions/visitParamExtractRaw.cpp
index 296429423fe..3cdc5001e13 100644
--- a/src/Functions/visitParamExtractRaw.cpp
+++ b/src/Functions/visitParamExtractRaw.cpp
@@ -68,7 +68,7 @@ REGISTER_FUNCTION(VisitParamExtractRaw)
         = {{"json", "The JSON in which the field is searched for. String."},
            {"field_name", "The name of the field to search for. String literal."}},
         .returned_value
-        = "It returns the value of the field as a String including separators if the field exists, or an emtpy String otherwise.",
+        = "It returns the value of the field as a String including separators if the field exists, or an empty String otherwise.",
         .examples
         = {{.name = "simple",
             .query = R"(CREATE TABLE jsons

From d9b5f9a086d8bc1af5387edee77d0e3fdbf4d9b0 Mon Sep 17 00:00:00 2001
From: Nikolay Monkov <nikmonkov@gmail.com>
Date: Wed, 6 Mar 2024 21:37:56 +0500
Subject: [PATCH 141/985] version has been added to docker labels

---
 tests/ci/docker_server.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tests/ci/docker_server.py b/tests/ci/docker_server.py
index 38d0ea6d86b..803dbfcd92a 100644
--- a/tests/ci/docker_server.py
+++ b/tests/ci/docker_server.py
@@ -216,11 +216,12 @@ def gen_tags(version: ClickHouseVersion, release_type: str) -> List[str]:
     return tags
 
 
-def buildx_args(urls: Dict[str, str], arch: str, direct_urls: List[str]) -> List[str]:
+def buildx_args(urls: Dict[str, str], arch: str, direct_urls: List[str], version: str) -> List[str]:
     args = [
         f"--platform=linux/{arch}",
         f"--label=build-url={GITHUB_RUN_URL}",
         f"--label=com.clickhouse.build.githash={git.sha}",
+        f"--label=com.clickhouse.build.version={version}",
     ]
     if direct_urls:
         args.append(f"--build-arg=DIRECT_DOWNLOAD_URLS='{' '.join(direct_urls)}'")
@@ -267,7 +268,7 @@ def build_and_push_image(
                 urls = [url for url in direct_urls[arch] if ".deb" in url]
             else:
                 urls = [url for url in direct_urls[arch] if ".tgz" in url]
-        cmd_args.extend(buildx_args(repo_urls, arch, direct_urls=urls))
+        cmd_args.extend(buildx_args(repo_urls, arch, direct_urls=urls, version=version.describe))
         if not push:
             cmd_args.append(f"--tag={image.repo}:{arch_tag}")
         cmd_args.extend(

From 245ea0c186614a5a13a7e0bed79f94bc6ad46d87 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 6 Mar 2024 15:26:11 +0000
Subject: [PATCH 142/985] Implement const/non-const shortcut

---
 src/Functions/array/arrayDistance.cpp         |   3 +-
 src/Functions/array/arrayDotProduct.cpp       | 110 ++++++++++++++----
 tests/performance/dotProduct.xml              |   1 +
 .../0_stateless/02708_dotProduct.reference    |   7 ++
 .../queries/0_stateless/02708_dotProduct.sql  |   9 ++
 5 files changed, 106 insertions(+), 24 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index c9e6e97749f..03f0bc7b286 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -477,6 +477,7 @@ private:
         /// Do the actual computation
         ColumnArray::Offset prev = 0;
         size_t row = 0;
+
         for (auto off : offsets_x)
         {
             /// Process chunks in vectorized manner
@@ -522,7 +523,7 @@ private:
         const auto & offsets_y = array_y.getOffsets();
 
         ColumnArray::Offset prev_offset = 0;
-        for (size_t row : collections::range(0, offsets_y.size()))
+        for (size_t row = 0; row < offsets_y.size(); ++row)
         {
             if (offsets_x[0] != offsets_y[row] - prev_offset) [[unlikely]]
             {
diff --git a/src/Functions/array/arrayDotProduct.cpp b/src/Functions/array/arrayDotProduct.cpp
index 3abd1a6c6db..f9a6687e028 100644
--- a/src/Functions/array/arrayDotProduct.cpp
+++ b/src/Functions/array/arrayDotProduct.cpp
@@ -245,6 +245,15 @@ private:
     template <typename ResultType, typename LeftType, typename RightType>
     ColumnPtr executeWithResultTypeAndLeftTypeAndRightType(ColumnPtr col_x, ColumnPtr col_y) const
     {
+        if (typeid_cast<const ColumnConst *>(col_x.get()))
+        {
+            return executeWithLeftArgConst<ResultType, LeftType, RightType>(col_x, col_y);
+        }
+        else if (typeid_cast<const ColumnConst *>(col_y.get()))
+        {
+            return executeWithLeftArgConst<ResultType, RightType, LeftType>(col_y, col_x);
+        }
+
         col_x = col_x->convertToFullColumnIfConst();
         col_y = col_y->convertToFullColumnIfConst();
 
@@ -260,30 +269,83 @@ private:
             throw Exception(ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH, "Array arguments for function {} must have equal sizes", getName());
 
         auto col_res = ColumnVector<ResultType>::create();
+        auto & result = col_res->getData();
 
-        vector(
-            data_x,
-            data_y,
-            offsets_x,
-            col_res->getData());
-
-        return col_res;
-    }
-
-    template <typename ResultType, typename LeftType, typename RightType>
-    static void vector(
-        const PaddedPODArray<LeftType> & left,
-        const PaddedPODArray<RightType> & right,
-        const ColumnArray::Offsets & offsets,
-        PaddedPODArray<ResultType> & result)
-    {
-        size_t size = offsets.size();
+        size_t size = offsets_x.size();
         result.resize(size);
 
         ColumnArray::Offset current_offset = 0;
         for (size_t row = 0; row < size; ++row)
         {
-            size_t array_size = offsets[row] - current_offset;
+            size_t array_size = offsets_x[row] - current_offset;
+
+            size_t i = 0;
+
+            /// Process chunks in vectorized manner
+            static constexpr size_t VEC_SIZE = 4;
+            typename Kernel::template State<ResultType> states[VEC_SIZE];
+            for (; i + VEC_SIZE < array_size; i += VEC_SIZE)
+            {
+                for (size_t j = 0; j < VEC_SIZE; ++j)
+                    Kernel::template accumulate<ResultType>(states[j], static_cast<ResultType>(data_x[current_offset + i + j]), static_cast<ResultType>(data_y[current_offset + i + j]));
+            }
+
+            typename Kernel::template State<ResultType> state;
+            for (const auto & other_state : states)
+                Kernel::template combine<ResultType>(state, other_state);
+
+            /// Process the tail
+            for (; i < array_size; ++i)
+                Kernel::template accumulate<ResultType>(state, static_cast<ResultType>(data_x[current_offset + i]), static_cast<ResultType>(data_y[current_offset + i]));
+
+            result[row] = Kernel::template finalize<ResultType>(state);
+
+            current_offset = offsets_x[row];
+        }
+
+        return col_res;
+    }
+
+    template <typename ResultType, typename LeftType, typename RightType>
+    ColumnPtr executeWithLeftArgConst(ColumnPtr col_x, ColumnPtr col_y) const
+    {
+        col_x = assert_cast<const ColumnConst *>(col_x.get())->getDataColumnPtr();
+        col_y = col_y->convertToFullColumnIfConst();
+
+        const auto & array_x = *assert_cast<const ColumnArray *>(col_x.get());
+        const auto & array_y = *assert_cast<const ColumnArray *>(col_y.get());
+
+        const auto & data_x = typeid_cast<const ColumnVector<LeftType> &>(array_x.getData()).getData();
+        const auto & data_y = typeid_cast<const ColumnVector<RightType> &>(array_y.getData()).getData();
+
+        const auto & offsets_x = array_x.getOffsets();
+        const auto & offsets_y = array_y.getOffsets();
+
+        ColumnArray::Offset prev_offset = 0;
+        for (size_t row = 0; row < offsets_y.size(); ++row)
+        {
+            if (offsets_x[0] != offsets_y[row] - prev_offset) [[unlikely]]
+            {
+                throw Exception(
+                    ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH,
+                    "Arguments of function {} have different array sizes: {} and {}",
+                    getName(),
+                    offsets_x[0],
+                    offsets_y[row] - prev_offset);
+            }
+            prev_offset = offsets_y[row];
+        }
+
+        auto col_res = ColumnVector<ResultType>::create();
+        auto & result = col_res->getData();
+
+        size_t size = offsets_y.size();
+        result.resize(size);
+
+        ColumnArray::Offset current_offset = 0;
+        for (size_t row = 0; row < size; ++row)
+        {
+            size_t array_size = offsets_x[0];
 
             typename Kernel::template State<ResultType> state;
             size_t i = 0;
@@ -292,13 +354,14 @@ private:
             /// To avoid combinatorial explosion of SIMD kernels, focus on
             /// - the two most common input/output types (Float32 x Float32) --> Float32 and (Float64 x Float64) --> Float64 instead of 10 x
             ///   10 input types x 8 output types,
+            /// - const/non-const inputs instead of non-const/non-const inputs
             /// - the most powerful SIMD instruction set (AVX-512F).
 #if USE_MULTITARGET_CODE
             if constexpr ((std::is_same_v<ResultType, Float32> || std::is_same_v<ResultType, Float64>)
                             && std::is_same_v<ResultType, LeftType> && std::is_same_v<LeftType, RightType>)
             {
                 if (isArchSupported(TargetArch::AVX512F))
-                    Kernel::template accumulateCombine<ResultType>(&left[current_offset], &right[current_offset], array_size, i, state);
+                    Kernel::template accumulateCombine<ResultType>(&data_x[0], &data_y[current_offset], array_size, i, state);
             }
 #else
             /// Process chunks in vectorized manner
@@ -307,7 +370,7 @@ private:
             for (; i + VEC_SIZE < array_size; i += VEC_SIZE)
             {
                 for (size_t j = 0; j < VEC_SIZE; ++j)
-                    Kernel::template accumulate<ResultType>(states[j], static_cast<ResultType>(left[i + j]), static_cast<ResultType>(right[i + j]));
+                    Kernel::template accumulate<ResultType>(states[j], static_cast<ResultType>(data_x[i + j]), static_cast<ResultType>(data_y[current_offset + i + j]));
             }
 
             for (const auto & other_state : states)
@@ -316,13 +379,14 @@ private:
 
             /// Process the tail
             for (; i < array_size; ++i)
-                Kernel::template accumulate<ResultType>(state, static_cast<ResultType>(left[i]), static_cast<ResultType>(right[i]));
+                Kernel::template accumulate<ResultType>(state, static_cast<ResultType>(data_x[i]), static_cast<ResultType>(data_y[current_offset + i]));
 
-            /// ResultType res = Kernel::template finalize<ResultType>(state);
             result[row] = Kernel::template finalize<ResultType>(state);
 
-            current_offset = offsets[row];
+            current_offset = offsets_y[row];
         }
+
+        return col_res;
     }
 };
 
diff --git a/tests/performance/dotProduct.xml b/tests/performance/dotProduct.xml
index 6e056964ebb..a0ab7beea9c 100644
--- a/tests/performance/dotProduct.xml
+++ b/tests/performance/dotProduct.xml
@@ -56,6 +56,7 @@
     </settings>
 
     <query>SELECT sum(dp) FROM (SELECT dotProduct(v, v) AS dp FROM vecs_{element_type})</query>
+    <query>WITH (SELECT v FROM vecs_{element_type} limit 1) AS a SELECT sum(dp) FROM (SELECT dotProduct(a, v) AS dp FROM vecs_{element_type})</query>
 
     <drop_query>DROP TABLE vecs_{element_type}</drop_query>
 
diff --git a/tests/queries/0_stateless/02708_dotProduct.reference b/tests/queries/0_stateless/02708_dotProduct.reference
index 5cc9a9f0502..593071a3521 100644
--- a/tests/queries/0_stateless/02708_dotProduct.reference
+++ b/tests/queries/0_stateless/02708_dotProduct.reference
@@ -32,3 +32,10 @@
 32
 32
 32
+-- Tests that trigger special paths
+0	61
+1	186
+0	62
+1	187
+0	62
+1	187
diff --git a/tests/queries/0_stateless/02708_dotProduct.sql b/tests/queries/0_stateless/02708_dotProduct.sql
index 2035e23cf1d..ac94ecc28d3 100644
--- a/tests/queries/0_stateless/02708_dotProduct.sql
+++ b/tests/queries/0_stateless/02708_dotProduct.sql
@@ -45,3 +45,12 @@ SELECT '-- Aliases';
 SELECT scalarProduct([1, 2, 3], [4, 5, 6]);
 SELECT scalarProduct((1, 2, 3), (4, 5, 6));
 SELECT arrayDotProduct([1, 2, 3], [4, 5, 6]); -- actually no alias but the internal function for arrays
+
+SELECT '-- Tests that trigger special paths';
+DROP TABLE IF EXISTS tab;
+CREATE TABLE tab(id UInt64, vec Array(Float32)) ENGINE = MergeTree ORDER BY id;
+INSERT INTO tab VALUES (0, [0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0]) (1, [5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0]);
+SELECT id, arrayDotProduct(vec, vec) FROM tab ORDER BY id; -- non-const / non-const
+SELECT id, arrayDotProduct([5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0]::Array(Float32), vec) FROM tab ORDER BY id; -- const / non-const
+SELECT id, arrayDotProduct([5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0]::Array(Float64), vec) FROM tab ORDER BY id; -- const / non-const
+DROP TABLE tab;

From 06a7665d0e780b52b4c1e2c1115ed41050d2d03a Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Wed, 6 Mar 2024 18:19:52 +0100
Subject: [PATCH 143/985] Update encoding-functions.md

Add missing "Result:" after query
---
 docs/en/sql-reference/functions/encoding-functions.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/en/sql-reference/functions/encoding-functions.md b/docs/en/sql-reference/functions/encoding-functions.md
index c81b3e35317..4f6da764b3c 100644
--- a/docs/en/sql-reference/functions/encoding-functions.md
+++ b/docs/en/sql-reference/functions/encoding-functions.md
@@ -469,6 +469,7 @@ Query:
 ```sql
 SELECT mortonEncode(1, 2, 3);
 ```
+Result:
 
 ```response
 53

From 87f3c957c7dc3d16d9967723e30215e12a0b5dc0 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 6 Mar 2024 21:16:22 +0100
Subject: [PATCH 144/985] Blind experiment

---
 base/base/itoa.h | 30 +++++++++++++++++++++++-------
 1 file changed, 23 insertions(+), 7 deletions(-)

diff --git a/base/base/itoa.h b/base/base/itoa.h
index 513070c99d9..c450090d82f 100644
--- a/base/base/itoa.h
+++ b/base/base/itoa.h
@@ -349,16 +349,32 @@ namespace convert
 
 
 template <typename T>
-static inline char * writeUIntText(T x, char * p)
+static inline char * writeUIntText(T _x, char * p)
 {
-    static_assert(is_unsigned_v<T>);
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wbit-int-extension"
+    int len = digits10(_x);
+    static_assert(std::is_same_v<T, UInt128> || std::is_same_v<T, UInt256>);
+    using T_ = std::conditional_t<std::is_same_v<T, UInt128>, unsigned __int128, unsigned _BitInt(256)>;
+#pragma clang diagnostic pop
 
-    int len = digits10(x);
-    auto * pp = p + len;
-    while (x >= 100)
+    T_ x;
+    T_ hundred(100ULL);
+    if constexpr (std::is_same_v<T, UInt128>)
     {
-        const auto i = x % 100;
-        x /= 100;
+        x = (T_(_x.items[T::_impl::little(1)]) << 64) + T_(_x.items[T::_impl::little(0)]);
+    }
+    else
+    {
+        x = (T_(_x.items[T::_impl::little(3)]) << 192) + (T_(_x.items[T::_impl::little(2)]) << 128) +
+                (T_(_x.items[T::_impl::little(1)]) << 64) + T_(_x.items[T::_impl::little(0)]);
+    }
+
+    auto * pp = p + len;
+    while (x >= hundred)
+    {
+        const auto i = x % hundred;
+        x /= hundred;
         pp -= 2;
         outTwoDigits(pp, i);
     }

From c192d0b12532060d14934e60164df7ce771d9399 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Wed, 6 Mar 2024 22:29:41 +0100
Subject: [PATCH 145/985] impl

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 83 +++++++++++++------
 src/Storages/MergeTree/IMergeTreeDataPart.h   |  8 +-
 .../MergeTree/MergeTreeDataPartCompact.cpp    |  3 +-
 .../MergeTree/MergeTreeDataPartCompact.h      | 12 +--
 .../MergeTree/MergeTreeDataPartWide.cpp       |  3 +-
 .../MergeTree/MergeTreeDataPartWide.h         |  4 +-
 .../MergeTree/MergeTreeIndexGranularity.cpp   |  5 +-
 .../MergeTree/MergeTreeIndexGranularity.h     |  2 +
 .../MergeTreeIndexGranularityInfo.cpp         | 14 +++-
 .../MergeTree/MergeTreeIndexGranularityInfo.h |  4 +
 10 files changed, 97 insertions(+), 41 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index a9bdceacef0..3922d5018c6 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -2,38 +2,41 @@
 #include <Storages/MergeTree/IDataPartStorage.h>
 #include <base/types.h>
 
+#include <exception>
 #include <optional>
-#include <boost/algorithm/string/join.hpp>
 #include <string_view>
+#include <Compression/CompressedReadBuffer.h>
+#include <Compression/getCompressionCodecForFile.h>
 #include <Core/Defines.h>
-#include <IO/HashingWriteBuffer.h>
+#include <Core/NamesAndTypes.h>
+#include <Core/SettingsEnums.h>
+#include <DataTypes/DataTypeAggregateFunction.h>
+#include <DataTypes/NestedUtils.h>
 #include <IO/HashingReadBuffer.h>
+#include <IO/HashingWriteBuffer.h>
 #include <IO/ReadBufferFromString.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
-#include <Storages/MergeTree/MergeTreeData.h>
-#include <Storages/MergeTree/localBackup.h>
-#include <Storages/MergeTree/checkDataPart.h>
-#include <Storages/StorageReplicatedMergeTree.h>
-#include <Storages/MergeTree/PartMetadataManagerOrdinary.h>
-#include <Core/NamesAndTypes.h>
-#include <Storages/ColumnsDescription.h>
-#include <Compression/CompressedReadBuffer.h>
-#include <Common/StringUtils/StringUtils.h>
-#include <Common/escapeForFileName.h>
-#include <Common/CurrentMetrics.h>
-#include <Common/FieldVisitorsAccurateComparison.h>
-#include <Common/MemoryTrackerBlockerInThread.h>
-#include <base/JSON.h>
-#include <Common/logger_useful.h>
-#include <Compression/getCompressionCodecForFile.h>
-#include <Parsers/parseQuery.h>
-#include <Parsers/queryToString.h>
-#include <Parsers/ExpressionElementParsers.h>
-#include <DataTypes/NestedUtils.h>
-#include <DataTypes/DataTypeAggregateFunction.h>
 #include <Interpreters/MergeTreeTransaction.h>
 #include <Interpreters/TransactionLog.h>
+#include <Parsers/ExpressionElementParsers.h>
+#include <Parsers/parseQuery.h>
+#include <Parsers/queryToString.h>
+#include <Storages/ColumnsDescription.h>
+#include <Storages/MergeTree/MergeTreeData.h>
+#include <Storages/MergeTree/PartMetadataManagerOrdinary.h>
+#include <Storages/MergeTree/checkDataPart.h>
+#include <Storages/MergeTree/localBackup.h>
+#include <Storages/StorageReplicatedMergeTree.h>
+#include <base/JSON.h>
+#include <boost/algorithm/string/join.hpp>
+#include <Common/CurrentMetrics.h>
+#include <Common/Exception.h>
+#include <Common/FieldVisitorsAccurateComparison.h>
+#include <Common/MemoryTrackerBlockerInThread.h>
+#include <Common/StringUtils/StringUtils.h>
+#include <Common/escapeForFileName.h>
+#include <Common/logger_useful.h>
 
 #include <Disks/IO/CachedOnDiskReadBufferFromFile.h>
 
@@ -1966,7 +1969,39 @@ void IMergeTreeDataPart::checkConsistencyBase() const
     }
 }
 
-void IMergeTreeDataPart::checkConsistency(bool /* require_part_metadata */) const
+void IMergeTreeDataPart::checkConsistency(bool require_part_metadata) const
+{
+    try
+    {
+        checkConsistencyBase();
+        doCheckConsistency(require_part_metadata);
+    }
+    catch (Exception & e)
+    {
+        const auto part_state = fmt::format(
+            "state: {}, is_unexpected_local_part: {}, is_frozen: {}, is_duplicate: {}",
+            stateString(),
+            is_unexpected_local_part,
+            is_frozen,
+            is_duplicate,
+            is_temp);
+
+        const auto debug_info = fmt::format(
+            "columns: {}, getMarkSizeInBytes: {}, getMarksCount: {}, index_granularity_info: [{}], index_granularity: [{}], "
+            "part_state: [{}]",
+            columns.toString(),
+            index_granularity_info.getMarkSizeInBytes(columns.size()),
+            index_granularity.getMarksCount(),
+            index_granularity_info.describe(),
+            index_granularity.describe(),
+            part_state);
+
+        e.addMessage(debug_info);
+        e.rethrow();
+    }
+}
+
+void IMergeTreeDataPart::doCheckConsistency(bool /* require_part_metadata */) const
 {
     throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method 'checkConsistency' is not implemented for part with type {}", getType().toString());
 }
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 91c559d30c8..209c2d9a256 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -498,7 +498,7 @@ public:
     void writeChecksums(const MergeTreeDataPartChecksums & checksums_, const WriteSettings & settings);
 
     /// Checks the consistency of this data part.
-    virtual void checkConsistency(bool require_part_metadata) const;
+    void checkConsistency(bool require_part_metadata) const;
 
     /// Checks the consistency of this data part, and check the consistency of its projections (if any) as well.
     void checkConsistencyWithProjections(bool require_part_metadata) const;
@@ -586,8 +586,6 @@ protected:
 
     void removeIfNeeded();
 
-    void checkConsistencyBase() const;
-
     /// Fill each_columns_size and total_size with sizes from columns files on
     /// disk using columns and checksums.
     virtual void calculateEachColumnSizes(ColumnSizeByName & each_columns_size, ColumnSize & total_size) const = 0;
@@ -610,6 +608,8 @@ protected:
 
     void initializeIndexGranularityInfo();
 
+    virtual void doCheckConsistency(bool require_part_metadata) const;
+
 private:
     String mutable_name;
     mutable MergeTreeDataPartState state{MergeTreeDataPartState::Temporary};
@@ -697,6 +697,8 @@ private:
     void incrementStateMetric(MergeTreeDataPartState state) const;
     void decrementStateMetric(MergeTreeDataPartState state) const;
 
+    void checkConsistencyBase() const;
+
     /// This ugly flag is needed for debug assertions only
     mutable bool part_is_probably_removed_from_disk = false;
 };
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp b/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp
index 0ecd7abe183..5d4b602b5b8 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp
@@ -157,9 +157,8 @@ std::optional<time_t> MergeTreeDataPartCompact::getColumnModificationTime(const
     return getDataPartStorage().getFileLastModified(DATA_FILE_NAME_WITH_EXTENSION).epochTime();
 }
 
-void MergeTreeDataPartCompact::checkConsistency(bool require_part_metadata) const
+void MergeTreeDataPartCompact::doCheckConsistency(bool require_part_metadata) const
 {
-    checkConsistencyBase();
     String mrk_file_name = DATA_FILE_NAME + getMarksFileExtension();
 
     if (!checksums.empty())
diff --git a/src/Storages/MergeTree/MergeTreeDataPartCompact.h b/src/Storages/MergeTree/MergeTreeDataPartCompact.h
index 35a358b3720..f897bcb0bfd 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCompact.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartCompact.h
@@ -67,14 +67,14 @@ protected:
          MergeTreeIndexGranularity & index_granularity_, const MergeTreeIndexGranularityInfo & index_granularity_info_,
          size_t columns_count, const IDataPartStorage & data_part_storage_);
 
-private:
-    void checkConsistency(bool require_part_metadata) const override;
+     void doCheckConsistency(bool require_part_metadata) const override;
 
-    /// Loads marks index granularity into memory
-    void loadIndexGranularity() override;
+ private:
+     /// Loads marks index granularity into memory
+     void loadIndexGranularity() override;
 
-    /// Compact parts doesn't support per column size, only total size
-    void calculateEachColumnSizes(ColumnSizeByName & each_columns_size, ColumnSize & total_size) const override;
+     /// Compact parts doesn't support per column size, only total size
+     void calculateEachColumnSizes(ColumnSizeByName & each_columns_size, ColumnSize & total_size) const override;
 };
 
 }
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
index dc6c1f0019d..0111f1e7b40 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.cpp
@@ -182,9 +182,8 @@ MergeTreeDataPartWide::~MergeTreeDataPartWide()
     removeIfNeeded();
 }
 
-void MergeTreeDataPartWide::checkConsistency(bool require_part_metadata) const
+void MergeTreeDataPartWide::doCheckConsistency(bool require_part_metadata) const
 {
-    checkConsistencyBase();
     std::string marks_file_extension = index_granularity_info.mark_type.getFileExtension();
 
     if (!checksums.empty())
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWide.h b/src/Storages/MergeTree/MergeTreeDataPartWide.h
index 14147c4ad56..508ea16d2d4 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWide.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWide.h
@@ -62,9 +62,9 @@ protected:
         MergeTreeIndexGranularity & index_granularity_, MergeTreeIndexGranularityInfo & index_granularity_info_,
         const IDataPartStorage & data_part_storage_, const std::string & any_column_file_name);
 
-private:
-    void checkConsistency(bool require_part_metadata) const override;
+    void doCheckConsistency(bool require_part_metadata) const override;
 
+private:
     /// Loads marks index granularity into memory
     void loadIndexGranularity() override;
 
diff --git a/src/Storages/MergeTree/MergeTreeIndexGranularity.cpp b/src/Storages/MergeTree/MergeTreeIndexGranularity.cpp
index 5fdd0555777..2a45ab1d927 100644
--- a/src/Storages/MergeTree/MergeTreeIndexGranularity.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexGranularity.cpp
@@ -121,5 +121,8 @@ void MergeTreeIndexGranularity::resizeWithFixedGranularity(size_t size, size_t f
     }
 }
 
-
+std::string MergeTreeIndexGranularity::describe() const
+{
+    return fmt::format("initialized: {}, marks_rows_partial_sums: [{}]", initialized, fmt::join(marks_rows_partial_sums, ", "));
+}
 }
diff --git a/src/Storages/MergeTree/MergeTreeIndexGranularity.h b/src/Storages/MergeTree/MergeTreeIndexGranularity.h
index f5677995ae0..d67762f7293 100644
--- a/src/Storages/MergeTree/MergeTreeIndexGranularity.h
+++ b/src/Storages/MergeTree/MergeTreeIndexGranularity.h
@@ -95,6 +95,8 @@ public:
 
     /// Add `size` of marks with `fixed_granularity` rows
     void resizeWithFixedGranularity(size_t size, size_t fixed_granularity);
+
+    std::string describe() const;
 };
 
 }
diff --git a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp
index da89d52a9ff..1ff72a4e36d 100644
--- a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp
@@ -88,6 +88,10 @@ std::string MarkType::getFileExtension() const
     }
 }
 
+std::string MarkType::describe() const
+{
+    return fmt::format("adaptive: {}, compressed: {}, part_type: {}", adaptive, compressed, part_type);
+}
 
 std::optional<MarkType> MergeTreeIndexGranularityInfo::getMarksTypeFromFilesystem(const IDataPartStorage & data_part_storage)
 {
@@ -132,10 +136,18 @@ size_t MergeTreeIndexGranularityInfo::getMarkSizeInBytes(size_t columns_num) con
         throw Exception(ErrorCodes::UNKNOWN_PART_TYPE, "Unknown part type");
 }
 
+std::string MergeTreeIndexGranularityInfo::describe() const
+{
+    return fmt::format(
+        "mark_type: [{}], index_granularity_bytes: {}, fixed_index_granularity: {}",
+        mark_type.describe(),
+        index_granularity_bytes,
+        fixed_index_granularity);
+}
+
 size_t getAdaptiveMrkSizeCompact(size_t columns_num)
 {
     /// Each mark contains number of rows in granule and two offsets for every column.
     return sizeof(UInt64) * (columns_num * 2 + 1);
 }
-
 }
diff --git a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.h b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.h
index af008866919..85006c3ffde 100644
--- a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.h
+++ b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.h
@@ -24,6 +24,8 @@ struct MarkType
     static bool isMarkFileExtension(std::string_view extension);
     std::string getFileExtension() const;
 
+    std::string describe() const;
+
     bool adaptive = false;
     bool compressed = false;
     MergeTreeDataPartType::Value part_type = MergeTreeDataPartType::Unknown;
@@ -58,6 +60,8 @@ public:
     size_t getMarkSizeInBytes(size_t columns_num = 1) const;
 
     static std::optional<MarkType> getMarksTypeFromFilesystem(const IDataPartStorage & data_part_storage);
+
+    std::string describe() const;
 };
 
 constexpr inline auto getNonAdaptiveMrkSizeWide() { return sizeof(UInt64) * 2; }

From 2b52583e06056e19df97216f41b81102bca8bd9d Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Wed, 6 Mar 2024 23:01:42 +0100
Subject: [PATCH 146/985] fix style

---
 src/Storages/MergeTree/MergeTreeDataPartCompact.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeDataPartCompact.h b/src/Storages/MergeTree/MergeTreeDataPartCompact.h
index f897bcb0bfd..8bbec2808d7 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCompact.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartCompact.h
@@ -69,7 +69,7 @@ protected:
 
      void doCheckConsistency(bool require_part_metadata) const override;
 
- private:
+private:
      /// Loads marks index granularity into memory
      void loadIndexGranularity() override;
 

From fb17749b50ce1024ef8c0b6f7bb8b7a58321894c Mon Sep 17 00:00:00 2001
From: Nikolay Monkov <nikmonkov@gmail.com>
Date: Thu, 7 Mar 2024 09:45:24 +0500
Subject: [PATCH 147/985] file has been reformatted to pass Style check

---
 tests/ci/docker_server.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/tests/ci/docker_server.py b/tests/ci/docker_server.py
index 803dbfcd92a..35c86d8eadd 100644
--- a/tests/ci/docker_server.py
+++ b/tests/ci/docker_server.py
@@ -216,7 +216,9 @@ def gen_tags(version: ClickHouseVersion, release_type: str) -> List[str]:
     return tags
 
 
-def buildx_args(urls: Dict[str, str], arch: str, direct_urls: List[str], version: str) -> List[str]:
+def buildx_args(
+    urls: Dict[str, str], arch: str, direct_urls: List[str], version: str
+) -> List[str]:
     args = [
         f"--platform=linux/{arch}",
         f"--label=build-url={GITHUB_RUN_URL}",
@@ -268,7 +270,9 @@ def build_and_push_image(
                 urls = [url for url in direct_urls[arch] if ".deb" in url]
             else:
                 urls = [url for url in direct_urls[arch] if ".tgz" in url]
-        cmd_args.extend(buildx_args(repo_urls, arch, direct_urls=urls, version=version.describe))
+        cmd_args.extend(
+            buildx_args(repo_urls, arch, direct_urls=urls, version=version.describe)
+        )
         if not push:
             cmd_args.append(f"--tag={image.repo}:{arch_tag}")
         cmd_args.extend(

From f77b5963748c321975d8bd131e794dcc57002fc8 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 7 Mar 2024 16:17:27 +0800
Subject: [PATCH 148/985] Fix test

---
 .../integration/test_filesystem_cache/test.py | 47 ++++++++++++-------
 1 file changed, 29 insertions(+), 18 deletions(-)

diff --git a/tests/integration/test_filesystem_cache/test.py b/tests/integration/test_filesystem_cache/test.py
index 0cb1866f8e4..63316aba57e 100644
--- a/tests/integration/test_filesystem_cache/test.py
+++ b/tests/integration/test_filesystem_cache/test.py
@@ -350,6 +350,20 @@ def test_custom_cached_disk(cluster):
 
 def test_force_filesystem_cache_on_merges(cluster):
     def test(node, forced_read_through_cache_on_merge):
+        def to_int(value):
+            if value == "":
+                return 0
+            else:
+                return int(value)
+
+        r_cache_count = to_int(node.query(
+            "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
+        ))
+
+        w_cache_count = to_int(node.query(
+            "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
+        ))
+
         node.query(
             """
             DROP TABLE IF EXISTS test SYNC;
@@ -376,36 +390,33 @@ def test_force_filesystem_cache_on_merges(cluster):
         assert int(node.query("SELECT count() FROM system.filesystem_cache")) > 0
         assert int(node.query("SELECT max(size) FROM system.filesystem_cache")) == 1024
 
-        write_count = int(
+        w_cache_count_2 = int(
             node.query(
                 "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
             )
         )
-        assert write_count > 100000
-        assert "" == node.query(
-            "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
+        assert w_cache_count_2 > w_cache_count
+
+        r_cache_count_2 = to_int(
+            node.query(
+                "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
+            )
         )
+        assert r_cache_count_2 == r_cache_count
 
         node.query("SYSTEM DROP FILESYSTEM CACHE")
         node.query("OPTIMIZE TABLE test FINAL")
 
-        new_write_count = int(
+        r_cache_count_3 = to_int(
             node.query(
-                "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
-            )
-        )
-        assert new_write_count >= write_count
-
-        if forced_read_through_cache_on_merge:
-            assert 100000 < int(
-                node.query(
-                    "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
-                )
-            )
-        else:
-            assert "" == node.query(
                 "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
             )
+        )
+
+        if forced_read_through_cache_on_merge:
+            assert r_cache_count_3 > r_cache_count
+        else:
+            assert r_cache_count_3 == r_cache_count
 
     node = cluster.instances["node_force_read_through_cache_on_merge"]
     test(node, True)

From 50b84954e4810c94c1397504a64ca96e1a0fed55 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 7 Mar 2024 16:29:38 +0800
Subject: [PATCH 149/985] Update .reference

---
 .../0_stateless/02117_show_create_table_system.reference        | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index 7382b24afbc..5081527ceef 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -195,6 +195,8 @@ CREATE TABLE system.disks
     `unreserved_space` UInt64,
     `keep_free_space` UInt64,
     `type` String,
+    `object_storage_type` String,
+    `metadata_type` String,
     `is_encrypted` UInt8,
     `is_read_only` UInt8,
     `is_write_once` UInt8,

From c7f5b1631c359c61b6e4c74727092df73e956922 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Thu, 7 Mar 2024 08:30:34 +0000
Subject: [PATCH 150/985] Automatic style fix

---
 tests/integration/test_filesystem_cache/test.py | 16 ++++++++++------
 1 file changed, 10 insertions(+), 6 deletions(-)

diff --git a/tests/integration/test_filesystem_cache/test.py b/tests/integration/test_filesystem_cache/test.py
index 63316aba57e..c44d817c57c 100644
--- a/tests/integration/test_filesystem_cache/test.py
+++ b/tests/integration/test_filesystem_cache/test.py
@@ -356,13 +356,17 @@ def test_force_filesystem_cache_on_merges(cluster):
             else:
                 return int(value)
 
-        r_cache_count = to_int(node.query(
-            "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
-        ))
+        r_cache_count = to_int(
+            node.query(
+                "SELECT value FROM system.events WHERE name = 'CachedReadBufferCacheWriteBytes'"
+            )
+        )
 
-        w_cache_count = to_int(node.query(
-            "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
-        ))
+        w_cache_count = to_int(
+            node.query(
+                "SELECT value FROM system.events WHERE name = 'CachedWriteBufferCacheWriteBytes'"
+            )
+        )
 
         node.query(
             """

From 31ed1966e3c5388e601edd6e97c0497153bb7196 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 7 Mar 2024 16:44:10 +0800
Subject: [PATCH 151/985] Fix build

---
 src/Disks/ObjectStorages/ObjectStorageFactory.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index 9d7e714445a..46136ad7b12 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -166,7 +166,7 @@ void registerS3ObjectStorage(ObjectStorageFactory & factory)
 
         /// NOTE: should we still perform this check for clickhouse-disks?
         if (!skip_access_check)
-            checkS3Capabilities(*object_storage, s3_capabilities, name);
+            checkS3Capabilities(*dynamic_cast<S3ObjectStorage *>(object_storage.get()), s3_capabilities, name);
 
         return object_storage;
     });
@@ -202,7 +202,7 @@ void registerS3PlainObjectStorage(ObjectStorageFactory & factory)
 
         /// NOTE: should we still perform this check for clickhouse-disks?
         if (!skip_access_check)
-            checkS3Capabilities(*object_storage, s3_capabilities, name);
+            checkS3Capabilities(*dynamic_cast<S3ObjectStorage *>(object_storage.get()), s3_capabilities, name);
 
         return object_storage;
     });

From 10b5ce8ab3d1b412f6500d03bc96e205965178d7 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 7 Mar 2024 10:26:50 +0100
Subject: [PATCH 152/985] Updated BufferAllocationPolicy

---
 src/Backups/BackupIO_AzureBlobStorage.cpp     |  4 +--
 .../BufferAllocationPolicy.cpp}               | 25 +++++--------
 src/Common/BufferAllocationPolicy.h           | 35 +++++++++++++++++++
 src/Common/ThreadPoolTaskTracker.h            |  2 --
 src/Core/Settings.h                           |  5 +++
 .../IO/WriteBufferFromAzureBlobStorage.cpp    | 23 +++++++-----
 .../IO/WriteBufferFromAzureBlobStorage.h      |  9 ++---
 .../AzureBlobStorage/AzureBlobStorageAuth.cpp | 29 ++++++++-------
 .../AzureBlobStorage/AzureObjectStorage.cpp   |  4 +--
 .../AzureBlobStorage/AzureObjectStorage.h     | 17 +++++++--
 src/IO/WriteBufferFromS3.cpp                  |  7 +++-
 src/IO/WriteBufferFromS3.h                    | 13 +------
 12 files changed, 107 insertions(+), 66 deletions(-)
 rename src/{IO/WriteBufferFromS3BufferAllocationPolicy.cpp => Common/BufferAllocationPolicy.cpp} (74%)
 create mode 100644 src/Common/BufferAllocationPolicy.h

diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index fb36248433d..8d2b217ad21 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -275,11 +275,9 @@ std::unique_ptr<WriteBuffer> BackupWriterAzureBlobStorage::writeFile(const Strin
     return std::make_unique<WriteBufferFromAzureBlobStorage>(
         client,
         key,
-        settings->max_single_part_upload_size,
-        settings->max_unexpected_write_error_retries,
         DBMS_DEFAULT_BUFFER_SIZE,
         write_settings,
-        settings->max_inflight_parts_for_one_file);
+        settings);
 }
 
 void BackupWriterAzureBlobStorage::removeFile(const String & file_name)
diff --git a/src/IO/WriteBufferFromS3BufferAllocationPolicy.cpp b/src/Common/BufferAllocationPolicy.cpp
similarity index 74%
rename from src/IO/WriteBufferFromS3BufferAllocationPolicy.cpp
rename to src/Common/BufferAllocationPolicy.cpp
index 6347c1acfd7..1456233eb03 100644
--- a/src/IO/WriteBufferFromS3BufferAllocationPolicy.cpp
+++ b/src/Common/BufferAllocationPolicy.cpp
@@ -1,21 +1,17 @@
-#include "config.h"
-
-#if USE_AWS_S3
-
-#include <IO/WriteBufferFromS3.h>
+#include "BufferAllocationPolicy.h"
 
 #include <memory>
 
-namespace
+namespace DB
 {
 
-class FixedSizeBufferAllocationPolicy : public DB::WriteBufferFromS3::IBufferAllocationPolicy
+class FixedSizeBufferAllocationPolicy : public IBufferAllocationPolicy
 {
     const size_t buffer_size = 0;
     size_t buffer_number = 0;
 
 public:
-    explicit FixedSizeBufferAllocationPolicy(const DB::S3Settings::RequestSettings::PartUploadSettings & settings_)
+    explicit FixedSizeBufferAllocationPolicy(const BufferAllocationSettings & settings_)
         : buffer_size(settings_.strict_upload_part_size)
     {
         chassert(buffer_size > 0);
@@ -36,7 +32,7 @@ public:
 };
 
 
-class ExpBufferAllocationPolicy : public DB::WriteBufferFromS3::IBufferAllocationPolicy
+class ExpBufferAllocationPolicy : public DB::IBufferAllocationPolicy
 {
     const size_t first_size = 0;
     const size_t second_size = 0;
@@ -49,7 +45,7 @@ class ExpBufferAllocationPolicy : public DB::WriteBufferFromS3::IBufferAllocatio
     size_t buffer_number = 0;
 
 public:
-    explicit ExpBufferAllocationPolicy(const DB::S3Settings::RequestSettings::PartUploadSettings & settings_)
+    explicit ExpBufferAllocationPolicy(const BufferAllocationSettings & settings_)
         : first_size(std::max(settings_.max_single_part_upload_size, settings_.min_upload_part_size))
         , second_size(settings_.min_upload_part_size)
         , multiply_factor(settings_.upload_part_size_multiply_factor)
@@ -92,14 +88,10 @@ public:
     }
 };
 
-}
 
-namespace DB
-{
+IBufferAllocationPolicy::~IBufferAllocationPolicy() = default;
 
-WriteBufferFromS3::IBufferAllocationPolicy::~IBufferAllocationPolicy() = default;
-
-WriteBufferFromS3::IBufferAllocationPolicyPtr WriteBufferFromS3::ChooseBufferPolicy(const S3Settings::RequestSettings::PartUploadSettings & settings_)
+IBufferAllocationPolicyPtr ChooseBufferPolicy(BufferAllocationSettings settings_)
 {
     if (settings_.strict_upload_part_size > 0)
         return std::make_unique<FixedSizeBufferAllocationPolicy>(settings_);
@@ -109,4 +101,3 @@ WriteBufferFromS3::IBufferAllocationPolicyPtr WriteBufferFromS3::ChooseBufferPol
 
 }
 
-#endif
diff --git a/src/Common/BufferAllocationPolicy.h b/src/Common/BufferAllocationPolicy.h
new file mode 100644
index 00000000000..b759d22ede6
--- /dev/null
+++ b/src/Common/BufferAllocationPolicy.h
@@ -0,0 +1,35 @@
+#pragma once
+
+#include "config.h"
+
+#include "logger_useful.h"
+
+#include <list>
+
+namespace DB
+{
+
+struct BufferAllocationSettings
+{
+    size_t strict_upload_part_size = 0;
+    size_t min_upload_part_size = 16 * 1024 * 1024;
+    size_t max_upload_part_size = 5ULL * 1024 * 1024 * 1024;
+    size_t upload_part_size_multiply_factor = 2;
+    size_t upload_part_size_multiply_parts_count_threshold = 500;
+    size_t max_single_part_upload_size = 32 * 1024 * 1024;
+};
+
+class IBufferAllocationPolicy
+{
+    public:
+        virtual size_t getBufferNumber() const = 0;
+        virtual size_t getBufferSize() const = 0;
+        virtual void nextBuffer() = 0;
+        virtual ~IBufferAllocationPolicy() = 0;
+};
+
+using IBufferAllocationPolicyPtr = std::unique_ptr<IBufferAllocationPolicy>;
+
+IBufferAllocationPolicyPtr ChooseBufferPolicy(BufferAllocationSettings settings_);
+
+}
diff --git a/src/Common/ThreadPoolTaskTracker.h b/src/Common/ThreadPoolTaskTracker.h
index d37b759a913..72591648d30 100644
--- a/src/Common/ThreadPoolTaskTracker.h
+++ b/src/Common/ThreadPoolTaskTracker.h
@@ -11,8 +11,6 @@
 namespace DB
 {
 
-/// That class is used only in WriteBufferFromS3 for now.
-/// Therefore it declared as a part of  WriteBufferFromS3.
 /// TaskTracker takes a Callback which is run by scheduler in some external shared ThreadPool.
 /// TaskTracker brings the methods waitIfAny, waitAll/safeWaitAll
 /// to help with coordination of the running tasks.
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index b186ca6fe01..8ad08b7e348 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -78,10 +78,15 @@ class IColumn;
     M(UInt64, distributed_connections_pool_size, 1024, "Maximum number of connections with one remote server in the pool.", 0) \
     M(UInt64, connections_with_failover_max_tries, 3, "The maximum number of attempts to connect to replicas.", 0) \
     M(UInt64, s3_strict_upload_part_size, 0, "The exact size of part to upload during multipart upload to S3 (some implementations does not supports variable size parts).", 0) \
+    M(UInt64, azure_strict_upload_part_size, 0, "The exact size of part to upload during multipart upload to Azure blob storage.", 0) \
     M(UInt64, s3_min_upload_part_size, 16*1024*1024, "The minimum size of part to upload during multipart upload to S3.", 0) \
     M(UInt64, s3_max_upload_part_size, 5ull*1024*1024*1024, "The maximum size of part to upload during multipart upload to S3.", 0) \
+    M(UInt64, azure_min_upload_part_size, 16*1024*1024, "The minimum size of part to upload during multipart upload to Azure blob storage.", 0) \
+    M(UInt64, azure_max_upload_part_size, 5ull*1024*1024*1024, "The maximum size of part to upload during multipart upload to Azure blob storage.", 0) \
     M(UInt64, s3_upload_part_size_multiply_factor, 2, "Multiply s3_min_upload_part_size by this factor each time s3_multiply_parts_count_threshold parts were uploaded from a single write to S3.", 0) \
     M(UInt64, s3_upload_part_size_multiply_parts_count_threshold, 500, "Each time this number of parts was uploaded to S3, s3_min_upload_part_size is multiplied by s3_upload_part_size_multiply_factor.", 0) \
+    M(UInt64, azure_upload_part_size_multiply_factor, 2, "Multiply azure_min_upload_part_size by this factor each time azure_multiply_parts_count_threshold parts were uploaded from a single write to Azure blob storage.", 0) \
+    M(UInt64, azure_upload_part_size_multiply_parts_count_threshold, 500, "Each time this number of parts was uploaded to Azure blob storage, azure_min_upload_part_size is multiplied by azure_upload_part_size_multiply_factor.", 0) \
     M(UInt64, s3_max_inflight_parts_for_one_file, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited.", 0) \
     M(UInt64, azure_max_inflight_parts_for_one_file, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited.", 0) \
     M(UInt64, s3_max_single_part_upload_size, 32*1024*1024, "The maximum size of object to upload using singlepart upload to S3.", 0) \
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index 74a8949b235..bc11d445a51 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -27,23 +27,27 @@ struct WriteBufferFromAzureBlobStorage::PartData
 WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> blob_container_client_,
     const String & blob_path_,
-    size_t max_single_part_upload_size_,
-    size_t max_unexpected_write_error_retries_,
     size_t buf_size_,
     const WriteSettings & write_settings_,
-    size_t max_inflight_parts_for_one_file_,
+    std::shared_ptr<const AzureObjectStorageSettings> settings_,
     ThreadPoolCallbackRunner<void> schedule_)
     : WriteBufferFromFileBase(buf_size_, nullptr, 0)
     , log(getLogger("WriteBufferFromAzureBlobStorage"))
-    , max_single_part_upload_size(max_single_part_upload_size_)
-    , max_unexpected_write_error_retries(max_unexpected_write_error_retries_)
+    , buffer_allocation_policy(ChooseBufferPolicy({settings_->strict_upload_part_size,
+                                                   settings_->min_upload_part_size,
+                                                   settings_->max_upload_part_size,
+                                                   settings_->upload_part_size_multiply_factor,
+                                                   settings_->upload_part_size_multiply_parts_count_threshold,
+                                                   settings_->max_single_part_upload_size}))
+    , max_single_part_upload_size(settings_->max_single_part_upload_size)
+    , max_unexpected_write_error_retries(settings_->max_unexpected_write_error_retries)
     , blob_path(blob_path_)
     , write_settings(write_settings_)
     , blob_container_client(blob_container_client_)
     , task_tracker(
           std::make_unique<TaskTracker>(
               std::move(schedule_),
-              max_inflight_parts_for_one_file_,
+              settings_->max_inflight_parts_for_one_file,
               limitedLog))
 {
     allocateBuffer();
@@ -119,7 +123,8 @@ void WriteBufferFromAzureBlobStorage::nextImpl()
 
 void WriteBufferFromAzureBlobStorage::allocateBuffer()
 {
-    memory = Memory(max_single_part_upload_size);
+    buffer_allocation_policy->nextBuffer();
+    memory = Memory(buffer_allocation_policy->getBufferSize());
     WriteBuffer::set(memory.data(), memory.size());
 }
 
@@ -129,10 +134,10 @@ void WriteBufferFromAzureBlobStorage::reallocateBuffer()
     if (available() > 0)
         return;
 
-    if (memory.size() == max_single_part_upload_size)
+    if (memory.size() == buffer_allocation_policy->getBufferSize())
         return;
 
-    memory.resize(max_single_part_upload_size);
+    memory.resize(buffer_allocation_policy->getBufferSize());
 
     WriteBuffer::set(memory.data(), memory.size());
 
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
index 4897ca9a846..7223f66693e 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
@@ -12,7 +12,8 @@
 #include <azure/storage/blobs.hpp>
 #include <azure/core/io/body_stream.hpp>
 #include <Common/ThreadPoolTaskTracker.h>
-
+#include <Common/BufferAllocationPolicy.h>
+#include <Storages/StorageAzureBlob.h>
 
 namespace Poco
 {
@@ -32,11 +33,9 @@ public:
     WriteBufferFromAzureBlobStorage(
         AzureClientPtr blob_container_client_,
         const String & blob_path_,
-        size_t max_single_part_upload_size_,
-        size_t max_unexpected_write_error_retries_,
         size_t buf_size_,
         const WriteSettings & write_settings_,
-        size_t max_inflight_parts_for_one_file_,
+        std::shared_ptr<const AzureObjectStorageSettings> settings_,
         ThreadPoolCallbackRunner<void> schedule_ = {});
 
     ~WriteBufferFromAzureBlobStorage() override;
@@ -63,6 +62,8 @@ private:
     LoggerPtr log;
     LogSeriesLimiterPtr limitedLog = std::make_shared<LogSeriesLimiter>(log, 1, 5);
 
+    IBufferAllocationPolicyPtr buffer_allocation_policy;
+
     const size_t max_single_part_upload_size;
     const size_t max_unexpected_write_error_retries;
     const std::string blob_path;
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index f99586b2d1a..1d01e2f45e3 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -160,18 +160,23 @@ std::unique_ptr<BlobContainerClient> getAzureBlobContainerClient(
 
 std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr context)
 {
-    return std::make_unique<AzureObjectStorageSettings>(
-        config.getUInt64(config_prefix + ".max_single_part_upload_size", 100 * 1024 * 1024),
-        config.getUInt64(config_prefix + ".min_bytes_for_seek", 1024 * 1024),
-        config.getInt(config_prefix + ".max_single_read_retries", 3),
-        config.getInt(config_prefix + ".max_single_download_retries", 3),
-        config.getInt(config_prefix + ".list_object_keys_size", 1000),
-        config.getUInt64(config_prefix + ".max_upload_part_size", 5ULL * 1024 * 1024 * 1024),
-        config.getUInt64(config_prefix + ".max_single_part_copy_size", context->getSettings().azure_max_single_part_copy_size),
-        config.getBool(config_prefix + ".use_native_copy", false),
-        config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", context->getSettings().azure_max_unexpected_write_error_retries),
-        config.getUInt64(config_prefix + ".max_inflight_parts_for_one_file", context->getSettings().azure_max_inflight_parts_for_one_file)
-    );
+    std::unique_ptr<AzureObjectStorageSettings> settings = std::make_unique<AzureObjectStorageSettings>();
+    settings->max_single_part_upload_size = config.getUInt64(config_prefix + ".max_single_part_upload_size", 100 * 1024 * 1024);
+    settings->min_bytes_for_seek = config.getUInt64(config_prefix + ".min_bytes_for_seek", 1024 * 1024);
+    settings->max_single_read_retries = config.getInt(config_prefix + ".max_single_read_retries", 3);
+    settings->max_single_download_retries = config.getInt(config_prefix + ".max_single_download_retries", 3);
+    settings->list_object_keys_size = config.getInt(config_prefix + ".list_object_keys_size", 1000);
+    settings->min_upload_part_size = config.getUInt64(config_prefix + ".min_upload_part_size", context->getSettings().azure_min_upload_part_size);
+    settings->max_upload_part_size = config.getUInt64(config_prefix + ".max_upload_part_size", context->getSettings().azure_max_upload_part_size);
+    settings->max_single_part_copy_size = config.getUInt64(config_prefix + ".max_single_part_copy_size", context->getSettings().azure_max_single_part_copy_size);
+    settings->use_native_copy = config.getBool(config_prefix + ".use_native_copy", false);
+    settings->max_unexpected_write_error_retries = config.getUInt64(config_prefix + ".max_unexpected_write_error_retries", context->getSettings().azure_max_unexpected_write_error_retries);
+    settings->max_inflight_parts_for_one_file = config.getUInt64(config_prefix + ".max_inflight_parts_for_one_file", context->getSettings().azure_max_inflight_parts_for_one_file);
+    settings->strict_upload_part_size = config.getUInt64(config_prefix + ".strict_upload_part_size", context->getSettings().azure_strict_upload_part_size);
+    settings->upload_part_size_multiply_factor = config.getUInt64(config_prefix + ".upload_part_size_multiply_factor", context->getSettings().azure_upload_part_size_multiply_factor);
+    settings->upload_part_size_multiply_parts_count_threshold = config.getUInt64(config_prefix + ".upload_part_size_multiply_parts_count_threshold", context->getSettings().azure_upload_part_size_multiply_parts_count_threshold);
+
+    return settings;
 }
 
 }
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
index 844789ea5b5..15ab55d5611 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.cpp
@@ -265,11 +265,9 @@ std::unique_ptr<WriteBufferFromFileBase> AzureObjectStorage::writeObject( /// NO
     return std::make_unique<WriteBufferFromAzureBlobStorage>(
         client.get(),
         object.remote_path,
-        settings.get()->max_single_part_upload_size,
-        settings.get()->max_unexpected_write_error_retries,
         buf_size,
         patchSettings(write_settings),
-        settings.get()->max_inflight_parts_for_one_file);
+        settings.get());
 }
 
 /// Remove file. Throws exception if file doesn't exists or it's a directory.
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
index 1b473a01304..b97d706a4d9 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureObjectStorage.h
@@ -24,21 +24,29 @@ struct AzureObjectStorageSettings
         int max_single_read_retries_,
         int max_single_download_retries_,
         int list_object_keys_size_,
+        size_t min_upload_part_size_,
         size_t max_upload_part_size_,
         size_t max_single_part_copy_size_,
         bool use_native_copy_,
         size_t max_unexpected_write_error_retries_,
-        size_t max_inflight_parts_for_one_file_)
+        size_t max_inflight_parts_for_one_file_,
+        size_t strict_upload_part_size_,
+        size_t upload_part_size_multiply_factor_,
+        size_t upload_part_size_multiply_parts_count_threshold_)
         : max_single_part_upload_size(max_single_part_upload_size_)
         , min_bytes_for_seek(min_bytes_for_seek_)
         , max_single_read_retries(max_single_read_retries_)
         , max_single_download_retries(max_single_download_retries_)
         , list_object_keys_size(list_object_keys_size_)
+        , min_upload_part_size(min_upload_part_size_)
         , max_upload_part_size(max_upload_part_size_)
         , max_single_part_copy_size(max_single_part_copy_size_)
         , use_native_copy(use_native_copy_)
-        , max_unexpected_write_error_retries (max_unexpected_write_error_retries_)
-        , max_inflight_parts_for_one_file (max_inflight_parts_for_one_file_)
+        , max_unexpected_write_error_retries(max_unexpected_write_error_retries_)
+        , max_inflight_parts_for_one_file(max_inflight_parts_for_one_file_)
+        , strict_upload_part_size(strict_upload_part_size_)
+        , upload_part_size_multiply_factor(upload_part_size_multiply_factor_)
+        , upload_part_size_multiply_parts_count_threshold(upload_part_size_multiply_parts_count_threshold_)
     {
     }
 
@@ -55,6 +63,9 @@ struct AzureObjectStorageSettings
     bool use_native_copy = false;
     size_t max_unexpected_write_error_retries = 4;
     size_t max_inflight_parts_for_one_file = 20;
+    size_t strict_upload_part_size = 0;
+    size_t upload_part_size_multiply_factor = 2;
+    size_t upload_part_size_multiply_parts_count_threshold = 500;
 };
 
 using AzureClient = Azure::Storage::Blobs::BlobContainerClient;
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index 510d9bef4d3..60fa828d6c4 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -93,7 +93,12 @@ WriteBufferFromS3::WriteBufferFromS3(
     , write_settings(write_settings_)
     , client_ptr(std::move(client_ptr_))
     , object_metadata(std::move(object_metadata_))
-    , buffer_allocation_policy(ChooseBufferPolicy(upload_settings))
+    , buffer_allocation_policy(ChooseBufferPolicy({upload_settings.strict_upload_part_size,
+                                                   upload_settings.min_upload_part_size,
+                                                   upload_settings.max_upload_part_size,
+                                                   upload_settings.upload_part_size_multiply_factor,
+                                                   upload_settings.upload_part_size_multiply_parts_count_threshold,
+                                                   upload_settings.max_single_part_upload_size}))
     , task_tracker(
           std::make_unique<TaskTracker>(
               std::move(schedule_),
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index afd8b9909c1..840274c8ace 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -13,6 +13,7 @@
 #include <Common/threadPoolCallbackRunner.h>
 #include <IO/S3/BlobStorageLogWriter.h>
 #include <Common/ThreadPoolTaskTracker.h>
+#include <Common/BufferAllocationPolicy.h>
 
 #include <memory>
 #include <vector>
@@ -49,18 +50,6 @@ public:
     std::string getFileName() const override { return key; }
     void sync() override { next(); }
 
-    class IBufferAllocationPolicy
-    {
-    public:
-        virtual size_t getBufferNumber() const = 0;
-        virtual size_t getBufferSize() const = 0;
-        virtual void nextBuffer() = 0;
-        virtual ~IBufferAllocationPolicy() = 0;
-    };
-    using IBufferAllocationPolicyPtr = std::unique_ptr<IBufferAllocationPolicy>;
-
-    static IBufferAllocationPolicyPtr ChooseBufferPolicy(const S3Settings::RequestSettings::PartUploadSettings & settings_);
-
 private:
     /// Receives response from the server after sending all data.
     void finalizeImpl() override;

From f2a3ffe9eb79046093e77ed39f2366754e7a8ba2 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Thu, 7 Mar 2024 17:14:12 +0800
Subject: [PATCH 153/985] Replace some headers with forward decl

---
 src/Backups/BackupCoordinationRemote.cpp      |  1 +
 .../NamedCollections/NamedCollectionUtils.cpp |  1 +
 .../ObjectStorages/ObjectStorageFactory.cpp   |  3 +++
 src/Formats/ReadSchemaUtils.cpp               |  1 +
 src/Interpreters/DatabaseCatalog.cpp          |  1 -
 src/Interpreters/DatabaseCatalog.h            | 10 +++----
 src/Processors/QueryPlan/AggregatingStep.cpp  |  1 +
 src/Processors/QueryPlan/CubeStep.cpp         |  1 +
 src/Storages/StorageAzureBlob.cpp             |  4 +++
 src/Storages/StorageS3.h                      | 27 ++++++++++---------
 10 files changed, 29 insertions(+), 21 deletions(-)

diff --git a/src/Backups/BackupCoordinationRemote.cpp b/src/Backups/BackupCoordinationRemote.cpp
index 9c509858b2a..b869f890f56 100644
--- a/src/Backups/BackupCoordinationRemote.cpp
+++ b/src/Backups/BackupCoordinationRemote.cpp
@@ -1,6 +1,7 @@
 #include <Backups/BackupCoordinationRemote.h>
 
 #include <base/hex.h>
+#include <boost/algorithm/string/split.hpp>
 
 #include <Access/Common/AccessEntityType.h>
 #include <Backups/BackupCoordinationReplicatedAccess.h>
diff --git a/src/Common/NamedCollections/NamedCollectionUtils.cpp b/src/Common/NamedCollections/NamedCollectionUtils.cpp
index fe0f42467c7..e3ff50f5e3f 100644
--- a/src/Common/NamedCollections/NamedCollectionUtils.cpp
+++ b/src/Common/NamedCollections/NamedCollectionUtils.cpp
@@ -17,6 +17,7 @@
 #include <Common/NamedCollections/NamedCollections.h>
 #include <Common/NamedCollections/NamedCollectionConfiguration.h>
 
+#include <filesystem>
 
 namespace fs = std::filesystem;
 
diff --git a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
index 4f198be64fe..5fae257e8d4 100644
--- a/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
+++ b/src/Disks/ObjectStorages/ObjectStorageFactory.cpp
@@ -21,6 +21,9 @@
 #include <Interpreters/Context.h>
 #include <Common/Macros.h>
 
+#include <filesystem>
+
+namespace fs = std::filesystem;
 
 namespace DB
 {
diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index 5badf4301bf..736a35927c3 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -5,6 +5,7 @@
 #include <IO/WithFileSize.h>
 #include <IO/EmptyReadBuffer.h>
 #include <IO/PeekableReadBuffer.h>
+#include <Storages/IStorage.h>
 
 namespace DB
 {
diff --git a/src/Interpreters/DatabaseCatalog.cpp b/src/Interpreters/DatabaseCatalog.cpp
index a9fd5c852ba..a5a523b658b 100644
--- a/src/Interpreters/DatabaseCatalog.cpp
+++ b/src/Interpreters/DatabaseCatalog.cpp
@@ -26,7 +26,6 @@
 #include <Common/noexcept_scope.h>
 #include <Common/checkStackSize.h>
 
-#include "Interpreters/Context_fwd.h"
 #include "config.h"
 
 #if USE_MYSQL
diff --git a/src/Interpreters/DatabaseCatalog.h b/src/Interpreters/DatabaseCatalog.h
index 4fe114cc493..6995fc51941 100644
--- a/src/Interpreters/DatabaseCatalog.h
+++ b/src/Interpreters/DatabaseCatalog.h
@@ -1,15 +1,14 @@
 #pragma once
 
 #include <Core/UUID.h>
+#include <Databases/IDatabase.h>
+#include <Databases/TablesDependencyGraph.h>
 #include <Interpreters/Context_fwd.h>
 #include <Interpreters/StorageID.h>
-#include <Databases/TablesDependencyGraph.h>
 #include <Parsers/IAST_fwd.h>
 #include <Storages/IStorage_fwd.h>
-#include "Common/NamePrompter.h"
+#include <Common/NamePrompter.h>
 #include <Common/SharedMutex.h>
-#include "Storages/IStorage.h"
-#include "Databases/IDatabase.h"
 
 #include <boost/noncopyable.hpp>
 #include <Poco/Logger.h>
@@ -23,9 +22,6 @@
 #include <set>
 #include <unordered_map>
 #include <unordered_set>
-#include <filesystem>
-
-namespace fs = std::filesystem;
 
 namespace DB
 {
diff --git a/src/Processors/QueryPlan/AggregatingStep.cpp b/src/Processors/QueryPlan/AggregatingStep.cpp
index f374a7b7b10..a76bacdd97b 100644
--- a/src/Processors/QueryPlan/AggregatingStep.cpp
+++ b/src/Processors/QueryPlan/AggregatingStep.cpp
@@ -8,6 +8,7 @@
 #include <IO/Operators.h>
 #include <Interpreters/Aggregator.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/ExpressionActions.h>
 #include <Processors/Merges/AggregatingSortedTransform.h>
 #include <Processors/Merges/FinishAggregatingInOrderTransform.h>
 #include <Processors/QueryPlan/AggregatingStep.h>
diff --git a/src/Processors/QueryPlan/CubeStep.cpp b/src/Processors/QueryPlan/CubeStep.cpp
index 0c632c346c7..bf2ce148529 100644
--- a/src/Processors/QueryPlan/CubeStep.cpp
+++ b/src/Processors/QueryPlan/CubeStep.cpp
@@ -5,6 +5,7 @@
 #include <QueryPipeline/QueryPipelineBuilder.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <Functions/FunctionFactory.h>
+#include <Interpreters/ExpressionActions.h>
 
 namespace DB
 {
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 1f0fba99f84..2d4f1db04a1 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -41,6 +41,10 @@
 #include <Disks/IO/ReadBufferFromAzureBlobStorage.h>
 #include <Disks/IO/WriteBufferFromAzureBlobStorage.h>
 
+#include <filesystem>
+
+namespace fs = std::filesystem;
+
 using namespace Azure::Storage::Blobs;
 
 namespace CurrentMetrics
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index 65fb3b51be2..bf81ead0599 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -4,27 +4,28 @@
 
 #if USE_AWS_S3
 
-#include <Core/Types.h>
-
 #include <Compression/CompressionInfo.h>
-
-#include <Storages/IStorage.h>
-#include <Storages/StorageS3Settings.h>
-
-#include <Processors/SourceWithKeyCondition.h>
-#include <Processors/Executors/PullingPipelineExecutor.h>
-#include <Processors/Formats/IInputFormat.h>
-#include <Poco/URI.h>
-#include <IO/S3/getObjectInfo.h>
+#include <Core/Types.h>
 #include <IO/CompressionMethod.h>
+#include <IO/S3/BlobStorageLogWriter.h>
+#include <IO/S3/getObjectInfo.h>
 #include <IO/SeekableReadBuffer.h>
 #include <Interpreters/Context.h>
-#include <Common/threadPoolCallbackRunner.h>
+#include <Processors/Executors/PullingPipelineExecutor.h>
+#include <Processors/Formats/IInputFormat.h>
+#include <Processors/SourceWithKeyCondition.h>
 #include <Storages/Cache/SchemaCache.h>
+#include <Storages/IStorage.h>
 #include <Storages/SelectQueryInfo.h>
 #include <Storages/StorageConfiguration.h>
+#include <Storages/StorageS3Settings.h>
 #include <Storages/prepareReadingFromFormat.h>
-#include <IO/S3/BlobStorageLogWriter.h>
+#include <Poco/URI.h>
+#include <Common/threadPoolCallbackRunner.h>
+
+#include <filesystem>
+
+namespace fs = std::filesystem;
 
 namespace Aws::S3
 {

From f0a8d8843de5dffae2e1d4476fb119ad34059340 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 7 Mar 2024 00:10:06 +0100
Subject: [PATCH 154/985] Not x86_64 are lagging behind in features

---
 base/base/itoa.h | 18 +++++++++++++++---
 1 file changed, 15 insertions(+), 3 deletions(-)

diff --git a/base/base/itoa.h b/base/base/itoa.h
index c450090d82f..a36eecaf1e5 100644
--- a/base/base/itoa.h
+++ b/base/base/itoa.h
@@ -351,12 +351,20 @@ namespace convert
 template <typename T>
 static inline char * writeUIntText(T _x, char * p)
 {
-#pragma clang diagnostic push
-#pragma clang diagnostic ignored "-Wbit-int-extension"
     int len = digits10(_x);
     static_assert(std::is_same_v<T, UInt128> || std::is_same_v<T, UInt256>);
-    using T_ = std::conditional_t<std::is_same_v<T, UInt128>, unsigned __int128, unsigned _BitInt(256)>;
+    using T_ = std::conditional_t<
+        std::is_same_v<T, UInt128>,
+        unsigned __int128,
+#if defined(__x86_64__)
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wbit-int-extension"
+        unsigned _BitInt(256)
 #pragma clang diagnostic pop
+#else
+        T
+#endif
+        >;
 
     T_ x;
     T_ hundred(100ULL);
@@ -366,8 +374,12 @@ static inline char * writeUIntText(T _x, char * p)
     }
     else
     {
+#if defined(__x86_64__)
         x = (T_(_x.items[T::_impl::little(3)]) << 192) + (T_(_x.items[T::_impl::little(2)]) << 128) +
                 (T_(_x.items[T::_impl::little(1)]) << 64) + T_(_x.items[T::_impl::little(0)]);
+#else
+        x = _x;
+#endif
     }
 
     auto * pp = p + len;

From 66dea5111298abd4301df55b5615d158105fe78f Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Thu, 7 Mar 2024 12:40:48 +0100
Subject: [PATCH 155/985] fix clang-tidy

---
 src/Functions/array/arrayDotProduct.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Functions/array/arrayDotProduct.cpp b/src/Functions/array/arrayDotProduct.cpp
index f9a6687e028..8b7c85e05dd 100644
--- a/src/Functions/array/arrayDotProduct.cpp
+++ b/src/Functions/array/arrayDotProduct.cpp
@@ -322,18 +322,18 @@ private:
         const auto & offsets_y = array_y.getOffsets();
 
         ColumnArray::Offset prev_offset = 0;
-        for (size_t row = 0; row < offsets_y.size(); ++row)
+        for (auto offset_y : offsets_y)
         {
-            if (offsets_x[0] != offsets_y[row] - prev_offset) [[unlikely]]
+            if (offsets_x[0] != offset_y - prev_offset) [[unlikely]]
             {
                 throw Exception(
                     ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH,
                     "Arguments of function {} have different array sizes: {} and {}",
                     getName(),
                     offsets_x[0],
-                    offsets_y[row] - prev_offset);
+                    offset_y - prev_offset);
             }
-            prev_offset = offsets_y[row];
+            prev_offset = offset_y;
         }
 
         auto col_res = ColumnVector<ResultType>::create();

From 6c69e7d4dcfdfa21cfcaa103fc1cc7c53dfe0291 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Thu, 7 Mar 2024 20:29:04 +0800
Subject: [PATCH 156/985] detect output format by file extension in
 clickhouse-local

---
 programs/local/LocalServer.cpp | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 68f0e52ce08..20974dd9751 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -327,6 +327,14 @@ static bool checkIfStdinIsRegularFile()
     return fstat(STDIN_FILENO, &file_stat) == 0 && S_ISREG(file_stat.st_mode);
 }
 
+
+static bool checkIfStdoutIsRegularFile()
+{
+    struct stat file_stat;
+    return fstat(STDOUT_FILENO, &file_stat) == 0 && S_ISREG(file_stat.st_mode);
+}
+
+
 std::string LocalServer::getInitialCreateTableQuery()
 {
     if (!config().has("table-structure") && !config().has("table-file") && !config().has("table-data-format") && (!checkIfStdinIsRegularFile() || queries.empty()))
@@ -638,7 +646,14 @@ void LocalServer::processConfig()
     if (config().has("macros"))
         global_context->setMacros(std::make_unique<Macros>(config(), "macros", log));
 
-    format = config().getString("output-format", config().getString("format", is_interactive ? "PrettyCompact" : "TSV"));
+    if (!config().has("output-format") && !config().has("format") && checkIfStdoutIsRegularFile())
+    {
+        std::optional<String> format_from_file_name;
+        format_from_file_name = FormatFactory::instance().tryGetFormatFromFileDescriptor(STDOUT_FILENO);
+        format = format_from_file_name ? *format_from_file_name : "TSV";
+    }
+    else
+        format = config().getString("output-format", config().getString("format", is_interactive ? "PrettyCompact" : "TSV"));
     insert_format = "Values";
 
     /// Setting value from cmd arg overrides one from config

From 6d5fd2857ed50047d8acf48766165aa815ca30b9 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Thu, 7 Mar 2024 20:29:42 +0800
Subject: [PATCH 157/985] detect output format by file extension in
 clickhouse-client

---
 programs/client/Client.cpp | 17 ++++++++++++++++-
 1 file changed, 16 insertions(+), 1 deletion(-)

diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index a2bd6b6016a..fac34003553 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -50,6 +50,7 @@
 #include <Functions/registerFunctions.h>
 #include <AggregateFunctions/registerAggregateFunctions.h>
 #include <Formats/registerFormats.h>
+#include <Formats/FormatFactory.h>
 
 namespace fs = std::filesystem;
 using namespace std::literals;
@@ -1137,6 +1138,13 @@ void Client::processOptions(const OptionsDescription & options_description,
 }
 
 
+static bool checkIfStdoutIsRegularFile()
+{
+    struct stat file_stat;
+    return fstat(STDOUT_FILENO, &file_stat) == 0 && S_ISREG(file_stat.st_mode);
+}
+
+
 void Client::processConfig()
 {
     if (!queries.empty() && config().has("queries-file"))
@@ -1173,7 +1181,14 @@ void Client::processConfig()
     pager = config().getString("pager", "");
 
     is_default_format = !config().has("vertical") && !config().has("format");
-    if (config().has("vertical"))
+    if (is_default_format && checkIfStdoutIsRegularFile())
+    {
+        is_default_format = false;
+        std::optional<String> format_from_file_name;
+        format_from_file_name = FormatFactory::instance().tryGetFormatFromFileDescriptor(STDOUT_FILENO);
+        format = format_from_file_name ? *format_from_file_name : "TabSeparated";
+    }
+    else if (config().has("vertical"))
         format = config().getString("format", "Vertical");
     else
         format = config().getString("format", is_interactive ? "PrettyCompact" : "TabSeparated");

From 112c1efb7da2619cb67a48ff7fbe65ecea8e44a9 Mon Sep 17 00:00:00 2001
From: HowePa <2873679104@qq.com>
Date: Thu, 7 Mar 2024 20:30:24 +0800
Subject: [PATCH 158/985] test detect output format by file extension

---
 ..._output_format_by_file_extension.reference | 20 +++++++++++++++++++
 ..._detect_output_format_by_file_extension.sh | 13 ++++++++++++
 2 files changed, 33 insertions(+)
 create mode 100644 tests/queries/0_stateless/02181_detect_output_format_by_file_extension.reference
 create mode 100755 tests/queries/0_stateless/02181_detect_output_format_by_file_extension.sh

diff --git a/tests/queries/0_stateless/02181_detect_output_format_by_file_extension.reference b/tests/queries/0_stateless/02181_detect_output_format_by_file_extension.reference
new file mode 100644
index 00000000000..7b36cc96f5e
--- /dev/null
+++ b/tests/queries/0_stateless/02181_detect_output_format_by_file_extension.reference
@@ -0,0 +1,20 @@
+0
+1
+2
+3
+4
+5
+6
+7
+8
+9
+0
+1
+2
+3
+4
+5
+6
+7
+8
+9
diff --git a/tests/queries/0_stateless/02181_detect_output_format_by_file_extension.sh b/tests/queries/0_stateless/02181_detect_output_format_by_file_extension.sh
new file mode 100755
index 00000000000..ec1edd710a1
--- /dev/null
+++ b/tests/queries/0_stateless/02181_detect_output_format_by_file_extension.sh
@@ -0,0 +1,13 @@
+#!/usr/bin/env bash
+# Tags: no-parallel, no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+
+$CLICKHOUSE_LOCAL -q "select * from numbers(10)" > $CLICKHOUSE_TMP/data.parquet
+$CLICKHOUSE_LOCAL -q "select * from table" < $CLICKHOUSE_TMP/data.parquet 
+
+$CLICKHOUSE_CLIENT -q "select * from numbers(10)" > $CLICKHOUSE_TMP/data.parquet
+$CLICKHOUSE_LOCAL -q "select * from table" < $CLICKHOUSE_TMP/data.parquet 

From 930deee699be05398aac334ce9e025d084c68a30 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 7 Mar 2024 22:02:10 +0800
Subject: [PATCH 159/985] fix bugs

---
 src/Columns/ColumnArray.cpp | 63 ++++++++++++++++++-------------------
 src/Columns/ColumnArray.h   |  2 +-
 2 files changed, 32 insertions(+), 33 deletions(-)

diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index 44b17c89ae1..0214375122f 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -43,29 +43,34 @@ namespace ErrorCodes
 static constexpr size_t max_array_size_as_field = 1000000;
 
 
-ColumnArray::ColumnArray(MutableColumnPtr && nested_column, MutableColumnPtr && offsets_column)
+ColumnArray::ColumnArray(MutableColumnPtr && nested_column, MutableColumnPtr && offsets_column, bool check_offsets)
     : data(std::move(nested_column)), offsets(std::move(offsets_column))
 {
-    const ColumnOffsets * offsets_concrete = typeid_cast<const ColumnOffsets *>(offsets.get());
-
-    if (!offsets_concrete)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "offsets_column must be a ColumnUInt64");
-
-    if (!offsets_concrete->empty() && data && !data->empty())
+    if (check_offsets)
     {
-        Offset last_offset = offsets_concrete->getData().back();
+        const ColumnOffsets * offsets_concrete = typeid_cast<const ColumnOffsets *>(offsets.get());
 
-        /// This will also prevent possible overflow in offset.
-        if (data->size() != last_offset)
-            throw Exception(ErrorCodes::LOGICAL_ERROR,
-                "offsets_column has data inconsistent with nested_column. Data size: {}, last offset: {}",
-                data->size(), last_offset);
+        if (!offsets_concrete)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "offsets_column must be a ColumnUInt64");
+
+        if (!offsets_concrete->empty() && data && !data->empty())
+        {
+            Offset last_offset = offsets_concrete->getData().back();
+
+            /// This will also prevent possible overflow in offset.
+            if (data->size() != last_offset)
+                throw Exception(
+                    ErrorCodes::LOGICAL_ERROR,
+                    "offsets_column has data inconsistent with nested_column. Data size: {}, last offset: {}",
+                    data->size(),
+                    last_offset);
+        }
+
+        /** NOTE
+         * Arrays with constant value are possible and used in implementation of higher order functions (see FunctionReplicate).
+         * But in most cases, arrays with constant value are unexpected and code will work wrong. Use with caution.
+         */
     }
-
-    /** NOTE
-      * Arrays with constant value are possible and used in implementation of higher order functions (see FunctionReplicate).
-      * But in most cases, arrays with constant value are unexpected and code will work wrong. Use with caution.
-      */
 }
 
 ColumnArray::ColumnArray(MutableColumnPtr && nested_column)
@@ -425,20 +430,14 @@ void ColumnArray::insertManyFromTuple(const ColumnArray & src, size_t position,
     if (tuple_size != src_tuple_size)
         throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Nested tuple size mismatch: {} vs {}", tuple_size, src_tuple_size);
 
-    MutableColumns temporary_arrays(tuple_size);
-    Columns src_temporary_arrays(tuple_size);
-    for (size_t i = 0; i < tuple_size; ++i)
-    {
-        temporary_arrays[i] = ColumnArray::create(tuple.getColumn(i).assumeMutable(), getOffsetsPtr()->assumeMutable());
-        src_temporary_arrays[i] = ColumnArray::create(src_tuple.getColumn(i).assumeMutable(), src.getOffsetsPtr()->assumeMutable());
-        assert_cast<ColumnArray &>(*temporary_arrays[i])
-            .insertManyFromImpl(assert_cast<const ColumnArray &>(*src_temporary_arrays[i]), position, length, false);
-    }
-
     Columns tuple_columns(tuple_size);
     for (size_t i = 0; i < tuple_size; ++i)
-        tuple_columns[i] = assert_cast<const ColumnArray &>(*temporary_arrays[i]).getDataPtr();
-
+    {
+        auto array_of_element = ColumnArray(tuple.getColumn(i).assumeMutable(), getOffsetsPtr()->assumeMutable(), false);
+        auto src_array_of_element = ColumnArray(src_tuple.getColumn(i).assumeMutable(), src.getOffsetsPtr()->assumeMutable());
+        array_of_element.insertManyFromImpl(src_array_of_element, position, length, false);
+        tuple_columns[i] = array_of_element.getDataPtr();
+    }
     getDataPtr() = ColumnTuple::create(std::move(tuple_columns));
 }
 
@@ -448,12 +447,12 @@ void ColumnArray::insertManyFromNullable(const ColumnArray & src, size_t positio
     const ColumnNullable & src_nullable = assert_cast<const ColumnNullable &>(src.getData());
 
     /// Process nested column without updating array offsets
-    auto array_of_nested = ColumnArray(nullable.getNestedColumnPtr()->assumeMutable(), getOffsetsPtr()->assumeMutable());
+    auto array_of_nested = ColumnArray(nullable.getNestedColumnPtr()->assumeMutable(), getOffsetsPtr()->assumeMutable(), false);
     auto src_array_of_nested = ColumnArray(src_nullable.getNestedColumnPtr()->assumeMutable(), src.getOffsetsPtr()->assumeMutable());
     array_of_nested.insertManyFromImpl(src_array_of_nested, position, length, false);
 
     /// Process null map column without updating array offsets
-    auto array_of_null_map = ColumnArray(nullable.getNullMapColumnPtr()->assumeMutable(), getOffsetsPtr()->assumeMutable());
+    auto array_of_null_map = ColumnArray(nullable.getNullMapColumnPtr()->assumeMutable(), getOffsetsPtr()->assumeMutable(), false);
     auto src_array_of_null_map = ColumnArray(src_nullable.getNullMapColumnPtr()->assumeMutable(), src.getOffsetsPtr()->assumeMutable());
     array_of_null_map.insertManyFromImpl(src_array_of_null_map, position, length, false);
 
diff --git a/src/Columns/ColumnArray.h b/src/Columns/ColumnArray.h
index 765f86ec552..8c4d103e7d0 100644
--- a/src/Columns/ColumnArray.h
+++ b/src/Columns/ColumnArray.h
@@ -21,7 +21,7 @@ private:
     friend class COWHelper<IColumnHelper<ColumnArray>, ColumnArray>;
 
     /** Create an array column with specified values and offsets. */
-    ColumnArray(MutableColumnPtr && nested_column, MutableColumnPtr && offsets_column);
+    ColumnArray(MutableColumnPtr && nested_column, MutableColumnPtr && offsets_column, bool check_offsets = true);
 
     /** Create an empty column of arrays with the type of values as in the column `nested_column` */
     explicit ColumnArray(MutableColumnPtr && nested_column);

From cd9d9018e0db8139e48cb722e9e9685d2a212c8b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 7 Mar 2024 17:15:42 +0100
Subject: [PATCH 160/985] Be able to iterate

---
 base/base/CMakeLists.txt     |   1 +
 base/base/itoa.cpp           | 503 +++++++++++++++++++++++++++++++++++
 base/base/itoa.h             | 498 +++-------------------------------
 src/Functions/CMakeLists.txt |   1 +
 4 files changed, 540 insertions(+), 463 deletions(-)
 create mode 100644 base/base/itoa.cpp

diff --git a/base/base/CMakeLists.txt b/base/base/CMakeLists.txt
index 548ba01d86a..55d046767b8 100644
--- a/base/base/CMakeLists.txt
+++ b/base/base/CMakeLists.txt
@@ -19,6 +19,7 @@ set (SRCS
     getPageSize.cpp
     getThreadId.cpp
     int8_to_string.cpp
+    itoa.cpp
     JSON.cpp
     mremap.cpp
     phdr_cache.cpp
diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
new file mode 100644
index 00000000000..9fefc9f0f07
--- /dev/null
+++ b/base/base/itoa.cpp
@@ -0,0 +1,503 @@
+// Based on https://github.com/amdn/itoa and combined with our optimizations
+//
+//=== itoa.h - Fast integer to ascii conversion                   --*- C++ -*-//
+//
+// The MIT License (MIT)
+// Copyright (c) 2016 Arturo Martin-de-Nicolas
+//
+// Permission is hereby granted, free of charge, to any person obtaining a copy
+// of this software and associated documentation files (the "Software"), to deal
+// in the Software without restriction, including without limitation the rights
+// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+// copies of the Software, and to permit persons to whom the Software is
+// furnished to do so, subject to the following conditions:
+//
+//     The above copyright notice and this permission notice shall be included
+//     in all copies or substantial portions of the Software.
+//
+// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+// SOFTWARE.
+//===----------------------------------------------------------------------===//
+
+#include <cstddef>
+#include <cstdint>
+#include <cstring>
+#include <type_traits>
+#include <base/defines.h>
+#include <base/extended_types.h>
+#include <base/itoa.h>
+
+
+template <typename T>
+int digits10(T x)
+{
+    if (x < T(10ULL))
+        return 1;
+    if (x < T(100ULL))
+        return 2;
+    if constexpr (sizeof(T) == 1)
+        return 3;
+    else
+    {
+        if (x < T(1000ULL))
+            return 3;
+
+        if (x < T(1000000000000ULL))
+        {
+            if (x < T(100000000ULL))
+            {
+                if (x < T(1000000ULL))
+                {
+                    if (x < T(10000ULL))
+                        return 4;
+                    else
+                        return 5 + (x >= T(100000ULL));
+                }
+
+                return 7 + (x >= T(10000000ULL));
+            }
+
+            if (x < T(10000000000ULL))
+                return 9 + (x >= T(1000000000ULL));
+
+            return 11 + (x >= T(100000000000ULL));
+        }
+
+        return 12 + digits10(x / T(1000000000000ULL));
+    }
+}
+
+
+namespace
+{
+
+template <typename T>
+static constexpr T pow10(size_t x)
+{
+    return x ? 10 * pow10<T>(x - 1) : 1;
+}
+
+// Division by a power of 10 is implemented using a multiplicative inverse.
+// This strength reduction is also done by optimizing compilers, but
+// presently the fastest results are produced by using the values
+// for the multiplication and the shift as given by the algorithm
+// described by Agner Fog in "Optimizing Subroutines in Assembly Language"
+//
+// http://www.agner.org/optimize/optimizing_assembly.pdf
+//
+// "Integer division by a constant (all processors)
+// A floating point number can be divided by a constant by multiplying
+// with the reciprocal. If we want to do the same with integers, we have
+// to scale the reciprocal by 2n and then shift the product to the right
+// by n. There are various algorithms for finding a suitable value of n
+// and compensating for rounding errors. The algorithm described below
+// was invented by Terje Mathisen, Norway, and not published elsewhere."
+
+/// Division by constant is performed by:
+/// 1. Adding 1 if needed;
+/// 2. Multiplying by another constant;
+/// 3. Shifting right by another constant.
+template <typename UInt, bool add_, UInt multiplier_, unsigned shift_>
+struct Division
+{
+    static constexpr bool add{add_};
+    static constexpr UInt multiplier{multiplier_};
+    static constexpr unsigned shift{shift_};
+};
+
+/// Select a type with appropriate number of bytes from the list of types.
+/// First parameter is the number of bytes requested. Then goes a list of types with 1, 2, 4, ... number of bytes.
+/// Example: SelectType<4, uint8_t, uint16_t, uint32_t, uint64_t> will select uint32_t.
+template <size_t N, typename T, typename... Ts>
+struct SelectType
+{
+    using Result = typename SelectType<N / 2, Ts...>::Result;
+};
+
+template <typename T, typename... Ts>
+struct SelectType<1, T, Ts...>
+{
+    using Result = T;
+};
+
+
+/// Division by 10^N where N is the size of the type.
+template <size_t N>
+using DivisionBy10PowN = typename SelectType<
+    N,
+    Division<uint8_t, false, 205U, 11>, /// divide by 10
+    Division<uint16_t, true, 41943U, 22>, /// divide by 100
+    Division<uint32_t, false, 3518437209U, 45>, /// divide by 10000
+    Division<uint64_t, false, 12379400392853802749ULL, 90> /// divide by 100000000
+    >::Result;
+
+template <size_t N>
+using UnsignedOfSize = typename SelectType<N, uint8_t, uint16_t, uint32_t, uint64_t, __uint128_t>::Result;
+
+/// Holds the result of dividing an unsigned N-byte variable by 10^N resulting in
+template <size_t N>
+struct QuotientAndRemainder
+{
+    UnsignedOfSize<N> quotient; // quotient with fewer than 2*N decimal digits
+    UnsignedOfSize<N / 2> remainder; // remainder with at most N decimal digits
+};
+
+template <size_t N>
+QuotientAndRemainder<N> static inline split(UnsignedOfSize<N> value)
+{
+    constexpr DivisionBy10PowN<N> division;
+
+    UnsignedOfSize<N> quotient = (division.multiplier * (UnsignedOfSize<2 * N>(value) + division.add)) >> division.shift;
+    UnsignedOfSize<N / 2> remainder = static_cast<UnsignedOfSize<N / 2>>(value - quotient * pow10<UnsignedOfSize<N / 2>>(N));
+
+    return {quotient, remainder};
+}
+
+
+static inline char * outDigit(char * p, uint8_t value)
+{
+    *p = '0' + value;
+    ++p;
+    return p;
+}
+
+// Using a lookup table to convert binary numbers from 0 to 99
+// into ascii characters as described by Andrei Alexandrescu in
+// https://www.facebook.com/notes/facebook-engineering/three-optimization-tips-for-c/10151361643253920/
+
+static const char digits[201] = "00010203040506070809"
+                                "10111213141516171819"
+                                "20212223242526272829"
+                                "30313233343536373839"
+                                "40414243444546474849"
+                                "50515253545556575859"
+                                "60616263646566676869"
+                                "70717273747576777879"
+                                "80818283848586878889"
+                                "90919293949596979899";
+
+static inline char * outTwoDigits(char * p, uint8_t value)
+{
+    memcpy(p, &digits[value * 2], 2);
+    p += 2;
+    return p;
+}
+
+
+namespace convert
+{
+template <typename UInt, size_t N = sizeof(UInt)>
+static char * head(char * p, UInt u);
+template <typename UInt, size_t N = sizeof(UInt)>
+static char * tail(char * p, UInt u);
+
+//===----------------------------------------------------------===//
+//     head: find most significant digit, skip leading zeros
+//===----------------------------------------------------------===//
+
+// "x" contains quotient and remainder after division by 10^N
+// quotient is less than 10^N
+template <size_t N>
+static inline char * head(char * p, QuotientAndRemainder<N> x)
+{
+    p = head(p, UnsignedOfSize<N / 2>(x.quotient));
+    p = tail(p, x.remainder);
+    return p;
+}
+
+// "u" is less than 10^2*N
+template <typename UInt, size_t N>
+static inline char * head(char * p, UInt u)
+{
+    return u < pow10<UnsignedOfSize<N>>(N) ? head(p, UnsignedOfSize<N / 2>(u)) : head<N>(p, split<N>(u));
+}
+
+// recursion base case, selected when "u" is one byte
+template <>
+inline char * head<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
+{
+    return u < 10 ? outDigit(p, u) : outTwoDigits(p, u);
+}
+
+//===----------------------------------------------------------===//
+//     tail: produce all digits including leading zeros
+//===----------------------------------------------------------===//
+
+// recursive step, "u" is less than 10^2*N
+template <typename UInt, size_t N>
+static inline char * tail(char * p, UInt u)
+{
+    QuotientAndRemainder<N> x = split<N>(u);
+    p = tail(p, UnsignedOfSize<N / 2>(x.quotient));
+    p = tail(p, x.remainder);
+    return p;
+}
+
+// recursion base case, selected when "u" is one byte
+template <>
+inline char * tail<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
+{
+    return outTwoDigits(p, u);
+}
+
+//===----------------------------------------------------------===//
+// large values are >= 10^2*N
+// where x contains quotient and remainder after division by 10^N
+//===----------------------------------------------------------===//
+
+template <size_t N>
+static inline char * large(char * p, QuotientAndRemainder<N> x)
+{
+    QuotientAndRemainder<N> y = split<N>(x.quotient);
+    p = head(p, UnsignedOfSize<N / 2>(y.quotient));
+    p = tail(p, y.remainder);
+    p = tail(p, x.remainder);
+    return p;
+}
+
+//===----------------------------------------------------------===//
+// handle values of "u" that might be >= 10^2*N
+// where N is the size of "u" in bytes
+//===----------------------------------------------------------===//
+
+template <typename UInt, size_t N = sizeof(UInt)>
+static inline char * uitoa(char * p, UInt u)
+{
+    if (u < pow10<UnsignedOfSize<N>>(N))
+        return head(p, UnsignedOfSize<N / 2>(u));
+    QuotientAndRemainder<N> x = split<N>(u);
+
+    return u < pow10<UnsignedOfSize<N>>(2 * N) ? head<N>(p, x) : large<N>(p, x);
+}
+
+// selected when "u" is one byte
+template <>
+inline char * uitoa<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
+{
+    if (u < 10)
+        return outDigit(p, u);
+    else if (u < 100)
+        return outTwoDigits(p, u);
+    else
+    {
+        p = outDigit(p, u / 100);
+        p = outTwoDigits(p, u % 100);
+        return p;
+    }
+}
+
+//===----------------------------------------------------------===//
+//     handle unsigned and signed integral operands
+//===----------------------------------------------------------===//
+
+// itoa: handle unsigned integral operands (selected by SFINAE)
+template <typename U, std::enable_if_t<!std::is_signed_v<U> && std::is_integral_v<U>> * = nullptr>
+static inline char * itoa(U u, char * p)
+{
+    return convert::uitoa(p, u);
+}
+
+// itoa: handle signed integral operands (selected by SFINAE)
+template <typename I, size_t N = sizeof(I), std::enable_if_t<std::is_signed_v<I> && std::is_integral_v<I>> * = nullptr>
+static inline char * itoa(I i, char * p)
+{
+    // Need "mask" to be filled with a copy of the sign bit.
+    // If "i" is a negative value, then the result of "operator >>"
+    // is implementation-defined, though usually it is an arithmetic
+    // right shift that replicates the sign bit.
+    // Use a conditional expression to be portable,
+    // a good optimizing compiler generates an arithmetic right shift
+    // and avoids the conditional branch.
+    UnsignedOfSize<N> mask = i < 0 ? ~UnsignedOfSize<N>(0) : 0;
+    // Now get the absolute value of "i" and cast to unsigned type UnsignedOfSize<N>.
+    // Cannot use std::abs() because the result is undefined
+    // in 2's complement systems for the most-negative value.
+    // Want to avoid conditional branch for performance reasons since
+    // CPU branch prediction will be ineffective when negative values
+    // occur randomly.
+    // Let "u" be "i" cast to unsigned type UnsignedOfSize<N>.
+    // Subtract "u" from 2*u if "i" is positive or 0 if "i" is negative.
+    // This yields the absolute value with the desired type without
+    // using a conditional branch and without invoking undefined or
+    // implementation defined behavior:
+    UnsignedOfSize<N> u = ((2 * UnsignedOfSize<N>(i)) & ~mask) - UnsignedOfSize<N>(i);
+    // Unconditionally store a minus sign when producing digits
+    // in a forward direction and increment the pointer only if
+    // the value is in fact negative.
+    // This avoids a conditional branch and is safe because we will
+    // always produce at least one digit and it will overwrite the
+    // minus sign when the value is not negative.
+    *p = '-';
+    p += (mask & 1);
+    p = convert::uitoa(p, u);
+    return p;
+}
+}
+
+
+template <typename T>
+static NO_INLINE char * writeUIntText(T _x, char * p)
+{
+    static_assert(std::is_same_v<T, UInt128> || std::is_same_v<T, UInt256>);
+    using T_ = std::conditional_t<
+        std::is_same_v<T, UInt128>,
+        unsigned __int128,
+#if defined(__x86_64__)
+#    pragma clang diagnostic push
+#    pragma clang diagnostic ignored "-Wbit-int-extension"
+        unsigned _BitInt(256)
+#    pragma clang diagnostic pop
+#else
+        T
+#endif
+        >;
+
+    T_ x;
+    T_ hundred(100ULL);
+    if constexpr (std::is_same_v<T, UInt128>)
+    {
+        x = (T_(_x.items[T::_impl::little(1)]) << 64) + T_(_x.items[T::_impl::little(0)]);
+    }
+    else
+    {
+#if defined(__x86_64__)
+        x = (T_(_x.items[T::_impl::little(3)]) << 192) + (T_(_x.items[T::_impl::little(2)]) << 128)
+            + (T_(_x.items[T::_impl::little(1)]) << 64) + T_(_x.items[T::_impl::little(0)]);
+#else
+        x = _x;
+#endif
+    }
+
+    int len = digits10(x);
+    auto * pp = p + len;
+    while (x >= hundred)
+    {
+        const auto i = x % hundred;
+        x /= hundred;
+        pp -= 2;
+        outTwoDigits(pp, i);
+    }
+    if (x < 10)
+        *p = '0' + x;
+    else
+        outTwoDigits(p, x);
+    return p + len;
+}
+
+static ALWAYS_INLINE inline char * writeLeadingMinus(char * pos)
+{
+    *pos = '-';
+    return pos + 1;
+}
+
+template <typename T>
+static ALWAYS_INLINE inline char * writeSIntText(T x, char * pos)
+{
+    static_assert(std::is_same_v<T, Int128> || std::is_same_v<T, Int256>);
+
+    using UnsignedT = make_unsigned_t<T>;
+    static constexpr T min_int = UnsignedT(1) << (sizeof(T) * 8 - 1);
+
+    if (unlikely(x == min_int))
+    {
+        if constexpr (std::is_same_v<T, Int128>)
+        {
+            const char * res = "-170141183460469231731687303715884105728";
+            memcpy(pos, res, strlen(res));
+            return pos + strlen(res);
+        }
+        else if constexpr (std::is_same_v<T, Int256>)
+        {
+            const char * res = "-57896044618658097711785492504343953926634992332820282019728792003956564819968";
+            memcpy(pos, res, strlen(res));
+            return pos + strlen(res);
+        }
+    }
+
+    if (x < 0)
+    {
+        x = -x;
+        pos = writeLeadingMinus(pos);
+    }
+    return writeUIntText(UnsignedT(x), pos);
+}
+}
+
+template <typename T>
+char * itoa(T i, char * p)
+{
+    return convert::itoa(i, p);
+}
+
+template <>
+char * itoa(UInt8 i, char * p)
+{
+    return convert::itoa(uint8_t(i), p);
+}
+
+template <>
+char * itoa(Int8 i, char * p)
+{
+    return convert::itoa(int8_t(i), p);
+}
+
+template <>
+char * itoa(UInt128 i, char * p)
+{
+    return writeUIntText(i, p);
+}
+
+template <>
+char * itoa(Int128 i, char * p)
+{
+    return writeSIntText(i, p);
+}
+
+template <>
+char * itoa(UInt256 i, char * p)
+{
+    return writeUIntText(i, p);
+}
+
+template <>
+char * itoa(Int256 i, char * p)
+{
+    return writeSIntText(i, p);
+}
+
+#define FOR_MISSING_INTEGER_TYPES(M) \
+    M(int8_t) \
+    M(uint8_t) \
+    M(UInt16) \
+    M(UInt32) \
+    M(UInt64) \
+    M(Int16) \
+    M(Int32) \
+    M(Int64)
+
+#define INSTANTIATION(T) template char * itoa(T i, char * p);
+FOR_MISSING_INTEGER_TYPES(INSTANTIATION)
+
+#undef FOR_MISSING_INTEGER_TYPES
+#undef INSTANTIATION
+
+
+#define DIGITS_INTEGER_TYPES(M) \
+    M(uint8_t) \
+    M(UInt8) \
+    M(UInt16) \
+    M(UInt32) \
+    M(UInt64) \
+    M(UInt128) \
+    M(UInt256)
+
+#define INSTANTIATION(T) template int digits10(T x);
+DIGITS_INTEGER_TYPES(INSTANTIATION)
+
+#undef DIGITS_INTEGER_TYPES
+#undef INSTANTIATION
diff --git a/base/base/itoa.h b/base/base/itoa.h
index a36eecaf1e5..71603cdeb88 100644
--- a/base/base/itoa.h
+++ b/base/base/itoa.h
@@ -1,474 +1,46 @@
 #pragma once
 
-// Based on https://github.com/amdn/itoa and combined with our optimizations
-//
-//=== itoa.h - Fast integer to ascii conversion                   --*- C++ -*-//
-//
-// The MIT License (MIT)
-// Copyright (c) 2016 Arturo Martin-de-Nicolas
-//
-// Permission is hereby granted, free of charge, to any person obtaining a copy
-// of this software and associated documentation files (the "Software"), to deal
-// in the Software without restriction, including without limitation the rights
-// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-// copies of the Software, and to permit persons to whom the Software is
-// furnished to do so, subject to the following conditions:
-//
-//     The above copyright notice and this permission notice shall be included
-//     in all copies or substantial portions of the Software.
-//
-// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-// SOFTWARE.
-//===----------------------------------------------------------------------===//
-
-#include <cstdint>
-#include <cstddef>
-#include <cstring>
-#include <type_traits>
 #include <base/extended_types.h>
 
+template <typename T> char * itoa(T i, char * p);
 
-template <typename T>
-inline int digits10(T x)
-{
-    if (x < 10ULL)
-        return 1;
-    if (x < 100ULL)
-        return 2;
-    if (x < 1000ULL)
-        return 3;
+template <> char * itoa(UInt8 i, char * p);
+template <> char * itoa(Int8 i, char * p);
+template <> char * itoa(UInt128 i, char * p);
+template <> char * itoa(Int128 i, char * p);
+template <> char * itoa(UInt256 i, char * p);
+template <> char * itoa(Int256 i, char * p);
 
-    if (x < 1000000000000ULL)
-    {
-        if (x < 100000000ULL)
-        {
-            if (x < 1000000ULL)
-            {
-                if (x < 10000ULL)
-                    return 4;
-                else
-                    return 5 + (x >= 100000ULL);
-            }
+#define FOR_MISSING_INTEGER_TYPES(M) \
+    M(int8_t) \
+    M(uint8_t) \
+    M(UInt16) \
+    M(UInt32) \
+    M(UInt64) \
+    M(Int16) \
+    M(Int32) \
+    M(Int64)
 
-            return 7 + (x >= 10000000ULL);
-        }
+#define INSTANTIATION(T) \
+    extern template char * itoa(T i, char * p);
+FOR_MISSING_INTEGER_TYPES(INSTANTIATION)
 
-        if (x < 10000000000ULL)
-            return 9 + (x >= 1000000000ULL);
-
-        return 11 + (x >= 100000000000ULL);
-    }
-
-    return 12 + digits10(x / 1000000000000ULL);
-}
+#undef FOR_MISSING_INTEGER_TYPES
+#undef INSTANTIATION
 
 
-namespace impl
-{
+template <typename T> int digits10(T x);
 
-template <typename T>
-static constexpr T pow10(size_t x)
-{
-    return x ? 10 * pow10<T>(x - 1) : 1;
-}
-
-// Division by a power of 10 is implemented using a multiplicative inverse.
-// This strength reduction is also done by optimizing compilers, but
-// presently the fastest results are produced by using the values
-// for the multiplication and the shift as given by the algorithm
-// described by Agner Fog in "Optimizing Subroutines in Assembly Language"
-//
-// http://www.agner.org/optimize/optimizing_assembly.pdf
-//
-// "Integer division by a constant (all processors)
-// A floating point number can be divided by a constant by multiplying
-// with the reciprocal. If we want to do the same with integers, we have
-// to scale the reciprocal by 2n and then shift the product to the right
-// by n. There are various algorithms for finding a suitable value of n
-// and compensating for rounding errors. The algorithm described below
-// was invented by Terje Mathisen, Norway, and not published elsewhere."
-
-/// Division by constant is performed by:
-/// 1. Adding 1 if needed;
-/// 2. Multiplying by another constant;
-/// 3. Shifting right by another constant.
-template <typename UInt, bool add_, UInt multiplier_, unsigned shift_>
-struct Division
-{
-    static constexpr bool add{add_};
-    static constexpr UInt multiplier{multiplier_};
-    static constexpr unsigned shift{shift_};
-};
-
-/// Select a type with appropriate number of bytes from the list of types.
-/// First parameter is the number of bytes requested. Then goes a list of types with 1, 2, 4, ... number of bytes.
-/// Example: SelectType<4, uint8_t, uint16_t, uint32_t, uint64_t> will select uint32_t.
-template <size_t N, typename T, typename... Ts>
-struct SelectType
-{
-    using Result = typename SelectType<N / 2, Ts...>::Result;
-};
-
-template <typename T, typename... Ts>
-struct SelectType<1, T, Ts...>
-{
-    using Result = T;
-};
-
-
-/// Division by 10^N where N is the size of the type.
-template <size_t N>
-using DivisionBy10PowN = typename SelectType
-<
-    N,
-    Division<uint8_t, false, 205U, 11>,                           /// divide by 10
-    Division<uint16_t, true, 41943U, 22>,                         /// divide by 100
-    Division<uint32_t, false, 3518437209U, 45>,                   /// divide by 10000
-    Division<uint64_t, false, 12379400392853802749ULL, 90>        /// divide by 100000000
->::Result;
-
-template <size_t N>
-using UnsignedOfSize = typename SelectType
-<
-    N,
-    uint8_t,
-    uint16_t,
-    uint32_t,
-    uint64_t,
-    __uint128_t
->::Result;
-
-/// Holds the result of dividing an unsigned N-byte variable by 10^N resulting in
-template <size_t N>
-struct QuotientAndRemainder
-{
-    UnsignedOfSize<N> quotient; // quotient with fewer than 2*N decimal digits
-    UnsignedOfSize<N / 2> remainder; // remainder with at most N decimal digits
-};
-
-template <size_t N>
-QuotientAndRemainder<N> static inline split(UnsignedOfSize<N> value)
-{
-    constexpr DivisionBy10PowN<N> division;
-
-    UnsignedOfSize<N> quotient = (division.multiplier * (UnsignedOfSize<2 * N>(value) + division.add)) >> division.shift;
-    UnsignedOfSize<N / 2> remainder = static_cast<UnsignedOfSize<N / 2>>(value - quotient * pow10<UnsignedOfSize<N / 2>>(N));
-
-    return {quotient, remainder};
-}
-
-
-static inline char * outDigit(char * p, uint8_t value)
-{
-    *p = '0' + value;
-    ++p;
-    return p;
-}
-
-// Using a lookup table to convert binary numbers from 0 to 99
-// into ascii characters as described by Andrei Alexandrescu in
-// https://www.facebook.com/notes/facebook-engineering/three-optimization-tips-for-c/10151361643253920/
-
-static const char digits[201] = "00010203040506070809"
-                                "10111213141516171819"
-                                "20212223242526272829"
-                                "30313233343536373839"
-                                "40414243444546474849"
-                                "50515253545556575859"
-                                "60616263646566676869"
-                                "70717273747576777879"
-                                "80818283848586878889"
-                                "90919293949596979899";
-
-static inline char * outTwoDigits(char * p, uint8_t value)
-{
-    memcpy(p, &digits[value * 2], 2);
-    p += 2;
-    return p;
-}
-
-
-namespace convert
-{
-    template <typename UInt, size_t N = sizeof(UInt)> static char * head(char * p, UInt u);
-    template <typename UInt, size_t N = sizeof(UInt)> static char * tail(char * p, UInt u);
-
-    //===----------------------------------------------------------===//
-    //     head: find most significant digit, skip leading zeros
-    //===----------------------------------------------------------===//
-
-    // "x" contains quotient and remainder after division by 10^N
-    // quotient is less than 10^N
-    template <size_t N>
-    static inline char * head(char * p, QuotientAndRemainder<N> x)
-    {
-        p = head(p, UnsignedOfSize<N / 2>(x.quotient));
-        p = tail(p, x.remainder);
-        return p;
-    }
-
-    // "u" is less than 10^2*N
-    template <typename UInt, size_t N>
-    static inline char * head(char * p, UInt u)
-    {
-        return u < pow10<UnsignedOfSize<N>>(N)
-            ? head(p, UnsignedOfSize<N / 2>(u))
-            : head<N>(p, split<N>(u));
-    }
-
-    // recursion base case, selected when "u" is one byte
-    template <>
-    inline char * head<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
-    {
-        return u < 10
-            ? outDigit(p, u)
-            : outTwoDigits(p, u);
-    }
-
-    //===----------------------------------------------------------===//
-    //     tail: produce all digits including leading zeros
-    //===----------------------------------------------------------===//
-
-    // recursive step, "u" is less than 10^2*N
-    template <typename UInt, size_t N>
-    static inline char * tail(char * p, UInt u)
-    {
-        QuotientAndRemainder<N> x = split<N>(u);
-        p = tail(p, UnsignedOfSize<N / 2>(x.quotient));
-        p = tail(p, x.remainder);
-        return p;
-    }
-
-    // recursion base case, selected when "u" is one byte
-    template <>
-    inline char * tail<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
-    {
-        return outTwoDigits(p, u);
-    }
-
-    //===----------------------------------------------------------===//
-    // large values are >= 10^2*N
-    // where x contains quotient and remainder after division by 10^N
-    //===----------------------------------------------------------===//
-
-    template <size_t N>
-    static inline char * large(char * p, QuotientAndRemainder<N> x)
-    {
-        QuotientAndRemainder<N> y = split<N>(x.quotient);
-        p = head(p, UnsignedOfSize<N / 2>(y.quotient));
-        p = tail(p, y.remainder);
-        p = tail(p, x.remainder);
-        return p;
-    }
-
-    //===----------------------------------------------------------===//
-    // handle values of "u" that might be >= 10^2*N
-    // where N is the size of "u" in bytes
-    //===----------------------------------------------------------===//
-
-    template <typename UInt, size_t N = sizeof(UInt)>
-    static inline char * uitoa(char * p, UInt u)
-    {
-        if (u < pow10<UnsignedOfSize<N>>(N))
-            return head(p, UnsignedOfSize<N / 2>(u));
-        QuotientAndRemainder<N> x = split<N>(u);
-
-        return u < pow10<UnsignedOfSize<N>>(2 * N)
-            ? head<N>(p, x)
-            : large<N>(p, x);
-    }
-
-    // selected when "u" is one byte
-    template <>
-    inline char * uitoa<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
-    {
-        if (u < 10)
-            return outDigit(p, u);
-        else if (u < 100)
-            return outTwoDigits(p, u);
-        else
-        {
-            p = outDigit(p, u / 100);
-            p = outTwoDigits(p, u % 100);
-            return p;
-        }
-    }
-
-    //===----------------------------------------------------------===//
-    //     handle unsigned and signed integral operands
-    //===----------------------------------------------------------===//
-
-    // itoa: handle unsigned integral operands (selected by SFINAE)
-    template <typename U, std::enable_if_t<!std::is_signed_v<U> && std::is_integral_v<U>> * = nullptr>
-    static inline char * itoa(U u, char * p)
-    {
-        return convert::uitoa(p, u);
-    }
-
-    // itoa: handle signed integral operands (selected by SFINAE)
-    template <typename I, size_t N = sizeof(I), std::enable_if_t<std::is_signed_v<I> && std::is_integral_v<I>> * = nullptr>
-    static inline char * itoa(I i, char * p)
-    {
-        // Need "mask" to be filled with a copy of the sign bit.
-        // If "i" is a negative value, then the result of "operator >>"
-        // is implementation-defined, though usually it is an arithmetic
-        // right shift that replicates the sign bit.
-        // Use a conditional expression to be portable,
-        // a good optimizing compiler generates an arithmetic right shift
-        // and avoids the conditional branch.
-        UnsignedOfSize<N> mask = i < 0 ? ~UnsignedOfSize<N>(0) : 0;
-        // Now get the absolute value of "i" and cast to unsigned type UnsignedOfSize<N>.
-        // Cannot use std::abs() because the result is undefined
-        // in 2's complement systems for the most-negative value.
-        // Want to avoid conditional branch for performance reasons since
-        // CPU branch prediction will be ineffective when negative values
-        // occur randomly.
-        // Let "u" be "i" cast to unsigned type UnsignedOfSize<N>.
-        // Subtract "u" from 2*u if "i" is positive or 0 if "i" is negative.
-        // This yields the absolute value with the desired type without
-        // using a conditional branch and without invoking undefined or
-        // implementation defined behavior:
-        UnsignedOfSize<N> u = ((2 * UnsignedOfSize<N>(i)) & ~mask) - UnsignedOfSize<N>(i);
-        // Unconditionally store a minus sign when producing digits
-        // in a forward direction and increment the pointer only if
-        // the value is in fact negative.
-        // This avoids a conditional branch and is safe because we will
-        // always produce at least one digit and it will overwrite the
-        // minus sign when the value is not negative.
-        *p = '-';
-        p += (mask & 1);
-        p = convert::uitoa(p, u);
-        return p;
-    }
-}
-
-
-template <typename T>
-static inline char * writeUIntText(T _x, char * p)
-{
-    int len = digits10(_x);
-    static_assert(std::is_same_v<T, UInt128> || std::is_same_v<T, UInt256>);
-    using T_ = std::conditional_t<
-        std::is_same_v<T, UInt128>,
-        unsigned __int128,
-#if defined(__x86_64__)
-#pragma clang diagnostic push
-#pragma clang diagnostic ignored "-Wbit-int-extension"
-        unsigned _BitInt(256)
-#pragma clang diagnostic pop
-#else
-        T
-#endif
-        >;
-
-    T_ x;
-    T_ hundred(100ULL);
-    if constexpr (std::is_same_v<T, UInt128>)
-    {
-        x = (T_(_x.items[T::_impl::little(1)]) << 64) + T_(_x.items[T::_impl::little(0)]);
-    }
-    else
-    {
-#if defined(__x86_64__)
-        x = (T_(_x.items[T::_impl::little(3)]) << 192) + (T_(_x.items[T::_impl::little(2)]) << 128) +
-                (T_(_x.items[T::_impl::little(1)]) << 64) + T_(_x.items[T::_impl::little(0)]);
-#else
-        x = _x;
-#endif
-    }
-
-    auto * pp = p + len;
-    while (x >= hundred)
-    {
-        const auto i = x % hundred;
-        x /= hundred;
-        pp -= 2;
-        outTwoDigits(pp, i);
-    }
-    if (x < 10)
-        *p = '0' + x;
-    else
-        outTwoDigits(p, x);
-    return p + len;
-}
-
-static inline char * writeLeadingMinus(char * pos)
-{
-    *pos = '-';
-    return pos + 1;
-}
-
-template <typename T>
-static inline char * writeSIntText(T x, char * pos)
-{
-    static_assert(std::is_same_v<T, Int128> || std::is_same_v<T, Int256>);
-
-    using UnsignedT = make_unsigned_t<T>;
-    static constexpr T min_int = UnsignedT(1) << (sizeof(T) * 8 - 1);
-
-    if (unlikely(x == min_int))
-    {
-        if constexpr (std::is_same_v<T, Int128>)
-        {
-            const char * res = "-170141183460469231731687303715884105728";
-            memcpy(pos, res, strlen(res));
-            return pos + strlen(res);
-        }
-        else if constexpr (std::is_same_v<T, Int256>)
-        {
-            const char * res = "-57896044618658097711785492504343953926634992332820282019728792003956564819968";
-            memcpy(pos, res, strlen(res));
-            return pos + strlen(res);
-        }
-    }
-
-    if (x < 0)
-    {
-        x = -x;
-        pos = writeLeadingMinus(pos);
-    }
-    return writeUIntText(UnsignedT(x), pos);
-}
-
-}
-
-template <typename I>
-char * itoa(I i, char * p)
-{
-    return impl::convert::itoa(i, p);
-}
-
-template <>
-inline char * itoa(char8_t i, char * p)
-{
-    return impl::convert::itoa(uint8_t(i), p);
-}
-
-template <>
-inline char * itoa(UInt128 i, char * p)
-{
-    return impl::writeUIntText(i, p);
-}
-
-template <>
-inline char * itoa(Int128 i, char * p)
-{
-    return impl::writeSIntText(i, p);
-}
-
-template <>
-inline char * itoa(UInt256 i, char * p)
-{
-    return impl::writeUIntText(i, p);
-}
-
-template <>
-inline char * itoa(Int256 i, char * p)
-{
-    return impl::writeSIntText(i, p);
-}
+#define DIGITS_INTEGER_TYPES(M) \
+    M(uint8_t) \
+    M(UInt8) \
+    M(UInt16) \
+    M(UInt32) \
+    M(UInt64) \
+    M(UInt128) \
+    M(UInt256)
+#define INSTANTIATION(T) \
+    extern template int digits10(T x);
+DIGITS_INTEGER_TYPES(INSTANTIATION)
+#undef DIGITS_INTEGER_TYPES
+#undef INSTANTIATION
diff --git a/src/Functions/CMakeLists.txt b/src/Functions/CMakeLists.txt
index ac3e3671ae0..dea369a508a 100644
--- a/src/Functions/CMakeLists.txt
+++ b/src/Functions/CMakeLists.txt
@@ -37,6 +37,7 @@ list (APPEND PUBLIC_LIBS
         clickhouse_dictionaries_embedded
         clickhouse_parsers
         ch_contrib::consistent_hashing
+        common
         dbms
         ch_contrib::metrohash
         ch_contrib::murmurhash

From 7fd13df8a5055892d2f8cdc83dcb900c19c87a95 Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Thu, 7 Mar 2024 17:09:55 +0100
Subject: [PATCH 161/985] check memory limit periodically

---
 programs/keeper/Keeper.cpp                | 10 +++++++++
 programs/server/Server.cpp                |  1 +
 src/Common/CgroupsMemoryUsageObserver.cpp | 26 +++++++++++++++++------
 src/Common/CgroupsMemoryUsageObserver.h   |  7 ++++--
 4 files changed, 35 insertions(+), 9 deletions(-)

diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index 8972c82eab8..76dd8cb15a5 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -10,6 +10,7 @@
 #include <IO/UseSSL.h>
 #include <Core/ServerUUID.h>
 #include <Common/logger_useful.h>
+#include <Common/CgroupsMemoryUsageObserver.h>
 #include <Common/ErrorHandlers.h>
 #include <Common/assertProcessUserMatchesDataOwner.h>
 #include <Common/makeSocketAddress.h>
@@ -623,6 +624,15 @@ try
     buildLoggers(config(), logger());
     main_config_reloader->start();
 
+    std::optional<CgroupsMemoryUsageObserver> observer;
+    auto cgroups_memory_observer_wait_time = config().getUInt64("keeper_server.cgroups_memory_observer_wait_time", 1);
+    if (cgroups_memory_observer_wait_time > 0)
+    {
+        observer.emplace(std::chrono::seconds(cgroups_memory_observer_wait_time));
+        observer->startThread();
+    }
+
+
     LOG_INFO(log, "Ready for connections.");
 
     waitForTerminationRequest();
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index c45291ba52c..6b282893dee 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -1362,6 +1362,7 @@ try
                 cgroups_memory_usage_observer->setLimits(
                     static_cast<uint64_t>(max_server_memory_usage * hard_limit_ratio),
                     static_cast<uint64_t>(max_server_memory_usage * soft_limit_ratio));
+                cgroups_memory_usage_observer->startThread();
             }
 
             size_t merges_mutations_memory_usage_soft_limit = new_server_settings.merges_mutations_memory_usage_soft_limit;
diff --git a/src/Common/CgroupsMemoryUsageObserver.cpp b/src/Common/CgroupsMemoryUsageObserver.cpp
index 9bed6b191e4..5f24c2553b5 100644
--- a/src/Common/CgroupsMemoryUsageObserver.cpp
+++ b/src/Common/CgroupsMemoryUsageObserver.cpp
@@ -8,7 +8,9 @@
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadBufferFromFileDescriptor.h>
 #include <IO/ReadHelpers.h>
+#include <Interpreters/Context.h>
 #include <base/cgroupsv2.h>
+#include <base/getMemoryAmount.h>
 #include <base/sleep.h>
 
 #include <filesystem>
@@ -48,11 +50,10 @@ CgroupsMemoryUsageObserver::~CgroupsMemoryUsageObserver()
 
 void CgroupsMemoryUsageObserver::setLimits(uint64_t hard_limit_, uint64_t soft_limit_)
 {
+    std::lock_guard<std::mutex> lock(set_limit_mutex);
     if (hard_limit_ == hard_limit && soft_limit_ == soft_limit)
         return;
 
-    stopThread();
-
     hard_limit = hard_limit_;
     soft_limit = soft_limit_;
 
@@ -94,8 +95,6 @@ void CgroupsMemoryUsageObserver::setLimits(uint64_t hard_limit_, uint64_t soft_l
         }
     };
 
-    startThread();
-
     LOG_INFO(log, "Set new limits, soft limit: {}, hard limit: {}", ReadableSize(soft_limit_), ReadableSize(hard_limit_));
 }
 
@@ -277,7 +276,7 @@ void CgroupsMemoryUsageObserver::stopThread()
 void CgroupsMemoryUsageObserver::runThread()
 {
     setThreadName("CgrpMemUsgObsr");
-
+    last_memory_amount = getMemoryAmount();
     std::unique_lock lock(thread_mutex);
     while (true)
     {
@@ -286,8 +285,21 @@ void CgroupsMemoryUsageObserver::runThread()
 
         try
         {
-            uint64_t memory_usage = file.readMemoryUsage();
-            processMemoryUsage(memory_usage);
+            uint64_t memory_limit = getMemoryAmount();
+            if (memory_limit != last_memory_amount)
+            {
+                last_memory_amount = memory_limit;
+                /// if we find memory amount changes, we just reload config.
+                /// Reloading config will check the memory amount again and calculate soft/hard limit again.
+                auto global_context = getContext()->getGlobalContext();
+                global_context->reloadConfig();
+            }
+            std::lock_guard<std::mutex> set_limit_lock(set_limit_mutex);
+            if (soft_limit > 0 && hard_limit > 0)
+            {
+                uint64_t memory_usage = file.readMemoryUsage();
+                processMemoryUsage(memory_usage);
+            }
         }
         catch (...)
         {
diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index 28bf08c82b5..6edf2e2049d 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <Common/ThreadPool.h>
+#include <Interpreters/Context_fwd.h>
 
 #include <atomic>
 #include <chrono>
@@ -14,7 +15,7 @@ namespace DB
 /// - When the soft memory limit is hit, drop jemalloc cache.
 /// - When the hard memory limit is hit, update MemoryTracking metric to throw memory exceptions faster.
 #if defined(OS_LINUX)
-class CgroupsMemoryUsageObserver
+class CgroupsMemoryUsageObserver : public WithContext
 {
 public:
     enum class CgroupsVersion
@@ -27,6 +28,7 @@ public:
     ~CgroupsMemoryUsageObserver();
 
     void setLimits(uint64_t hard_limit_, uint64_t soft_limit_);
+    void startThread();
 
     size_t getHardLimit() const { return hard_limit; }
     size_t getSoftLimit() const { return soft_limit; }
@@ -64,16 +66,17 @@ private:
 
     File file;
 
-    void startThread();
     void stopThread();
 
     void runThread();
     void processMemoryUsage(uint64_t usage);
 
     std::mutex thread_mutex;
+    std::mutex set_limit_mutex;
     std::condition_variable cond;
     ThreadFromGlobalPool thread;
     bool quit = false;
+    uint64_t last_memory_amount;
 };
 
 #else

From bd194aab41401492c5d628269df53e68243a1211 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Thu, 7 Mar 2024 12:55:21 -0400
Subject: [PATCH 162/985] Adds makeDateTime64 function.

---
 .../functions/date-time-functions.md          | 137 ++++++++++++++----
 .../functions/other-functions.md              |  65 ++++++++-
 2 files changed, 170 insertions(+), 32 deletions(-)

diff --git a/docs/en/sql-reference/functions/date-time-functions.md b/docs/en/sql-reference/functions/date-time-functions.md
index 41503abfa2f..12f0c996ce7 100644
--- a/docs/en/sql-reference/functions/date-time-functions.md
+++ b/docs/en/sql-reference/functions/date-time-functions.md
@@ -26,66 +26,115 @@ SELECT
 
 ## makeDate
 
-Creates a [Date](../../sql-reference/data-types/date.md)
-- from a year, month and day argument, or
-- from a year and day of year argument.
+Creates a [Date](../../sql-reference/data-types/date.md) from either one of the following sets of arguments:
 
-**Syntax**
+- a year, month, and day.
+- a year and day of year.
 
-``` sql
-makeDate(year, month, day);
-makeDate(year, day_of_year);
+### Syntax
+
+Using a year, month, and day:
+
+```sql
+makeDate(year, month, day)
 ```
 
-Alias:
-- `MAKEDATE(year, month, day);`
-- `MAKEDATE(year, day_of_year);`
+Using a year and day of year:
 
-**Arguments**
+```sql
+makeDate(year, day_of_year)
+```
+
+### Arguments
 
 - `year` — Year. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
 - `month` — Month. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
 - `day` — Day. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
 - `day_of_year` — Day of the year. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
 
-**Returned value**
+### Returned values
 
-- A date created from the arguments.
+A date created from the arguments.
 
 Type: [Date](../../sql-reference/data-types/date.md).
 
-**Example**
+### Examples
 
 Create a Date from a year, month and day:
 
-``` sql
+```sql
 SELECT makeDate(2023, 2, 28) AS Date;
 ```
 
-Result:
-
-``` text
-┌───────date─┐
-│ 2023-02-28 │
-└────────────┘
+```response
+2023-02-28
 ```
 
-Create a Date from a year and day of year argument:
+Create a Date from a year and day of year:
 
 ``` sql
 SELECT makeDate(2023, 42) AS Date;
 ```
 
-Result:
-
-``` text
-┌───────date─┐
-│ 2023-02-11 │
-└────────────┘
+```response
+2023-02-11
 ```
+
 ## makeDate32
 
-Like [makeDate](#makeDate) but produces a [Date32](../../sql-reference/data-types/date32.md).
+Creates a date of type [Date32](../../sql-reference/data-types/date32.md) from either one of the following sets of arguments:
+
+- a year, month, and day.
+- a year and day of year.
+
+### Syntax
+
+Using a year, month, and day:
+
+```sql
+makeDate32(year, month, day)
+```
+
+Using a year and day of year:
+
+```sql
+makeDate32(year, day_of_year)
+```
+
+### Arguments
+
+- `year` — Year. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
+- `month` — Month. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
+- `day` — Day. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
+- `day_of_year` — Day of the year. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
+
+### Returned values
+
+A date created from the arguments.
+
+Type: [Date32](../../sql-reference/data-types/date32.md).
+
+### Examples
+
+Create a date from a year, month, and day:
+
+```sql
+SELECT makeDate32(2024, 1, 1);
+```
+
+```response
+2024-01-01
+```
+
+Create a Date from a year and day of year:
+
+``` sql
+SELECT makeDate32(2024, 100);
+```
+
+```response
+2024-04-09
+```
 
 ## makeDateTime
 
@@ -129,12 +178,38 @@ Result:
 
 ## makeDateTime64
 
-Like [makeDateTime](#makedatetime) but produces a [DateTime64](../../sql-reference/data-types/datetime64.md).
+Create a [DateTime64](../../sql-reference/data-types/datetime64.md) data type value from its components (year, month, day, hour, minute, second, and optionally, subsecond precision).
+
+The DateTime64 data type stores both the date and time components in a single 64-bit integer value. The precision of the time component is configurable, allowing you to store time values with subsecond precision up to nanoseconds.
 
 **Syntax**
 
+```sql
+makeDateTime64(year, month, day, hour, minute, second[, fraction[, precision]])
+```
+
+**Arguments**
+
+- `year` — [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The year component (0-9999).
+- `month` — Month. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The month component (1-12).
+- `day` — Day. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The day component (1-31).
+- `hour` — Hour. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The hour component (0-23).
+- `minute` — Minute. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The minute component (0-59).
+- `second` — Second. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The second component (0-59).
+- `subsecond_precision` (optional) [Integer](../../sql-reference/data-types/int-uint.md): The precision of the subsecond component (0-9, where 0 means no subsecond precision, and 9 means nanosecond precision).
+
+**Returned value**
+
+A date and time element of type [DateTime64](../../sql-reference/data-types/datetime64.md) with created from the supplied arguments.
+
+**Example**
+
 ``` sql
-makeDateTime64(year, month, day, hour, minute, second[, fraction[, precision[, timezone]]])
+SELECT makeDateTime64(2023, 5, 15, 10, 30, 45, 779, 5);
+```
+
+```response
+2023-05-15 10:30:45.00779
 ```
 
 ## timestamp
diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index 739b688a0d2..10ceedad9aa 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -1866,7 +1866,7 @@ As you can see, `runningAccumulate` merges states for each group of rows separat
 
 ## joinGet
 
-The function lets you extract data from the table the same way as from a [dictionary](../../sql-reference/dictionaries/index.md).
+Allows you to extract data from a specific column in a Join table, similar to how you would access a value from a dictionary.
 
 Gets the data from [Join](../../engines/table-engines/special/join.md#creating-a-table) tables using the specified join key.
 
@@ -1927,6 +1927,69 @@ Result:
 └──────────────────────────────────────────────────┘
 ```
 
+## joinGetOrNull
+
+Allows you to extract data from a specific column in a Join table, similar to how you would access a value from a dictionary.
+
+Gets the data from [Join](../../engines/table-engines/special/join.md#creating-a-table) tables using the specified join key.
+
+Only supports tables created with the `ENGINE = Join(ANY, LEFT, <join_keys>)` statement.
+
+### Syntax
+
+```sql
+joinGet(join_storage_table_name, `value_column`, join_keys)
+```
+
+### Parameters
+
+- `join_storage_table_name` — an [identifier](../../sql-reference/syntax.md#syntax-identifiers) indicating where the search is performed. The identifier is searched in the default database (see setting `default_database` in the config file). To override the default database, use `USE db_name` or specify the database and the table through the separator `db_name.db_table` as in the example.
+- `value_column` — name of the column of the table that contains required data.
+- `join_keys` — list of keys.
+
+### Returned value
+
+Returns a list of values corresponded to list of keys.
+
+If certain does not exist in source table then `0` or `null` will be returned based on [join_use_nulls](../../operations/settings/settings.md#join_use_nulls) setting.
+
+More info about `join_use_nulls` in [Join operation](../../engines/table-engines/special/join.md).
+
+**Example**
+
+Input table:
+
+``` sql
+CREATE DATABASE db_test
+CREATE TABLE db_test.id_val(`id` UInt32, `val` UInt32) ENGINE = Join(ANY, LEFT, id) SETTINGS join_use_nulls = 1
+INSERT INTO db_test.id_val VALUES (1,11)(2,12)(4,13)
+```
+
+``` text
+┌─id─┬─val─┐
+│  4 │  13 │
+│  2 │  12 │
+│  1 │  11 │
+└────┴─────┘
+```
+
+Query:
+
+``` sql
+SELECT joinGet(db_test.id_val, 'val', toUInt32(number)) from numbers(4) SETTINGS join_use_nulls = 1
+```
+
+Result:
+
+``` text
+┌─joinGet(db_test.id_val, 'val', toUInt32(number))─┐
+│                                                0 │
+│                                               11 │
+│                                               12 │
+│                                                0 │
+└──────────────────────────────────────────────────┘
+```
+
 ## catboostEvaluate(path_to_model, feature_1, feature_2, …, feature_n)
 
 :::note

From 1b2357198d4c1b92fbe3f5a6c0c11be6f1d80a8f Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 7 Mar 2024 17:03:43 +0000
Subject: [PATCH 163/985] Fix: parallel replicas + prewhere

---
 src/Interpreters/InterpreterSelectQuery.cpp   |  5 ++--
 ...03006_parallel_replicas_prewhere.reference |  0
 .../03006_parallel_replicas_prewhere.sql      | 29 +++++++++++++++++++
 3 files changed, 32 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/03006_parallel_replicas_prewhere.reference
 create mode 100644 tests/queries/0_stateless/03006_parallel_replicas_prewhere.sql

diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index eaa256a16b0..80e2d5afef7 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -2112,7 +2112,7 @@ void InterpreterSelectQuery::applyFiltersToPrewhereInAnalysis(ExpressionAnalysis
         {
             /// Execute row level filter in prewhere as a part of "move to prewhere" optimization.
             analysis.prewhere_info
-                = std::make_shared<PrewhereInfo>(std::move(analysis.filter_info->actions), std::move(analysis.filter_info->column_name));
+                = std::make_shared<PrewhereInfo>(analysis.filter_info->actions, analysis.filter_info->column_name);
             analysis.prewhere_info->prewhere_actions->projectInput(false);
             analysis.prewhere_info->remove_prewhere_column = analysis.filter_info->do_remove_column;
             analysis.prewhere_info->need_filter = true;
@@ -2121,8 +2121,9 @@ void InterpreterSelectQuery::applyFiltersToPrewhereInAnalysis(ExpressionAnalysis
     }
     else
     {
+        chassert(analysis.filter_info->actions);
         /// Add row level security actions to prewhere.
-        analysis.prewhere_info->row_level_filter = std::move(analysis.filter_info->actions);
+        analysis.prewhere_info->row_level_filter = analysis.filter_info->actions;
         analysis.prewhere_info->row_level_column_name = std::move(analysis.filter_info->column_name);
         analysis.prewhere_info->row_level_filter->projectInput(false);
         analysis.filter_info = nullptr;
diff --git a/tests/queries/0_stateless/03006_parallel_replicas_prewhere.reference b/tests/queries/0_stateless/03006_parallel_replicas_prewhere.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03006_parallel_replicas_prewhere.sql b/tests/queries/0_stateless/03006_parallel_replicas_prewhere.sql
new file mode 100644
index 00000000000..819526b5596
--- /dev/null
+++ b/tests/queries/0_stateless/03006_parallel_replicas_prewhere.sql
@@ -0,0 +1,29 @@
+DROP POLICY IF EXISTS url_na_log_policy0 ON url_na_log;
+DROP TABLE IF EXISTS url_na_log;
+
+CREATE TABLE url_na_log
+(
+    `SiteId` UInt32,
+    `DateVisit` Date
+)
+ENGINE = MergeTree
+PRIMARY KEY SiteId
+ORDER BY (SiteId, DateVisit)
+SETTINGS index_granularity = 1000, min_bytes_for_wide_part = 0;
+
+CREATE ROW POLICY url_na_log_policy0 ON url_na_log FOR SELECT USING (DateVisit < '2022-08-11') OR (DateVisit > '2022-08-19') TO default;
+
+INSERT INTO url_na_log
+SETTINGS max_insert_block_size = 200000
+SELECT
+    209,
+    CAST('2022-08-09', 'Date') + toIntervalDay(intDiv(number, 10000))
+FROM numbers(130000)
+SETTINGS max_insert_block_size = 200000;
+
+EXPLAIN ESTIMATE
+SELECT count()
+FROM url_na_log
+PREWHERE (DateVisit >= toFixedString('2022-08-10', 10)) AND (DateVisit <= '2022-08-20')
+SETTINGS max_block_size = 1048576, max_threads = 1, allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3, allow_experimental_analyzer=0, parallel_replicas_min_number_of_rows_per_replica=10000;
+

From 0f0ea422f21af8e37aa5c8ef58002d608cde5c77 Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Thu, 7 Mar 2024 17:05:54 +0000
Subject: [PATCH 164/985] separate limits on number of waiting and executing
 queries

---
 .../settings.md                               |  16 ++-
 programs/server/Server.cpp                    |   1 +
 src/Common/AsyncLoader.cpp                    |  21 +++-
 src/Common/AsyncLoader.h                      |  65 ++++++++++-
 src/Common/tests/gtest_async_loader.cpp       |  66 +++++++++++
 src/Core/ServerSettings.h                     |   1 +
 src/Interpreters/ProcessList.cpp              | 103 +++++++++++++++---
 src/Interpreters/ProcessList.h                |  41 ++++++-
 .../System/StorageSystemServerSettings.cpp    |   1 +
 9 files changed, 293 insertions(+), 22 deletions(-)

diff --git a/docs/en/operations/server-configuration-parameters/settings.md b/docs/en/operations/server-configuration-parameters/settings.md
index 07c9a2b88ab..63fbd9d1964 100644
--- a/docs/en/operations/server-configuration-parameters/settings.md
+++ b/docs/en/operations/server-configuration-parameters/settings.md
@@ -379,6 +379,18 @@ Type: UInt64
 
 Default: 0
 
+## max_waiting_queries
+
+Limit on total number of concurrently waiting queries. Execution of a waiting query is blocked while required tables are loading asynchronously (see `async_load_databases`). Note that waiting queries are not counted when `max_concurrent_queries`, `max_concurrent_insert_queries`, `max_concurrent_select_queries`, `max_concurrent_queries_for_user` and `max_concurrent_queries_for_all_users` limits are checked. This correction is done to avoid hitting these limits just after server startup. Zero means unlimited.
+
+:::note
+This setting can be modified at runtime and will take effect immediately. Queries that are already running will remain unchanged.
+:::
+
+Type: UInt64
+
+Default: 0
+
 ## max_connections
 
 Max server connections.
@@ -1725,7 +1737,7 @@ Default value: `0.5`.
 
 Asynchronous loading of databases and tables.
 
-If `true` all non-system databases with `Ordinary`, `Atomic` and `Replicated` engine will be loaded asynchronously after the ClickHouse server start up. See `system.asynchronous_loader` table, `tables_loader_background_pool_size` and `tables_loader_foreground_pool_size` server settings. Any query that tries to access a table, that is not yet loaded, will wait for exactly this table to be started up. If load job fails, query will rethrow an error (instead of shutting down the whole server in case of `async_load_databases = false`). The table that is waited for by at least one query will be loaded with higher priority. DDL queries on a database will wait for exactly that database to be started up.
+If `true` all non-system databases with `Ordinary`, `Atomic` and `Replicated` engine will be loaded asynchronously after the ClickHouse server start up. See `system.asynchronous_loader` table, `tables_loader_background_pool_size` and `tables_loader_foreground_pool_size` server settings. Any query that tries to access a table, that is not yet loaded, will wait for exactly this table to be started up. If load job fails, query will rethrow an error (instead of shutting down the whole server in case of `async_load_databases = false`). The table that is waited for by at least one query will be loaded with higher priority. DDL queries on a database will wait for exactly that database to be started up. Also consider setting a limit `max_waiting_queries` for the total number of waiting queries.
 
 If `false`, all databases are loaded when the server starts.
 
@@ -2926,7 +2938,7 @@ Default: 0
 
 ## ignore_empty_sql_security_in_create_view_query {#ignore_empty_sql_security_in_create_view_query}
 
-If true, ClickHouse doesn't write defaults for empty SQL security statement in CREATE VIEW queries. 
+If true, ClickHouse doesn't write defaults for empty SQL security statement in CREATE VIEW queries.
 
 :::note
 This setting is only necessary for the migration period and will become obsolete in 24.4
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index a10f47be0b8..336563665a2 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -1429,6 +1429,7 @@ try
             global_context->getProcessList().setMaxSize(new_server_settings.max_concurrent_queries);
             global_context->getProcessList().setMaxInsertQueriesAmount(new_server_settings.max_concurrent_insert_queries);
             global_context->getProcessList().setMaxSelectQueriesAmount(new_server_settings.max_concurrent_select_queries);
+            global_context->getProcessList().setMaxWaitingQueriesAmount(new_server_settings.max_waiting_queries);
 
             if (config->has("keeper_server"))
                 global_context->updateKeeperConfiguration(*config);
diff --git a/src/Common/AsyncLoader.cpp b/src/Common/AsyncLoader.cpp
index 140194e10b4..80e4c72f1c1 100644
--- a/src/Common/AsyncLoader.cpp
+++ b/src/Common/AsyncLoader.cpp
@@ -140,6 +140,11 @@ void LoadJob::finish()
     finish_time = std::chrono::system_clock::now();
     if (waiters > 0)
         finished.notify_all();
+    else
+    {
+        on_waiters_increment = {};
+        on_waiters_decrement = {};
+    }
 }
 
 void LoadJob::scheduled(UInt64 job_id_)
@@ -765,11 +770,25 @@ void AsyncLoader::wait(std::unique_lock<std::mutex> & job_lock, const LoadJobPtr
     if (job->load_status != LoadStatus::PENDING) // Shortcut just to avoid incrementing ProfileEvents
         return;
 
+    if (job->on_waiters_increment)
+        job->on_waiters_increment(job);
+
+    // WARNING: it is important not to throw below this point to avoid `on_waiters_increment` call w/o matching `on_waiters_decrement` call
+
     Stopwatch watch;
     job->waiters++;
     job->finished.wait(job_lock, [&] { return job->load_status != LoadStatus::PENDING; });
     job->waiters--;
     ProfileEvents::increment(ProfileEvents::AsyncLoaderWaitMicroseconds, watch.elapsedMicroseconds());
+
+    if (job->on_waiters_decrement)
+        job->on_waiters_decrement(job);
+
+    if (job->waiters == 0)
+    {
+        job->on_waiters_increment = {};
+        job->on_waiters_decrement = {};
+    }
 }
 
 bool AsyncLoader::canSpawnWorker(Pool & pool, std::unique_lock<std::mutex> &)
@@ -859,7 +878,7 @@ void AsyncLoader::worker(Pool & pool)
         try
         {
             current_load_job = job.get();
-            SCOPE_EXIT({ current_load_job = nullptr; }); // Note that recursive job execution is not supported
+            SCOPE_EXIT({ current_load_job = nullptr; }); // Note that recursive job execution is not supported, but jobs can wait one another
             job->execute(*this, pool_id, job);
             exception_from_job = {};
         }
diff --git a/src/Common/AsyncLoader.h b/src/Common/AsyncLoader.h
index b1b336d24dc..3f81a36aa96 100644
--- a/src/Common/AsyncLoader.h
+++ b/src/Common/AsyncLoader.h
@@ -59,7 +59,8 @@ enum class LoadStatus
 class LoadJob : private boost::noncopyable
 {
 public:
-    template <class LoadJobSetType, class Func, class DFFunc>
+    // NOTE: makeLoadJob() helper should be used instead of direct ctor call
+    template <class LoadJobSetType, class DFFunc, class Func>
     LoadJob(LoadJobSetType && dependencies_, String name_, size_t pool_id_, DFFunc && dependency_failure_, Func && func_)
         : dependencies(std::forward<LoadJobSetType>(dependencies_))
         , name(std::move(name_))
@@ -69,6 +70,19 @@ public:
         , func(std::forward<Func>(func_))
     {}
 
+    // NOTE: makeLoadJob() helper should be used instead of direct ctor call
+    template <class LoadJobSetType, class WIFunc, class WDFunc, class DFFunc, class Func>
+    LoadJob(LoadJobSetType && dependencies_, String name_, size_t pool_id_, WIFunc && on_waiters_increment_, WDFunc && on_waiters_decrement_, DFFunc && dependency_failure_, Func && func_)
+        : dependencies(std::forward<LoadJobSetType>(dependencies_))
+        , name(std::move(name_))
+        , execution_pool_id(pool_id_)
+        , pool_id(pool_id_)
+        , on_waiters_increment(std::forward<WIFunc>(on_waiters_increment_))
+        , on_waiters_decrement(std::forward<WDFunc>(on_waiters_decrement_))
+        , dependency_failure(std::forward<DFFunc>(dependency_failure_))
+        , func(std::forward<Func>(func_))
+    {}
+
     // Current job status.
     LoadStatus status() const;
     std::exception_ptr exception() const;
@@ -112,6 +126,13 @@ private:
     std::atomic<size_t> execution_pool_id;
     std::atomic<size_t> pool_id;
 
+    // Handlers that is called by every new waiting thread, just before going to sleep.
+    // If `on_waiters_increment` throws, then wait is canceled, and corresponding `on_waiters_decrement` will never be called.
+    // It can be used for counting and limits on number of waiters.
+    // Note that implementations are called under `LoadJob::mutex` and should be fast.
+    std::function<void(const LoadJobPtr & self)> on_waiters_increment;
+    std::function<void(const LoadJobPtr & self)> on_waiters_decrement;
+
     // Handler for failed or canceled dependencies.
     // If job needs to be canceled on `dependency` failure, then function should set `cancel` to a specific reason.
     // Note that implementation should be fast and cannot use AsyncLoader, because it is called under `AsyncLoader::mutex`.
@@ -140,8 +161,50 @@ void cancelOnDependencyFailure(const LoadJobPtr & self, const LoadJobPtr & depen
 void ignoreDependencyFailure(const LoadJobPtr & self, const LoadJobPtr & dependency, std::exception_ptr & cancel);
 
 template <class F> concept LoadJobDependencyFailure = std::invocable<F, const LoadJobPtr &, const LoadJobPtr &, std::exception_ptr &>;
+template <class F> concept LoadJobOnWaiters = std::invocable<F, const LoadJobPtr &>;
 template <class F> concept LoadJobFunc = std::invocable<F, AsyncLoader &, const LoadJobPtr &>;
 
+LoadJobPtr makeLoadJob(LoadJobSet && dependencies, String name, LoadJobOnWaiters auto && on_waiters_increment, LoadJobOnWaiters auto && on_waiters_decrement, LoadJobDependencyFailure auto && dependency_failure, LoadJobFunc auto && func)
+{
+    return std::make_shared<LoadJob>(std::move(dependencies), std::move(name), 0, on_waiters_increment, on_waiters_decrement, std::forward<decltype(dependency_failure)>(dependency_failure), std::forward<decltype(func)>(func));
+}
+
+LoadJobPtr makeLoadJob(const LoadJobSet & dependencies, String name, LoadJobOnWaiters auto && on_waiters_increment, LoadJobOnWaiters auto && on_waiters_decrement, LoadJobDependencyFailure auto && dependency_failure, LoadJobFunc auto && func)
+{
+    return std::make_shared<LoadJob>(dependencies, std::move(name), 0, on_waiters_increment, on_waiters_decrement, std::forward<decltype(dependency_failure)>(dependency_failure), std::forward<decltype(func)>(func));
+}
+
+LoadJobPtr makeLoadJob(LoadJobSet && dependencies, size_t pool_id, String name, LoadJobOnWaiters auto && on_waiters_increment, LoadJobOnWaiters auto && on_waiters_decrement, LoadJobDependencyFailure auto && dependency_failure, LoadJobFunc auto && func)
+{
+    return std::make_shared<LoadJob>(std::move(dependencies), std::move(name), pool_id, on_waiters_increment, on_waiters_decrement, std::forward<decltype(dependency_failure)>(dependency_failure), std::forward<decltype(func)>(func));
+}
+
+LoadJobPtr makeLoadJob(const LoadJobSet & dependencies, size_t pool_id, String name, LoadJobOnWaiters auto && on_waiters_increment, LoadJobOnWaiters auto && on_waiters_decrement, LoadJobDependencyFailure auto && dependency_failure, LoadJobFunc auto && func)
+{
+    return std::make_shared<LoadJob>(dependencies, std::move(name), pool_id, on_waiters_increment, on_waiters_decrement, std::forward<decltype(dependency_failure)>(dependency_failure), std::forward<decltype(func)>(func));
+}
+
+LoadJobPtr makeLoadJob(LoadJobSet && dependencies, String name, LoadJobOnWaiters auto && on_waiters_increment, LoadJobOnWaiters auto && on_waiters_decrement, LoadJobFunc auto && func)
+{
+    return std::make_shared<LoadJob>(std::move(dependencies), std::move(name), 0, on_waiters_increment, on_waiters_decrement, cancelOnDependencyFailure, std::forward<decltype(func)>(func));
+}
+
+LoadJobPtr makeLoadJob(const LoadJobSet & dependencies, String name, LoadJobOnWaiters auto && on_waiters_increment, LoadJobOnWaiters auto && on_waiters_decrement, LoadJobFunc auto && func)
+{
+    return std::make_shared<LoadJob>(dependencies, std::move(name), 0, on_waiters_increment, on_waiters_decrement, cancelOnDependencyFailure, std::forward<decltype(func)>(func));
+}
+
+LoadJobPtr makeLoadJob(LoadJobSet && dependencies, size_t pool_id, String name, LoadJobOnWaiters auto && on_waiters_increment, LoadJobOnWaiters auto && on_waiters_decrement, LoadJobFunc auto && func)
+{
+    return std::make_shared<LoadJob>(std::move(dependencies), std::move(name), pool_id, on_waiters_increment, on_waiters_decrement, cancelOnDependencyFailure, std::forward<decltype(func)>(func));
+}
+
+LoadJobPtr makeLoadJob(const LoadJobSet & dependencies, size_t pool_id, String name, LoadJobOnWaiters auto && on_waiters_increment, LoadJobOnWaiters auto && on_waiters_decrement, LoadJobFunc auto && func)
+{
+    return std::make_shared<LoadJob>(dependencies, std::move(name), pool_id, on_waiters_increment, on_waiters_decrement, cancelOnDependencyFailure, std::forward<decltype(func)>(func));
+}
+
+
 LoadJobPtr makeLoadJob(LoadJobSet && dependencies, String name, LoadJobDependencyFailure auto && dependency_failure, LoadJobFunc auto && func)
 {
     return std::make_shared<LoadJob>(std::move(dependencies), std::move(name), 0, std::forward<decltype(dependency_failure)>(dependency_failure), std::forward<decltype(func)>(func));
diff --git a/src/Common/tests/gtest_async_loader.cpp b/src/Common/tests/gtest_async_loader.cpp
index fc2537abcfc..62a27f259cc 100644
--- a/src/Common/tests/gtest_async_loader.cpp
+++ b/src/Common/tests/gtest_async_loader.cpp
@@ -643,6 +643,72 @@ TEST(AsyncLoader, CustomDependencyFailure)
     ASSERT_EQ(good_count.load(), 3);
 }
 
+TEST(AsyncLoader, WaitersLimit)
+{
+    AsyncLoaderTest t(16);
+
+    std::atomic<int> waiters_total{0};
+    int waiters_limit = 5;
+    auto waiters_inc = [&] (const LoadJobPtr &) {
+        int value = waiters_total.load();
+        while (true)
+        {
+            if (value >= waiters_limit)
+                throw Exception(ErrorCodes::ASYNC_LOAD_FAILED, "Too many waiters: {}", value);
+            if (waiters_total.compare_exchange_strong(value, value + 1))
+                break;
+        }
+    };
+    auto waiters_dec = [&] (const LoadJobPtr &) {
+        waiters_total.fetch_sub(1);
+    };
+
+    std::barrier sync(2);
+    t.loader.start();
+
+    auto job_func = [&] (AsyncLoader &, const LoadJobPtr &) {
+        sync.arrive_and_wait(); // (A)
+    };
+
+    auto job = makeLoadJob({}, "job", waiters_inc, waiters_dec, job_func);
+    auto task = t.schedule({job});
+
+    std::atomic<int> failure{0};
+    std::atomic<int> success{0};
+    std::vector<std::thread> waiters;
+    waiters.reserve(10);
+    auto waiter = [&] {
+        try
+        {
+            t.loader.wait(job);
+            success.fetch_add(1);
+        }
+        catch(...)
+        {
+            failure.fetch_add(1);
+        }
+    };
+
+    for (int i = 0; i < 10; i++)
+        waiters.emplace_back(waiter);
+
+    while (failure.load() != 5)
+        std::this_thread::yield();
+
+    ASSERT_EQ(job->waitersCount(), 5);
+
+    sync.arrive_and_wait(); // (A)
+
+    for (auto & thread : waiters)
+        thread.join();
+
+    ASSERT_EQ(success.load(), 5);
+    ASSERT_EQ(failure.load(), 5);
+    ASSERT_EQ(waiters_total.load(), 0);
+
+    t.loader.wait();
+}
+
 TEST(AsyncLoader, TestConcurrency)
 {
     AsyncLoaderTest t(10);
diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index c82255ec59c..129b1016fca 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -64,6 +64,7 @@ namespace DB
     M(UInt64, max_concurrent_queries, 0, "Maximum number of concurrently executed queries. Zero means unlimited.", 0) \
     M(UInt64, max_concurrent_insert_queries, 0, "Maximum number of concurrently INSERT queries. Zero means unlimited.", 0) \
     M(UInt64, max_concurrent_select_queries, 0, "Maximum number of concurrently SELECT queries. Zero means unlimited.", 0) \
+    M(UInt64, max_waiting_queries, 0, "Maximum number of concurrently waiting queries blocked due to `async_load_databases`. Note that waiting queries are not considered by `max_concurrent_*queries*` limits. Zero means unlimited.", 0) \
     \
     M(Double, cache_size_to_ram_max_ratio, 0.5, "Set cache size ro RAM max ratio. Allows to lower cache size on low-memory systems.", 0) \
     M(String, uncompressed_cache_policy, DEFAULT_UNCOMPRESSED_CACHE_POLICY, "Uncompressed cache policy name.", 0) \
diff --git a/src/Interpreters/ProcessList.cpp b/src/Interpreters/ProcessList.cpp
index 3bd7b2d4206..f451d561e60 100644
--- a/src/Interpreters/ProcessList.cpp
+++ b/src/Interpreters/ProcessList.cpp
@@ -83,25 +83,31 @@ ProcessList::insert(const String & query_, const IAST * ast, ContextMutablePtr q
         IAST::QueryKind query_kind = ast->getQueryKind();
 
         const auto queue_max_wait_ms = settings.queue_max_wait_ms.totalMilliseconds();
-        if (!is_unlimited_query && max_size && processes.size() >= max_size)
+        UInt64 waiting_queries = waiting_queries_amount.load();
+        if (!is_unlimited_query && max_size && processes.size() >= max_size + waiting_queries)
         {
             if (queue_max_wait_ms)
                 LOG_WARNING(getLogger("ProcessList"), "Too many simultaneous queries, will wait {} ms.", queue_max_wait_ms);
-            if (!queue_max_wait_ms || !have_space.wait_for(lock, std::chrono::milliseconds(queue_max_wait_ms), [&]{ return processes.size() < max_size; }))
-                throw Exception(ErrorCodes::TOO_MANY_SIMULTANEOUS_QUERIES, "Too many simultaneous queries. Maximum: {}", max_size);
+            if (!queue_max_wait_ms || !have_space.wait_for(lock, std::chrono::milliseconds(queue_max_wait_ms),
+                    [&]{ waiting_queries = waiting_queries_amount.load(); return processes.size() < max_size + waiting_queries; }))
+                throw Exception(ErrorCodes::TOO_MANY_SIMULTANEOUS_QUERIES,
+                                "Too many simultaneous queries. Maximum: {}{}",
+                                max_size, waiting_queries == 0 ? "" : fmt::format(", waiting: {}", waiting_queries));
         }
 
         if (!is_unlimited_query)
         {
             QueryAmount amount = getQueryKindAmount(query_kind);
-            if (max_insert_queries_amount && query_kind == IAST::QueryKind::Insert && amount >= max_insert_queries_amount)
+            UInt64 waiting_inserts = waiting_insert_queries_amount.load();
+            UInt64 waiting_selects = waiting_select_queries_amount.load();
+            if (max_insert_queries_amount && query_kind == IAST::QueryKind::Insert && amount >= max_insert_queries_amount + waiting_inserts)
                 throw Exception(ErrorCodes::TOO_MANY_SIMULTANEOUS_QUERIES,
-                                "Too many simultaneous insert queries. Maximum: {}, current: {}",
-                                max_insert_queries_amount, amount);
-            if (max_select_queries_amount && query_kind == IAST::QueryKind::Select && amount >= max_select_queries_amount)
+                                "Too many simultaneous insert queries. Maximum: {}, current: {}{}",
+                                max_insert_queries_amount, amount, waiting_inserts == 0 ? "" : fmt::format(", waiting: {}", waiting_inserts));
+            if (max_select_queries_amount && query_kind == IAST::QueryKind::Select && amount >= max_select_queries_amount + waiting_selects)
                 throw Exception(ErrorCodes::TOO_MANY_SIMULTANEOUS_QUERIES,
-                                "Too many simultaneous select queries. Maximum: {}, current: {}",
-                                max_select_queries_amount, amount);
+                                "Too many simultaneous select queries. Maximum: {}, current: {}{}",
+                                max_select_queries_amount, amount, waiting_selects == 0 ? "" : fmt::format(", waiting: {}", waiting_selects));
         }
 
         {
@@ -124,10 +130,12 @@ ProcessList::insert(const String & query_, const IAST * ast, ContextMutablePtr q
              * once is already processing 50+ concurrent queries (including analysts or any other users).
              */
 
+            waiting_queries = waiting_queries_amount.load();
             if (!is_unlimited_query && settings.max_concurrent_queries_for_all_users
-                && processes.size() >= settings.max_concurrent_queries_for_all_users)
+                && processes.size() >= settings.max_concurrent_queries_for_all_users + waiting_queries_amount)
                 throw Exception(ErrorCodes::TOO_MANY_SIMULTANEOUS_QUERIES, "Too many simultaneous queries for all users. "
-                    "Current: {}, maximum: {}", processes.size(), settings.max_concurrent_queries_for_all_users.toString());
+                    "Current: {}, maximum: {}{}", processes.size(), settings.max_concurrent_queries_for_all_users.toString(),
+                    waiting_queries == 0 ? "" : fmt::format(", waiting: {}", waiting_queries));
         }
 
         /** Why we use current user?
@@ -145,13 +153,15 @@ ProcessList::insert(const String & query_, const IAST * ast, ContextMutablePtr q
 
             if (user_process_list != user_to_queries.end())
             {
+                UInt64 user_waiting_queries = user_process_list->second.waiting_queries_amount.load();
                 if (!is_unlimited_query && settings.max_concurrent_queries_for_user
-                    && user_process_list->second.queries.size() >= settings.max_concurrent_queries_for_user)
+                    && user_process_list->second.queries.size() >= settings.max_concurrent_queries_for_user + user_waiting_queries)
                     throw Exception(ErrorCodes::TOO_MANY_SIMULTANEOUS_QUERIES,
                                     "Too many simultaneous queries for user {}. "
-                                    "Current: {}, maximum: {}",
+                                    "Current: {}, maximum: {}{}",
                                     client_info.current_user, user_process_list->second.queries.size(),
-                                    settings.max_concurrent_queries_for_user.toString());
+                                    settings.max_concurrent_queries_for_user.toString(),
+                                    user_waiting_queries == 0 ? "" : fmt::format(", waiting: {}", user_waiting_queries));
 
                 auto running_query = user_process_list->second.queries.find(client_info.current_query_id);
 
@@ -745,4 +755,69 @@ ProcessList::QueryAmount ProcessList::getQueryKindAmount(const IAST::QueryKind &
     return found->second;
 }
 
+void ProcessList::increaseWaitingQueryAmount(const QueryStatusPtr & status)
+{
+    UInt64 limit = max_waiting_queries_amount.load();
+    UInt64 value = waiting_queries_amount.load();
+    while (true)
+    {
+        if (value >= limit)
+            throw Exception(ErrorCodes::TOO_MANY_SIMULTANEOUS_QUERIES,
+                            "Too many simultaneous waiting queries. Maximum: {}, waiting: {}",
+                            limit, value);
+        if (waiting_queries_amount.compare_exchange_strong(value, value + 1))
+            break;
+    }
+
+    // WARNING: After this point we should not throw, otherwise corresponding `decreaseWaitingQueryAmount` will not be called.
+
+    // Update query kind counters
+    if (status->query_kind == IAST::QueryKind::Insert)
+        waiting_insert_queries_amount.fetch_add(1);
+    if (status->query_kind == IAST::QueryKind::Select)
+        waiting_select_queries_amount.fetch_add(1);
+
+    // Update per-user counter
+    status->getUserProcessList()->waiting_queries_amount.fetch_add(1);
+
+    // We have to notify because some queries might be waiting on `have_space`
+    // and this query leaves its space by transitioning to waiting state
+    have_space.notify_all();
+}
+
+void ProcessList::decreaseWaitingQueryAmount(const QueryStatusPtr & status)
+{
+    if (status->getUserProcessList()->waiting_queries_amount.fetch_sub(1) == 0)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong insert waiting query amount for user: decrease to negative");
+
+    if (status->query_kind == IAST::QueryKind::Insert && waiting_insert_queries_amount.fetch_sub(1) == 0)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong insert waiting query amount: decrease to negative");
+
+    if (status->query_kind == IAST::QueryKind::Select && waiting_select_queries_amount.fetch_sub(1) == 0)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong select waiting query amount: decrease to negative");
+
+    if (waiting_queries_amount.fetch_sub(1) == 0)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong waiting query amount: decrease to negative");
+}
+
+void ProcessList::incrementWaiters()
+{
+    ContextPtr context = CurrentThread::getQueryContext();
+    QueryStatusPtr status = context->getProcessListElement();
+
+    // Query became "waiting" with the first thread that waits
+    if (status->waiting_threads.fetch_add(1) == 0)
+        increaseWaitingQueryAmount(status);
+}
+
+void ProcessList::decrementWaiters()
+{
+    ContextPtr context = CurrentThread::getQueryContext();
+    QueryStatusPtr status = context->getProcessListElement();
+
+    // Query became "non-waiting" with the last thread that no longer waits
+    if (status->waiting_threads.fetch_sub(1) == 1)
+        decreaseWaitingQueryAmount(status);
+}
+
 }
diff --git a/src/Interpreters/ProcessList.h b/src/Interpreters/ProcessList.h
index 1c253f562e8..75350627698 100644
--- a/src/Interpreters/ProcessList.h
+++ b/src/Interpreters/ProcessList.h
@@ -42,10 +42,6 @@ class ThreadStatus;
 class ProcessListEntry;
 
 
-/** List of currently executing queries.
-  * Also implements limit on their number.
-  */
-
 /** Information of process list element.
   * To output in SHOW PROCESSLIST query. Does not contain any complex objects, that do something on copy or destructor.
   */
@@ -114,8 +110,13 @@ protected:
     /// Including EndOfStream or Exception.
     std::atomic<bool> is_all_data_sent { false };
 
+    /// Number of threads for the query that are waiting for load jobs
+    std::atomic<UInt64> waiting_threads{0};
+
+    /// For initialization of ProcessListForUser during process insertion.
     void setUserProcessList(ProcessListForUser * user_process_list_);
     /// Be careful using it. For example, queries field of ProcessListForUser could be modified concurrently.
+    ProcessListForUser * getUserProcessList() { return user_process_list; }
     const ProcessListForUser * getUserProcessList() const { return user_process_list; }
 
     /// Sets an entry in the ProcessList associated with this QueryStatus.
@@ -283,6 +284,9 @@ struct ProcessListForUser
     /// Count network usage for all simultaneously running queries of single user.
     ThrottlerPtr user_throttler;
 
+    /// Number of queries waiting on load jobs
+    std::atomic<UInt64> waiting_queries_amount{0};
+
     ProcessListForUserInfo getInfo(bool get_profile_events = false) const;
 
     /// Clears MemoryTracker for the user.
@@ -341,6 +345,9 @@ protected:
 };
 
 
+/** List of currently executing queries.
+  * Also implements limit on their number.
+  */
 class ProcessList : public ProcessListBase
 {
 public:
@@ -399,10 +406,21 @@ protected:
     /// amount of queries by query kind.
     QueryKindAmounts query_kind_amounts;
 
+    /// limit for waiting queries. 0 means no limit. Otherwise, when limit exceeded, an exception is thrown.
+    std::atomic<UInt64> max_waiting_queries_amount{0};
+
+    /// amounts of waiting queries
+    std::atomic<UInt64> waiting_queries_amount{0};
+    std::atomic<UInt64> waiting_insert_queries_amount{0};
+    std::atomic<UInt64> waiting_select_queries_amount{0};
+
     void increaseQueryKindAmount(const IAST::QueryKind & query_kind);
     void decreaseQueryKindAmount(const IAST::QueryKind & query_kind);
     QueryAmount getQueryKindAmount(const IAST::QueryKind & query_kind) const;
 
+    void increaseWaitingQueryAmount(const QueryStatusPtr & status);
+    void decreaseWaitingQueryAmount(const QueryStatusPtr & status);
+
 public:
     using EntryPtr = std::shared_ptr<ProcessListEntry>;
 
@@ -458,6 +476,21 @@ public:
         return max_select_queries_amount;
     }
 
+    void setMaxWaitingQueriesAmount(UInt64 max_waiting_queries_amount_)
+    {
+        max_waiting_queries_amount.store(max_waiting_queries_amount_);
+        // NOTE: We cannot cancel waiting queries when limit is lowered. They have to wait anyways, but new queries will be canceled instead of waiting.
+    }
+
+    size_t getMaxWaitingQueriesAmount() const
+    {
+        return max_waiting_queries_amount.load();
+    }
+
+    // Handlers for AsyncLoader waiters
+    void incrementWaiters();
+    void decrementWaiters();
+
     /// Try call cancel() for input and output streams of query with specified id and user
     CancellationCode sendCancelToQuery(const String & current_query_id, const String & current_user, bool kill = false);
     CancellationCode sendCancelToQuery(QueryStatusPtr elem, bool kill = false);
diff --git a/src/Storages/System/StorageSystemServerSettings.cpp b/src/Storages/System/StorageSystemServerSettings.cpp
index f390985546b..bf14f757a19 100644
--- a/src/Storages/System/StorageSystemServerSettings.cpp
+++ b/src/Storages/System/StorageSystemServerSettings.cpp
@@ -70,6 +70,7 @@ void StorageSystemServerSettings::fillData(MutableColumns & res_columns, Context
         {"max_concurrent_queries", {std::to_string(context->getProcessList().getMaxSize()), ChangeableWithoutRestart::Yes}},
         {"max_concurrent_insert_queries", {std::to_string(context->getProcessList().getMaxInsertQueriesAmount()), ChangeableWithoutRestart::Yes}},
         {"max_concurrent_select_queries", {std::to_string(context->getProcessList().getMaxSelectQueriesAmount()), ChangeableWithoutRestart::Yes}},
+        {"max_waiting_queries", {std::to_string(context->getProcessList().getMaxWaitingQueriesAmount()), ChangeableWithoutRestart::Yes}},
 
         {"background_buffer_flush_schedule_pool_size", {std::to_string(CurrentMetrics::get(CurrentMetrics::BackgroundBufferFlushSchedulePoolSize)), ChangeableWithoutRestart::IncreaseOnly}},
         {"background_schedule_pool_size", {std::to_string(CurrentMetrics::get(CurrentMetrics::BackgroundSchedulePoolSize)), ChangeableWithoutRestart::IncreaseOnly}},

From f4fc65449cc3ace36f33323600fd1a47fbfb9736 Mon Sep 17 00:00:00 2001
From: Peter <peter279k@gmail.com>
Date: Fri, 8 Mar 2024 01:20:50 +0800
Subject: [PATCH 165/985] Add another example dataset for presenting usage

---
 .../example-datasets/tw-weather.md            | 293 ++++++++++++++++++
 1 file changed, 293 insertions(+)
 create mode 100644 docs/en/getting-started/example-datasets/tw-weather.md

diff --git a/docs/en/getting-started/example-datasets/tw-weather.md b/docs/en/getting-started/example-datasets/tw-weather.md
new file mode 100644
index 00000000000..e5f16c403d5
--- /dev/null
+++ b/docs/en/getting-started/example-datasets/tw-weather.md
@@ -0,0 +1,293 @@
+---
+slug: /en/getting-started/example-datasets/tw-weather
+sidebar_label: Taiwan Historical Weather Datasets
+sidebar_position: 1
+description: 131 million rows of weather observation data for the last 128 yrs
+---
+
+# Taiwan Historical Weather Datasets
+
+This dataset contains historical meteorological observations measurements for the last 128 years. Each row is a measurement for a point in date time and weather station.
+
+The origin of this dataset is available [here](https://github.com/Raingel/historical_weather) and the list of weather station numbers can be found [here](https://github.com/Raingel/weather_station_list).
+
+> The sources of meteorological datasets include the meteorological stations that are established by the Central Weather Administration (station code is beginning with C0, C1, and 4) and the agricultural meteorological stations belonging to the Council of Agriculture (station code other than those mentioned above):
+
+    - StationId
+    - MeasuredDate, the observation time
+    - StnPres, the station air pressure
+    - SeaPres, the sea level pressure
+    - Td, the dew point temperature
+    - RH, the relative humidity
+    - Other elements where available
+
+## Downloading the data
+
+- A [pre-processed version](#pre-processed-data) of the data for the ClickHouse, which has been cleaned, re-structured, and enriched. This dataset covers the years from 1896 to 2023.
+- [Download the original raw data](#original-raw-data) and convert to the format required by ClickHouse. Users wanting to add their own columns may wish to explore or complete their approaches.
+
+### Pre-processed data
+
+The dataset has also been re-structured from a measurement per line to a row per weather station id and measured date, i.e.
+
+```csv
+StationId,MeasuredDate,StnPres,Tx,RH,WS,WD,WSGust,WDGust,Precp,GloblRad,TxSoil0cm,TxSoil5cm,TxSoil20cm,TxSoil50cm,TxSoil100cm,SeaPres,Td,PrecpHour,SunShine,TxSoil10cm,EvapA,Visb,UVI,Cloud Amount,TxSoil30cm,TxSoil200cm,TxSoil300cm,TxSoil500cm,VaporPressure
+C0X100,2016-01-01 01:00:00,1022.1,16.1,72,1.1,8.0,,,,,,,,,,,,,,,,,,,,,,,
+C0X100,2016-01-01 02:00:00,1021.6,16.0,73,1.2,358.0,,,,,,,,,,,,,,,,,,,,,,,
+C0X100,2016-01-01 03:00:00,1021.3,15.8,74,1.5,353.0,,,,,,,,,,,,,,,,,,,,,,,
+C0X100,2016-01-01 04:00:00,1021.2,15.8,74,1.7,8.0,,,,,,,,,,,,,,,,,,,,,,,
+```
+
+It is easy to query and ensure that the resulting table has less sparse and some elements are null because they're not available to be measured in this weather station.
+
+This dataset is available in the following Google CloudStorage location. Either download the dataset to your local filesystem (and insert them with the ClickHouse client) or insert them directly into the ClickHouse (see [Inserting from URL](#inserting-from-url)).
+
+To download:
+
+```bash
+wget https://storage.googleapis.com/taiwan-weather-observaiton-datasets/preprocessed_weather_daily_1896_2023.tar.gz
+
+# Option: Validate the checksum
+md5sum preprocessed_weather_daily_1896_2023.tar.gz
+# Checksum should be equal to: 11b484f5bd9ddafec5cfb131eb2dd008
+
+tar -xzvf preprocessed_weather_daily_1896_2023.tar.gz
+daily_weather_preprocessed_1896_2023.csv
+
+# Option: Validate the checksum
+md5sum daily_weather_preprocessed_1896_2023.csv
+# Checksum should be equal to: 1132248c78195c43d93f843753881754
+```
+
+### Original raw data
+
+The following details are about the steps to download the original raw data to transform and convert as you want.
+
+#### Download
+
+To download the original raw data:
+
+```bash
+mkdir tw_raw_weather_data && cd tw_raw_weather_data
+
+wget https://storage.googleapis.com/taiwan-weather-observaiton-datasets/raw_data_weather_daily_1896_2023.tar.gz
+
+# Option: Validate the checksum
+md5sum raw_data_weather_daily_1896_2023.tar.gz
+# Checksum should be equal to: b66b9f137217454d655e3004d7d1b51a
+
+tar -xzvf raw_data_weather_daily_1896_2023.tar.gz
+466920_1928.csv
+466920_1929.csv
+466920_1930.csv
+466920_1931.csv
+...
+
+# Option: Validate the checksum
+cat *.csv | md5sum
+# Checksum should be equal to: b26db404bf84d4063fac42e576464ce1
+```
+
+#### Retrieve the Taiwan weather stations
+
+```bash
+wget -O weather_sta_list.csv https://github.com/Raingel/weather_station_list/raw/main/data/weather_sta_list.csv
+
+# Option: Convert the UTF-8-BOM to UTF-8 encoding
+sed -i '1s/^\xEF\xBB\xBF//' weather_sta_list.csv
+```
+
+## Create table schema
+
+Create the MergeTree table in ClickHouse (from the ClickHouse client).
+
+```bash
+CREATE TABLE tw_weather_data (
+    StationId String null,
+    MeasuredDate DateTime64,
+    StnPres Float64 null,
+    SeaPres Float64 null,
+    Tx Float64 null,
+    Td Float64 null,
+    RH Float64 null,
+    WS Float64 null,
+    WD Float64 null,
+    WSGust Float64 null,
+    WDGust Float64 null,
+    Precp Float64 null,
+    PrecpHour Float64 null,
+    SunShine Float64 null,
+    GloblRad Float64 null,
+    TxSoil0cm Float64 null,
+    TxSoil5cm Float64 null,
+    TxSoil10cm Float64 null,
+    TxSoil20cm Float64 null,
+    TxSoil50cm Float64 null,
+    TxSoil100cm Float64 null,
+    TxSoil30cm Float64 null,
+    TxSoil200cm Float64 null,
+    TxSoil300cm Float64 null,
+    TxSoil500cm Float64 null,
+    VaporPressure Float64 null,
+    UVI Float64 null,
+    "Cloud Amount" Float64 null,
+    EvapA Float64 null,
+    Visb Float64 null
+)
+ENGINE = MergeTree
+ORDER BY (MeasuredDate);
+```
+
+## Inserting into ClickHouse
+
+### Inserting from local file
+
+Data can be inserted from a local file as follows (from the ClickHouse client):
+
+```sql
+INSERT INTO tw_weather_data FROM INFILE '/path/to/daily_weather_preprocessed_1896_2023.csv'
+```
+
+where `/path/to` represents the specific user path to the local file on the disk.
+
+And the sample response output is as follows after inserting data into the ClickHouse:
+
+```response
+Query id: 90e4b524-6e14-4855-817c-7e6f98fbeabb
+
+Ok.
+131985329 rows in set. Elapsed: 71.770 sec. Processed 131.99 million rows, 10.06 GB (1.84 million rows/s., 140.14 MB/s.)
+Peak memory usage: 583.23 MiB.
+```
+
+### Inserting from URL
+
+```sql
+INSERT INTO tw_weather_data SELECT *
+FROM url('https://storage.googleapis.com/taiwan-weather-observaiton-datasets/daily_weather_preprocessed_1896_2023.csv', 'CSVWithNames')
+
+```
+To know how to speed this up, please see our blog post on [tuning large data loads](https://clickhouse.com/blog/supercharge-your-clickhouse-data-loads-part2).
+
+## Check data rows and sizes
+
+1. Let's see how many rows are inserted:
+
+```sql
+SELECT formatReadableQuantity(count())
+FROM tw_weather_data;
+```
+
+```response
+┌─formatReadableQuantity(count())─┐
+│ 131.99 million                  │
+└─────────────────────────────────┘
+```
+
+2. Let's see how much disk space are used for this table:
+
+```sql
+SELECT
+    formatReadableSize(sum(bytes)) AS disk_size,
+    formatReadableSize(sum(data_uncompressed_bytes)) AS uncompressed_size
+FROM system.parts
+WHERE (`table` = 'tw_weather_data') AND active
+```
+
+```response
+┌─disk_size─┬─uncompressed_size─┐
+│ 2.13 GiB  │ 32.94 GiB         │
+└───────────┴───────────────────┘
+```
+
+## Sample queries
+
+### Q1: Retrieve the highest dew point temperature for each weather station in the specific year
+
+```sql
+SELECT
+    StationId,
+    max(Td) AS max_td
+FROM tw_weather_data
+WHERE (year(MeasuredDate) = 2023) AND (Td IS NOT NULL)
+GROUP BY StationId
+
+┌─StationId─┬─max_td─┐
+│ 466940    │      1 │
+│ 467300    │      1 │
+│ 467540    │      1 │
+│ 467490    │      1 │
+│ 467080    │      1 │
+│ 466910    │      1 │
+│ 467660    │      1 │
+│ 467270    │      1 │
+│ 467350    │      1 │
+│ 467571    │      1 │
+│ 466920    │      1 │
+│ 467650    │      1 │
+│ 467550    │      1 │
+│ 467480    │      1 │
+│ 467610    │      1 │
+│ 467050    │      1 │
+│ 467590    │      1 │
+│ 466990    │      1 │
+│ 467060    │      1 │
+│ 466950    │      1 │
+│ 467620    │      1 │
+│ 467990    │      1 │
+│ 466930    │      1 │
+│ 467110    │      1 │
+│ 466881    │      1 │
+│ 467410    │      1 │
+│ 467441    │      1 │
+│ 467420    │      1 │
+│ 467530    │      1 │
+│ 466900    │      1 │
+└───────────┴────────┘
+
+30 rows in set. Elapsed: 0.045 sec. Processed 6.41 million rows, 187.33 MB (143.92 million rows/s., 4.21 GB/s.)
+```
+
+### Q2: Raw data fetching with the specific duration time range, fields and weather station
+
+```sql
+SELECT
+    StnPres,
+    SeaPres,
+    Tx,
+    Td,
+    RH,
+    WS,
+    WD,
+    WSGust,
+    WDGust,
+    Precp,
+    PrecpHour
+FROM tw_weather_data
+WHERE (StationId = 'C0UB10') AND (MeasuredDate >= '2023-12-23') AND (MeasuredDate < '2023-12-24')
+ORDER BY MeasuredDate ASC
+LIMIT 10
+```
+
+```response
+┌─StnPres─┬─SeaPres─┬───Tx─┬───Td─┬─RH─┬──WS─┬──WD─┬─WSGust─┬─WDGust─┬─Precp─┬─PrecpHour─┐
+│  1029.5 │    ᴺᵁᴸᴸ │ 11.8 │ ᴺᵁᴸᴸ │ 78 │ 2.7 │ 271 │    5.5 │    275 │ -99.8 │     -99.8 │
+│  1029.8 │    ᴺᵁᴸᴸ │ 12.3 │ ᴺᵁᴸᴸ │ 78 │ 2.7 │ 289 │    5.5 │    308 │ -99.8 │     -99.8 │
+│  1028.6 │    ᴺᵁᴸᴸ │ 12.3 │ ᴺᵁᴸᴸ │ 79 │ 2.3 │ 251 │    6.1 │    289 │ -99.8 │     -99.8 │
+│  1028.2 │    ᴺᵁᴸᴸ │   13 │ ᴺᵁᴸᴸ │ 75 │ 4.3 │ 312 │    7.5 │    316 │ -99.8 │     -99.8 │
+│  1027.8 │    ᴺᵁᴸᴸ │ 11.1 │ ᴺᵁᴸᴸ │ 89 │ 7.1 │ 310 │   11.6 │    322 │ -99.8 │     -99.8 │
+│  1027.8 │    ᴺᵁᴸᴸ │ 11.6 │ ᴺᵁᴸᴸ │ 90 │ 3.1 │ 269 │   10.7 │    295 │ -99.8 │     -99.8 │
+│  1027.9 │    ᴺᵁᴸᴸ │ 12.3 │ ᴺᵁᴸᴸ │ 89 │ 4.7 │ 296 │    8.1 │    310 │ -99.8 │     -99.8 │
+│  1028.2 │    ᴺᵁᴸᴸ │ 12.2 │ ᴺᵁᴸᴸ │ 94 │ 2.5 │ 246 │    7.1 │    283 │ -99.8 │     -99.8 │
+│  1028.4 │    ᴺᵁᴸᴸ │ 12.5 │ ᴺᵁᴸᴸ │ 94 │ 3.1 │ 265 │    4.8 │    297 │ -99.8 │     -99.8 │
+│  1028.3 │    ᴺᵁᴸᴸ │ 13.6 │ ᴺᵁᴸᴸ │ 91 │ 1.2 │ 273 │    4.4 │    256 │ -99.8 │     -99.8 │
+└─────────┴─────────┴──────┴──────┴────┴─────┴─────┴────────┴────────┴───────┴───────────┘
+
+10 rows in set. Elapsed: 0.009 sec. Processed 91.70 thousand rows, 2.33 MB (9.67 million rows/s., 245.31 MB/s.)
+```
+
+## Credits
+
+We would like to acknowledge the efforts of the Central Weather Administration and Agricultural Meteorological Observation Network (Station) of the Council of Agriculture for preparing, cleaning, and distributing this dataset. We appreciate your efforts.
+
+Ou, J.-H., Kuo, C.-H., Wu, Y.-F., Lin, G.-C., Lee, M.-H., Chen, R.-K., Chou, H.-P., Wu, H.-Y., Chu, S.-C., Lai, Q.-J., Tsai, Y.-C., Lin, C.-C., Kuo, C.-C., Liao, C.-T., Chen, Y.-N., Chu, Y.-W., Chen, C.-Y., 2023. Application-oriented deep learning model for early warning of rice blast in Taiwan. Ecological Informatics 73, 101950. https://doi.org/10.1016/j.ecoinf.2022.101950 [13/12/2022]

From a2bdb054ca5a9c205f5d0442313d3c9f4d22cda7 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 7 Mar 2024 17:31:37 +0000
Subject: [PATCH 166/985] Cleanup

---
 src/Interpreters/InterpreterSelectQuery.cpp                   | 4 +---
 .../queries/0_stateless/03006_parallel_replicas_prewhere.sql  | 4 +++-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 80e2d5afef7..987bf560add 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -2111,8 +2111,7 @@ void InterpreterSelectQuery::applyFiltersToPrewhereInAnalysis(ExpressionAnalysis
         if (does_storage_support_prewhere && shouldMoveToPrewhere())
         {
             /// Execute row level filter in prewhere as a part of "move to prewhere" optimization.
-            analysis.prewhere_info
-                = std::make_shared<PrewhereInfo>(analysis.filter_info->actions, analysis.filter_info->column_name);
+            analysis.prewhere_info = std::make_shared<PrewhereInfo>(analysis.filter_info->actions, analysis.filter_info->column_name);
             analysis.prewhere_info->prewhere_actions->projectInput(false);
             analysis.prewhere_info->remove_prewhere_column = analysis.filter_info->do_remove_column;
             analysis.prewhere_info->need_filter = true;
@@ -2121,7 +2120,6 @@ void InterpreterSelectQuery::applyFiltersToPrewhereInAnalysis(ExpressionAnalysis
     }
     else
     {
-        chassert(analysis.filter_info->actions);
         /// Add row level security actions to prewhere.
         analysis.prewhere_info->row_level_filter = analysis.filter_info->actions;
         analysis.prewhere_info->row_level_column_name = std::move(analysis.filter_info->column_name);
diff --git a/tests/queries/0_stateless/03006_parallel_replicas_prewhere.sql b/tests/queries/0_stateless/03006_parallel_replicas_prewhere.sql
index 819526b5596..4b84646c034 100644
--- a/tests/queries/0_stateless/03006_parallel_replicas_prewhere.sql
+++ b/tests/queries/0_stateless/03006_parallel_replicas_prewhere.sql
@@ -25,5 +25,7 @@ EXPLAIN ESTIMATE
 SELECT count()
 FROM url_na_log
 PREWHERE (DateVisit >= toFixedString('2022-08-10', 10)) AND (DateVisit <= '2022-08-20')
-SETTINGS max_block_size = 1048576, max_threads = 1, allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3, allow_experimental_analyzer=0, parallel_replicas_min_number_of_rows_per_replica=10000;
+SETTINGS max_block_size = 1048576, max_threads = 1, allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3, parallel_replicas_min_number_of_rows_per_replica=10000;
 
+DROP POLICY url_na_log_policy0 ON url_na_log;
+DROP TABLE url_na_log;

From 38cbc2c6c40541cc916bc591cd68b7eef70b1162 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 7 Mar 2024 18:57:16 +0100
Subject: [PATCH 167/985] Restore digits

---
 base/base/itoa.cpp | 43 +++++++++++++++++++------------------------
 1 file changed, 19 insertions(+), 24 deletions(-)

diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
index 9fefc9f0f07..ef844ff68a8 100644
--- a/base/base/itoa.cpp
+++ b/base/base/itoa.cpp
@@ -34,42 +34,37 @@
 
 
 template <typename T>
-int digits10(T x)
+inline int digits10(T x)
 {
-    if (x < T(10ULL))
+    if (x < 10ULL)
         return 1;
-    if (x < T(100ULL))
+    if (x < 100ULL)
         return 2;
-    if constexpr (sizeof(T) == 1)
+    if (x < 1000ULL)
         return 3;
-    else
+
+    if (x < 1000000000000ULL)
     {
-        if (x < T(1000ULL))
-            return 3;
-
-        if (x < T(1000000000000ULL))
+        if (x < 100000000ULL)
         {
-            if (x < T(100000000ULL))
+            if (x < 1000000ULL)
             {
-                if (x < T(1000000ULL))
-                {
-                    if (x < T(10000ULL))
-                        return 4;
-                    else
-                        return 5 + (x >= T(100000ULL));
-                }
-
-                return 7 + (x >= T(10000000ULL));
+                if (x < 10000ULL)
+                    return 4;
+                else
+                    return 5 + (x >= 100000ULL);
             }
 
-            if (x < T(10000000000ULL))
-                return 9 + (x >= T(1000000000ULL));
-
-            return 11 + (x >= T(100000000000ULL));
+            return 7 + (x >= 10000000ULL);
         }
 
-        return 12 + digits10(x / T(1000000000000ULL));
+        if (x < 10000000000ULL)
+            return 9 + (x >= 1000000000ULL);
+
+        return 11 + (x >= 100000000000ULL);
     }
+
+    return 12 + digits10(x / 1000000000000ULL);
 }
 
 
From a00a1fd7b4c9a4e83eeb746da781b27c74dcd0b2 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Thu, 7 Mar 2024 14:45:15 -0400
Subject: [PATCH 168/985] Adds readWKT docs.

---
 .../en/sql-reference/functions/geo/polygon.md | 56 +++++++++++++++++++
 1 file changed, 56 insertions(+)

diff --git a/docs/en/sql-reference/functions/geo/polygon.md b/docs/en/sql-reference/functions/geo/polygon.md
index 4a8653965c2..35e2280e5cc 100644
--- a/docs/en/sql-reference/functions/geo/polygon.md
+++ b/docs/en/sql-reference/functions/geo/polygon.md
@@ -53,6 +53,62 @@ String starting with `POLYGON`
 
 Polygon
 
+## readWKTPoint
+
+The `readWKTPoint` function in ClickHouse parses a Well-Known Text (WKT) representation of a Point geometry and returns a point in the internal ClickHouse format.
+
+### Syntax
+
+```sql
+readWKTPoint(wkt_string)
+```
+
+### Arguments
+
+- `wkt_string`: The input WKT string representing a Point geometry.
+
+### Returned value
+
+The function returns a ClickHouse internal representation of the Point geometry.
+
+### Example
+
+```sql
+SELECT readWKTPoint('POINT (1.2 3.4)');
+```
+
+```response
+(1.2,3.4)
+```
+
+## readWKTRing
+
+Parses a Well-Known Text (WKT) representation of a Polygon geometry and returns a ring (closed linestring) in the internal ClickHouse format.
+
+### Syntax
+
+```sql
+readWKTRing(wkt_string)
+```
+
+### Arguments
+
+- `wkt_string`: The input WKT string representing a Polygon geometry.
+
+### Returned value
+
+The function returns a ClickHouse internal representation of the ring (closed linestring) geometry.
+
+### Example
+
+```sql
+SELECT readWKTRing('LINESTRING (1 1, 2 2, 3 3, 1 1)');
+```
+
+```response
+[(1,1),(2,2),(3,3),(1,1)]
+```
+
 ## polygonsWithinSpherical
 
 Returns true or false depending on whether or not one polygon lies completely inside another polygon. Reference https://www.boost.org/doc/libs/1_62_0/libs/geometry/doc/html/geometry/reference/algorithms/within/within_2.html

From 444595ac576438c9d0a259debf776187ddd3fcce Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 7 Mar 2024 20:00:07 +0100
Subject: [PATCH 169/985] More speed please Mr. compiler

---
 base/base/itoa.cpp | 165 +++++++++++++++++++++++++++++++--------------
 1 file changed, 114 insertions(+), 51 deletions(-)

diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
index ef844ff68a8..08912edf3ea 100644
--- a/base/base/itoa.cpp
+++ b/base/base/itoa.cpp
@@ -72,7 +72,7 @@ namespace
 {
 
 template <typename T>
-static constexpr T pow10(size_t x)
+ALWAYS_INLINE inline constexpr T pow10(size_t x)
 {
     return x ? 10 * pow10<T>(x - 1) : 1;
 }
@@ -143,7 +143,7 @@ struct QuotientAndRemainder
 };
 
 template <size_t N>
-QuotientAndRemainder<N> static inline split(UnsignedOfSize<N> value)
+QuotientAndRemainder<N> inline split(UnsignedOfSize<N> value)
 {
     constexpr DivisionBy10PowN<N> division;
 
@@ -154,7 +154,7 @@ QuotientAndRemainder<N> static inline split(UnsignedOfSize<N> value)
 }
 
 
-static inline char * outDigit(char * p, uint8_t value)
+ALWAYS_INLINE inline char * outDigit(char * p, uint8_t value)
 {
     *p = '0' + value;
     ++p;
@@ -176,7 +176,7 @@ static const char digits[201] = "00010203040506070809"
                                 "80818283848586878889"
                                 "90919293949596979899";
 
-static inline char * outTwoDigits(char * p, uint8_t value)
+ALWAYS_INLINE inline char * outTwoDigits(char * p, uint8_t value)
 {
     memcpy(p, &digits[value * 2], 2);
     p += 2;
@@ -187,9 +187,9 @@ static inline char * outTwoDigits(char * p, uint8_t value)
 namespace convert
 {
 template <typename UInt, size_t N = sizeof(UInt)>
-static char * head(char * p, UInt u);
+char * head(char * p, UInt u);
 template <typename UInt, size_t N = sizeof(UInt)>
-static char * tail(char * p, UInt u);
+char * tail(char * p, UInt u);
 
 //===----------------------------------------------------------===//
 //     head: find most significant digit, skip leading zeros
@@ -198,7 +198,7 @@ static char * tail(char * p, UInt u);
 // "x" contains quotient and remainder after division by 10^N
 // quotient is less than 10^N
 template <size_t N>
-static inline char * head(char * p, QuotientAndRemainder<N> x)
+ALWAYS_INLINE inline char * head(char * p, QuotientAndRemainder<N> x)
 {
     p = head(p, UnsignedOfSize<N / 2>(x.quotient));
     p = tail(p, x.remainder);
@@ -207,14 +207,14 @@ static inline char * head(char * p, QuotientAndRemainder<N> x)
 
 // "u" is less than 10^2*N
 template <typename UInt, size_t N>
-static inline char * head(char * p, UInt u)
+ALWAYS_INLINE inline char * head(char * p, UInt u)
 {
     return u < pow10<UnsignedOfSize<N>>(N) ? head(p, UnsignedOfSize<N / 2>(u)) : head<N>(p, split<N>(u));
 }
 
 // recursion base case, selected when "u" is one byte
 template <>
-inline char * head<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
+ALWAYS_INLINE inline char * head<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
 {
     return u < 10 ? outDigit(p, u) : outTwoDigits(p, u);
 }
@@ -225,7 +225,7 @@ inline char * head<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
 
 // recursive step, "u" is less than 10^2*N
 template <typename UInt, size_t N>
-static inline char * tail(char * p, UInt u)
+ALWAYS_INLINE inline char * tail(char * p, UInt u)
 {
     QuotientAndRemainder<N> x = split<N>(u);
     p = tail(p, UnsignedOfSize<N / 2>(x.quotient));
@@ -235,7 +235,7 @@ static inline char * tail(char * p, UInt u)
 
 // recursion base case, selected when "u" is one byte
 template <>
-inline char * tail<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
+ALWAYS_INLINE inline char * tail<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
 {
     return outTwoDigits(p, u);
 }
@@ -244,9 +244,8 @@ inline char * tail<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
 // large values are >= 10^2*N
 // where x contains quotient and remainder after division by 10^N
 //===----------------------------------------------------------===//
-
 template <size_t N>
-static inline char * large(char * p, QuotientAndRemainder<N> x)
+ALWAYS_INLINE inline char * large(char * p, QuotientAndRemainder<N> x)
 {
     QuotientAndRemainder<N> y = split<N>(x.quotient);
     p = head(p, UnsignedOfSize<N / 2>(y.quotient));
@@ -259,9 +258,8 @@ static inline char * large(char * p, QuotientAndRemainder<N> x)
 // handle values of "u" that might be >= 10^2*N
 // where N is the size of "u" in bytes
 //===----------------------------------------------------------===//
-
 template <typename UInt, size_t N = sizeof(UInt)>
-static inline char * uitoa(char * p, UInt u)
+ALWAYS_INLINE inline char * uitoa(char * p, UInt u)
 {
     if (u < pow10<UnsignedOfSize<N>>(N))
         return head(p, UnsignedOfSize<N / 2>(u));
@@ -272,7 +270,7 @@ static inline char * uitoa(char * p, UInt u)
 
 // selected when "u" is one byte
 template <>
-inline char * uitoa<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
+ALWAYS_INLINE inline char * uitoa<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
 {
     if (u < 10)
         return outDigit(p, u);
@@ -292,14 +290,14 @@ inline char * uitoa<UnsignedOfSize<1>, 1>(char * p, UnsignedOfSize<1> u)
 
 // itoa: handle unsigned integral operands (selected by SFINAE)
 template <typename U, std::enable_if_t<!std::is_signed_v<U> && std::is_integral_v<U>> * = nullptr>
-static inline char * itoa(U u, char * p)
+ALWAYS_INLINE inline char * itoa(U u, char * p)
 {
     return convert::uitoa(p, u);
 }
 
 // itoa: handle signed integral operands (selected by SFINAE)
 template <typename I, size_t N = sizeof(I), std::enable_if_t<std::is_signed_v<I> && std::is_integral_v<I>> * = nullptr>
-static inline char * itoa(I i, char * p)
+ALWAYS_INLINE inline char * itoa(I i, char * p)
 {
     // Need "mask" to be filled with a copy of the sign bit.
     // If "i" is a negative value, then the result of "operator >>"
@@ -335,63 +333,128 @@ static inline char * itoa(I i, char * p)
 }
 
 
-template <typename T>
-static NO_INLINE char * writeUIntText(T _x, char * p)
+const uint64_t max_multiple_of_hundred_that_fits_in_64_bits = 1'00'00'00'00'00'00'00'00'00ull;
+constexpr int max_multiple_of_hundred_blocks = 9;
+static_assert(max_multiple_of_hundred_that_fits_in_64_bits % 100 == 0);
+
+ALWAYS_INLINE inline char * writeUIntText(UInt128 _x, char * p)
 {
-    static_assert(std::is_same_v<T, UInt128> || std::is_same_v<T, UInt256>);
-    using T_ = std::conditional_t<
-        std::is_same_v<T, UInt128>,
-        unsigned __int128,
+    /// If we the highest 8 byte item is empty, we can print only the lowest item as i64
+    if (_x.items[UInt128::_impl::little(1)] == 0)
+        return convert::itoa(_x.items[UInt128::_impl::little(0)], p);
+
+    /// Doing operations using __int128 is faster, as we already rely on this feature
+    using T = unsigned __int128;
+    T x = (T(_x.items[UInt128::_impl::little(1)]) << 64) + T(_x.items[UInt128::_impl::little(0)]);
+
+    /// We are going to accumulate blocks of 2 digits to print until the number is small enough to be printed as u64
+    /// To do this we could do: x / 100, x % 100
+    /// But this is too many iterations with long integers, so instead we can divide by a much longer integer
+    /// max_multiple_of_hundred_that_fits_in_64_bits and then get the blocks out of this (as u64)
+    static const T large_divisor = max_multiple_of_hundred_that_fits_in_64_bits;
+    static const T largest_uint64 = std::numeric_limits<uint64_t>::max();
+    uint8_t two_values[20] = {0}; // 39 Max characters / 2
+
+    int current_block = 0;
+    while (x > largest_uint64)
+    {
+        uint64_t remainder = uint64_t(x % large_divisor);
+        x /= large_divisor;
+
+        int pos = current_block;
+        while (remainder)
+        {
+            two_values[pos] = uint8_t(remainder % 100);
+            pos++;
+            remainder /= 100;
+        }
+        current_block += max_multiple_of_hundred_blocks;
+    }
+
+    char * highest_part_print = convert::itoa(uint64_t(x), p);
+    for (int i = 0; i < current_block; i++)
+    {
+        outTwoDigits(highest_part_print, two_values[current_block - 1 - i]);
+        highest_part_print += 2;
+    }
+
+    return highest_part_print;
+}
+
+ALWAYS_INLINE inline char * writeUIntText(UInt256 _x, char * p)
+{
+    /// If possible, treat it as a smaller integer as they are much faster to print
+    if (_x.items[UInt256::_impl::little(3)] == 0 && _x.items[UInt256::_impl::little(2)] == 0)
+        return writeUIntText(UInt128{_x.items[UInt256::_impl::little(0)], _x.items[UInt256::_impl::little(1)]}, p);
+
+    /// If available (x86) we transform from our custom class to _BitInt(256) which has better support in the compiler
+    /// and produces better code
+    using T =
 #if defined(__x86_64__)
 #    pragma clang diagnostic push
 #    pragma clang diagnostic ignored "-Wbit-int-extension"
         unsigned _BitInt(256)
 #    pragma clang diagnostic pop
 #else
-        T
+        UInt256
 #endif
-        >;
+        ;
 
-    T_ x;
-    T_ hundred(100ULL);
-    if constexpr (std::is_same_v<T, UInt128>)
-    {
-        x = (T_(_x.items[T::_impl::little(1)]) << 64) + T_(_x.items[T::_impl::little(0)]);
-    }
-    else
-    {
 #if defined(__x86_64__)
-        x = (T_(_x.items[T::_impl::little(3)]) << 192) + (T_(_x.items[T::_impl::little(2)]) << 128)
-            + (T_(_x.items[T::_impl::little(1)]) << 64) + T_(_x.items[T::_impl::little(0)]);
+    T x = (T(_x.items[UInt256::_impl::little(3)]) << 192) + (T(_x.items[UInt256::_impl::little(2)]) << 128)
+        + (T(_x.items[UInt256::_impl::little(1)]) << 64) + T(_x.items[UInt256::_impl::little(0)]);
 #else
-        x = _x;
+    T x = _x;
 #endif
+
+    /// Similar to writeUIntText(UInt128) only that in this case we will stop as soon as we reach the largest u128
+    /// and switch to that function
+    uint8_t two_values[39] = {0}; // 78 Max characters / 2
+    int current_pos = 0;
+
+    static const T large_divisor = max_multiple_of_hundred_that_fits_in_64_bits;
+    static const T largest_uint128 = T(std::numeric_limits<uint64_t>::max()) << 64 | T(std::numeric_limits<uint64_t>::max());
+
+    while (x > largest_uint128)
+    {
+        uint64_t remainder = uint64_t(x % large_divisor);
+        x /= large_divisor;
+
+        int pos = current_pos;
+        while (remainder)
+        {
+            two_values[pos] = uint8_t(remainder % 100);
+            pos++;
+            remainder /= 100;
+        }
+        current_pos += max_multiple_of_hundred_blocks;
     }
 
-    int len = digits10(x);
-    auto * pp = p + len;
-    while (x >= hundred)
+#if defined(__x86_64__)
+    UInt128 pending{uint64_t(x), uint64_t(x >> 64)};
+#else
+    UInt128 pending{x.items[UInt256::_impl::little(0)], x.items[UInt256::_impl::little(1)]};
+#endif
+
+    char * highest_part_print = writeUIntText(pending, p);
+    for (int i = 0; i < current_pos; i++)
     {
-        const auto i = x % hundred;
-        x /= hundred;
-        pp -= 2;
-        outTwoDigits(pp, i);
+        outTwoDigits(highest_part_print, two_values[current_pos - 1 - i]);
+        highest_part_print += 2;
     }
-    if (x < 10)
-        *p = '0' + x;
-    else
-        outTwoDigits(p, x);
-    return p + len;
+
+    return highest_part_print;
 }
 
-static ALWAYS_INLINE inline char * writeLeadingMinus(char * pos)
+
+ALWAYS_INLINE inline char * writeLeadingMinus(char * pos)
 {
     *pos = '-';
     return pos + 1;
 }
 
 template <typename T>
-static ALWAYS_INLINE inline char * writeSIntText(T x, char * pos)
+ALWAYS_INLINE inline char * writeSIntText(T x, char * pos)
 {
     static_assert(std::is_same_v<T, Int128> || std::is_same_v<T, Int256>);
 

From 2bc4d27ac6f42af79120dac72b25db6e36ee4b42 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <nikitamikhaylov@clickhouse.com>
Date: Thu, 7 Mar 2024 19:24:39 +0000
Subject: [PATCH 170/985] Bye bye

---
 docker/packager/README.md                     |    1 -
 docs/en/operations/backup.md                  |    6 +-
 .../operations/utilities/clickhouse-copier.md |  187 --
 docs/en/operations/utilities/index.md         |    2 -
 .../sql-reference/statements/alter/column.md  |    2 +-
 docs/ru/getting-started/tutorial.md           |    4 -
 docs/ru/operations/backup.md                  |    6 -
 .../operations/utilities/clickhouse-copier.md |  183 --
 docs/ru/operations/utilities/index.md         |    1 -
 .../sql-reference/statements/alter/column.md  |    4 +-
 docs/zh/getting-started/tutorial.md           |    2 -
 docs/zh/operations/backup.md                  |    6 -
 .../operations/utilities/clickhouse-copier.md |  172 --
 docs/zh/operations/utilities/index.md         |    1 -
 docs/zh/sql-reference/statements/alter.md     |    2 +-
 packages/clickhouse-server.yaml               |    2 -
 programs/CMakeLists.txt                       |    2 -
 programs/copier/Aliases.h                     |   15 -
 programs/copier/CMakeLists.txt                |   28 -
 programs/copier/ClusterCopier.cpp             | 2076 -----------------
 programs/copier/ClusterCopier.h               |  240 --
 programs/copier/ClusterCopierApp.cpp          |  252 --
 programs/copier/ClusterCopierApp.h            |   99 -
 programs/copier/ClusterPartition.h            |   22 -
 programs/copier/Internals.cpp                 |  280 ---
 programs/copier/Internals.h                   |  198 --
 programs/copier/ShardPartition.cpp            |   70 -
 programs/copier/ShardPartition.h              |   54 -
 programs/copier/ShardPartitionPiece.cpp       |   64 -
 programs/copier/ShardPartitionPiece.h         |   43 -
 programs/copier/StatusAccumulator.cpp         |   48 -
 programs/copier/StatusAccumulator.h           |   27 -
 programs/copier/TaskCluster.cpp               |   74 -
 programs/copier/TaskCluster.h                 |   51 -
 programs/copier/TaskShard.cpp                 |   37 -
 programs/copier/TaskShard.h                   |   56 -
 programs/copier/TaskTable.cpp                 |  222 --
 programs/copier/TaskTable.h                   |  173 --
 programs/copier/ZooKeeperStaff.h              |  221 --
 programs/copier/clickhouse-copier.cpp         |    1 -
 .../testdata/configs/xml/config.xml           |    2 +-
 .../testdata/configs/yaml/config.yaml         |    2 +-
 .../testdata/configs/yandex_xml/config.xml    |    2 +-
 programs/install/Install.cpp                  |    1 -
 programs/main.cpp                             |    2 -
 programs/server/config.xml                    |    2 +-
 programs/server/config.yaml.example           |    2 +-
 src/Storages/StorageDistributed.h             |    1 -
 tests/integration/README.md                   |    2 +-
 .../test_cluster_copier/__init__.py           |    0
 .../configs/conf.d/clusters.xml               |   73 -
 .../configs/conf.d/clusters_trivial.xml       |   20 -
 .../configs/conf.d/ddl.xml                    |    5 -
 .../configs/conf.d/query_log.xml              |   14 -
 .../configs/config-copier.xml                 |   11 -
 .../test_cluster_copier/configs/users.xml     |   34 -
 .../configs_three_nodes/conf.d/clusters.xml   |   27 -
 .../configs_three_nodes/conf.d/ddl.xml        |    5 -
 .../configs_three_nodes/config-copier.xml     |   27 -
 .../configs_three_nodes/users.xml             |   32 -
 .../configs_two_nodes/conf.d/clusters.xml     |   22 -
 .../configs_two_nodes/conf.d/ddl.xml          |    5 -
 .../conf.d/storage_configuration.xml          |   34 -
 .../configs_two_nodes/config-copier.xml       |   19 -
 .../configs_two_nodes/users.xml               |   32 -
 .../test_cluster_copier/task0_description.xml |   95 -
 .../task_drop_target_partition.xml            |   41 -
 .../task_month_to_week_description.xml        |   99 -
 .../test_cluster_copier/task_no_arg.xml       |   39 -
 .../test_cluster_copier/task_no_index.xml     |  109 -
 .../task_non_partitioned_table.xml            |   39 -
 .../test_cluster_copier/task_self_copy.xml    |   63 -
 .../test_cluster_copier/task_skip_index.xml   |   39 -
 .../test_cluster_copier/task_taxi_data.xml    |   42 -
 .../task_test_block_size.xml                  |  101 -
 .../test_cluster_copier/task_trivial.xml      |   63 -
 .../task_trivial_without_arguments.xml        |   63 -
 .../test_cluster_copier/task_ttl_columns.xml  |   39 -
 .../task_ttl_move_to_volume.xml               |   39 -
 .../task_with_different_schema.xml            |   39 -
 tests/integration/test_cluster_copier/test.py |  653 ------
 .../test_cluster_copier/test_three_nodes.py   |  286 ---
 .../test_cluster_copier/test_trivial.py       |  227 --
 .../test_cluster_copier/test_two_nodes.py     |  597 -----
 .../test_config_xml_full/configs/config.xml   |    2 +-
 85 files changed, 12 insertions(+), 7973 deletions(-)
 delete mode 100644 docs/en/operations/utilities/clickhouse-copier.md
 delete mode 100644 docs/ru/operations/utilities/clickhouse-copier.md
 delete mode 100644 docs/zh/operations/utilities/clickhouse-copier.md
 delete mode 100644 programs/copier/Aliases.h
 delete mode 100644 programs/copier/CMakeLists.txt
 delete mode 100644 programs/copier/ClusterCopier.cpp
 delete mode 100644 programs/copier/ClusterCopier.h
 delete mode 100644 programs/copier/ClusterCopierApp.cpp
 delete mode 100644 programs/copier/ClusterCopierApp.h
 delete mode 100644 programs/copier/ClusterPartition.h
 delete mode 100644 programs/copier/Internals.cpp
 delete mode 100644 programs/copier/Internals.h
 delete mode 100644 programs/copier/ShardPartition.cpp
 delete mode 100644 programs/copier/ShardPartition.h
 delete mode 100644 programs/copier/ShardPartitionPiece.cpp
 delete mode 100644 programs/copier/ShardPartitionPiece.h
 delete mode 100644 programs/copier/StatusAccumulator.cpp
 delete mode 100644 programs/copier/StatusAccumulator.h
 delete mode 100644 programs/copier/TaskCluster.cpp
 delete mode 100644 programs/copier/TaskCluster.h
 delete mode 100644 programs/copier/TaskShard.cpp
 delete mode 100644 programs/copier/TaskShard.h
 delete mode 100644 programs/copier/TaskTable.cpp
 delete mode 100644 programs/copier/TaskTable.h
 delete mode 100644 programs/copier/ZooKeeperStaff.h
 delete mode 100644 programs/copier/clickhouse-copier.cpp
 delete mode 100644 tests/integration/test_cluster_copier/__init__.py
 delete mode 100644 tests/integration/test_cluster_copier/configs/conf.d/clusters.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs/conf.d/clusters_trivial.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs/conf.d/ddl.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs/conf.d/query_log.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs/config-copier.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs/users.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs_three_nodes/conf.d/clusters.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs_three_nodes/conf.d/ddl.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs_three_nodes/config-copier.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs_three_nodes/users.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs_two_nodes/conf.d/clusters.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs_two_nodes/conf.d/ddl.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs_two_nodes/conf.d/storage_configuration.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs_two_nodes/config-copier.xml
 delete mode 100644 tests/integration/test_cluster_copier/configs_two_nodes/users.xml
 delete mode 100644 tests/integration/test_cluster_copier/task0_description.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_drop_target_partition.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_month_to_week_description.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_no_arg.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_no_index.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_non_partitioned_table.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_self_copy.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_skip_index.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_taxi_data.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_test_block_size.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_trivial.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_trivial_without_arguments.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_ttl_columns.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_ttl_move_to_volume.xml
 delete mode 100644 tests/integration/test_cluster_copier/task_with_different_schema.xml
 delete mode 100644 tests/integration/test_cluster_copier/test.py
 delete mode 100644 tests/integration/test_cluster_copier/test_three_nodes.py
 delete mode 100644 tests/integration/test_cluster_copier/test_trivial.py
 delete mode 100644 tests/integration/test_cluster_copier/test_two_nodes.py

diff --git a/docker/packager/README.md b/docker/packager/README.md
index e0b7f38ea58..3604e8585a4 100644
--- a/docker/packager/README.md
+++ b/docker/packager/README.md
@@ -28,7 +28,6 @@ lrwxrwxrwx 1 root root        10  clickhouse-benchmark -> clickhouse
 lrwxrwxrwx 1 root root        10  clickhouse-clang -> clickhouse
 lrwxrwxrwx 1 root root        10  clickhouse-client -> clickhouse
 lrwxrwxrwx 1 root root        10  clickhouse-compressor -> clickhouse
-lrwxrwxrwx 1 root root        10  clickhouse-copier -> clickhouse
 lrwxrwxrwx 1 root root        10  clickhouse-extract-from-config -> clickhouse
 lrwxrwxrwx 1 root root        10  clickhouse-format -> clickhouse
 lrwxrwxrwx 1 root root        10  clickhouse-lld -> clickhouse
diff --git a/docs/en/operations/backup.md b/docs/en/operations/backup.md
index 2d9bf2a2ee8..8639af468c2 100644
--- a/docs/en/operations/backup.md
+++ b/docs/en/operations/backup.md
@@ -170,7 +170,7 @@ RESTORE TABLE test.table PARTITIONS '2', '3'
 
 ### Backups as tar archives
 
-Backups can also be stored as tar archives. The functionality is the same as for zip, except that a password is not supported. 
+Backups can also be stored as tar archives. The functionality is the same as for zip, except that a password is not supported.
 
 Write a backup as a tar:
 ```
@@ -444,10 +444,6 @@ Often data that is ingested into ClickHouse is delivered through some sort of pe
 
 Some local filesystems provide snapshot functionality (for example, [ZFS](https://en.wikipedia.org/wiki/ZFS)), but they might not be the best choice for serving live queries. A possible solution is to create additional replicas with this kind of filesystem and exclude them from the [Distributed](../engines/table-engines/special/distributed.md) tables that are used for `SELECT` queries. Snapshots on such replicas will be out of reach of any queries that modify data. As a bonus, these replicas might have special hardware configurations with more disks attached per server, which would be cost-effective.
 
-### clickhouse-copier {#clickhouse-copier}
-
-[clickhouse-copier](../operations/utilities/clickhouse-copier.md) is a versatile tool that was initially created to re-shard petabyte-sized tables. It can also be used for backup and restore purposes because it reliably copies data between ClickHouse tables and clusters.
-
 For smaller volumes of data, a simple `INSERT INTO ... SELECT ...` to remote tables might work as well.
 
 ### Manipulations with Parts {#manipulations-with-parts}
diff --git a/docs/en/operations/utilities/clickhouse-copier.md b/docs/en/operations/utilities/clickhouse-copier.md
deleted file mode 100644
index 0d329487504..00000000000
--- a/docs/en/operations/utilities/clickhouse-copier.md
+++ /dev/null
@@ -1,187 +0,0 @@
----
-slug: /en/operations/utilities/clickhouse-copier
-sidebar_position: 59
-sidebar_label: clickhouse-copier
----
-
-# clickhouse-copier 
-
-Copies data from the tables in one cluster to tables in another (or the same) cluster.
-
-:::note    
-To get a consistent copy, the data in the source tables and partitions should not change during the entire process.
-:::
-
-You can run multiple `clickhouse-copier` instances on different servers to perform the same job. ClickHouse Keeper, or ZooKeeper, is used for syncing the processes.
-
-After starting, `clickhouse-copier`:
-
-- Connects to ClickHouse Keeper and receives:
-
-    - Copying jobs.
-    - The state of the copying jobs.
-
-- It performs the jobs.
-
-    Each running process chooses the “closest” shard of the source cluster and copies the data into the destination cluster, resharding the data if necessary.
-
-`clickhouse-copier` tracks the changes in ClickHouse Keeper and applies them on the fly.
-
-To reduce network traffic, we recommend running `clickhouse-copier` on the same server where the source data is located.
-
-## Running Clickhouse-copier {#running-clickhouse-copier}
-
-The utility should be run manually:
-
-``` bash
-$ clickhouse-copier --daemon --config keeper.xml --task-path /task/path --base-dir /path/to/dir
-```
-
-Parameters:
-
-- `daemon` — Starts `clickhouse-copier` in daemon mode.
-- `config` — The path to the `keeper.xml` file with the parameters for the connection to ClickHouse Keeper.
-- `task-path` — The path to the ClickHouse Keeper node. This node is used for syncing `clickhouse-copier` processes and storing tasks. Tasks are stored in `$task-path/description`.
-- `task-file` — Optional path to file with task configuration for initial upload to ClickHouse Keeper.
-- `task-upload-force` — Force upload `task-file` even if node already exists. Default is false.
-- `base-dir` — The path to logs and auxiliary files. When it starts, `clickhouse-copier` creates `clickhouse-copier_YYYYMMHHSS_<PID>` subdirectories in `$base-dir`. If this parameter is omitted, the directories are created in the directory where `clickhouse-copier` was launched.
-
-## Format of keeper.xml {#format-of-zookeeper-xml}
-
-``` xml
-<clickhouse>
-    <logger>
-        <level>trace</level>
-        <size>100M</size>
-        <count>3</count>
-    </logger>
-
-    <zookeeper>
-        <node index="1">
-            <host>127.0.0.1</host>
-            <port>2181</port>
-        </node>
-    </zookeeper>
-</clickhouse>
-```
-
-## Configuration of Copying Tasks {#configuration-of-copying-tasks}
-
-``` xml
-<clickhouse>
-    <!-- Configuration of clusters as in an ordinary server config -->
-    <remote_servers>
-        <source_cluster>
-            <!--
-                source cluster & destination clusters accept exactly the same
-                parameters as parameters for the usual Distributed table
-                see https://clickhouse.com/docs/en/engines/table-engines/special/distributed/
-            -->
-            <shard>
-                <internal_replication>false</internal_replication>
-                    <replica>
-                        <host>127.0.0.1</host>
-                        <port>9000</port>
-                        <!--
-                        <user>default</user>
-                        <password>default</password>
-                        <secure>1</secure>
-                        -->
-                    </replica>
-            </shard>
-            ...
-        </source_cluster>
-
-        <destination_cluster>
-        ...
-        </destination_cluster>
-    </remote_servers>
-
-    <!-- How many simultaneously active workers are possible. If you run more workers superfluous workers will sleep. -->
-    <max_workers>2</max_workers>
-
-    <!-- Setting used to fetch (pull) data from source cluster tables -->
-    <settings_pull>
-        <readonly>1</readonly>
-    </settings_pull>
-
-    <!-- Setting used to insert (push) data to destination cluster tables -->
-    <settings_push>
-        <readonly>0</readonly>
-    </settings_push>
-
-    <!-- Common setting for fetch (pull) and insert (push) operations. Also, copier process context uses it.
-         They are overlaid by <settings_pull/> and <settings_push/> respectively. -->
-    <settings>
-        <connect_timeout>3</connect_timeout>
-        <!-- Sync insert is set forcibly, leave it here just in case. -->
-        <distributed_foreground_insert>1</distributed_foreground_insert>
-    </settings>
-
-    <!-- Copying tasks description.
-         You could specify several table task in the same task description (in the same ZooKeeper node), they will be performed
-         sequentially.
-    -->
-    <tables>
-        <!-- A table task, copies one table. -->
-        <table_hits>
-            <!-- Source cluster name (from <remote_servers/> section) and tables in it that should be copied -->
-            <cluster_pull>source_cluster</cluster_pull>
-            <database_pull>test</database_pull>
-            <table_pull>hits</table_pull>
-
-            <!-- Destination cluster name and tables in which the data should be inserted -->
-            <cluster_push>destination_cluster</cluster_push>
-            <database_push>test</database_push>
-            <table_push>hits2</table_push>
-
-            <!-- Engine of destination tables.
-                 If destination tables have not be created, workers create them using columns definition from source tables and engine
-                 definition from here.
-
-                 NOTE: If the first worker starts insert data and detects that destination partition is not empty then the partition will
-                 be dropped and refilled, take it into account if you already have some data in destination tables. You could directly
-                 specify partitions that should be copied in <enabled_partitions/>, they should be in quoted format like partition column of
-                 system.parts table.
-            -->
-            <engine>
-            ENGINE=ReplicatedMergeTree('/clickhouse/tables/{cluster}/{shard}/hits2', '{replica}')
-            PARTITION BY toMonday(date)
-            ORDER BY (CounterID, EventDate)
-            </engine>
-
-            <!-- Sharding key used to insert data to destination cluster -->
-            <sharding_key>jumpConsistentHash(intHash64(UserID), 2)</sharding_key>
-
-            <!-- Optional expression that filter data while pull them from source servers -->
-            <where_condition>CounterID != 0</where_condition>
-
-            <!-- This section specifies partitions that should be copied, other partition will be ignored.
-                 Partition names should have the same format as
-                 partition column of system.parts table (i.e. a quoted text).
-                 Since partition key of source and destination cluster could be different,
-                 these partition names specify destination partitions.
-
-                 NOTE: In spite of this section is optional (if it is not specified, all partitions will be copied),
-                 it is strictly recommended to specify them explicitly.
-                 If you already have some ready partitions on destination cluster they
-                 will be removed at the start of the copying since they will be interpeted
-                 as unfinished data from the previous copying!!!
-            -->
-            <enabled_partitions>
-                <partition>'2018-02-26'</partition>
-                <partition>'2018-03-05'</partition>
-                ...
-            </enabled_partitions>
-        </table_hits>
-
-        <!-- Next table to copy. It is not copied until previous table is copying. -->
-        <table_visits>
-        ...
-        </table_visits>
-        ...
-    </tables>
-</clickhouse>
-```
-
-`clickhouse-copier` tracks the changes in `/task/path/description` and applies them on the fly. For instance, if you change the value of `max_workers`, the number of processes running tasks will also change.
diff --git a/docs/en/operations/utilities/index.md b/docs/en/operations/utilities/index.md
index 8959073d00e..912a5b9ccb1 100644
--- a/docs/en/operations/utilities/index.md
+++ b/docs/en/operations/utilities/index.md
@@ -2,13 +2,11 @@
 slug: /en/operations/utilities/
 sidebar_position: 56
 sidebar_label: List of tools and utilities
-pagination_next: 'en/operations/utilities/clickhouse-copier'
 ---
 
 # List of tools and utilities
 
 - [clickhouse-local](../../operations/utilities/clickhouse-local.md) — Allows running SQL queries on data without starting the ClickHouse server, similar to how `awk` does this.
-- [clickhouse-copier](../../operations/utilities/clickhouse-copier.md) — Copies (and reshards) data from one cluster to another cluster.
 - [clickhouse-benchmark](../../operations/utilities/clickhouse-benchmark.md) — Loads server with the custom queries and settings.
 - [clickhouse-format](../../operations/utilities/clickhouse-format.md) — Enables formatting input queries.
 - [ClickHouse obfuscator](../../operations/utilities/clickhouse-obfuscator.md) — Obfuscates data.
diff --git a/docs/en/sql-reference/statements/alter/column.md b/docs/en/sql-reference/statements/alter/column.md
index 0989c151d18..a23710b12bd 100644
--- a/docs/en/sql-reference/statements/alter/column.md
+++ b/docs/en/sql-reference/statements/alter/column.md
@@ -335,7 +335,7 @@ The `ALTER` query lets you create and delete separate elements (columns) in nest
 
 There is no support for deleting columns in the primary key or the sampling key (columns that are used in the `ENGINE` expression). Changing the type for columns that are included in the primary key is only possible if this change does not cause the data to be modified (for example, you are allowed to add values to an Enum or to change a type from `DateTime` to `UInt32`).
 
-If the `ALTER` query is not sufficient to make the table changes you need, you can create a new table, copy the data to it using the [INSERT SELECT](/docs/en/sql-reference/statements/insert-into.md/#inserting-the-results-of-select) query, then switch the tables using the [RENAME](/docs/en/sql-reference/statements/rename.md/#rename-table) query and delete the old table. You can use the [clickhouse-copier](/docs/en/operations/utilities/clickhouse-copier.md) as an alternative to the `INSERT SELECT` query.
+If the `ALTER` query is not sufficient to make the table changes you need, you can create a new table, copy the data to it using the [INSERT SELECT](/docs/en/sql-reference/statements/insert-into.md/#inserting-the-results-of-select) query, then switch the tables using the [RENAME](/docs/en/sql-reference/statements/rename.md/#rename-table) query and delete the old table.
 
 The `ALTER` query blocks all reads and writes for the table. In other words, if a long `SELECT` is running at the time of the `ALTER` query, the `ALTER` query will wait for it to complete. At the same time, all new queries to the same table will wait while this `ALTER` is running.
 
diff --git a/docs/ru/getting-started/tutorial.md b/docs/ru/getting-started/tutorial.md
index 34064b6cf2f..8c827137e6d 100644
--- a/docs/ru/getting-started/tutorial.md
+++ b/docs/ru/getting-started/tutorial.md
@@ -585,10 +585,6 @@ ENGINE = Distributed(perftest_3shards_1replicas, tutorial, hits_local, rand());
 INSERT INTO tutorial.hits_all SELECT * FROM tutorial.hits_v1;
 ```
 
-:::danger Внимание!
-Этот подход не годится для сегментирования больших таблиц. Есть инструмент [clickhouse-copier](../operations/utilities/clickhouse-copier.md), специально предназначенный для перераспределения любых больших таблиц.
-:::
-
 Как и следовало ожидать, вычислительно сложные запросы работают втрое быстрее, если они выполняются на трёх серверах, а не на одном.
 
 В данном случае мы использовали кластер из трёх сегментов с одной репликой для каждого.
diff --git a/docs/ru/operations/backup.md b/docs/ru/operations/backup.md
index 9ff13bbc8a6..50ee6b45e09 100644
--- a/docs/ru/operations/backup.md
+++ b/docs/ru/operations/backup.md
@@ -24,12 +24,6 @@ sidebar_label: "Резервное копирование данных"
 
 Некоторые локальные файловые системы позволяют делать снимки (например, [ZFS](https://en.wikipedia.org/wiki/ZFS)), но они могут быть не лучшим выбором для обслуживания живых запросов. Возможным решением является создание дополнительных реплик с такой файловой системой и исключение их из [Distributed](../engines/table-engines/special/distributed.md) таблиц, используемых для запросов `SELECT`. Снимки на таких репликах будут недоступны для запросов, изменяющих данные. В качестве бонуса, эти реплики могут иметь особые конфигурации оборудования с большим количеством дисков, подключенных к серверу, что будет экономически эффективным.
 
-## clickhouse-copier {#clickhouse-copier}
-
-[clickhouse-copier](utilities/clickhouse-copier.md) — это универсальный инструмент, который изначально был создан для перешардирования таблиц с петабайтами данных. Его также можно использовать для резервного копирования и восстановления, поскольку он надёжно копирует данные между таблицами и кластерами ClickHouse.
-
-Для небольших объёмов данных можно применять `INSERT INTO ... SELECT ...` в удалённые таблицы.
-
 ## Манипуляции с партициями {#manipuliatsii-s-partitsiiami}
 
 ClickHouse позволяет использовать запрос `ALTER TABLE ... FREEZE PARTITION ...` для создания локальной копии партиций таблицы. Это реализуется с помощью жестких ссылок (hardlinks) на каталог `/var/lib/clickhouse/shadow/`, поэтому такая копия обычно не занимает дополнительное место на диске для старых данных. Созданные копии файлов не обрабатываются сервером ClickHouse, поэтому вы можете просто оставить их там: у вас будет простая резервная копия, которая не требует дополнительной внешней системы, однако при аппаратных проблемах вы можете утратить и актуальные данные и сохраненную копию. По этой причине, лучше удаленно скопировать их в другое место, а затем удалить локальную копию. Распределенные файловые системы и хранилища объектов по-прежнему являются хорошими вариантами для этого, однако можно использовать и обычные присоединенные файловые серверы с достаточно большой ёмкостью (в этом случае передача будет происходить через сетевую файловую систему или, возможно, [rsync](https://en.wikipedia.org/wiki/Rsync)).
diff --git a/docs/ru/operations/utilities/clickhouse-copier.md b/docs/ru/operations/utilities/clickhouse-copier.md
deleted file mode 100644
index da86ef2d35d..00000000000
--- a/docs/ru/operations/utilities/clickhouse-copier.md
+++ /dev/null
@@ -1,183 +0,0 @@
----
-slug: /ru/operations/utilities/clickhouse-copier
-sidebar_position: 59
-sidebar_label: clickhouse-copier
----
-
-# clickhouse-copier {#clickhouse-copier}
-
-Копирует данные из таблиц одного кластера в таблицы другого (или этого же) кластера.
-
-Можно запустить несколько `clickhouse-copier` для разных серверах для выполнения одного и того же задания. Для синхронизации между процессами используется ZooKeeper.
-
-После запуска, `clickhouse-copier`:
-
--   Соединяется с ZooKeeper и получает:
-
-    -   Задания на копирование.
-    -   Состояние заданий на копирование.
-
--   Выполняет задания.
-
-        Каждый запущенный процесс выбирает "ближайший" шард исходного кластера и копирует данные в кластер назначения, при необходимости перешардируя их.
-
-`clickhouse-copier` отслеживает изменения в ZooKeeper и применяет их «на лету».
-
-Для снижения сетевого трафика рекомендуем запускать `clickhouse-copier` на том же сервере, где находятся исходные данные.
-
-## Запуск Clickhouse-copier {#zapusk-clickhouse-copier}
-
-Утилиту следует запускать вручную следующим образом:
-
-``` bash
-$ clickhouse-copier --daemon --config zookeeper.xml --task-path /task/path --base-dir /path/to/dir
-```
-
-Параметры запуска:
-
--   `daemon` - запускает `clickhouse-copier` в режиме демона.
--   `config` - путь к файлу `zookeeper.xml` с параметрами соединения с ZooKeeper.
--   `task-path` - путь к ноде ZooKeeper. Нода используется для синхронизации между процессами `clickhouse-copier` и для хранения заданий. Задания хранятся в `$task-path/description`.
--   `task-file` - необязательный путь к файлу с описанием конфигурация заданий для загрузки в ZooKeeper.
--   `task-upload-force` - Загрузить `task-file` в ZooKeeper даже если уже было загружено.
--   `base-dir` - путь к логам и вспомогательным файлам. При запуске `clickhouse-copier` создает в `$base-dir` подкаталоги `clickhouse-copier_YYYYMMHHSS_<PID>`. Если параметр не указан, то каталоги будут создаваться в каталоге, где `clickhouse-copier` был запущен.
-
-## Формат Zookeeper.xml {#format-zookeeper-xml}
-
-``` xml
-<clickhouse>
-    <logger>
-        <level>trace</level>
-        <size>100M</size>
-        <count>3</count>
-    </logger>
-
-    <zookeeper>
-        <node index="1">
-            <host>127.0.0.1</host>
-            <port>2181</port>
-        </node>
-    </zookeeper>
-</clickhouse>
-```
-
-## Конфигурация заданий на копирование {#konfiguratsiia-zadanii-na-kopirovanie}
-
-``` xml
-<clickhouse>
-    <!-- Configuration of clusters as in an ordinary server config -->
-    <remote_servers>
-        <source_cluster>
-		    <!--
-                source cluster & destination clusters accept exactly the same
-                parameters as parameters for the usual Distributed table
-                see https://clickhouse.com/docs/ru/engines/table-engines/special/distributed/
-            -->
-            <shard>
-                <internal_replication>false</internal_replication>
-                    <replica>
-                        <host>127.0.0.1</host>
-                        <port>9000</port>
-						<!--
-                        <user>default</user>
-                        <password>default</password>
-                        <secure>1</secure>
-                        -->
-                    </replica>
-            </shard>
-            ...
-        </source_cluster>
-
-        <destination_cluster>
-        ...
-        </destination_cluster>
-    </remote_servers>
-
-    <!-- How many simultaneously active workers are possible. If you run more workers superfluous workers will sleep. -->
-    <max_workers>2</max_workers>
-
-    <!-- Setting used to fetch (pull) data from source cluster tables -->
-    <settings_pull>
-        <readonly>1</readonly>
-    </settings_pull>
-
-    <!-- Setting used to insert (push) data to destination cluster tables -->
-    <settings_push>
-        <readonly>0</readonly>
-    </settings_push>
-
-    <!-- Common setting for fetch (pull) and insert (push) operations. Also, copier process context uses it.
-         They are overlaid by <settings_pull/> and <settings_push/> respectively. -->
-    <settings>
-        <connect_timeout>3</connect_timeout>
-        <!-- Sync insert is set forcibly, leave it here just in case. -->
-        <distributed_foreground_insert>1</distributed_foreground_insert>
-    </settings>
-
-    <!-- Copying tasks description.
-         You could specify several table task in the same task description (in the same ZooKeeper node), they will be performed
-         sequentially.
-    -->
-    <tables>
-        <!-- A table task, copies one table. -->
-        <table_hits>
-            <!-- Source cluster name (from <remote_servers/> section) and tables in it that should be copied -->
-            <cluster_pull>source_cluster</cluster_pull>
-            <database_pull>test</database_pull>
-            <table_pull>hits</table_pull>
-
-            <!-- Destination cluster name and tables in which the data should be inserted -->
-            <cluster_push>destination_cluster</cluster_push>
-            <database_push>test</database_push>
-            <table_push>hits2</table_push>
-
-            <!-- Engine of destination tables.
-                 If destination tables have not be created, workers create them using columns definition from source tables and engine
-                 definition from here.
-
-                 NOTE: If the first worker starts insert data and detects that destination partition is not empty then the partition will
-                 be dropped and refilled, take it into account if you already have some data in destination tables. You could directly
-                 specify partitions that should be copied in <enabled_partitions/>, they should be in quoted format like partition column of
-                 system.parts table.
-            -->
-            <engine>
-            ENGINE=ReplicatedMergeTree('/clickhouse/tables/{cluster}/{shard}/hits2', '{replica}')
-            PARTITION BY toMonday(date)
-            ORDER BY (CounterID, EventDate)
-            </engine>
-
-            <!-- Sharding key used to insert data to destination cluster -->
-            <sharding_key>jumpConsistentHash(intHash64(UserID), 2)</sharding_key>
-
-            <!-- Optional expression that filter data while pull them from source servers -->
-            <where_condition>CounterID != 0</where_condition>
-
-            <!-- This section specifies partitions that should be copied, other partition will be ignored.
-                 Partition names should have the same format as
-                 partition column of system.parts table (i.e. a quoted text).
-                 Since partition key of source and destination cluster could be different,
-                 these partition names specify destination partitions.
-
-                 NOTE: In spite of this section is optional (if it is not specified, all partitions will be copied),
-                 it is strictly recommended to specify them explicitly.
-                 If you already have some ready partitions on destination cluster they
-                 will be removed at the start of the copying since they will be interpeted
-                 as unfinished data from the previous copying!!!
-            -->
-            <enabled_partitions>
-                <partition>'2018-02-26'</partition>
-                <partition>'2018-03-05'</partition>
-                ...
-            </enabled_partitions>
-        </table_hits>
-
-        <!-- Next table to copy. It is not copied until previous table is copying. -->
-        <table_visits>
-        ...
-        </table_visits>
-        ...
-    </tables>
-</clickhouse>
-```
-
-`clickhouse-copier` отслеживает изменения `/task/path/description` и применяет их «на лету». Если вы поменяете, например, значение `max_workers`, то количество процессов, выполняющих задания, также изменится.
diff --git a/docs/ru/operations/utilities/index.md b/docs/ru/operations/utilities/index.md
index 9eb90a3037c..e4b01a0276d 100644
--- a/docs/ru/operations/utilities/index.md
+++ b/docs/ru/operations/utilities/index.md
@@ -7,7 +7,6 @@ sidebar_position: 56
 # Утилиты ClickHouse {#utility-clickhouse}
 
 -   [clickhouse-local](clickhouse-local.md) - позволяет выполнять SQL-запросы над данными без остановки сервера ClickHouse, подобно утилите `awk`.
--   [clickhouse-copier](clickhouse-copier.md) - копирует (и перешардирует) данные с одного кластера на другой.
 -   [clickhouse-benchmark](../../operations/utilities/clickhouse-benchmark.md) — устанавливает соединение с сервером ClickHouse и запускает циклическое выполнение указанных запросов.
 -   [clickhouse-format](../../operations/utilities/clickhouse-format.md) — позволяет форматировать входящие запросы.
 -   [ClickHouse obfuscator](../../operations/utilities/clickhouse-obfuscator.md) — обфусцирует данные.
diff --git a/docs/ru/sql-reference/statements/alter/column.md b/docs/ru/sql-reference/statements/alter/column.md
index 385a9835eca..2ea045f4ae3 100644
--- a/docs/ru/sql-reference/statements/alter/column.md
+++ b/docs/ru/sql-reference/statements/alter/column.md
@@ -94,7 +94,7 @@ RENAME COLUMN [IF EXISTS] name to new_name
 
 Переименовывает столбец `name` в `new_name`. Если указано выражение `IF EXISTS`, то запрос не будет возвращать ошибку при условии, что столбец `name` не существует. Поскольку переименование не затрагивает физические данные колонки, запрос выполняется практически мгновенно.
 
-**ЗАМЕЧЕНИЕ**: Столбцы, являющиеся частью основного ключа или ключа сортировки (заданные с помощью `ORDER BY` или `PRIMARY KEY`), не могут быть переименованы. Попытка переименовать эти слобцы приведет к `SQL Error [524]`. 
+**ЗАМЕЧЕНИЕ**: Столбцы, являющиеся частью основного ключа или ключа сортировки (заданные с помощью `ORDER BY` или `PRIMARY KEY`), не могут быть переименованы. Попытка переименовать эти слобцы приведет к `SQL Error [524]`.
 
 Пример:
 
@@ -254,7 +254,7 @@ SELECT groupArray(x), groupArray(s) FROM tmp;
 
 Отсутствует возможность удалять столбцы, входящие в первичный ключ или ключ для сэмплирования (в общем, входящие в выражение `ENGINE`). Изменение типа у столбцов, входящих в первичный ключ возможно только в том случае, если это изменение не приводит к изменению данных (например, разрешено добавление значения в Enum или изменение типа с `DateTime` на `UInt32`).
 
-Если возможностей запроса `ALTER` не хватает для нужного изменения таблицы, вы можете создать новую таблицу, скопировать туда данные с помощью запроса [INSERT SELECT](../insert-into.md#inserting-the-results-of-select), затем поменять таблицы местами с помощью запроса [RENAME](../rename.md#rename-table), и удалить старую таблицу. В качестве альтернативы для запроса `INSERT SELECT`, можно использовать инструмент [clickhouse-copier](../../../sql-reference/statements/alter/index.md).
+Если возможностей запроса `ALTER` не хватает для нужного изменения таблицы, вы можете создать новую таблицу, скопировать туда данные с помощью запроса [INSERT SELECT](../insert-into.md#inserting-the-results-of-select), затем поменять таблицы местами с помощью запроса [RENAME](../rename.md#rename-table), и удалить старую таблицу.
 
 Запрос `ALTER` блокирует все чтения и записи для таблицы. То есть если на момент запроса `ALTER` выполнялся долгий `SELECT`, то запрос `ALTER` сначала дождётся его выполнения. И в это время все новые запросы к той же таблице будут ждать, пока завершится этот `ALTER`.
 
diff --git a/docs/zh/getting-started/tutorial.md b/docs/zh/getting-started/tutorial.md
index 989cf5f57d8..d0c9bda83ef 100644
--- a/docs/zh/getting-started/tutorial.md
+++ b/docs/zh/getting-started/tutorial.md
@@ -582,8 +582,6 @@ ENGINE = Distributed(perftest_3shards_1replicas, tutorial, hits_local, rand());
 INSERT INTO tutorial.hits_all SELECT * FROM tutorial.hits_v1;
 ```
 
-!!! warning "注意:"
-    这种方法不适合大型表的分片。 有一个单独的工具 [clickhouse-copier](../operations/utilities/clickhouse-copier.md) 这可以重新分片任意大表。
 
 正如您所期望的那样，如果计算量大的查询使用3台服务器而不是一个，则运行速度快N倍。
 
diff --git a/docs/zh/operations/backup.md b/docs/zh/operations/backup.md
index 6d491f9c2f7..48e852b4228 100644
--- a/docs/zh/operations/backup.md
+++ b/docs/zh/operations/backup.md
@@ -24,12 +24,6 @@ sidebar_label: "\u6570\u636E\u5907\u4EFD"
 
 某些本地文件系统提供快照功能（例如, [ZFS](https://en.wikipedia.org/wiki/ZFS)），但它们可能不是提供实时查询的最佳选择。 一个可能的解决方案是使用这种文件系统创建额外的副本，并将它们与用于`SELECT` 查询的 [分布式](../engines/table-engines/special/distributed.md) 表分离。 任何修改数据的查询都无法访问此类副本上的快照。 作为回报，这些副本可能具有特殊的硬件配置，每个服务器附加更多的磁盘，这将是经济高效的。
 
-## clickhouse-copier {#clickhouse-copier}
-
-[clickhouse-copier](utilities/clickhouse-copier.md) 是一个多功能工具，最初创建它是为了用于重新切分pb大小的表。 因为它能够在ClickHouse表和集群之间可靠地复制数据，所以它也可用于备份和还原数据。
-
-对于较小的数据量，一个简单的 `INSERT INTO ... SELECT ...` 到远程表也可以工作。
-
 ## part操作 {#manipulations-with-parts}
 
 ClickHouse允许使用 `ALTER TABLE ... FREEZE PARTITION ...` 查询以创建表分区的本地副本。 这是利用硬链接(hardlink)到 `/var/lib/clickhouse/shadow/` 文件夹中实现的，所以它通常不会因为旧数据而占用额外的磁盘空间。 创建的文件副本不由ClickHouse服务器处理，所以你可以把它们留在那里：你将有一个简单的备份，不需要任何额外的外部系统，但它仍然容易出现硬件问题。 出于这个原因，最好将它们远程复制到另一个位置，然后删除本地副本。 分布式文件系统和对象存储仍然是一个不错的选择，但是具有足够大容量的正常附加文件服务器也可以工作（在这种情况下，传输将通过网络文件系统或者也许是 [rsync](https://en.wikipedia.org/wiki/Rsync) 来进行).
diff --git a/docs/zh/operations/utilities/clickhouse-copier.md b/docs/zh/operations/utilities/clickhouse-copier.md
deleted file mode 100644
index b01edd9257c..00000000000
--- a/docs/zh/operations/utilities/clickhouse-copier.md
+++ /dev/null
@@ -1,172 +0,0 @@
----
-slug: /zh/operations/utilities/clickhouse-copier
----
-# clickhouse-copier {#clickhouse-copier}
-
-将数据从一个群集中的表复制到另一个（或相同）群集中的表。
-
-您可以运行多个 `clickhouse-copier` 不同服务器上的实例执行相同的作业。 ZooKeeper用于同步进程。
-
-开始后, `clickhouse-copier`:
-
--   连接到ZooKeeper并且接收:
-
-    -   复制作业。
-    -   复制作业的状态。
-
--   它执行的工作。
-
-        每个正在运行的进程都会选择源集群的“最接近”分片，然后将数据复制到目标集群，并在必要时重新分片数据。
-
-`clickhouse-copier` 跟踪ZooKeeper中的更改，并实时应用它们。
-
-为了减少网络流量，我们建议运行 `clickhouse-copier` 在源数据所在的同一服务器上。
-
-## 运行Clickhouse-copier {#running-clickhouse-copier}
-
-该实用程序应手动运行:
-
-``` bash
-clickhouse-copier --daemon --config zookeeper.xml --task-path /task/path --base-dir /path/to/dir
-```
-
-参数:
-
--   `daemon` — 在守护进程模式下启动`clickhouse-copier`。
--   `config` — `zookeeper.xml`文件的路径，其中包含用于连接ZooKeeper的参数。
--   `task-path` — ZooKeeper节点的路径。 该节点用于同步`clickhouse-copier`进程和存储任务。 任务存储在`$task-path/description`中。
--   `task-file` — 可选的非必须参数, 指定一个包含任务配置的参数文件, 用于初始上传到ZooKeeper。
--   `task-upload-force` — 即使节点已经存在，也强制上载`task-file`。
--   `base-dir` — 日志和辅助文件的路径。 启动时，`clickhouse-copier`在`$base-dir`中创建`clickhouse-copier_YYYYMMHHSS_<PID>`子目录。 如果省略此参数，则会在启动`clickhouse-copier`的目录中创建目录。
-
-
-
-## Zookeeper.xml格式 {#format-of-zookeeper-xml}
-
-``` xml
-<clickhouse>
-    <logger>
-        <level>trace</level>
-        <size>100M</size>
-        <count>3</count>
-    </logger>
-
-    <zookeeper>
-        <node index="1">
-            <host>127.0.0.1</host>
-            <port>2181</port>
-        </node>
-    </zookeeper>
-</clickhouse>
-```
-
-## 复制任务的配置 {#configuration-of-copying-tasks}
-
-``` xml
-<clickhouse>
-    <!-- Configuration of clusters as in an ordinary server config -->
-    <remote_servers>
-        <source_cluster>
-            <shard>
-                <internal_replication>false</internal_replication>
-                    <replica>
-                        <host>127.0.0.1</host>
-                        <port>9000</port>
-                    </replica>
-            </shard>
-            ...
-        </source_cluster>
-
-        <destination_cluster>
-        ...
-        </destination_cluster>
-    </remote_servers>
-
-    <!-- How many simultaneously active workers are possible. If you run more workers superfluous workers will sleep. -->
-    <max_workers>2</max_workers>
-
-    <!-- Setting used to fetch (pull) data from source cluster tables -->
-    <settings_pull>
-        <readonly>1</readonly>
-    </settings_pull>
-
-    <!-- Setting used to insert (push) data to destination cluster tables -->
-    <settings_push>
-        <readonly>0</readonly>
-    </settings_push>
-
-    <!-- Common setting for fetch (pull) and insert (push) operations. Also, copier process context uses it.
-         They are overlaid by <settings_pull/> and <settings_push/> respectively. -->
-    <settings>
-        <connect_timeout>3</connect_timeout>
-        <!-- Sync insert is set forcibly, leave it here just in case. -->
-        <distributed_foreground_insert>1</distributed_foreground_insert>
-    </settings>
-
-    <!-- Copying tasks description.
-         You could specify several table task in the same task description (in the same ZooKeeper node), they will be performed
-         sequentially.
-    -->
-    <tables>
-        <!-- A table task, copies one table. -->
-        <table_hits>
-            <!-- Source cluster name (from <remote_servers/> section) and tables in it that should be copied -->
-            <cluster_pull>source_cluster</cluster_pull>
-            <database_pull>test</database_pull>
-            <table_pull>hits</table_pull>
-
-            <!-- Destination cluster name and tables in which the data should be inserted -->
-            <cluster_push>destination_cluster</cluster_push>
-            <database_push>test</database_push>
-            <table_push>hits2</table_push>
-
-            <!-- Engine of destination tables.
-                 If destination tables have not be created, workers create them using columns definition from source tables and engine
-                 definition from here.
-
-                 NOTE: If the first worker starts insert data and detects that destination partition is not empty then the partition will
-                 be dropped and refilled, take it into account if you already have some data in destination tables. You could directly
-                 specify partitions that should be copied in <enabled_partitions/>, they should be in quoted format like partition column of
-                 system.parts table.
-            -->
-            <engine>
-            ENGINE=ReplicatedMergeTree('/clickhouse/tables/{cluster}/{shard}/hits2', '{replica}')
-            PARTITION BY toMonday(date)
-            ORDER BY (CounterID, EventDate)
-            </engine>
-
-            <!-- Sharding key used to insert data to destination cluster -->
-            <sharding_key>jumpConsistentHash(intHash64(UserID), 2)</sharding_key>
-
-            <!-- Optional expression that filter data while pull them from source servers -->
-            <where_condition>CounterID != 0</where_condition>
-
-            <!-- This section specifies partitions that should be copied, other partition will be ignored.
-                 Partition names should have the same format as
-                 partition column of system.parts table (i.e. a quoted text).
-                 Since partition key of source and destination cluster could be different,
-                 these partition names specify destination partitions.
-
-                 NOTE: In spite of this section is optional (if it is not specified, all partitions will be copied),
-                 it is strictly recommended to specify them explicitly.
-                 If you already have some ready partitions on destination cluster they
-                 will be removed at the start of the copying since they will be interpeted
-                 as unfinished data from the previous copying!!!
-            -->
-            <enabled_partitions>
-                <partition>'2018-02-26'</partition>
-                <partition>'2018-03-05'</partition>
-                ...
-            </enabled_partitions>
-        </table_hits>
-
-        <!-- Next table to copy. It is not copied until previous table is copying. -->
-        <table_visits>
-        ...
-        </table_visits>
-        ...
-    </tables>
-</clickhouse>
-```
-
-`clickhouse-copier` 跟踪更改 `/task/path/description` 并在飞行中应用它们。 例如，如果你改变的值 `max_workers`，运行任务的进程数也会发生变化。
diff --git a/docs/zh/operations/utilities/index.md b/docs/zh/operations/utilities/index.md
index af158baf275..cebe312450c 100644
--- a/docs/zh/operations/utilities/index.md
+++ b/docs/zh/operations/utilities/index.md
@@ -4,5 +4,4 @@ slug: /zh/operations/utilities/
 # 实用工具 {#clickhouse-utility}
 
 -   [本地查询](clickhouse-local.md) —  在不停止ClickHouse服务的情况下，对数据执行查询操作(类似于 `awk` 命令)。
--   [跨集群复制](clickhouse-copier.md) —  在不同集群间复制数据。
 -   [性能测试](clickhouse-benchmark.md) — 连接到Clickhouse服务器，执行性能测试。
diff --git a/docs/zh/sql-reference/statements/alter.md b/docs/zh/sql-reference/statements/alter.md
index 002d5102fa3..48665ae04ab 100644
--- a/docs/zh/sql-reference/statements/alter.md
+++ b/docs/zh/sql-reference/statements/alter.md
@@ -150,7 +150,7 @@ ALTER TABLE visits MODIFY COLUMN browser Array(String)
 
 不支持对primary key或者sampling key中的列（在 `ENGINE` 表达式中用到的列）进行删除操作。改变包含在primary key中的列的类型时，如果操作不会导致数据的变化（例如，往Enum中添加一个值，或者将`DateTime` 类型改成 `UInt32`），那么这种操作是可行的。
 
-如果 `ALTER` 操作不足以完成你想要的表变动操作，你可以创建一张新的表，通过 [INSERT SELECT](../../sql-reference/statements/insert-into.md#inserting-the-results-of-select)将数据拷贝进去，然后通过  [RENAME](../../sql-reference/statements/misc.md#misc_operations-rename)将新的表改成和原有表一样的名称，并删除原有的表。你可以使用 [clickhouse-copier](../../operations/utilities/clickhouse-copier.md) 代替 `INSERT SELECT`。
+如果 `ALTER` 操作不足以完成你想要的表变动操作，你可以创建一张新的表，通过 [INSERT SELECT](../../sql-reference/statements/insert-into.md#inserting-the-results-of-select)将数据拷贝进去，然后通过  [RENAME](../../sql-reference/statements/misc.md#misc_operations-rename)将新的表改成和原有表一样的名称，并删除原有的表。
 
  `ALTER` 操作会阻塞对表的所有读写操作。换句话说，当一个大的 `SELECT` 语句和 `ALTER`同时执行时，`ALTER`会等待，直到 `SELECT` 执行结束。与此同时，当 `ALTER` 运行时，新的 sql 语句将会等待。
 
diff --git a/packages/clickhouse-server.yaml b/packages/clickhouse-server.yaml
index 7894129b8e3..dc183ead102 100644
--- a/packages/clickhouse-server.yaml
+++ b/packages/clickhouse-server.yaml
@@ -50,8 +50,6 @@ contents:
   dst: /etc/init.d/clickhouse-server
 - src: clickhouse-server.service
   dst: /lib/systemd/system/clickhouse-server.service
-- src: root/usr/bin/clickhouse-copier
-  dst: /usr/bin/clickhouse-copier
 - src: root/usr/bin/clickhouse-server
   dst: /usr/bin/clickhouse-server
 # clickhouse-keeper part
diff --git a/programs/CMakeLists.txt b/programs/CMakeLists.txt
index 62bcf068879..d945fdf4a6f 100644
--- a/programs/CMakeLists.txt
+++ b/programs/CMakeLists.txt
@@ -122,7 +122,6 @@ add_subdirectory (local)
 add_subdirectory (benchmark)
 add_subdirectory (extract-from-config)
 add_subdirectory (compressor)
-add_subdirectory (copier)
 add_subdirectory (format)
 add_subdirectory (obfuscator)
 add_subdirectory (install)
@@ -200,7 +199,6 @@ clickhouse_program_install(clickhouse-server server)
 clickhouse_program_install(clickhouse-client client chc)
 clickhouse_program_install(clickhouse-local local chl ch)
 clickhouse_program_install(clickhouse-benchmark benchmark)
-clickhouse_program_install(clickhouse-copier copier)
 clickhouse_program_install(clickhouse-extract-from-config extract-from-config)
 clickhouse_program_install(clickhouse-compressor compressor)
 clickhouse_program_install(clickhouse-format format)
diff --git a/programs/copier/Aliases.h b/programs/copier/Aliases.h
deleted file mode 100644
index 02be3441acd..00000000000
--- a/programs/copier/Aliases.h
+++ /dev/null
@@ -1,15 +0,0 @@
-#pragma once
-
-#include <base/types.h>
-
-#include <Poco/Util/AbstractConfiguration.h>
-
-#include <utility>
-
-namespace DB
-{
-    using ConfigurationPtr = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
-
-    using DatabaseAndTableName = std::pair<String, String>;
-    using ListOfDatabasesAndTableNames = std::vector<DatabaseAndTableName>;
-}
diff --git a/programs/copier/CMakeLists.txt b/programs/copier/CMakeLists.txt
deleted file mode 100644
index 2c17e70bc5e..00000000000
--- a/programs/copier/CMakeLists.txt
+++ /dev/null
@@ -1,28 +0,0 @@
-set(CLICKHOUSE_COPIER_SOURCES
-        "${CMAKE_CURRENT_SOURCE_DIR}/ClusterCopierApp.cpp"
-        "${CMAKE_CURRENT_SOURCE_DIR}/ClusterCopier.cpp"
-        "${CMAKE_CURRENT_SOURCE_DIR}/Internals.cpp"
-        "${CMAKE_CURRENT_SOURCE_DIR}/ShardPartition.cpp"
-        "${CMAKE_CURRENT_SOURCE_DIR}/ShardPartitionPiece.cpp"
-        "${CMAKE_CURRENT_SOURCE_DIR}/StatusAccumulator.cpp"
-        "${CMAKE_CURRENT_SOURCE_DIR}/TaskCluster.cpp"
-        "${CMAKE_CURRENT_SOURCE_DIR}/TaskShard.cpp"
-        "${CMAKE_CURRENT_SOURCE_DIR}/TaskTable.cpp")
-
-set (CLICKHOUSE_COPIER_LINK
-        PRIVATE
-                clickhouse_common_zookeeper
-                clickhouse_common_config
-                clickhouse_parsers
-                clickhouse_functions
-                clickhouse_table_functions
-                clickhouse_aggregate_functions
-                string_utils
-
-        PUBLIC
-                daemon
-)
-
-set(CLICKHOUSE_COPIER_INCLUDE SYSTEM PRIVATE ${CMAKE_CURRENT_SOURCE_DIR})
-
-clickhouse_program_add(copier)
diff --git a/programs/copier/ClusterCopier.cpp b/programs/copier/ClusterCopier.cpp
deleted file mode 100644
index 59505d08f5c..00000000000
--- a/programs/copier/ClusterCopier.cpp
+++ /dev/null
@@ -1,2076 +0,0 @@
-#include "ClusterCopier.h"
-
-#include "Internals.h"
-#include "StatusAccumulator.h"
-
-#include <Common/ZooKeeper/ZooKeeper.h>
-#include <Common/ZooKeeper/KeeperException.h>
-#include <Common/randomSeed.h>
-#include <Common/setThreadName.h>
-#include <Common/CurrentMetrics.h>
-#include <Interpreters/InterpreterInsertQuery.h>
-#include <Interpreters/InterpreterSelectWithUnionQuery.h>
-#include <Parsers/ASTFunction.h>
-#include <Processors/Transforms/ExpressionTransform.h>
-#include <QueryPipeline/QueryPipelineBuilder.h>
-#include <QueryPipeline/Chain.h>
-#include <Processors/Executors/PullingPipelineExecutor.h>
-#include <Processors/Executors/PushingPipelineExecutor.h>
-#include <Processors/Sources/RemoteSource.h>
-#include <Processors/QueryPlan/QueryPlan.h>
-#include <Processors/QueryPlan/BuildQueryPipelineSettings.h>
-#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
-
-namespace CurrentMetrics
-{
-    extern const Metric LocalThread;
-    extern const Metric LocalThreadActive;
-    extern const Metric LocalThreadScheduled;
-}
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int NOT_IMPLEMENTED;
-    extern const int LOGICAL_ERROR;
-    extern const int UNFINISHED;
-    extern const int BAD_ARGUMENTS;
-}
-
-
-void ClusterCopier::init()
-{
-    auto zookeeper = getContext()->getZooKeeper();
-
-    task_description_watch_callback = [this] (const Coordination::WatchResponse & response)
-    {
-        if (response.error != Coordination::Error::ZOK)
-            return;
-        UInt64 version = ++task_description_version;
-        LOG_INFO(log, "Task description should be updated, local version {}", version);
-    };
-
-    task_description_path = task_zookeeper_path + "/description";
-    task_cluster = std::make_unique<TaskCluster>(task_zookeeper_path, working_database_name);
-
-    reloadTaskDescription();
-
-    task_cluster->loadTasks(*task_cluster_current_config);
-    getContext()->setClustersConfig(task_cluster_current_config, false, task_cluster->clusters_prefix);
-
-    /// Set up shards and their priority
-    task_cluster->random_engine.seed(randomSeed());
-    for (auto & task_table : task_cluster->table_tasks)
-    {
-        task_table.cluster_pull = getContext()->getCluster(task_table.cluster_pull_name);
-        task_table.cluster_push = getContext()->getCluster(task_table.cluster_push_name);
-        task_table.initShards(task_cluster->random_engine);
-    }
-
-    LOG_INFO(log, "Will process {} table tasks", task_cluster->table_tasks.size());
-
-    /// Do not initialize tables, will make deferred initialization in process()
-
-    zookeeper->createAncestors(getWorkersPathVersion() + "/");
-    zookeeper->createAncestors(getWorkersPath() + "/");
-    /// Init status node
-    zookeeper->createIfNotExists(task_zookeeper_path + "/status", "{}");
-}
-
-template <typename T>
-decltype(auto) ClusterCopier::retry(T && func, UInt64 max_tries)
-{
-    std::exception_ptr exception;
-
-    if (max_tries == 0)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot perform zero retries");
-
-    for (UInt64 try_number = 1; try_number <= max_tries; ++try_number)
-    {
-        try
-        {
-            return func();
-        }
-        catch (...)
-        {
-            exception = std::current_exception();
-            if (try_number < max_tries)
-            {
-                tryLogCurrentException(log, "Will retry");
-                std::this_thread::sleep_for(retry_delay_ms);
-            }
-        }
-    }
-
-    std::rethrow_exception(exception);
-}
-
-
-void ClusterCopier::discoverShardPartitions(const ConnectionTimeouts & timeouts, const TaskShardPtr & task_shard)
-{
-    TaskTable & task_table = task_shard->task_table;
-
-    LOG_INFO(log, "Discover partitions of shard {}", task_shard->getDescription());
-
-    auto get_partitions = [&] () { return getShardPartitions(timeouts, *task_shard); };
-    auto existing_partitions_names = retry(get_partitions, 60);
-    Strings filtered_partitions_names;
-    Strings missing_partitions;
-
-    /// Check that user specified correct partition names
-    auto check_partition_format = [] (const DataTypePtr & type, const String & partition_text_quoted)
-    {
-        MutableColumnPtr column_dummy = type->createColumn();
-        ReadBufferFromString rb(partition_text_quoted);
-
-        try
-        {
-            type->getDefaultSerialization()->deserializeTextQuoted(*column_dummy, rb, FormatSettings());
-        }
-        catch (Exception & e)
-        {
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Partition {} has incorrect format. {}", partition_text_quoted, e.displayText());
-        }
-    };
-
-    if (task_table.has_enabled_partitions)
-    {
-        /// Process partition in order specified by <enabled_partitions/>
-        for (const String & partition_name : task_table.enabled_partitions)
-        {
-            /// Check that user specified correct partition names
-            check_partition_format(task_shard->partition_key_column.type, partition_name);
-
-            auto it = existing_partitions_names.find(partition_name);
-
-            /// Do not process partition if it is not in enabled_partitions list
-            if (it == existing_partitions_names.end())
-            {
-                missing_partitions.emplace_back(partition_name);
-                continue;
-            }
-
-            filtered_partitions_names.emplace_back(*it);
-        }
-
-        for (const String & partition_name : existing_partitions_names)
-        {
-            if (!task_table.enabled_partitions_set.contains(partition_name))
-            {
-                LOG_INFO(log, "Partition {} will not be processed, since it is not in enabled_partitions of {}", partition_name, task_table.table_id);
-            }
-        }
-    }
-    else
-    {
-        for (const String & partition_name : existing_partitions_names)
-            filtered_partitions_names.emplace_back(partition_name);
-    }
-
-    for (const String & partition_name : filtered_partitions_names)
-    {
-        const size_t number_of_splits = task_table.number_of_splits;
-        task_shard->partition_tasks.emplace(partition_name, ShardPartition(*task_shard, partition_name, number_of_splits));
-        task_shard->checked_partitions.emplace(partition_name, true);
-
-        auto shard_partition_it = task_shard->partition_tasks.find(partition_name);
-        PartitionPieces & shard_partition_pieces = shard_partition_it->second.pieces;
-
-        for (size_t piece_number = 0; piece_number < number_of_splits; ++piece_number)
-        {
-            bool res = checkPresentPartitionPiecesOnCurrentShard(timeouts, *task_shard, partition_name, piece_number);
-            shard_partition_pieces.emplace_back(shard_partition_it->second, piece_number, res);
-        }
-    }
-
-    if (!missing_partitions.empty())
-    {
-        WriteBufferFromOwnString ss;
-        for (const String & missing_partition : missing_partitions)
-            ss << " " << missing_partition;
-
-        LOG_WARNING(log, "There are no {} partitions from enabled_partitions in shard {} :{}", missing_partitions.size(), task_shard->getDescription(), ss.str());
-    }
-
-    LOG_INFO(log, "Will copy {} partitions from shard {}", task_shard->partition_tasks.size(), task_shard->getDescription());
-}
-
-void ClusterCopier::discoverTablePartitions(const ConnectionTimeouts & timeouts, TaskTable & task_table, UInt64 num_threads)
-{
-    /// Fetch partitions list from a shard
-    {
-        ThreadPool thread_pool(CurrentMetrics::LocalThread, CurrentMetrics::LocalThreadActive, CurrentMetrics::LocalThreadScheduled, num_threads ? num_threads : 2 * getNumberOfPhysicalCPUCores());
-
-        for (const TaskShardPtr & task_shard : task_table.all_shards)
-            thread_pool.scheduleOrThrowOnError([this, timeouts, task_shard]()
-            {
-                setThreadName("DiscoverPartns");
-                discoverShardPartitions(timeouts, task_shard);
-            });
-
-        LOG_INFO(log, "Waiting for {} setup jobs", thread_pool.active());
-        thread_pool.wait();
-    }
-}
-
-void ClusterCopier::uploadTaskDescription(const std::string & task_path, const std::string & task_file, const bool force)
-{
-    auto local_task_description_path = task_path + "/description";
-
-    String task_config_str;
-    {
-        ReadBufferFromFile in(task_file);
-        readStringUntilEOF(task_config_str, in);
-    }
-    if (task_config_str.empty())
-        return;
-
-    auto zookeeper = getContext()->getZooKeeper();
-
-    zookeeper->createAncestors(local_task_description_path);
-    auto code = zookeeper->tryCreate(local_task_description_path, task_config_str, zkutil::CreateMode::Persistent);
-    if (code != Coordination::Error::ZOK && force)
-        zookeeper->createOrUpdate(local_task_description_path, task_config_str, zkutil::CreateMode::Persistent);
-
-    LOG_INFO(log, "Task description {} uploaded to {} with result {} ({})",
-        ((code != Coordination::Error::ZOK && !force) ? "not " : ""), local_task_description_path, code, Coordination::errorMessage(code));
-}
-
-void ClusterCopier::reloadTaskDescription()
-{
-    auto zookeeper = getContext()->getZooKeeper();
-    task_description_watch_zookeeper = zookeeper;
-
-    Coordination::Stat stat{};
-
-    /// It will throw exception if such a node doesn't exist.
-    auto task_config_str = zookeeper->get(task_description_path, &stat);
-
-    LOG_INFO(log, "Loading task description");
-    task_cluster_current_config = getConfigurationFromXMLString(task_config_str);
-
-    /// Setup settings
-    task_cluster->reloadSettings(*task_cluster_current_config);
-    getContext()->setSettings(task_cluster->settings_common);
-}
-
-void ClusterCopier::updateConfigIfNeeded()
-{
-    UInt64 version_to_update = task_description_version;
-    bool is_outdated_version = task_description_current_version != version_to_update;
-    bool is_expired_session  = !task_description_watch_zookeeper || task_description_watch_zookeeper->expired();
-
-    if (!is_outdated_version && !is_expired_session)
-        return;
-
-    LOG_INFO(log, "Updating task description");
-    reloadTaskDescription();
-
-    task_description_current_version = version_to_update;
-}
-
-void ClusterCopier::process(const ConnectionTimeouts & timeouts)
-{
-    for (TaskTable & task_table : task_cluster->table_tasks)
-    {
-        LOG_INFO(log, "Process table task {} with {} shards, {} of them are local ones", task_table.table_id, task_table.all_shards.size(), task_table.local_shards.size());
-
-        if (task_table.all_shards.empty())
-            continue;
-
-        /// Discover partitions of each shard and total set of partitions
-        if (!task_table.has_enabled_partitions)
-        {
-            /// If there are no specified enabled_partitions, we must discover them manually
-            discoverTablePartitions(timeouts, task_table);
-
-            /// After partitions of each shard are initialized, initialize cluster partitions
-            for (const TaskShardPtr & task_shard : task_table.all_shards)
-            {
-                for (const auto & partition_elem : task_shard->partition_tasks)
-                {
-                    const String & partition_name = partition_elem.first;
-                    task_table.cluster_partitions.emplace(partition_name, ClusterPartition{});
-                }
-            }
-
-            for (auto & partition_elem : task_table.cluster_partitions)
-            {
-                const String & partition_name = partition_elem.first;
-
-                for (const TaskShardPtr & task_shard : task_table.all_shards)
-                    task_shard->checked_partitions.emplace(partition_name);
-
-                task_table.ordered_partition_names.emplace_back(partition_name);
-            }
-        }
-        else
-        {
-            /// If enabled_partitions are specified, assume that each shard has all partitions
-            /// We will refine partition set of each shard in future
-
-            for (const String & partition_name : task_table.enabled_partitions)
-            {
-                task_table.cluster_partitions.emplace(partition_name, ClusterPartition{});
-                task_table.ordered_partition_names.emplace_back(partition_name);
-            }
-        }
-
-        task_table.watch.restart();
-
-        /// Retry table processing
-        bool table_is_done = false;
-        for (UInt64 num_table_tries = 1; num_table_tries <= max_table_tries; ++num_table_tries)
-        {
-            if (tryProcessTable(timeouts, task_table))
-            {
-                table_is_done = true;
-                break;
-            }
-        }
-
-        if (!table_is_done)
-        {
-            throw Exception(ErrorCodes::UNFINISHED, "Too many tries to process table {}. Abort remaining execution",
-                            task_table.table_id);
-        }
-    }
-}
-
-/// Protected section
-
-
-/*
- * Creates task worker node and checks maximum number of workers not to exceed the limit.
- * To achieve this we have to check version of workers_version_path node and create current_worker_path
- * node atomically.
- * */
-
-zkutil::EphemeralNodeHolder::Ptr ClusterCopier::createTaskWorkerNodeAndWaitIfNeed(
-    const zkutil::ZooKeeperPtr & zookeeper,
-    const String & description,
-    bool unprioritized)
-{
-    std::chrono::milliseconds current_sleep_time = retry_delay_ms;
-    static constexpr std::chrono::milliseconds max_sleep_time(30000); // 30 sec
-
-    if (unprioritized)
-        std::this_thread::sleep_for(current_sleep_time);
-
-    String workers_version_path = getWorkersPathVersion();
-    String workers_path         = getWorkersPath();
-    String current_worker_path  = getCurrentWorkerNodePath();
-
-    UInt64 num_bad_version_errors = 0;
-
-    while (true)
-    {
-        updateConfigIfNeeded();
-
-        Coordination::Stat stat;
-        zookeeper->get(workers_version_path, &stat);
-        auto version = stat.version;
-        zookeeper->get(workers_path, &stat);
-
-        if (static_cast<UInt64>(stat.numChildren) >= task_cluster->max_workers)
-        {
-            LOG_INFO(log, "Too many workers ({}, maximum {}). Postpone processing {}", stat.numChildren, task_cluster->max_workers, description);
-
-            if (unprioritized)
-                current_sleep_time = std::min(max_sleep_time, current_sleep_time + retry_delay_ms);
-
-            std::this_thread::sleep_for(current_sleep_time);
-            num_bad_version_errors = 0;
-        }
-        else
-        {
-            Coordination::Requests ops;
-            ops.emplace_back(zkutil::makeSetRequest(workers_version_path, description, version));
-            ops.emplace_back(zkutil::makeCreateRequest(current_worker_path, description, zkutil::CreateMode::Ephemeral));
-            Coordination::Responses responses;
-            auto code = zookeeper->tryMulti(ops, responses);
-
-            if (code == Coordination::Error::ZOK || code == Coordination::Error::ZNODEEXISTS)
-                return zkutil::EphemeralNodeHolder::existing(current_worker_path, *zookeeper);
-
-            if (code == Coordination::Error::ZBADVERSION)
-            {
-                ++num_bad_version_errors;
-
-                /// Try to make fast retries
-                if (num_bad_version_errors > 3)
-                {
-                    LOG_INFO(log, "A concurrent worker has just been added, will check free worker slots again");
-                    std::chrono::milliseconds random_sleep_time(std::uniform_int_distribution<int>(1, 1000)(task_cluster->random_engine));
-                    std::this_thread::sleep_for(random_sleep_time);
-                    num_bad_version_errors = 0;
-                }
-            }
-            else
-                throw Coordination::Exception(code);
-        }
-    }
-}
-
-
-bool ClusterCopier::checkPartitionPieceIsClean(
-        const zkutil::ZooKeeperPtr & zookeeper,
-        const CleanStateClock & clean_state_clock,
-        const String & task_status_path)
-{
-    LogicalClock task_start_clock;
-
-    Coordination::Stat stat{};
-    if (zookeeper->exists(task_status_path, &stat))
-        task_start_clock = LogicalClock(stat.mzxid);
-
-    return clean_state_clock.is_clean() && (!task_start_clock.hasHappened() || clean_state_clock.discovery_zxid <= task_start_clock);
-}
-
-
-bool ClusterCopier::checkAllPiecesInPartitionAreDone(const TaskTable & task_table, const String & partition_name, const TasksShard & shards_with_partition)
-{
-    bool answer = true;
-    for (size_t piece_number = 0; piece_number < task_table.number_of_splits; ++piece_number)
-    {
-        bool piece_is_done = checkPartitionPieceIsDone(task_table, partition_name, piece_number, shards_with_partition);
-        if (!piece_is_done)
-            LOG_INFO(log, "Partition {} piece {} is not already done.", partition_name, piece_number);
-        answer &= piece_is_done;
-    }
-
-    return answer;
-}
-
-
-/* The same as function above
- * Assume that we don't know on which shards do we have partition certain piece.
- * We'll check them all (I mean shards that contain the whole partition)
- * And shards that don't have certain piece MUST mark that piece is_done true.
- * */
-bool ClusterCopier::checkPartitionPieceIsDone(const TaskTable & task_table, const String & partition_name,
-                               size_t piece_number, const TasksShard & shards_with_partition)
-{
-    LOG_INFO(log, "Check that all shards processed partition {} piece {} successfully", partition_name, piece_number);
-
-    auto zookeeper = getContext()->getZooKeeper();
-
-    /// Collect all shards that contain partition piece number piece_number.
-    Strings piece_status_paths;
-    for (const auto & shard : shards_with_partition)
-    {
-        ShardPartition & task_shard_partition = shard->partition_tasks.find(partition_name)->second;
-        ShardPartitionPiece & shard_partition_piece = task_shard_partition.pieces[piece_number];
-        piece_status_paths.emplace_back(shard_partition_piece.getShardStatusPath());
-    }
-
-    std::vector<int64_t> zxid1, zxid2;
-
-    try
-    {
-        std::vector<zkutil::ZooKeeper::FutureGet> get_futures;
-        for (const String & path : piece_status_paths)
-            get_futures.emplace_back(zookeeper->asyncGet(path));
-
-        // Check that state is Finished and remember zxid
-        for (auto & future : get_futures)
-        {
-            auto res = future.get();
-
-            TaskStateWithOwner status = TaskStateWithOwner::fromString(res.data);
-            if (status.state != TaskState::Finished)
-            {
-                LOG_INFO(log, "The task {} is being rewritten by {}. Partition piece will be rechecked", res.data, status.owner);
-                return false;
-            }
-
-            zxid1.push_back(res.stat.pzxid);
-        }
-
-        const String piece_is_dirty_flag_path = task_table.getCertainPartitionPieceIsDirtyPath(partition_name, piece_number);
-        const String piece_is_dirty_cleaned_path = task_table.getCertainPartitionPieceIsCleanedPath(partition_name, piece_number);
-        const String piece_task_status_path = task_table.getCertainPartitionPieceTaskStatusPath(partition_name, piece_number);
-
-        CleanStateClock clean_state_clock (zookeeper, piece_is_dirty_flag_path, piece_is_dirty_cleaned_path);
-
-        const bool is_clean = checkPartitionPieceIsClean(zookeeper, clean_state_clock, piece_task_status_path);
-
-
-        if (!is_clean)
-        {
-            LOG_INFO(log, "Partition {} become dirty", partition_name);
-            return false;
-        }
-
-        get_futures.clear();
-        for (const String & path : piece_status_paths)
-            get_futures.emplace_back(zookeeper->asyncGet(path));
-
-        // Remember zxid of states again
-        for (auto & future : get_futures)
-        {
-            auto res = future.get();
-            zxid2.push_back(res.stat.pzxid);
-        }
-    }
-    catch (const Coordination::Exception & e)
-    {
-        LOG_INFO(log, "A ZooKeeper error occurred while checking partition {} piece number {}. Will recheck the partition. Error: {}", partition_name, toString(piece_number), e.displayText());
-        return false;
-    }
-
-    // If all task is finished and zxid is not changed then partition could not become dirty again
-    for (UInt64 shard_num = 0; shard_num < piece_status_paths.size(); ++shard_num)
-    {
-        if (zxid1[shard_num] != zxid2[shard_num])
-        {
-            LOG_INFO(log, "The task {} is being modified now. Partition piece will be rechecked", piece_status_paths[shard_num]);
-            return false;
-        }
-    }
-
-    LOG_INFO(log, "Partition {} piece number {} is copied successfully", partition_name, toString(piece_number));
-    return true;
-}
-
-
-TaskStatus ClusterCopier::tryMoveAllPiecesToDestinationTable(const TaskTable & task_table, const String & partition_name)
-{
-    bool inject_fault = false;
-    if (move_fault_probability > 0)
-    {
-        double value = std::uniform_real_distribution<>(0, 1)(task_table.task_cluster.random_engine);
-        inject_fault = value < move_fault_probability;
-    }
-
-    LOG_INFO(log, "Try to move {} to destination table", partition_name);
-
-    auto zookeeper = getContext()->getZooKeeper();
-
-    const auto current_partition_attach_is_active = task_table.getPartitionAttachIsActivePath(partition_name);
-    const auto current_partition_attach_is_done   = task_table.getPartitionAttachIsDonePath(partition_name);
-
-    /// Create ephemeral node to mark that we are active and process the partition
-    zookeeper->createAncestors(current_partition_attach_is_active);
-    zkutil::EphemeralNodeHolderPtr partition_attach_node_holder;
-    try
-    {
-        partition_attach_node_holder = zkutil::EphemeralNodeHolder::create(current_partition_attach_is_active, *zookeeper, host_id);
-    }
-    catch (const Coordination::Exception & e)
-    {
-        if (e.code == Coordination::Error::ZNODEEXISTS)
-        {
-            LOG_INFO(log, "Someone is already moving pieces {}", current_partition_attach_is_active);
-            return TaskStatus::Active;
-        }
-
-        throw;
-    }
-
-
-    /// Exit if task has been already processed;
-    /// create blocking node to signal cleaning up if it is abandoned
-    {
-        String status_data;
-        if (zookeeper->tryGet(current_partition_attach_is_done, status_data))
-        {
-            TaskStateWithOwner status = TaskStateWithOwner::fromString(status_data);
-            if (status.state == TaskState::Finished)
-            {
-                LOG_INFO(log, "All pieces for partition from this task {} has been successfully moved to destination table by {}", current_partition_attach_is_active, status.owner);
-                return TaskStatus::Finished;
-            }
-
-            /// Task is abandoned, because previously we created ephemeral node, possibly in other copier's process.
-            /// Initialize DROP PARTITION
-            LOG_INFO(log, "Moving piece for partition {} has not been successfully finished by {}. Will try to move by myself.", current_partition_attach_is_active, status.owner);
-
-            /// Remove is_done marker.
-            zookeeper->remove(current_partition_attach_is_done);
-        }
-    }
-
-
-    /// Try start processing, create node about it
-    {
-        String start_state = TaskStateWithOwner::getData(TaskState::Started, host_id);
-        zookeeper->create(current_partition_attach_is_done, start_state, zkutil::CreateMode::Persistent);
-    }
-
-
-    /// Try to drop destination partition in original table
-    if (task_table.allow_to_drop_target_partitions)
-    {
-        DatabaseAndTableName original_table = task_table.table_push;
-
-        WriteBufferFromOwnString ss;
-        ss << "ALTER TABLE " << getQuotedTable(original_table) << ((partition_name == "'all'") ? " DROP PARTITION ID " : " DROP PARTITION ") << partition_name;
-
-        UInt64 num_shards_drop_partition = executeQueryOnCluster(task_table.cluster_push, ss.str(), task_cluster->settings_push, ClusterExecutionMode::ON_EACH_SHARD);
-        if (num_shards_drop_partition != task_table.cluster_push->getShardCount())
-            return TaskStatus::Error;
-
-        LOG_INFO(log, "Drop partition {} in original table {} have been executed successfully on {} shards of {}",
-            partition_name, getQuotedTable(original_table), num_shards_drop_partition, task_table.cluster_push->getShardCount());
-    }
-
-    /// Move partition to original destination table.
-    for (size_t current_piece_number = 0; current_piece_number < task_table.number_of_splits; ++current_piece_number)
-    {
-        LOG_INFO(log, "Trying to move partition {} piece {} to original table", partition_name, toString(current_piece_number));
-
-        ASTPtr query_alter_ast;
-        String query_alter_ast_string;
-
-        DatabaseAndTableName original_table = task_table.table_push;
-        DatabaseAndTableName helping_table = DatabaseAndTableName(original_table.first,
-                                                                  original_table.second + "_piece_" +
-                                                                  toString(current_piece_number));
-
-        Settings settings_push = task_cluster->settings_push;
-        ClusterExecutionMode execution_mode = ClusterExecutionMode::ON_EACH_NODE;
-
-        if (settings_push.alter_sync == 1)
-            execution_mode = ClusterExecutionMode::ON_EACH_SHARD;
-
-        query_alter_ast_string += " ALTER TABLE " + getQuotedTable(original_table) +
-                                  ((partition_name == "'all'") ? " ATTACH PARTITION ID " : " ATTACH PARTITION ") + partition_name +
-                                  " FROM " + getQuotedTable(helping_table);
-
-        LOG_INFO(log, "Executing ALTER query: {}", query_alter_ast_string);
-
-        try
-        {
-            /// Try attach partition on each shard
-            UInt64 num_nodes = executeQueryOnCluster(
-                task_table.cluster_push,
-                query_alter_ast_string,
-                task_cluster->settings_push,
-                execution_mode);
-
-            if (settings_push.alter_sync == 1)
-            {
-                LOG_INFO(
-                    log,
-                    "Destination tables {} have been executed alter query successfully on {} shards of {}",
-                    getQuotedTable(task_table.table_push),
-                    num_nodes,
-                    task_table.cluster_push->getShardCount());
-
-                if (num_nodes != task_table.cluster_push->getShardCount())
-                    return TaskStatus::Error;
-            }
-            else
-            {
-                LOG_INFO(log, "Number of nodes that executed ALTER query successfully : {}", toString(num_nodes));
-            }
-        }
-        catch (...)
-        {
-            LOG_INFO(log, "Error while moving partition {} piece {} to original table", partition_name, toString(current_piece_number));
-            LOG_WARNING(log, "In case of non-replicated tables it can cause duplicates.");
-            throw;
-        }
-
-        if (inject_fault)
-            throw Exception(ErrorCodes::UNFINISHED, "Copy fault injection is activated");
-    }
-
-    /// Create node to signal that we finished moving
-    /// Also increment a counter of processed partitions
-    {
-        const auto state_finished = TaskStateWithOwner::getData(TaskState::Finished, host_id);
-        const auto task_status = task_zookeeper_path + "/status";
-
-        /// Try until success
-        while (true)
-        {
-            Coordination::Stat stat;
-            auto status_json = zookeeper->get(task_status, &stat);
-            auto statuses = StatusAccumulator::fromJSON(status_json);
-
-            /// Increment status for table.
-            (*statuses)[task_table.name_in_config].processed_partitions_count += 1;
-            auto statuses_to_commit = StatusAccumulator::serializeToJSON(statuses);
-
-            Coordination::Requests ops;
-            ops.emplace_back(zkutil::makeSetRequest(current_partition_attach_is_done, state_finished, 0));
-            ops.emplace_back(zkutil::makeSetRequest(task_status, statuses_to_commit, stat.version));
-
-            Coordination::Responses responses;
-            Coordination::Error code = zookeeper->tryMulti(ops, responses);
-
-            if (code == Coordination::Error::ZOK)
-                break;
-        }
-    }
-
-    return TaskStatus::Finished;
-}
-
-/// This is needed to create internal Distributed table
-/// Removes column's TTL expression from `CREATE` query
-/// Removes MATEREALIZED or ALIAS columns not to copy additional and useless data over the network.
-/// Removes data skipping indices.
-ASTPtr ClusterCopier::removeAliasMaterializedAndTTLColumnsFromCreateQuery(const ASTPtr & query_ast, bool allow_to_copy_alias_and_materialized_columns)
-{
-    const ASTs & column_asts = query_ast->as<ASTCreateQuery &>().columns_list->columns->children;
-    auto new_columns = std::make_shared<ASTExpressionList>();
-
-    for (const ASTPtr & column_ast : column_asts)
-    {
-        const auto & column = column_ast->as<ASTColumnDeclaration &>();
-
-        /// Skip this columns
-        if (!column.default_specifier.empty() && !allow_to_copy_alias_and_materialized_columns)
-        {
-            ColumnDefaultKind kind = columnDefaultKindFromString(column.default_specifier);
-            if (kind == ColumnDefaultKind::Materialized || kind == ColumnDefaultKind::Alias)
-                continue;
-        }
-
-        /// Remove TTL on columns definition.
-        auto new_column_ast = column_ast->clone();
-        auto & new_column = new_column_ast->as<ASTColumnDeclaration &>();
-        if (new_column.ttl)
-            new_column.ttl.reset();
-
-        new_columns->children.emplace_back(new_column_ast);
-    }
-
-    ASTPtr new_query_ast = query_ast->clone();
-    auto & new_query = new_query_ast->as<ASTCreateQuery &>();
-
-    auto new_columns_list = std::make_shared<ASTColumns>();
-    new_columns_list->set(new_columns_list->columns, new_columns);
-
-    /// Skip indices and projections are not needed, because distributed table doesn't support it.
-
-    new_query.replace(new_query.columns_list, new_columns_list);
-
-    return new_query_ast;
-}
-
-/// Replaces ENGINE and table name in a create query
-std::shared_ptr<ASTCreateQuery> rewriteCreateQueryStorage(const ASTPtr & create_query_ast,
-                                                          const DatabaseAndTableName & new_table,
-                                                          const ASTPtr & new_storage_ast)
-{
-    const auto & create = create_query_ast->as<ASTCreateQuery &>();
-    auto res = std::make_shared<ASTCreateQuery>(create);
-
-    if (create.storage == nullptr || new_storage_ast == nullptr)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Storage is not specified");
-
-    res->setDatabase(new_table.first);
-    res->setTable(new_table.second);
-
-    res->children.clear();
-    res->set(res->columns_list, create.columns_list->clone());
-    res->set(res->storage, new_storage_ast->clone());
-    /// Just to make it better and don't store additional flag like `is_table_created` somewhere else
-    res->if_not_exists = true;
-
-    return res;
-}
-
-
-bool ClusterCopier::tryDropPartitionPiece(
-        ShardPartition & task_partition,
-        const size_t current_piece_number,
-        const zkutil::ZooKeeperPtr & zookeeper,
-        const CleanStateClock & clean_state_clock)
-{
-    if (is_safe_mode)
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "DROP PARTITION is prohibited in safe mode");
-
-    TaskTable & task_table = task_partition.task_shard.task_table;
-    ShardPartitionPiece & partition_piece = task_partition.pieces[current_piece_number];
-
-    const String current_shards_path                  = partition_piece.getPartitionPieceShardsPath();
-    const String current_partition_active_workers_dir = partition_piece.getPartitionPieceActiveWorkersPath();
-    const String is_dirty_flag_path                   = partition_piece.getPartitionPieceIsDirtyPath();
-    const String dirty_cleaner_path                   = partition_piece.getPartitionPieceCleanerPath();
-    const String is_dirty_cleaned_path                = partition_piece.getPartitionPieceIsCleanedPath();
-
-    zkutil::EphemeralNodeHolder::Ptr cleaner_holder;
-    try
-    {
-        cleaner_holder = zkutil::EphemeralNodeHolder::create(dirty_cleaner_path, *zookeeper, host_id);
-    }
-    catch (const Coordination::Exception & e)
-    {
-        if (e.code == Coordination::Error::ZNODEEXISTS)
-        {
-            LOG_INFO(log, "Partition {} piece {} is cleaning now by somebody, sleep", task_partition.name, toString(current_piece_number));
-            std::this_thread::sleep_for(retry_delay_ms);
-            return false;
-        }
-
-        throw;
-    }
-
-    Coordination::Stat stat{};
-    if (zookeeper->exists(current_partition_active_workers_dir, &stat))
-    {
-        if (stat.numChildren != 0)
-        {
-            LOG_INFO(log, "Partition {} contains {} active workers while trying to drop it. Going to sleep.", task_partition.name, stat.numChildren);
-            std::this_thread::sleep_for(retry_delay_ms);
-            return false;
-        }
-        else
-        {
-            zookeeper->remove(current_partition_active_workers_dir);
-        }
-    }
-
-    {
-        zkutil::EphemeralNodeHolder::Ptr active_workers_lock;
-        try
-        {
-            active_workers_lock = zkutil::EphemeralNodeHolder::create(current_partition_active_workers_dir, *zookeeper, host_id);
-        }
-        catch (const Coordination::Exception & e)
-        {
-            if (e.code == Coordination::Error::ZNODEEXISTS)
-            {
-                LOG_INFO(log, "Partition {} is being filled now by somebody, sleep", task_partition.name);
-                return false;
-            }
-
-            throw;
-        }
-
-        // Lock the dirty flag
-        zookeeper->set(is_dirty_flag_path, host_id, clean_state_clock.discovery_version.value());
-        zookeeper->tryRemove(partition_piece.getPartitionPieceCleanStartPath());
-        CleanStateClock my_clock(zookeeper, is_dirty_flag_path, is_dirty_cleaned_path);
-
-        /// Remove all status nodes
-        {
-            Strings children;
-            if (zookeeper->tryGetChildren(current_shards_path, children) == Coordination::Error::ZOK)
-                for (const auto & child : children)
-                {
-                    zookeeper->removeRecursive(current_shards_path + "/" + child);
-                }
-        }
-
-
-        DatabaseAndTableName original_table = task_table.table_push;
-        DatabaseAndTableName helping_table = DatabaseAndTableName(original_table.first, original_table.second + "_piece_" + toString(current_piece_number));
-
-        String query = "ALTER TABLE " + getQuotedTable(helping_table);
-        query += ((task_partition.name == "'all'") ? " DROP PARTITION ID " : " DROP PARTITION ")  + task_partition.name + "";
-
-        /// TODO: use this statement after servers will be updated up to 1.1.54310
-        // query += " DROP PARTITION ID '" + task_partition.name + "'";
-
-        ClusterPtr & cluster_push = task_table.cluster_push;
-        Settings settings_push = task_cluster->settings_push;
-
-        /// It is important, DROP PARTITION must be done synchronously
-        settings_push.alter_sync = 2;
-
-        LOG_INFO(log, "Execute distributed DROP PARTITION: {}", query);
-        /// We have to drop partition_piece on each replica
-        size_t num_shards = executeQueryOnCluster(
-                cluster_push, query,
-                settings_push,
-                ClusterExecutionMode::ON_EACH_NODE);
-
-        LOG_INFO(log, "DROP PARTITION was successfully executed on {} nodes of a cluster.", num_shards);
-
-        /// Update the locking node
-        if (!my_clock.is_stale())
-        {
-            zookeeper->set(is_dirty_flag_path, host_id, my_clock.discovery_version.value());
-            if (my_clock.clean_state_version)
-                zookeeper->set(is_dirty_cleaned_path, host_id, my_clock.clean_state_version.value());
-            else
-                zookeeper->create(is_dirty_cleaned_path, host_id, zkutil::CreateMode::Persistent);
-        }
-        else
-        {
-            LOG_INFO(log, "Clean state is altered when dropping the partition, cowardly bailing");
-            /// clean state is stale
-            return false;
-        }
-
-        LOG_INFO(log, "Partition {} piece {} was dropped on cluster {}", task_partition.name, toString(current_piece_number), task_table.cluster_push_name);
-        if (zookeeper->tryCreate(current_shards_path, host_id, zkutil::CreateMode::Persistent) == Coordination::Error::ZNODEEXISTS)
-            zookeeper->set(current_shards_path, host_id);
-    }
-
-    LOG_INFO(log, "Partition {} piece {} is safe for work now.", task_partition.name, toString(current_piece_number));
-    return true;
-}
-
-bool ClusterCopier::tryProcessTable(const ConnectionTimeouts & timeouts, TaskTable & task_table)
-{
-    /// Create destination table
-    TaskStatus task_status = TaskStatus::Error;
-
-    task_status = tryCreateDestinationTable(timeouts, task_table);
-    /// Exit if success
-    if (task_status != TaskStatus::Finished)
-    {
-        LOG_WARNING(log, "Create destination table failed ");
-        return false;
-    }
-
-    /// Set all_partitions_count for table in Zookeeper
-    auto zookeeper = getContext()->getZooKeeper();
-    while (true)
-    {
-        Coordination::Stat stat;
-        auto status_json = zookeeper->get(task_zookeeper_path + "/status", &stat);
-        auto statuses = StatusAccumulator::fromJSON(status_json);
-
-        /// Exit if someone already set the initial value for this table.
-        if (statuses->find(task_table.name_in_config) != statuses->end())
-            break;
-        (*statuses)[task_table.name_in_config] = StatusAccumulator::TableStatus
-        {
-            /*all_partitions_count=*/task_table.ordered_partition_names.size(),
-            /*processed_partition_count=*/0
-        };
-
-        auto statuses_to_commit = StatusAccumulator::serializeToJSON(statuses);
-        auto error = zookeeper->trySet(task_zookeeper_path + "/status", statuses_to_commit, stat.version);
-        if (error == Coordination::Error::ZOK)
-            break;
-    }
-
-
-    /// An heuristic: if previous shard is already done, then check next one without sleeps due to max_workers constraint
-    bool previous_shard_is_instantly_finished = false;
-
-    /// Process each partition that is present in cluster
-    for (const String & partition_name : task_table.ordered_partition_names)
-    {
-        if (!task_table.cluster_partitions.contains(partition_name))
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "There are no expected partition {}. It is a bug", partition_name);
-
-        ClusterPartition & cluster_partition = task_table.cluster_partitions[partition_name];
-
-        Stopwatch watch;
-        /// We will check all the shards of the table and check if they contain current partition.
-        TasksShard expected_shards;
-        UInt64 num_failed_shards = 0;
-
-        ++cluster_partition.total_tries;
-
-        LOG_INFO(log, "Processing partition {} for the whole cluster", partition_name);
-
-        /// Process each source shard having current partition and copy current partition
-        /// NOTE: shards are sorted by "distance" to current host
-        bool has_shard_to_process = false;
-        for (const TaskShardPtr & shard : task_table.all_shards)
-        {
-            /// Does shard have a node with current partition?
-            if (!shard->partition_tasks.contains(partition_name))
-            {
-                /// If not, did we check existence of that partition previously?
-                if (!shard->checked_partitions.contains(partition_name))
-                {
-                    auto check_shard_has_partition = [&] () { return checkShardHasPartition(timeouts, *shard, partition_name); };
-                    bool has_partition = retry(check_shard_has_partition);
-
-                    shard->checked_partitions.emplace(partition_name);
-
-                    if (has_partition)
-                    {
-                        const size_t number_of_splits = task_table.number_of_splits;
-                        shard->partition_tasks.emplace(partition_name, ShardPartition(*shard, partition_name, number_of_splits));
-                        LOG_INFO(log, "Discovered partition {} in shard {}", partition_name, shard->getDescription());
-                        /// To save references in the future.
-                        auto shard_partition_it = shard->partition_tasks.find(partition_name);
-                        PartitionPieces & shard_partition_pieces = shard_partition_it->second.pieces;
-
-                        for (size_t piece_number = 0; piece_number < number_of_splits; ++piece_number)
-                        {
-                            auto res = checkPresentPartitionPiecesOnCurrentShard(timeouts, *shard, partition_name, piece_number);
-                            shard_partition_pieces.emplace_back(shard_partition_it->second, piece_number, res);
-                        }
-                    }
-                    else
-                    {
-                        LOG_INFO(log, "Found that shard {} does not contain current partition {}", shard->getDescription(), partition_name);
-                        continue;
-                    }
-                }
-                else
-                {
-                    /// We have already checked that partition, but did not discover it
-                    previous_shard_is_instantly_finished = true;
-                    continue;
-                }
-            }
-
-            auto it_shard_partition = shard->partition_tasks.find(partition_name);
-            /// Previously when we discovered that shard does not contain current partition, we skipped it.
-            /// At this moment partition have to be present.
-            if (it_shard_partition == shard->partition_tasks.end())
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "There are no such partition in a shard. This is a bug.");
-            auto & partition = it_shard_partition->second;
-
-            expected_shards.emplace_back(shard);
-
-            /// Do not sleep if there is a sequence of already processed shards to increase startup
-            bool is_unprioritized_task = !previous_shard_is_instantly_finished && shard->priority.is_remote;
-            task_status = TaskStatus::Error;
-            bool was_error = false;
-            has_shard_to_process = true;
-            for (UInt64 try_num = 1; try_num <= max_shard_partition_tries; ++try_num)
-            {
-                task_status = tryProcessPartitionTask(timeouts, partition, is_unprioritized_task);
-
-                /// Exit if success
-                if (task_status == TaskStatus::Finished)
-                    break;
-
-                was_error = true;
-
-                /// Skip if the task is being processed by someone
-                if (task_status == TaskStatus::Active)
-                    break;
-
-                /// Repeat on errors
-                std::this_thread::sleep_for(retry_delay_ms);
-            }
-
-            if (task_status == TaskStatus::Error)
-                ++num_failed_shards;
-
-            previous_shard_is_instantly_finished = !was_error;
-        }
-
-        cluster_partition.elapsed_time_seconds += watch.elapsedSeconds();
-
-        /// Check that whole cluster partition is done
-        /// Firstly check the number of failed partition tasks, then look into ZooKeeper and ensure that each partition is done
-        bool partition_copying_is_done = num_failed_shards == 0;
-        try
-        {
-            partition_copying_is_done =
-                    !has_shard_to_process
-                    || (partition_copying_is_done && checkAllPiecesInPartitionAreDone(task_table, partition_name, expected_shards));
-        }
-        catch (...)
-        {
-            tryLogCurrentException(log);
-            partition_copying_is_done = false;
-        }
-
-
-        bool partition_moving_is_done = false;
-        /// Try to move only if all pieces were copied.
-        if (partition_copying_is_done)
-        {
-            for (UInt64 try_num = 0; try_num < max_shard_partition_piece_tries_for_alter; ++try_num)
-            {
-                try
-                {
-                    auto res = tryMoveAllPiecesToDestinationTable(task_table, partition_name);
-                    /// Exit and mark current task is done.
-                    if (res == TaskStatus::Finished)
-                    {
-                        partition_moving_is_done = true;
-                        break;
-                    }
-
-                    /// Exit if this task is active.
-                    if (res == TaskStatus::Active)
-                        break;
-
-                    /// Repeat on errors.
-                    std::this_thread::sleep_for(retry_delay_ms);
-                }
-                catch (...)
-                {
-                    tryLogCurrentException(log, "Some error occurred while moving pieces to destination table for partition " + partition_name);
-                }
-            }
-        }
-
-        if (partition_copying_is_done && partition_moving_is_done)
-        {
-            task_table.finished_cluster_partitions.emplace(partition_name);
-
-            task_table.bytes_copied += cluster_partition.bytes_copied;
-            task_table.rows_copied += cluster_partition.rows_copied;
-            double elapsed = cluster_partition.elapsed_time_seconds;
-
-            LOG_INFO(log, "It took {} seconds to copy partition {}: {} uncompressed bytes, {} rows and {} source blocks are copied",
-                elapsed, partition_name,
-                formatReadableSizeWithDecimalSuffix(cluster_partition.bytes_copied),
-                formatReadableQuantity(cluster_partition.rows_copied),
-                cluster_partition.blocks_copied);
-
-            if (cluster_partition.rows_copied)
-            {
-                LOG_INFO(log, "Average partition speed: {} per second.", formatReadableSizeWithDecimalSuffix(cluster_partition.bytes_copied / elapsed));
-            }
-
-            if (task_table.rows_copied)
-            {
-                LOG_INFO(log, "Average table {} speed: {} per second.", task_table.table_id, formatReadableSizeWithDecimalSuffix(task_table.bytes_copied / elapsed));
-            }
-        }
-    }
-
-    UInt64 required_partitions = task_table.cluster_partitions.size();
-    UInt64 finished_partitions = task_table.finished_cluster_partitions.size();
-    bool table_is_done = finished_partitions >= required_partitions;
-
-    if (!table_is_done)
-    {
-        LOG_INFO(log, "Table {} is not processed yet. Copied {} of {}, will retry", task_table.table_id, finished_partitions, required_partitions);
-    }
-    else
-    {
-        /// Delete helping tables in case that whole table is done
-        dropHelpingTables(task_table);
-    }
-
-    return table_is_done;
-}
-
-TaskStatus ClusterCopier::tryCreateDestinationTable(const ConnectionTimeouts & timeouts, TaskTable & task_table)
-{
-    /// Try create original table (if not exists) on each shard
-
-    //TaskTable & task_table = task_shard.task_table;
-    const TaskShardPtr task_shard = task_table.all_shards.at(0);
-    /// We need to update table definitions for each part, it could be changed after ALTER
-    task_shard->current_pull_table_create_query = getCreateTableForPullShard(timeouts, *task_shard);
-    try
-    {
-        auto create_query_push_ast
-            = rewriteCreateQueryStorage(task_shard->current_pull_table_create_query, task_table.table_push, task_table.engine_push_ast);
-        auto & create = create_query_push_ast->as<ASTCreateQuery &>();
-        create.if_not_exists = true;
-        InterpreterCreateQuery::prepareOnClusterQuery(create, getContext(), task_table.cluster_push_name);
-        String query = queryToString(create_query_push_ast);
-
-        LOG_INFO(log, "Create destination tables. Query: {}", query);
-        UInt64 shards = executeQueryOnCluster(task_table.cluster_push, query, task_cluster->settings_push, ClusterExecutionMode::ON_EACH_NODE);
-        LOG_INFO(
-            log,
-            "Destination tables {} have been created on {} shards of {}",
-            getQuotedTable(task_table.table_push),
-            shards,
-            task_table.cluster_push->getShardCount());
-    }
-    catch (...)
-    {
-        tryLogCurrentException(log, "Error while creating original table. Maybe we are not first.");
-    }
-
-    return TaskStatus::Finished;
-}
-
-/// Job for copying partition from particular shard.
-TaskStatus ClusterCopier::tryProcessPartitionTask(const ConnectionTimeouts & timeouts, ShardPartition & task_partition, bool is_unprioritized_task)
-{
-    TaskStatus res;
-
-    try
-    {
-        res = iterateThroughAllPiecesInPartition(timeouts, task_partition, is_unprioritized_task);
-    }
-    catch (...)
-    {
-        tryLogCurrentException(log, "An error occurred while processing partition " + task_partition.name);
-        res = TaskStatus::Error;
-    }
-
-    /// At the end of each task check if the config is updated
-    try
-    {
-        updateConfigIfNeeded();
-    }
-    catch (...)
-    {
-        tryLogCurrentException(log, "An error occurred while updating the config");
-    }
-
-    return res;
-}
-
-TaskStatus ClusterCopier::iterateThroughAllPiecesInPartition(const ConnectionTimeouts & timeouts, ShardPartition & task_partition,
-                                                       bool is_unprioritized_task)
-{
-    const size_t total_number_of_pieces = task_partition.task_shard.task_table.number_of_splits;
-
-    TaskStatus res{TaskStatus::Finished};
-
-    bool was_failed_pieces = false;
-    bool was_active_pieces = false;
-
-    for (size_t piece_number = 0; piece_number < total_number_of_pieces; piece_number++)
-    {
-        for (UInt64 try_num = 0; try_num < max_shard_partition_tries; ++try_num)
-        {
-            LOG_INFO(log, "Attempt number {} to process partition {} piece number {} on shard number {} with index {}.",
-                try_num, task_partition.name, piece_number,
-                task_partition.task_shard.numberInCluster(),
-                task_partition.task_shard.indexInCluster());
-
-            res = processPartitionPieceTaskImpl(timeouts, task_partition, piece_number, is_unprioritized_task);
-
-            /// Exit if success
-            if (res == TaskStatus::Finished)
-                break;
-
-            /// Skip if the task is being processed by someone
-            if (res == TaskStatus::Active)
-                break;
-
-            /// Repeat on errors
-            std::this_thread::sleep_for(retry_delay_ms);
-        }
-
-        was_active_pieces |= (res == TaskStatus::Active);
-        was_failed_pieces |= (res == TaskStatus::Error);
-    }
-
-    if (was_failed_pieces)
-        return TaskStatus::Error;
-
-    if (was_active_pieces)
-        return TaskStatus::Active;
-
-    return TaskStatus::Finished;
-}
-
-
-TaskStatus ClusterCopier::processPartitionPieceTaskImpl(
-        const ConnectionTimeouts & timeouts, ShardPartition & task_partition,
-        const size_t current_piece_number, bool is_unprioritized_task)
-{
-    TaskShard & task_shard = task_partition.task_shard;
-    TaskTable & task_table = task_shard.task_table;
-    ClusterPartition & cluster_partition  = task_table.getClusterPartition(task_partition.name);
-    ShardPartitionPiece & partition_piece = task_partition.pieces[current_piece_number];
-
-    const size_t number_of_splits = task_table.number_of_splits;
-    const String primary_key_comma_separated = task_table.primary_key_comma_separated;
-
-    /// We need to update table definitions for each partition, it could be changed after ALTER
-    createShardInternalTables(timeouts, task_shard, true);
-
-    auto split_table_for_current_piece = task_shard.list_of_split_tables_on_shard[current_piece_number];
-
-    auto zookeeper = getContext()->getZooKeeper();
-
-    const String piece_is_dirty_flag_path          = partition_piece.getPartitionPieceIsDirtyPath();
-    const String piece_is_dirty_cleaned_path       = partition_piece.getPartitionPieceIsCleanedPath();
-    const String current_task_piece_is_active_path = partition_piece.getActiveWorkerPath();
-    const String current_task_piece_status_path    = partition_piece.getShardStatusPath();
-
-    /// Auxiliary functions:
-
-    /// Creates is_dirty node to initialize DROP PARTITION
-    auto create_is_dirty_node = [&] (const CleanStateClock & clock)
-    {
-        if (clock.is_stale())
-            LOG_INFO(log, "Clean state clock is stale while setting dirty flag, cowardly bailing");
-        else if (!clock.is_clean())
-            LOG_INFO(log, "Thank you, Captain Obvious");
-        else if (clock.discovery_version)
-        {
-            LOG_INFO(log, "Updating clean state clock");
-            zookeeper->set(piece_is_dirty_flag_path, host_id, clock.discovery_version.value());
-        }
-        else
-        {
-            LOG_INFO(log, "Creating clean state clock");
-            zookeeper->create(piece_is_dirty_flag_path, host_id, zkutil::CreateMode::Persistent);
-        }
-    };
-
-    /// Returns SELECT query filtering current partition and applying user filter
-    auto get_select_query = [&] (const DatabaseAndTableName & from_table, const String & fields, bool enable_splitting, String limit = "")
-    {
-        String query;
-        query += "WITH " + task_partition.name + " AS partition_key ";
-        query += "SELECT " + fields + " FROM " + getQuotedTable(from_table);
-
-        if (enable_splitting && experimental_use_sample_offset)
-            query += " SAMPLE 1/" + toString(number_of_splits) + " OFFSET " + toString(current_piece_number) + "/" + toString(number_of_splits);
-
-        /// TODO: Bad, it is better to rewrite with ASTLiteral(partition_key_field)
-        query += " WHERE (" + queryToString(task_table.engine_push_partition_key_ast) + " = partition_key)";
-
-        if (enable_splitting && !experimental_use_sample_offset)
-            query += " AND ( cityHash64(" + primary_key_comma_separated + ") %" + toString(number_of_splits) + " = " + toString(current_piece_number) + " )";
-
-        if (!task_table.where_condition_str.empty())
-            query += " AND (" + task_table.where_condition_str + ")";
-
-        if (!limit.empty())
-            query += " LIMIT " + limit;
-
-        query += " FORMAT Native";
-
-        ParserQuery p_query(query.data() + query.size());
-
-        const auto & settings = getContext()->getSettingsRef();
-        return parseQuery(p_query, query, settings.max_query_size, settings.max_parser_depth);
-    };
-
-    /// Load balancing
-    auto worker_node_holder = createTaskWorkerNodeAndWaitIfNeed(zookeeper, current_task_piece_status_path, is_unprioritized_task);
-
-    LOG_INFO(log, "Processing {}", current_task_piece_status_path);
-
-    const String piece_status_path = partition_piece.getPartitionPieceShardsPath();
-
-    CleanStateClock clean_state_clock(zookeeper, piece_is_dirty_flag_path, piece_is_dirty_cleaned_path);
-
-    const bool is_clean = checkPartitionPieceIsClean(zookeeper, clean_state_clock, piece_status_path);
-
-    /// Do not start if partition piece is dirty, try to clean it
-    if (is_clean)
-    {
-        LOG_INFO(log, "Partition {} piece {} appears to be clean", task_partition.name, current_piece_number);
-        zookeeper->createAncestors(current_task_piece_status_path);
-    }
-    else
-    {
-        LOG_INFO(log, "Partition {} piece {} is dirty, try to drop it", task_partition.name, current_piece_number);
-
-        try
-        {
-            tryDropPartitionPiece(task_partition, current_piece_number, zookeeper, clean_state_clock);
-        }
-        catch (...)
-        {
-            tryLogCurrentException(log, "An error occurred when clean partition");
-        }
-
-        return TaskStatus::Error;
-    }
-
-    /// Create ephemeral node to mark that we are active and process the partition
-    zookeeper->createAncestors(current_task_piece_is_active_path);
-    zkutil::EphemeralNodeHolderPtr partition_task_node_holder;
-    try
-    {
-        partition_task_node_holder = zkutil::EphemeralNodeHolder::create(current_task_piece_is_active_path, *zookeeper, host_id);
-    }
-    catch (const Coordination::Exception & e)
-    {
-        if (e.code == Coordination::Error::ZNODEEXISTS)
-        {
-            LOG_INFO(log, "Someone is already processing {}", current_task_piece_is_active_path);
-            return TaskStatus::Active;
-        }
-
-        throw;
-    }
-
-    /// Exit if task has been already processed;
-    /// create blocking node to signal cleaning up if it is abandoned
-    {
-        String status_data;
-        if (zookeeper->tryGet(current_task_piece_status_path, status_data))
-        {
-            TaskStateWithOwner status = TaskStateWithOwner::fromString(status_data);
-            if (status.state == TaskState::Finished)
-            {
-                LOG_INFO(log, "Task {} has been successfully executed by {}", current_task_piece_status_path, status.owner);
-                return TaskStatus::Finished;
-            }
-
-            /// Task is abandoned, because previously we created ephemeral node, possibly in other copier's process.
-            /// Initialize DROP PARTITION
-            LOG_INFO(log, "Task {} has not been successfully finished by {}. Partition will be dropped and refilled.", current_task_piece_status_path, status.owner);
-
-            create_is_dirty_node(clean_state_clock);
-            return TaskStatus::Error;
-        }
-    }
-
-
-    /// Try create table (if not exists) on each shard
-    /// We have to create this table even in case that partition piece is empty
-    /// This is significant, because we will have simpler code
-    {
-        /// 1) Get columns description from any replica of destination cluster
-        /// 2) Change ENGINE, database and table name
-        /// 3) Create helping table on the whole destination cluster
-        auto & settings_push = task_cluster->settings_push;
-
-        auto connection = task_table.cluster_push->getAnyShardInfo().pool->get(timeouts, settings_push, true);
-        String create_query = getRemoteCreateTable(task_shard.task_table.table_push, *connection, settings_push);
-
-        ParserCreateQuery parser_create_query;
-        auto create_query_ast = parseQuery(parser_create_query, create_query, settings_push.max_query_size, settings_push.max_parser_depth);
-        /// Define helping table database and name for current partition piece
-        DatabaseAndTableName database_and_table_for_current_piece
-        {
-            task_table.table_push.first,
-            task_table.table_push.second + "_piece_" + toString(current_piece_number)
-        };
-
-
-        auto new_engine_push_ast = task_table.engine_push_ast;
-        if (task_table.isReplicatedTable())
-            new_engine_push_ast = task_table.rewriteReplicatedCreateQueryToPlain();
-
-        /// Take columns definition from destination table, new database and table name, and new engine (non replicated variant of MergeTree)
-        auto create_query_push_ast = rewriteCreateQueryStorage(create_query_ast, database_and_table_for_current_piece, new_engine_push_ast);
-        String query = queryToString(create_query_push_ast);
-
-        LOG_INFO(log, "Create destination tables. Query: {}", query);
-        UInt64 shards = executeQueryOnCluster(task_table.cluster_push, query, task_cluster->settings_push, ClusterExecutionMode::ON_EACH_NODE);
-        LOG_INFO(
-            log,
-            "Destination tables {} have been created on {} shards of {}",
-            getQuotedTable(task_table.table_push),
-            shards,
-            task_table.cluster_push->getShardCount());
-    }
-
-
-    /// Exit if current piece is absent on this shard. Also mark it as finished, because we will check
-    /// whether each shard have processed each partitition (and its pieces).
-    if (partition_piece.is_absent_piece)
-    {
-        String state_finished = TaskStateWithOwner::getData(TaskState::Finished, host_id);
-        auto res = zookeeper->tryCreate(current_task_piece_status_path, state_finished, zkutil::CreateMode::Persistent);
-        if (res == Coordination::Error::ZNODEEXISTS)
-            LOG_INFO(log, "Partition {} piece {} is absent on current replica of a shard. But other replicas have already marked it as done.", task_partition.name, current_piece_number);
-        if (res == Coordination::Error::ZOK)
-            LOG_INFO(log, "Partition {} piece {} is absent on current replica of a shard. Will mark it as done. Other replicas will do the same.", task_partition.name, current_piece_number);
-        return TaskStatus::Finished;
-    }
-
-    /// Check that destination partition is empty if we are first worker
-    /// NOTE: this check is incorrect if pull and push tables have different partition key!
-    String clean_start_status;
-    if (!zookeeper->tryGet(partition_piece.getPartitionPieceCleanStartPath(), clean_start_status) || clean_start_status != "ok")
-    {
-        zookeeper->createIfNotExists(partition_piece.getPartitionPieceCleanStartPath(), "");
-        auto checker = zkutil::EphemeralNodeHolder::create(partition_piece.getPartitionPieceCleanStartPath() + "/checker",
-                                                           *zookeeper, host_id);
-        // Maybe we are the first worker
-
-        ASTPtr query_select_ast = get_select_query(split_table_for_current_piece, "count()", /* enable_splitting= */ true);
-        UInt64 count;
-        {
-            auto local_context = Context::createCopy(context);
-            // Use pull (i.e. readonly) settings, but fetch data from destination servers
-            local_context->setSettings(task_cluster->settings_pull);
-            local_context->setSetting("skip_unavailable_shards", true);
-
-            InterpreterSelectWithUnionQuery select(query_select_ast, local_context, SelectQueryOptions{});
-            QueryPlan plan;
-            select.buildQueryPlan(plan);
-            auto builder = std::move(*plan.buildQueryPipeline(
-                QueryPlanOptimizationSettings::fromContext(local_context),
-                BuildQueryPipelineSettings::fromContext(local_context)));
-
-            Block block = getBlockWithAllStreamData(std::move(builder));
-            count = (block) ? block.safeGetByPosition(0).column->getUInt(0) : 0;
-        }
-
-        if (count != 0)
-        {
-            LOG_INFO(log, "Partition {} piece {} is not empty. In contains {} rows.", task_partition.name, current_piece_number, count);
-            Coordination::Stat stat_shards{};
-            zookeeper->get(partition_piece.getPartitionPieceShardsPath(), &stat_shards);
-
-            /// NOTE: partition is still fresh if dirt discovery happens before cleaning
-            if (stat_shards.numChildren == 0)
-            {
-                LOG_WARNING(log, "There are no workers for partition {} piece {}, but destination table contains {} rows. Partition will be dropped and refilled.", task_partition.name, toString(current_piece_number), count);
-
-                create_is_dirty_node(clean_state_clock);
-                return TaskStatus::Error;
-            }
-        }
-        zookeeper->set(partition_piece.getPartitionPieceCleanStartPath(), "ok");
-    }
-    /// At this point, we need to sync that the destination table is clean
-    /// before any actual work
-
-    /// Try start processing, create node about it
-    {
-        String start_state = TaskStateWithOwner::getData(TaskState::Started, host_id);
-        CleanStateClock new_clean_state_clock(zookeeper, piece_is_dirty_flag_path, piece_is_dirty_cleaned_path);
-        if (clean_state_clock != new_clean_state_clock)
-        {
-            LOG_INFO(log, "Partition {} piece {} clean state changed, cowardly bailing", task_partition.name, toString(current_piece_number));
-            return TaskStatus::Error;
-        }
-        else if (!new_clean_state_clock.is_clean())
-        {
-            LOG_INFO(log, "Partition {} piece {} is dirty and will be dropped and refilled", task_partition.name, toString(current_piece_number));
-            create_is_dirty_node(new_clean_state_clock);
-            return TaskStatus::Error;
-        }
-        zookeeper->create(current_task_piece_status_path, start_state, zkutil::CreateMode::Persistent);
-    }
-
-
-    /// Do the copying
-    {
-        bool inject_fault = false;
-        if (copy_fault_probability > 0)
-        {
-            double value = std::uniform_real_distribution<>(0, 1)(task_table.task_cluster.random_engine);
-            inject_fault = value < copy_fault_probability;
-        }
-
-        // Select all fields
-        ASTPtr query_select_ast = get_select_query(task_shard.table_read_shard, "*", /* enable_splitting= */ true, inject_fault ? "1" : "");
-
-        LOG_INFO(log, "Executing SELECT query and pull from {}: {}", task_shard.getDescription(), queryToString(query_select_ast));
-
-        ASTPtr query_insert_ast;
-        {
-            String query;
-            query += "INSERT INTO " + getQuotedTable(split_table_for_current_piece) + " FORMAT Native  ";
-
-            ParserQuery p_query(query.data() + query.size());
-            const auto & settings = getContext()->getSettingsRef();
-            query_insert_ast = parseQuery(p_query, query, settings.max_query_size, settings.max_parser_depth);
-
-            LOG_INFO(log, "Executing INSERT query: {}", query);
-        }
-
-        try
-        {
-            auto context_select = Context::createCopy(context);
-            context_select->setSettings(task_cluster->settings_pull);
-
-            auto context_insert = Context::createCopy(context);
-            context_insert->setSettings(task_cluster->settings_push);
-
-            /// Custom INSERT SELECT implementation
-            QueryPipeline input;
-            QueryPipeline output;
-            {
-                BlockIO io_insert = InterpreterFactory::instance().get(query_insert_ast, context_insert)->execute();
-
-                InterpreterSelectWithUnionQuery select(query_select_ast, context_select, SelectQueryOptions{});
-                QueryPlan plan;
-                select.buildQueryPlan(plan);
-                auto builder = std::move(*plan.buildQueryPipeline(
-                    QueryPlanOptimizationSettings::fromContext(context_select),
-                    BuildQueryPipelineSettings::fromContext(context_select)));
-
-                output = std::move(io_insert.pipeline);
-
-                /// Add converting actions to make it possible to copy blocks with slightly different schema
-                const auto & select_block = builder.getHeader();
-                const auto & insert_block = output.getHeader();
-                auto actions_dag = ActionsDAG::makeConvertingActions(
-                        select_block.getColumnsWithTypeAndName(),
-                        insert_block.getColumnsWithTypeAndName(),
-                        ActionsDAG::MatchColumnsMode::Position);
-
-                auto actions = std::make_shared<ExpressionActions>(actions_dag, ExpressionActionsSettings::fromContext(getContext()));
-
-                builder.addSimpleTransform([&](const Block & header)
-                {
-                    return std::make_shared<ExpressionTransform>(header, actions);
-                });
-                input = QueryPipelineBuilder::getPipeline(std::move(builder));
-            }
-
-            /// Fail-fast optimization to abort copying when the current clean state expires
-            std::future<Coordination::ExistsResponse> future_is_dirty_checker;
-
-            Stopwatch watch(CLOCK_MONOTONIC_COARSE);
-            constexpr UInt64 check_period_milliseconds = 500;
-
-            /// Will asynchronously check that ZooKeeper connection and is_dirty flag appearing while copying data
-            auto cancel_check = [&] ()
-            {
-                if (zookeeper->expired())
-                    throw Exception(ErrorCodes::UNFINISHED, "ZooKeeper session is expired, cancel INSERT SELECT");
-
-                if (!future_is_dirty_checker.valid())
-                    future_is_dirty_checker = zookeeper->asyncExists(piece_is_dirty_flag_path);
-
-                /// check_period_milliseconds should less than average insert time of single block
-                /// Otherwise, the insertion will slow a little bit
-                if (watch.elapsedMilliseconds() >= check_period_milliseconds)
-                {
-                    Coordination::ExistsResponse status = future_is_dirty_checker.get();
-
-                    if (status.error != Coordination::Error::ZNONODE)
-                    {
-                        LogicalClock dirt_discovery_epoch (status.stat.mzxid);
-                        if (dirt_discovery_epoch == clean_state_clock.discovery_zxid)
-                            return false;
-                        throw Exception(ErrorCodes::UNFINISHED, "Partition is dirty, cancel INSERT SELECT");
-                    }
-                }
-
-                return false;
-            };
-
-            /// Update statistics
-            /// It is quite rough: bytes_copied don't take into account DROP PARTITION.
-            auto update_stats = [&cluster_partition] (const Block & block)
-            {
-                cluster_partition.bytes_copied += block.bytes();
-                cluster_partition.rows_copied += block.rows();
-                cluster_partition.blocks_copied += 1;
-            };
-
-            /// Main work is here
-            PullingPipelineExecutor pulling_executor(input);
-            PushingPipelineExecutor pushing_executor(output);
-
-            Block data;
-            bool is_cancelled = false;
-            while (pulling_executor.pull(data))
-            {
-                if (cancel_check())
-                {
-                    is_cancelled = true;
-                    pushing_executor.cancel();
-                    pushing_executor.cancel();
-                    break;
-                }
-                pushing_executor.push(data);
-                update_stats(data);
-            }
-
-            if (!is_cancelled)
-                pushing_executor.finish();
-
-            // Just in case
-            if (future_is_dirty_checker.valid())
-                future_is_dirty_checker.get();
-
-            if (inject_fault)
-                throw Exception(ErrorCodes::UNFINISHED, "Copy fault injection is activated");
-        }
-        catch (...)
-        {
-            tryLogCurrentException(log, "An error occurred during copying, partition will be marked as dirty");
-            create_is_dirty_node(clean_state_clock);
-            return TaskStatus::Error;
-        }
-    }
-
-    LOG_INFO(log, "Partition {} piece {} copied. But not moved to original destination table.", task_partition.name, toString(current_piece_number));
-
-    /// Finalize the processing, change state of current partition task (and also check is_dirty flag)
-    {
-        String state_finished = TaskStateWithOwner::getData(TaskState::Finished, host_id);
-        CleanStateClock new_clean_state_clock (zookeeper, piece_is_dirty_flag_path, piece_is_dirty_cleaned_path);
-        if (clean_state_clock != new_clean_state_clock)
-        {
-            LOG_INFO(log, "Partition {} piece {} clean state changed, cowardly bailing", task_partition.name, toString(current_piece_number));
-            return TaskStatus::Error;
-        }
-        else if (!new_clean_state_clock.is_clean())
-        {
-            LOG_INFO(log, "Partition {} piece {} became dirty and will be dropped and refilled", task_partition.name, toString(current_piece_number));
-            create_is_dirty_node(new_clean_state_clock);
-            return TaskStatus::Error;
-        }
-        zookeeper->set(current_task_piece_status_path, state_finished, 0);
-    }
-
-    return TaskStatus::Finished;
-}
-
-void ClusterCopier::dropAndCreateLocalTable(const ASTPtr & create_ast)
-{
-    const auto & create = create_ast->as<ASTCreateQuery &>();
-    dropLocalTableIfExists({create.getDatabase(), create.getTable()});
-
-    auto create_context = Context::createCopy(getContext());
-
-    InterpreterCreateQuery interpreter(create_ast, create_context);
-    interpreter.execute();
-}
-
-void ClusterCopier::dropLocalTableIfExists(const DatabaseAndTableName & table_name) const
-{
-    auto drop_ast = std::make_shared<ASTDropQuery>();
-    drop_ast->if_exists = true;
-    drop_ast->setDatabase(table_name.first);
-    drop_ast->setTable(table_name.second);
-
-    auto drop_context = Context::createCopy(getContext());
-
-    InterpreterDropQuery interpreter(drop_ast, drop_context);
-    interpreter.execute();
-}
-
-void ClusterCopier::dropHelpingTablesByPieceNumber(const TaskTable & task_table, size_t current_piece_number)
-{
-    LOG_INFO(log, "Removing helping tables piece {}", current_piece_number);
-
-    DatabaseAndTableName original_table = task_table.table_push;
-    DatabaseAndTableName helping_table
-        = DatabaseAndTableName(original_table.first, original_table.second + "_piece_" + toString(current_piece_number));
-
-    String query = "DROP TABLE IF EXISTS " + getQuotedTable(helping_table);
-
-    const ClusterPtr & cluster_push = task_table.cluster_push;
-    Settings settings_push = task_cluster->settings_push;
-
-    LOG_INFO(log, "Execute distributed DROP TABLE: {}", query);
-
-    /// We have to drop partition_piece on each replica
-    UInt64 num_nodes = executeQueryOnCluster(cluster_push, query, settings_push, ClusterExecutionMode::ON_EACH_NODE);
-
-    LOG_INFO(log, "DROP TABLE query was successfully executed on {} nodes.", toString(num_nodes));
-}
-
-void ClusterCopier::dropHelpingTables(const TaskTable & task_table)
-{
-    LOG_INFO(log, "Removing helping tables");
-    for (size_t current_piece_number = 0; current_piece_number < task_table.number_of_splits; ++current_piece_number)
-    {
-        dropHelpingTablesByPieceNumber(task_table, current_piece_number);
-    }
-}
-
-void ClusterCopier::dropParticularPartitionPieceFromAllHelpingTables(const TaskTable & task_table, const String & partition_name)
-{
-    LOG_INFO(log, "Try drop partition partition from all helping tables.");
-    for (size_t current_piece_number = 0; current_piece_number < task_table.number_of_splits; ++current_piece_number)
-    {
-        DatabaseAndTableName original_table = task_table.table_push;
-        DatabaseAndTableName helping_table = DatabaseAndTableName(original_table.first, original_table.second + "_piece_" + toString(current_piece_number));
-
-        String query = "ALTER TABLE " + getQuotedTable(helping_table) + ((partition_name == "'all'") ? " DROP PARTITION ID " : " DROP PARTITION ") + partition_name;
-
-        const ClusterPtr & cluster_push = task_table.cluster_push;
-        Settings settings_push = task_cluster->settings_push;
-
-        LOG_INFO(log, "Execute distributed DROP PARTITION: {}", query);
-        /// We have to drop partition_piece on each replica
-        UInt64 num_nodes = executeQueryOnCluster(
-                cluster_push, query,
-                settings_push,
-                ClusterExecutionMode::ON_EACH_NODE);
-
-        LOG_INFO(log, "DROP PARTITION query was successfully executed on {} nodes.", toString(num_nodes));
-    }
-    LOG_INFO(log, "All helping tables dropped partition {}", partition_name);
-}
-
-String ClusterCopier::getRemoteCreateTable(const DatabaseAndTableName & table, Connection & connection, const Settings & settings)
-{
-    auto remote_context = Context::createCopy(context);
-    remote_context->setSettings(settings);
-
-    String query = "SHOW CREATE TABLE " + getQuotedTable(table);
-
-    QueryPipelineBuilder builder;
-    builder.init(Pipe(std::make_shared<RemoteSource>(
-            std::make_shared<RemoteQueryExecutor>(connection, query, InterpreterShowCreateQuery::getSampleBlock(), remote_context), false, false, /* async_query_sending= */ false)));
-    Block block = getBlockWithAllStreamData(std::move(builder));
-    return typeid_cast<const ColumnString &>(*block.safeGetByPosition(0).column).getDataAt(0).toString();
-}
-
-
-ASTPtr ClusterCopier::getCreateTableForPullShard(const ConnectionTimeouts & timeouts, TaskShard & task_shard)
-{
-    /// Fetch and parse (possibly) new definition
-    auto connection_entry = task_shard.info.pool->get(timeouts, task_cluster->settings_pull, true);
-    String create_query_pull_str = getRemoteCreateTable(
-            task_shard.task_table.table_pull,
-            *connection_entry,
-            task_cluster->settings_pull);
-
-    ParserCreateQuery parser_create_query;
-    const auto & settings = getContext()->getSettingsRef();
-    return parseQuery(parser_create_query, create_query_pull_str, settings.max_query_size, settings.max_parser_depth);
-}
-
-
-/// If it is implicitly asked to create split Distributed table for certain piece on current shard, we will do it.
-void ClusterCopier::createShardInternalTables(const ConnectionTimeouts & timeouts,
-        TaskShard & task_shard, bool create_split)
-{
-    TaskTable & task_table = task_shard.task_table;
-
-    /// We need to update table definitions for each part, it could be changed after ALTER
-    task_shard.current_pull_table_create_query = getCreateTableForPullShard(timeouts, task_shard);
-
-    /// Create local Distributed tables:
-    ///  a table fetching data from current shard and a table inserting data to the whole destination cluster
-    String read_shard_prefix = ".read_shard_" + toString(task_shard.indexInCluster()) + ".";
-    String split_shard_prefix = ".split.";
-    task_shard.table_read_shard = DatabaseAndTableName(working_database_name, read_shard_prefix + task_table.table_id);
-    task_shard.main_table_split_shard = DatabaseAndTableName(working_database_name, split_shard_prefix + task_table.table_id);
-
-    for (const auto & piece_number : collections::range(0, task_table.number_of_splits))
-    {
-        task_shard.list_of_split_tables_on_shard[piece_number] =
-                DatabaseAndTableName(working_database_name, split_shard_prefix + task_table.table_id + "_piece_" + toString(piece_number));
-    }
-
-    /// Create special cluster with single shard
-    String shard_read_cluster_name = read_shard_prefix + task_table.cluster_pull_name;
-    ClusterPtr cluster_pull_current_shard = task_table.cluster_pull->getClusterWithSingleShard(task_shard.indexInCluster());
-    getContext()->setCluster(shard_read_cluster_name, cluster_pull_current_shard);
-
-    auto storage_shard_ast = createASTStorageDistributed(shard_read_cluster_name, task_table.table_pull.first, task_table.table_pull.second);
-
-    auto create_query_ast = removeAliasMaterializedAndTTLColumnsFromCreateQuery(
-        task_shard.current_pull_table_create_query,
-        task_table.allow_to_copy_alias_and_materialized_columns);
-
-    auto create_table_pull_ast = rewriteCreateQueryStorage(create_query_ast, task_shard.table_read_shard, storage_shard_ast);
-    dropAndCreateLocalTable(create_table_pull_ast);
-
-    if (create_split)
-    {
-        auto create_table_split_piece_ast = rewriteCreateQueryStorage(
-                create_query_ast,
-                task_shard.main_table_split_shard,
-                task_table.main_engine_split_ast);
-
-        dropAndCreateLocalTable(create_table_split_piece_ast);
-
-        /// Create auxiliary split tables for each piece
-        for (const auto & piece_number : collections::range(0, task_table.number_of_splits))
-        {
-            const auto & storage_piece_split_ast = task_table.auxiliary_engine_split_asts[piece_number];
-
-            create_table_split_piece_ast = rewriteCreateQueryStorage(
-                    create_query_ast,
-                    task_shard.list_of_split_tables_on_shard[piece_number],
-                    storage_piece_split_ast);
-
-            dropAndCreateLocalTable(create_table_split_piece_ast);
-        }
-    }
-
-}
-
-
-std::set<String> ClusterCopier::getShardPartitions(const ConnectionTimeouts & timeouts, TaskShard & task_shard)
-{
-    std::set<String> res;
-
-    createShardInternalTables(timeouts, task_shard, false);
-
-    TaskTable & task_table = task_shard.task_table;
-
-    const String & partition_name = queryToString(task_table.engine_push_partition_key_ast);
-
-    if (partition_name == "'all'")
-    {
-        res.emplace("'all'");
-        return res;
-    }
-
-    String query;
-    {
-        WriteBufferFromOwnString wb;
-        wb << "SELECT " << partition_name << " AS partition FROM "
-           << getQuotedTable(task_shard.table_read_shard) << " GROUP BY partition ORDER BY partition DESC";
-        query = wb.str();
-    }
-
-    ParserQuery parser_query(query.data() + query.size());
-    const auto & settings = getContext()->getSettingsRef();
-    ASTPtr query_ast = parseQuery(parser_query, query, settings.max_query_size, settings.max_parser_depth);
-
-    LOG_INFO(log, "Computing destination partition set, executing query: {}", query);
-
-    auto local_context = Context::createCopy(context);
-    local_context->setSettings(task_cluster->settings_pull);
-    InterpreterSelectWithUnionQuery select(query_ast, local_context, SelectQueryOptions{});
-    QueryPlan plan;
-    select.buildQueryPlan(plan);
-    auto builder = std::move(*plan.buildQueryPipeline(
-        QueryPlanOptimizationSettings::fromContext(local_context),
-        BuildQueryPipelineSettings::fromContext(local_context)));
-
-    Block block = getBlockWithAllStreamData(std::move(builder));
-
-    if (block)
-    {
-        ColumnWithTypeAndName & column = block.getByPosition(0);
-        task_shard.partition_key_column = column;
-
-        for (size_t i = 0; i < column.column->size(); ++i)
-        {
-            WriteBufferFromOwnString wb;
-            column.type->getDefaultSerialization()->serializeTextQuoted(*column.column, i, wb, FormatSettings());
-            res.emplace(wb.str());
-        }
-    }
-
-    LOG_INFO(log, "There are {} destination partitions in shard {}", res.size(), task_shard.getDescription());
-
-    return res;
-}
-
-bool ClusterCopier::checkShardHasPartition(const ConnectionTimeouts & timeouts,
-        TaskShard & task_shard, const String & partition_quoted_name)
-{
-    createShardInternalTables(timeouts, task_shard, false);
-
-    TaskTable & task_table = task_shard.task_table;
-
-    WriteBufferFromOwnString ss;
-    ss << "WITH " + partition_quoted_name + " AS partition_key ";
-    ss << "SELECT 1 FROM " << getQuotedTable(task_shard.table_read_shard);
-    ss << " WHERE (" << queryToString(task_table.engine_push_partition_key_ast) << " = partition_key)";
-    if (!task_table.where_condition_str.empty())
-        ss << " AND (" << task_table.where_condition_str << ")";
-    ss << " LIMIT 1";
-    auto query = ss.str();
-
-    ParserQuery parser_query(query.data() + query.size());
-    const auto & settings = getContext()->getSettingsRef();
-    ASTPtr query_ast = parseQuery(parser_query, query, settings.max_query_size, settings.max_parser_depth);
-
-    LOG_INFO(log, "Checking shard {} for partition {} existence, executing query: {}",
-        task_shard.getDescription(), partition_quoted_name, query_ast->formatForErrorMessage());
-
-    auto local_context = Context::createCopy(context);
-    local_context->setSettings(task_cluster->settings_pull);
-    auto pipeline = InterpreterFactory::instance().get(query_ast, local_context)->execute().pipeline;
-    PullingPipelineExecutor executor(pipeline);
-    Block block;
-    executor.pull(block);
-    return block.rows() != 0;
-}
-
-bool ClusterCopier::checkPresentPartitionPiecesOnCurrentShard(const ConnectionTimeouts & timeouts,
-                           TaskShard & task_shard, const String & partition_quoted_name, size_t current_piece_number)
-{
-    createShardInternalTables(timeouts, task_shard, false);
-
-    TaskTable & task_table = task_shard.task_table;
-    const size_t number_of_splits = task_table.number_of_splits;
-    const String & primary_key_comma_separated = task_table.primary_key_comma_separated;
-
-    UNUSED(primary_key_comma_separated);
-
-    std::string query;
-
-    query += "WITH " + partition_quoted_name + " AS partition_key ";
-    query += "SELECT 1 FROM " + getQuotedTable(task_shard.table_read_shard);
-
-    if (experimental_use_sample_offset)
-        query += " SAMPLE 1/" + toString(number_of_splits) + " OFFSET " + toString(current_piece_number) + "/" + toString(number_of_splits);
-
-    query += " WHERE (" + queryToString(task_table.engine_push_partition_key_ast) + " = partition_key)";
-
-    if (!experimental_use_sample_offset)
-        query += " AND (cityHash64(" + primary_key_comma_separated + ") % "
-                 + std::to_string(number_of_splits) + " = " + std::to_string(current_piece_number) + " )";
-
-    if (!task_table.where_condition_str.empty())
-        query += " AND (" + task_table.where_condition_str + ")";
-
-    query += " LIMIT 1";
-
-    LOG_INFO(log, "Checking shard {} for partition {} piece {} existence, executing query: {}", task_shard.getDescription(), partition_quoted_name, std::to_string(current_piece_number), query);
-
-    ParserQuery parser_query(query.data() + query.size());
-    const auto & settings = getContext()->getSettingsRef();
-    ASTPtr query_ast = parseQuery(parser_query, query, settings.max_query_size, settings.max_parser_depth);
-
-    auto local_context = Context::createCopy(context);
-    local_context->setSettings(task_cluster->settings_pull);
-    auto pipeline = InterpreterFactory::instance().get(query_ast, local_context)->execute().pipeline;
-    PullingPipelineExecutor executor(pipeline);
-    Block result;
-    executor.pull(result);
-    if (result.rows() != 0)
-        LOG_INFO(log, "Partition {} piece number {} is PRESENT on shard {}", partition_quoted_name, std::to_string(current_piece_number), task_shard.getDescription());
-    else
-        LOG_INFO(log, "Partition {} piece number {} is ABSENT on shard {}", partition_quoted_name, std::to_string(current_piece_number), task_shard.getDescription());
-    return result.rows() != 0;
-}
-
-
-/** Executes simple query (without output streams, for example DDL queries) on each shard of the cluster
-  * Returns number of shards for which at least one replica executed query successfully
-  */
-UInt64 ClusterCopier::executeQueryOnCluster(
-        const ClusterPtr & cluster,
-        const String & query,
-        const Settings & current_settings,
-        ClusterExecutionMode execution_mode) const
-{
-    ClusterPtr cluster_for_query = cluster;
-    if (execution_mode == ClusterExecutionMode::ON_EACH_NODE)
-        cluster_for_query = cluster->getClusterWithReplicasAsShards(current_settings);
-
-    std::vector<std::shared_ptr<Connection>> connections;
-    connections.reserve(cluster->getShardCount());
-
-    std::atomic<UInt64> successfully_executed = 0;
-
-    for (const auto & replicas : cluster_for_query->getShardsAddresses())
-    {
-        for (const auto & node : replicas)
-        {
-            try
-            {
-                connections.emplace_back(std::make_shared<Connection>(
-                    node.host_name, node.port, node.default_database,
-                    node.user, node.password, ssh::SSHKey(), node.quota_key, node.cluster, node.cluster_secret,
-                    "ClusterCopier", node.compression, node.secure
-                ));
-
-                /// We execute only Alter, Create and Drop queries.
-                const auto header = Block{};
-
-                /// For unknown reason global context is passed to IStorage::read() method
-                /// So, task_identifier is passed as constructor argument. It is more obvious.
-                auto remote_query_executor = std::make_shared<RemoteQueryExecutor>(
-                        *connections.back(), query, header, getContext(),
-                        /*throttler=*/nullptr, Scalars(), Tables(), QueryProcessingStage::Complete);
-
-                try
-                {
-                    remote_query_executor->sendQuery();
-                }
-                catch (...)
-                {
-                    LOG_WARNING(log, "Node with address {} seems to be unreachable.", node.host_name);
-                    continue;
-                }
-
-                while (true)
-                {
-                    auto block = remote_query_executor->readBlock();
-                    if (!block)
-                        break;
-                }
-
-                remote_query_executor->finish();
-                ++successfully_executed;
-                break;
-            }
-            catch (...)
-            {
-                LOG_WARNING(log, "An error occurred while processing query: {}", query);
-                tryLogCurrentException(log);
-                continue;
-            }
-        }
-    }
-
-    return successfully_executed.load();
-}
-
-}
diff --git a/programs/copier/ClusterCopier.h b/programs/copier/ClusterCopier.h
deleted file mode 100644
index 01f8b30f546..00000000000
--- a/programs/copier/ClusterCopier.h
+++ /dev/null
@@ -1,240 +0,0 @@
-#pragma once
-
-#include "Aliases.h"
-#include "Internals.h"
-#include "TaskCluster.h"
-#include "TaskShard.h"
-#include "TaskTable.h"
-#include "ShardPartition.h"
-#include "ShardPartitionPiece.h"
-#include "ZooKeeperStaff.h"
-
-
-namespace DB
-{
-
-class ClusterCopier : WithMutableContext
-{
-public:
-    ClusterCopier(const String & task_path_,
-                  const String & host_id_,
-                  const String & proxy_database_name_,
-                  ContextMutablePtr context_,
-                  LoggerRawPtr log_)
-            : WithMutableContext(context_),
-            task_zookeeper_path(task_path_),
-            host_id(host_id_),
-            working_database_name(proxy_database_name_),
-            log(log_) {}
-
-    void init();
-
-    template <typename T>
-    decltype(auto) retry(T && func, UInt64 max_tries = 100);
-
-    void discoverShardPartitions(const ConnectionTimeouts & timeouts, const TaskShardPtr & task_shard);
-
-    /// Compute set of partitions, assume set of partitions aren't changed during the processing
-    void discoverTablePartitions(const ConnectionTimeouts & timeouts, TaskTable & task_table, UInt64 num_threads = 0);
-
-    void uploadTaskDescription(const std::string & task_path, const std::string & task_file, bool force);
-
-    void reloadTaskDescription();
-
-    void updateConfigIfNeeded();
-
-    void process(const ConnectionTimeouts & timeouts);
-
-    /// Disables DROP PARTITION commands that used to clear data after errors
-    void setSafeMode(bool is_safe_mode_ = true)
-    {
-        is_safe_mode = is_safe_mode_;
-    }
-
-    void setCopyFaultProbability(double copy_fault_probability_)
-    {
-        copy_fault_probability = copy_fault_probability_;
-    }
-
-    void setMoveFaultProbability(double move_fault_probability_)
-    {
-        move_fault_probability = move_fault_probability_;
-    }
-
-    void setExperimentalUseSampleOffset(bool value)
-    {
-        experimental_use_sample_offset = value;
-    }
-
-    void setMaxTableTries(UInt64 tries)
-    {
-        max_table_tries = tries;
-    }
-    void setMaxShardPartitionTries(UInt64 tries)
-    {
-        max_shard_partition_tries = tries;
-    }
-    void setMaxShardPartitionPieceTriesForAlter(UInt64 tries)
-    {
-        max_shard_partition_piece_tries_for_alter = tries;
-    }
-    void setRetryDelayMs(std::chrono::milliseconds ms)
-    {
-        retry_delay_ms = ms;
-    }
-
-protected:
-
-    String getWorkersPath() const
-    {
-        return task_cluster->task_zookeeper_path + "/task_active_workers";
-    }
-
-    String getWorkersPathVersion() const
-    {
-        return getWorkersPath() + "_version";
-    }
-
-    String getCurrentWorkerNodePath() const
-    {
-        return getWorkersPath() + "/" + host_id;
-    }
-
-    zkutil::EphemeralNodeHolder::Ptr createTaskWorkerNodeAndWaitIfNeed(
-            const zkutil::ZooKeeperPtr & zookeeper,
-            const String & description,
-            bool unprioritized);
-
-    /*
-     * Checks that partition piece or some other entity is clean.
-     * The only requirement is that you have to pass is_dirty_flag_path and is_dirty_cleaned_path to the function.
-     * And is_dirty_flag_path is a parent of is_dirty_cleaned_path.
-     * */
-    static bool checkPartitionPieceIsClean(
-            const zkutil::ZooKeeperPtr & zookeeper,
-            const CleanStateClock & clean_state_clock,
-            const String & task_status_path);
-
-    bool checkAllPiecesInPartitionAreDone(const TaskTable & task_table, const String & partition_name, const TasksShard & shards_with_partition);
-
-    /** Checks that the whole partition of a table was copied. We should do it carefully due to dirty lock.
-     * State of some task could change during the processing.
-     * We have to ensure that all shards have the finished state and there is no dirty flag.
-     * Moreover, we have to check status twice and check zxid, because state can change during the checking.
-     */
-
-    /* The same as function above
-     * Assume that we don't know on which shards do we have partition certain piece.
-     * We'll check them all (I mean shards that contain the whole partition)
-     * And shards that don't have certain piece MUST mark that piece is_done true.
-     * */
-    bool checkPartitionPieceIsDone(const TaskTable & task_table, const String & partition_name,
-                                   size_t piece_number, const TasksShard & shards_with_partition);
-
-
-    /*Alter successful insertion to helping tables it will move all pieces to destination table*/
-    TaskStatus tryMoveAllPiecesToDestinationTable(const TaskTable & task_table, const String & partition_name);
-
-    /// Removes MATERIALIZED and ALIAS columns from create table query
-    static ASTPtr removeAliasMaterializedAndTTLColumnsFromCreateQuery(const ASTPtr & query_ast, bool allow_to_copy_alias_and_materialized_columns);
-
-    bool tryDropPartitionPiece(ShardPartition & task_partition, size_t current_piece_number,
-            const zkutil::ZooKeeperPtr & zookeeper, const CleanStateClock & clean_state_clock);
-
-    bool tryProcessTable(const ConnectionTimeouts & timeouts, TaskTable & task_table);
-
-    TaskStatus tryCreateDestinationTable(const ConnectionTimeouts & timeouts, TaskTable & task_table);
-    /// Job for copying partition from particular shard.
-    TaskStatus tryProcessPartitionTask(const ConnectionTimeouts & timeouts,
-                                       ShardPartition & task_partition,
-                                       bool is_unprioritized_task);
-
-    TaskStatus iterateThroughAllPiecesInPartition(const ConnectionTimeouts & timeouts,
-                                                  ShardPartition & task_partition,
-                                                  bool is_unprioritized_task);
-
-    TaskStatus processPartitionPieceTaskImpl(const ConnectionTimeouts & timeouts,
-                                             ShardPartition & task_partition,
-                                             size_t current_piece_number,
-                                             bool is_unprioritized_task);
-
-    void dropAndCreateLocalTable(const ASTPtr & create_ast);
-
-    void dropLocalTableIfExists(const DatabaseAndTableName & table_name) const;
-
-    void dropHelpingTables(const TaskTable & task_table);
-
-    void dropHelpingTablesByPieceNumber(const TaskTable & task_table, size_t current_piece_number);
-
-    /// Is used for usage less disk space.
-    /// After all pieces were successfully moved to original destination
-    /// table we can get rid of partition pieces (partitions in helping tables).
-    void dropParticularPartitionPieceFromAllHelpingTables(const TaskTable & task_table, const String & partition_name);
-
-    String getRemoteCreateTable(const DatabaseAndTableName & table, Connection & connection, const Settings & settings);
-
-    ASTPtr getCreateTableForPullShard(const ConnectionTimeouts & timeouts, TaskShard & task_shard);
-
-    /// If it is implicitly asked to create split Distributed table for certain piece on current shard, we will do it.
-    void createShardInternalTables(const ConnectionTimeouts & timeouts, TaskShard & task_shard, bool create_split = true);
-
-    std::set<String> getShardPartitions(const ConnectionTimeouts & timeouts, TaskShard & task_shard);
-
-    bool checkShardHasPartition(const ConnectionTimeouts & timeouts, TaskShard & task_shard, const String & partition_quoted_name);
-
-    bool checkPresentPartitionPiecesOnCurrentShard(const ConnectionTimeouts & timeouts,
-             TaskShard & task_shard, const String & partition_quoted_name, size_t current_piece_number);
-
-    /*
-     * This class is used in executeQueryOnCluster function
-     * You can execute query on each shard (no sense it is executed on each replica of a shard or not)
-     * or you can execute query on each replica on each shard.
-     * First mode is useful for INSERTS queries.
-     * */
-    enum ClusterExecutionMode
-    {
-        ON_EACH_SHARD,
-        ON_EACH_NODE
-    };
-
-    /** Executes simple query (without output streams, for example DDL queries) on each shard of the cluster
-      * Returns number of shards for which at least one replica executed query successfully
-      */
-    UInt64 executeQueryOnCluster(
-            const ClusterPtr & cluster,
-            const String & query,
-            const Settings & current_settings,
-            ClusterExecutionMode execution_mode = ClusterExecutionMode::ON_EACH_SHARD) const;
-
-private:
-    String task_zookeeper_path;
-    String task_description_path;
-    String host_id;
-    String working_database_name;
-
-    /// Auto update config stuff
-    UInt64 task_description_current_version = 1;
-    std::atomic<UInt64> task_description_version{1};
-    Coordination::WatchCallback task_description_watch_callback;
-    /// ZooKeeper session used to set the callback
-    zkutil::ZooKeeperPtr task_description_watch_zookeeper;
-
-    ConfigurationPtr task_cluster_initial_config;
-    ConfigurationPtr task_cluster_current_config;
-
-    std::unique_ptr<TaskCluster> task_cluster;
-
-    bool is_safe_mode = false;
-    double copy_fault_probability = 0.0;
-    double move_fault_probability = 0.0;
-
-    bool experimental_use_sample_offset{false};
-
-    LoggerRawPtr log;
-
-    UInt64 max_table_tries = 3;
-    UInt64 max_shard_partition_tries = 3;
-    UInt64 max_shard_partition_piece_tries_for_alter = 10;
-    std::chrono::milliseconds retry_delay_ms{1000};
-};
-}
diff --git a/programs/copier/ClusterCopierApp.cpp b/programs/copier/ClusterCopierApp.cpp
deleted file mode 100644
index fdf07dec61a..00000000000
--- a/programs/copier/ClusterCopierApp.cpp
+++ /dev/null
@@ -1,252 +0,0 @@
-#include "ClusterCopierApp.h"
-#include <Common/ZooKeeper/ZooKeeper.h>
-#include <Common/StatusFile.h>
-#include <Common/TerminalSize.h>
-#include <Databases/registerDatabases.h>
-#include <IO/ConnectionTimeouts.h>
-#include <Interpreters/registerInterpreters.h>
-#include <Formats/registerFormats.h>
-#include <Common/scope_guard_safe.h>
-#include <unistd.h>
-#include <filesystem>
-
-namespace fs = std::filesystem;
-
-namespace DB
-{
-
-/// ClusterCopierApp
-
-void ClusterCopierApp::initialize(Poco::Util::Application & self)
-{
-    is_help = config().has("help");
-    if (is_help)
-        return;
-
-    config_xml_path = config().getString("config-file");
-    task_path = config().getString("task-path");
-    log_level = config().getString("log-level", "info");
-    is_safe_mode = config().has("safe-mode");
-    is_status_mode = config().has("status");
-    if (config().has("copy-fault-probability"))
-        copy_fault_probability = std::max(std::min(config().getDouble("copy-fault-probability"), 1.0), 0.0);
-    if (config().has("move-fault-probability"))
-        move_fault_probability = std::max(std::min(config().getDouble("move-fault-probability"), 1.0), 0.0);
-    base_dir = (config().has("base-dir")) ? config().getString("base-dir") : fs::current_path().string();
-
-    max_table_tries = std::max<size_t>(config().getUInt("max-table-tries", 3), 1);
-    max_shard_partition_tries = std::max<size_t>(config().getUInt("max-shard-partition-tries", 3), 1);
-    max_shard_partition_piece_tries_for_alter = std::max<size_t>(config().getUInt("max-shard-partition-piece-tries-for-alter", 10), 1);
-    retry_delay_ms = std::chrono::milliseconds(std::max<size_t>(config().getUInt("retry-delay-ms", 1000), 100));
-
-    if (config().has("experimental-use-sample-offset"))
-        experimental_use_sample_offset = config().getBool("experimental-use-sample-offset");
-
-    // process_id is '<hostname>#<start_timestamp>_<pid>'
-    time_t timestamp = Poco::Timestamp().epochTime();
-    auto curr_pid = Poco::Process::id();
-
-    process_id = std::to_string(DateLUT::serverTimezoneInstance().toNumYYYYMMDDhhmmss(timestamp)) + "_" + std::to_string(curr_pid);
-    host_id = escapeForFileName(getFQDNOrHostName()) + '#' + process_id;
-    process_path = fs::weakly_canonical(fs::path(base_dir) / ("clickhouse-copier_" + process_id));
-    fs::create_directories(process_path);
-
-    /// Override variables for BaseDaemon
-    if (config().has("log-level"))
-        config().setString("logger.level", config().getString("log-level"));
-
-    if (config().has("base-dir") || !config().has("logger.log"))
-        config().setString("logger.log", fs::path(process_path) / "log.log");
-
-    if (config().has("base-dir") || !config().has("logger.errorlog"))
-        config().setString("logger.errorlog", fs::path(process_path) / "log.err.log");
-
-    Base::initialize(self);
-}
-
-
-void ClusterCopierApp::handleHelp(const std::string &, const std::string &)
-{
-    uint16_t terminal_width = 0;
-    if (isatty(STDIN_FILENO))
-        terminal_width = getTerminalWidth();
-
-    Poco::Util::HelpFormatter help_formatter(options());
-    if (terminal_width)
-        help_formatter.setWidth(terminal_width);
-    help_formatter.setCommand(commandName());
-    help_formatter.setHeader("Copies tables from one cluster to another");
-    help_formatter.setUsage("--config-file <config-file> --task-path <task-path>");
-    help_formatter.format(std::cerr);
-    help_formatter.setFooter("See also: https://clickhouse.com/docs/en/operations/utilities/clickhouse-copier/");
-
-    stopOptionsProcessing();
-}
-
-
-void ClusterCopierApp::defineOptions(Poco::Util::OptionSet & options)
-{
-    Base::defineOptions(options);
-
-    options.addOption(Poco::Util::Option("task-path", "", "path to task in ZooKeeper")
-                          .argument("task-path").binding("task-path"));
-    options.addOption(Poco::Util::Option("task-file", "", "path to task file for uploading in ZooKeeper to task-path")
-                          .argument("task-file").binding("task-file"));
-    options.addOption(Poco::Util::Option("task-upload-force", "", "Force upload task-file even node already exists. Default is false.")
-                          .argument("task-upload-force").binding("task-upload-force"));
-    options.addOption(Poco::Util::Option("safe-mode", "", "disables ALTER DROP PARTITION in case of errors")
-                          .binding("safe-mode"));
-    options.addOption(Poco::Util::Option("copy-fault-probability", "", "the copying fails with specified probability (used to test partition state recovering)")
-                          .argument("copy-fault-probability").binding("copy-fault-probability"));
-    options.addOption(Poco::Util::Option("move-fault-probability", "", "the moving fails with specified probability (used to test partition state recovering)")
-                              .argument("move-fault-probability").binding("move-fault-probability"));
-    options.addOption(Poco::Util::Option("log-level", "", "sets log level")
-                          .argument("log-level").binding("log-level"));
-    options.addOption(Poco::Util::Option("base-dir", "", "base directory for copiers, consecutive copier launches will populate /base-dir/launch_id/* directories")
-                          .argument("base-dir").binding("base-dir"));
-    options.addOption(Poco::Util::Option("experimental-use-sample-offset", "", "Use SAMPLE OFFSET query instead of cityHash64(PRIMARY KEY) % n == k")
-                          .argument("experimental-use-sample-offset").binding("experimental-use-sample-offset"));
-    options.addOption(Poco::Util::Option("status", "", "Get for status for current execution").binding("status"));
-
-    options.addOption(Poco::Util::Option("max-table-tries", "", "Number of tries for the copy table task")
-                          .argument("max-table-tries").binding("max-table-tries"));
-    options.addOption(Poco::Util::Option("max-shard-partition-tries", "", "Number of tries for the copy one partition task")
-                          .argument("max-shard-partition-tries").binding("max-shard-partition-tries"));
-    options.addOption(Poco::Util::Option("max-shard-partition-piece-tries-for-alter", "", "Number of tries for final ALTER ATTACH to destination table")
-                          .argument("max-shard-partition-piece-tries-for-alter").binding("max-shard-partition-piece-tries-for-alter"));
-    options.addOption(Poco::Util::Option("retry-delay-ms", "", "Delay between task retries")
-                          .argument("retry-delay-ms").binding("retry-delay-ms"));
-
-    using Me = std::decay_t<decltype(*this)>;
-    options.addOption(Poco::Util::Option("help", "", "produce this help message").binding("help")
-                          .callback(Poco::Util::OptionCallback<Me>(this, &Me::handleHelp)));
-}
-
-
-void ClusterCopierApp::mainImpl()
-{
-    /// Status command
-    {
-        if (is_status_mode)
-        {
-            SharedContextHolder shared_context = Context::createShared();
-            auto context = Context::createGlobal(shared_context.get());
-            context->makeGlobalContext();
-            SCOPE_EXIT_SAFE(context->shutdown());
-
-            auto zookeeper = context->getZooKeeper();
-            auto status_json = zookeeper->get(task_path + "/status");
-
-            LOG_INFO(&logger(), "{}", status_json);
-            std::cout << status_json << std::endl;
-
-            context->resetZooKeeper();
-            return;
-        }
-    }
-    StatusFile status_file(process_path + "/status", StatusFile::write_full_info);
-    ThreadStatus thread_status;
-
-    auto * log = &logger();
-    LOG_INFO(log, "Starting clickhouse-copier (id {}, host_id {}, path {}, revision {})", process_id, host_id, process_path, ClickHouseRevision::getVersionRevision());
-
-    SharedContextHolder shared_context = Context::createShared();
-    auto context = Context::createGlobal(shared_context.get());
-    context->makeGlobalContext();
-    SCOPE_EXIT_SAFE(context->shutdown());
-
-    context->setConfig(loaded_config.configuration);
-    context->setApplicationType(Context::ApplicationType::LOCAL);
-    context->setPath(process_path + "/");
-
-    registerInterpreters();
-    registerFunctions();
-    registerAggregateFunctions();
-    registerTableFunctions();
-    registerDatabases();
-    registerStorages();
-    registerDictionaries();
-    registerDisks(/* global_skip_access_check= */ true);
-    registerFormats();
-
-    static const std::string default_database = "_local";
-    DatabaseCatalog::instance().attachDatabase(default_database, std::make_shared<DatabaseMemory>(default_database, context));
-    context->setCurrentDatabase(default_database);
-
-    /// Disable queries logging, since:
-    /// - There are bits that is not allowed for global context, like adding factories info (for the query_log)
-    /// - And anyway it is useless for copier.
-    context->setSetting("log_queries", false);
-
-    auto local_context = Context::createCopy(context);
-
-    /// Initialize query scope just in case.
-    CurrentThread::QueryScope query_scope(local_context);
-
-    auto copier = std::make_unique<ClusterCopier>(
-        task_path, host_id, default_database, local_context, log);
-    copier->setSafeMode(is_safe_mode);
-    copier->setCopyFaultProbability(copy_fault_probability);
-    copier->setMoveFaultProbability(move_fault_probability);
-    copier->setMaxTableTries(max_table_tries);
-    copier->setMaxShardPartitionTries(max_shard_partition_tries);
-    copier->setMaxShardPartitionPieceTriesForAlter(max_shard_partition_piece_tries_for_alter);
-    copier->setRetryDelayMs(retry_delay_ms);
-    copier->setExperimentalUseSampleOffset(experimental_use_sample_offset);
-
-    auto task_file = config().getString("task-file", "");
-    if (!task_file.empty())
-        copier->uploadTaskDescription(task_path, task_file, config().getBool("task-upload-force", false));
-
-    zkutil::validateZooKeeperConfig(config());
-
-    copier->init();
-    copier->process(ConnectionTimeouts::getTCPTimeoutsWithoutFailover(context->getSettingsRef()));
-
-    /// Reset ZooKeeper before removing ClusterCopier.
-    /// Otherwise zookeeper watch can call callback which use already removed ClusterCopier object.
-    context->resetZooKeeper();
-}
-
-
-int ClusterCopierApp::main(const std::vector<std::string> &)
-{
-    if (is_help)
-        return 0;
-
-    try
-    {
-        mainImpl();
-    }
-    catch (...)
-    {
-        tryLogCurrentException(&Poco::Logger::root(), __PRETTY_FUNCTION__);
-        auto code = getCurrentExceptionCode();
-
-        return (code) ? code : -1;
-    }
-
-    return 0;
-}
-
-
-}
-
-#pragma GCC diagnostic ignored "-Wunused-function"
-#pragma GCC diagnostic ignored "-Wmissing-declarations"
-
-int mainEntryClickHouseClusterCopier(int argc, char ** argv)
-{
-    try
-    {
-        DB::ClusterCopierApp app;
-        return app.run(argc, argv);
-    }
-    catch (...)
-    {
-        std::cerr << DB::getCurrentExceptionMessage(true) << "\n";
-        auto code = DB::getCurrentExceptionCode();
-
-        return (code) ? code : -1;
-    }
-}
diff --git a/programs/copier/ClusterCopierApp.h b/programs/copier/ClusterCopierApp.h
deleted file mode 100644
index 0ddc232381e..00000000000
--- a/programs/copier/ClusterCopierApp.h
+++ /dev/null
@@ -1,99 +0,0 @@
-#pragma once
-
-#include <Poco/Util/ServerApplication.h>
-#include <Daemon/BaseDaemon.h>
-
-#include "ClusterCopier.h"
-
-/* clickhouse cluster copier util
- * Copies tables data from one cluster to new tables of other (possibly the same) cluster in distributed fault-tolerant manner.
- *
- * See overview in the docs: docs/en/utils/clickhouse-copier.md
- *
- * Implementation details:
- *
- * cluster-copier workers pull each partition of each shard of the source cluster and push it to the destination cluster through
- * Distributed table (to perform data resharding). So, worker job is a partition of a source shard.
- * A job has three states: Active, Finished and Abandoned. Abandoned means that worker died and did not finish the job.
- *
- * If an error occurred during the copying (a worker failed or a worker did not finish the INSERT), then the whole partition (on
- * all destination servers) should be dropped and refilled. So, copying entity is a partition of all destination shards.
- * If a failure is detected a special /is_dirty node is created in ZooKeeper signalling that other workers copying the same partition
- * should stop, after a refilling procedure should start.
- *
- * ZooKeeper task node has the following structure:
- *  /task/path_root                     - path passed in --task-path parameter
- *      /description                    - contains user-defined XML config of the task
- *      /task_active_workers            - contains ephemeral nodes of all currently active workers, used to implement max_workers limitation
- *          /server_fqdn#PID_timestamp  - cluster-copier worker ID
- *          ...
- *      /tables             - directory with table tasks
- *      /cluster.db.table1  - directory of table_hits task
- *          /partition1     - directory for partition1
- *              /shards     - directory for source cluster shards
- *                  /1      - worker job for the first shard of partition1 of table test.hits
- *                            Contains info about current status (Active or Finished) and worker ID.
- *                  /2
- *                  ...
- *              /partition_active_workers
- *                  /1      - for each job in /shards a corresponding ephemeral node created in /partition_active_workers
- *                            It is used to detect Abandoned jobs (if there is Active node in /shards and there is no node in
- *                            /partition_active_workers).
- *                            Also, it is used to track active workers in the partition (when we need to refill the partition we do
- *                            not DROP PARTITION while there are active workers)
- *                  /2
- *                  ...
- *              /is_dirty   - the node is set if some worker detected that an error occurred (the INSERT is failed or an Abandoned node is
- *                            detected). If the node appeared workers in this partition should stop and start cleaning and refilling
- *                            partition procedure.
- *                            During this procedure a single 'cleaner' worker is selected. The worker waits for stopping all partition
- *                            workers, removes /shards node, executes DROP PARTITION on each destination node and removes /is_dirty node.
- *                  /cleaner- An ephemeral node used to select 'cleaner' worker. Contains ID of the worker.
- *      /cluster.db.table2
- *          ...
- */
-
-namespace DB
-{
-
-class ClusterCopierApp : public BaseDaemon
-{
-public:
-
-    void initialize(Poco::Util::Application & self) override;
-
-    void handleHelp(const std::string &, const std::string &);
-
-    void defineOptions(Poco::Util::OptionSet & options) override;
-
-    int main(const std::vector<std::string> &) override;
-
-private:
-
-    using Base = BaseDaemon;
-
-    void mainImpl();
-
-    std::string config_xml_path;
-    std::string task_path;
-    std::string log_level = "info";
-    bool is_safe_mode = false;
-    bool is_status_mode = false;
-    double copy_fault_probability = 0.0;
-    double move_fault_probability = 0.0;
-    bool is_help = false;
-
-    UInt64 max_table_tries = 3;
-    UInt64 max_shard_partition_tries = 3;
-    UInt64 max_shard_partition_piece_tries_for_alter = 10;
-    std::chrono::milliseconds retry_delay_ms{1000};
-
-    bool experimental_use_sample_offset{false};
-
-    std::string base_dir;
-    std::string process_path;
-    std::string process_id;
-    std::string host_id;
-};
-
-}
diff --git a/programs/copier/ClusterPartition.h b/programs/copier/ClusterPartition.h
deleted file mode 100644
index 22063989e22..00000000000
--- a/programs/copier/ClusterPartition.h
+++ /dev/null
@@ -1,22 +0,0 @@
-#pragma once
-
-#include <base/types.h>
-#include <map>
-
-namespace DB
-{
-
-/// Contains info about all shards that contain a partition
-struct ClusterPartition
-{
-    double elapsed_time_seconds = 0;
-    UInt64 bytes_copied = 0;
-    UInt64 rows_copied = 0;
-    UInt64 blocks_copied = 0;
-
-    UInt64 total_tries = 0;
-};
-
-using ClusterPartitions = std::map<String, ClusterPartition, std::greater<>>;
-
-}
diff --git a/programs/copier/Internals.cpp b/programs/copier/Internals.cpp
deleted file mode 100644
index dcd199c6b38..00000000000
--- a/programs/copier/Internals.cpp
+++ /dev/null
@@ -1,280 +0,0 @@
-#include "Internals.h"
-#include <Parsers/ASTFunction.h>
-#include <Parsers/ASTIdentifier.h>
-#include <Processors/Executors/PullingPipelineExecutor.h>
-#include <Processors/Transforms/SquashingChunksTransform.h>
-#include <Storages/MergeTree/MergeTreeData.h>
-#include <Storages/extractKeyExpressionList.h>
-#include <QueryPipeline/QueryPipelineBuilder.h>
-
-namespace DB
-{
-namespace ErrorCodes
-{
-    extern const int BAD_ARGUMENTS;
-}
-
-using ConfigurationPtr = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
-
-ConfigurationPtr getConfigurationFromXMLString(const std::string & xml_data)
-{
-    std::stringstream ss(xml_data);         // STYLE_CHECK_ALLOW_STD_STRING_STREAM
-    Poco::XML::InputSource input_source{ss};
-    return {new Poco::Util::XMLConfiguration{&input_source}};
-}
-
-String getQuotedTable(const String & database, const String & table)
-{
-    if (database.empty())
-        return backQuoteIfNeed(table);
-
-    return backQuoteIfNeed(database) + "." + backQuoteIfNeed(table);
-}
-
-String getQuotedTable(const DatabaseAndTableName & db_and_table)
-{
-    return getQuotedTable(db_and_table.first, db_and_table.second);
-}
-
-
-// Creates AST representing 'ENGINE = Distributed(cluster, db, table, [sharding_key])
-std::shared_ptr<ASTStorage> createASTStorageDistributed(
-        const String & cluster_name, const String & database, const String & table,
-        const ASTPtr & sharding_key_ast)
-{
-    auto args = std::make_shared<ASTExpressionList>();
-    args->children.emplace_back(std::make_shared<ASTLiteral>(cluster_name));
-    args->children.emplace_back(std::make_shared<ASTIdentifier>(database));
-    args->children.emplace_back(std::make_shared<ASTIdentifier>(table));
-    if (sharding_key_ast)
-        args->children.emplace_back(sharding_key_ast);
-
-    auto engine = std::make_shared<ASTFunction>();
-    engine->name = "Distributed";
-    engine->arguments = args;
-
-    auto storage = std::make_shared<ASTStorage>();
-    storage->set(storage->engine, engine);
-
-    return storage;
-}
-
-
-Block getBlockWithAllStreamData(QueryPipelineBuilder builder)
-{
-    builder.addTransform(std::make_shared<SquashingChunksTransform>(
-        builder.getHeader(),
-        std::numeric_limits<size_t>::max(),
-        std::numeric_limits<size_t>::max()));
-
-    auto cur_pipeline = QueryPipelineBuilder::getPipeline(std::move(builder));
-    Block block;
-    PullingPipelineExecutor executor(cur_pipeline);
-    executor.pull(block);
-
-    return block;
-}
-
-bool isExtendedDefinitionStorage(const ASTPtr & storage_ast)
-{
-    const auto & storage = storage_ast->as<ASTStorage &>();
-    return storage.partition_by || storage.order_by || storage.sample_by;
-}
-
-ASTPtr extractPartitionKey(const ASTPtr & storage_ast)
-{
-    String storage_str = queryToString(storage_ast);
-
-    const auto & storage = storage_ast->as<ASTStorage &>();
-    const auto & engine = storage.engine->as<ASTFunction &>();
-
-    if (!endsWith(engine.name, "MergeTree"))
-    {
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unsupported engine was specified in {}, only *MergeTree engines are supported", storage_str);
-    }
-
-    if (isExtendedDefinitionStorage(storage_ast))
-    {
-        if (storage.partition_by)
-            return storage.partition_by->clone();
-
-        static const char * all = "all";
-        return std::make_shared<ASTLiteral>(Field(all, strlen(all)));
-    }
-    else
-    {
-        bool is_replicated = startsWith(engine.name, "Replicated");
-        size_t min_args = is_replicated ? 3 : 1;
-
-        if (!engine.arguments)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected arguments in {}", storage_str);
-
-        ASTPtr arguments_ast = engine.arguments->clone();
-        ASTs & arguments = arguments_ast->children;
-
-        if (arguments.size() < min_args)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected at least {} arguments in {}", min_args, storage_str);
-
-        ASTPtr & month_arg = is_replicated ? arguments[2] : arguments[1];
-        return makeASTFunction("toYYYYMM", month_arg->clone());
-    }
-}
-
-ASTPtr extractPrimaryKey(const ASTPtr & storage_ast)
-{
-    String storage_str = queryToString(storage_ast);
-
-    const auto & storage = storage_ast->as<ASTStorage &>();
-    const auto & engine = storage.engine->as<ASTFunction &>();
-
-    if (!endsWith(engine.name, "MergeTree"))
-    {
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unsupported engine was specified in {}, only *MergeTree engines are supported", storage_str);
-    }
-
-    if (!isExtendedDefinitionStorage(storage_ast))
-    {
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Is not extended deginition storage {} Will be fixed later.", storage_str);
-    }
-
-    if (storage.primary_key)
-        return storage.primary_key->clone();
-
-    return nullptr;
-}
-
-
-ASTPtr extractOrderBy(const ASTPtr & storage_ast)
-{
-    String storage_str = queryToString(storage_ast);
-
-    const auto & storage = storage_ast->as<ASTStorage &>();
-    const auto & engine = storage.engine->as<ASTFunction &>();
-
-    if (!endsWith(engine.name, "MergeTree"))
-    {
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unsupported engine was specified in {}, only *MergeTree engines are supported", storage_str);
-    }
-
-    if (!isExtendedDefinitionStorage(storage_ast))
-    {
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Is not extended deginition storage {} Will be fixed later.", storage_str);
-    }
-
-    if (storage.order_by)
-        return storage.order_by->clone();
-
-    throw Exception(ErrorCodes::BAD_ARGUMENTS, "ORDER BY cannot be empty");
-}
-
-/// Wraps only identifiers with backticks.
-std::string wrapIdentifiersWithBackticks(const ASTPtr & root)
-{
-    if (auto identifier = std::dynamic_pointer_cast<ASTIdentifier>(root))
-        return backQuote(identifier->name());
-
-    if (auto function = std::dynamic_pointer_cast<ASTFunction>(root))
-        return function->name + '(' + wrapIdentifiersWithBackticks(function->arguments) + ')';
-
-    if (auto expression_list = std::dynamic_pointer_cast<ASTExpressionList>(root))
-    {
-        Names function_arguments(expression_list->children.size());
-        for (size_t i = 0; i < expression_list->children.size(); ++i)
-            function_arguments[i] = wrapIdentifiersWithBackticks(expression_list->children[0]);
-        return boost::algorithm::join(function_arguments, ", ");
-    }
-
-    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Primary key could be represented only as columns or functions from columns.");
-}
-
-
-Names extractPrimaryKeyColumnNames(const ASTPtr & storage_ast)
-{
-    const auto sorting_key_ast = extractOrderBy(storage_ast);
-    const auto primary_key_ast = extractPrimaryKey(storage_ast);
-
-    const auto sorting_key_expr_list = extractKeyExpressionList(sorting_key_ast);
-    const auto primary_key_expr_list = primary_key_ast
-                           ? extractKeyExpressionList(primary_key_ast) : sorting_key_expr_list->clone();
-
-    /// Maybe we have to handle VersionedCollapsing engine separately. But in our case in looks pointless.
-
-    size_t primary_key_size = primary_key_expr_list->children.size();
-    size_t sorting_key_size = sorting_key_expr_list->children.size();
-
-    if (primary_key_size > sorting_key_size)
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Primary key must be a prefix of the sorting key, but its length: "
-                        "{} is greater than the sorting key length: {}",
-                        primary_key_size, sorting_key_size);
-
-    Names primary_key_columns;
-    NameSet primary_key_columns_set;
-
-    for (size_t i = 0; i < sorting_key_size; ++i)
-    {
-        /// Column name could be represented as a f_1(f_2(...f_n(column_name))).
-        /// Each f_i could take one or more parameters.
-        /// We will wrap identifiers with backticks to allow non-standard identifier names.
-        String sorting_key_column = sorting_key_expr_list->children[i]->getColumnName();
-
-        if (i < primary_key_size)
-        {
-            String pk_column = primary_key_expr_list->children[i]->getColumnName();
-            if (pk_column != sorting_key_column)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                                "Primary key must be a prefix of the sorting key, "
-                                "but the column in the position {} is {}, not {}", i, sorting_key_column, pk_column);
-
-            if (!primary_key_columns_set.emplace(pk_column).second)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Primary key contains duplicate columns");
-
-            primary_key_columns.push_back(wrapIdentifiersWithBackticks(primary_key_expr_list->children[i]));
-        }
-    }
-
-    return primary_key_columns;
-}
-
-bool isReplicatedTableEngine(const ASTPtr & storage_ast)
-{
-    const auto & storage = storage_ast->as<ASTStorage &>();
-    const auto & engine = storage.engine->as<ASTFunction &>();
-
-    if (!endsWith(engine.name, "MergeTree"))
-    {
-        String storage_str = queryToString(storage_ast);
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unsupported engine was specified in {}, only *MergeTree engines are supported", storage_str);
-    }
-
-    return startsWith(engine.name, "Replicated");
-}
-
-ShardPriority getReplicasPriority(const Cluster::Addresses & replicas, const std::string & local_hostname, UInt8 random)
-{
-    ShardPriority res;
-
-    if (replicas.empty())
-        return res;
-
-    res.is_remote = 1;
-    for (const auto & replica : replicas)
-    {
-        if (isLocalAddress(DNSResolver::instance().resolveHostAllInOriginOrder(replica.host_name).front()))
-        {
-            res.is_remote = 0;
-            break;
-        }
-    }
-
-    res.hostname_difference = std::numeric_limits<size_t>::max();
-    for (const auto & replica : replicas)
-    {
-        size_t difference = getHostNamePrefixDistance(local_hostname, replica.host_name);
-        res.hostname_difference = std::min(difference, res.hostname_difference);
-    }
-
-    res.random = random;
-    return res;
-}
-
-}
diff --git a/programs/copier/Internals.h b/programs/copier/Internals.h
deleted file mode 100644
index 27fedd5d9e8..00000000000
--- a/programs/copier/Internals.h
+++ /dev/null
@@ -1,198 +0,0 @@
-#pragma once
-
-#include <chrono>
-#include <optional>
-#include <Poco/Util/XMLConfiguration.h>
-#include <Poco/Logger.h>
-#include <Poco/ConsoleChannel.h>
-#include <Poco/FormattingChannel.h>
-#include <Poco/PatternFormatter.h>
-#include <Poco/UUIDGenerator.h>
-#include <Poco/Process.h>
-#include <Poco/FileChannel.h>
-#include <Poco/SplitterChannel.h>
-#include <Poco/Util/HelpFormatter.h>
-#include <boost/algorithm/string.hpp>
-#include <Common/logger_useful.h>
-#include <Common/ThreadPool.h>
-#include <Common/Exception.h>
-#include <Common/ZooKeeper/ZooKeeper.h>
-#include <Common/ZooKeeper/KeeperException.h>
-#include <base/getFQDNOrHostName.h>
-#include <Common/isLocalAddress.h>
-#include <Common/typeid_cast.h>
-#include <Common/ClickHouseRevision.h>
-#include <Common/formatReadable.h>
-#include <Common/DNSResolver.h>
-#include <Common/CurrentThread.h>
-#include <Common/getNumberOfPhysicalCPUCores.h>
-#include <Common/ThreadStatus.h>
-#include <Client/Connection.h>
-#include <Interpreters/Context.h>
-#include <Interpreters/Cluster.h>
-#include <Interpreters/InterpreterFactory.h>
-#include <Interpreters/InterpreterExistsQuery.h>
-#include <Interpreters/InterpreterShowCreateQuery.h>
-#include <Interpreters/InterpreterDropQuery.h>
-#include <Interpreters/InterpreterCreateQuery.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnsNumber.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/NestedUtils.h>
-#include <Parsers/ParserCreateQuery.h>
-#include <Parsers/parseQuery.h>
-#include <Parsers/ParserQuery.h>
-#include <Parsers/ASTCreateQuery.h>
-#include <Parsers/queryToString.h>
-#include <Parsers/ASTDropQuery.h>
-#include <Parsers/ASTLiteral.h>
-#include <Parsers/ASTExpressionList.h>
-#include <Formats/FormatSettings.h>
-#include <QueryPipeline/RemoteQueryExecutor.h>
-#include <IO/ConnectionTimeouts.h>
-#include <IO/Operators.h>
-#include <IO/ReadBufferFromString.h>
-#include <IO/ReadBufferFromFile.h>
-#include <Functions/registerFunctions.h>
-#include <TableFunctions/registerTableFunctions.h>
-#include <AggregateFunctions/registerAggregateFunctions.h>
-#include <Storages/registerStorages.h>
-#include <Storages/StorageDistributed.h>
-#include <Dictionaries/registerDictionaries.h>
-#include <Disks/registerDisks.h>
-#include <Databases/DatabaseMemory.h>
-
-#include "Aliases.h"
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int LOGICAL_ERROR;
-}
-
-
-ConfigurationPtr getConfigurationFromXMLString(const std::string & xml_data);
-
-String getQuotedTable(const String & database, const String & table);
-
-String getQuotedTable(const DatabaseAndTableName & db_and_table);
-
-
-enum class TaskState
-{
-    Started = 0,
-    Finished,
-    Unknown
-};
-
-/// Used to mark status of shard partition tasks
-struct TaskStateWithOwner
-{
-    TaskStateWithOwner() = default;
-
-    TaskStateWithOwner(TaskState state_, const String & owner_) : state(state_), owner(owner_) {}
-
-    TaskState state{TaskState::Unknown};
-    String owner;
-
-    static String getData(TaskState state, const String &owner)
-    {
-        return TaskStateWithOwner(state, owner).toString();
-    }
-
-    String toString() const
-    {
-        WriteBufferFromOwnString wb;
-        wb << static_cast<UInt32>(state) << "\n" << escape << owner;
-        return wb.str();
-    }
-
-    static TaskStateWithOwner fromString(const String & data)
-    {
-        ReadBufferFromString rb(data);
-        TaskStateWithOwner res;
-        UInt32 state;
-
-        rb >> state >> "\n" >> escape >> res.owner;
-
-        if (state >= static_cast<int>(TaskState::Unknown))
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown state {}", data);
-
-        res.state = static_cast<TaskState>(state);
-        return res;
-    }
-};
-
-
-struct ShardPriority
-{
-    UInt8 is_remote = 1;
-    size_t hostname_difference = 0;
-    UInt8 random = 0;
-
-    static bool greaterPriority(const ShardPriority & current, const ShardPriority & other)
-    {
-        return std::forward_as_tuple(current.is_remote, current.hostname_difference, current.random)
-               < std::forward_as_tuple(other.is_remote, other.hostname_difference, other.random);
-    }
-};
-
-/// Execution status of a task.
-/// Is used for: partition copying task status, partition piece copying task status, partition moving task status.
-enum class TaskStatus
-{
-    Active,
-    Finished,
-    Error,
-};
-
-struct MultiTransactionInfo
-{
-    int32_t code;
-    Coordination::Requests requests;
-    Coordination::Responses responses;
-};
-
-// Creates AST representing 'ENGINE = Distributed(cluster, db, table, [sharding_key])
-std::shared_ptr<ASTStorage> createASTStorageDistributed(
-        const String & cluster_name, const String & database, const String & table,
-        const ASTPtr & sharding_key_ast = nullptr);
-
-Block getBlockWithAllStreamData(QueryPipelineBuilder builder);
-
-bool isExtendedDefinitionStorage(const ASTPtr & storage_ast);
-
-ASTPtr extractPartitionKey(const ASTPtr & storage_ast);
-
-/*
-* Choosing a Primary Key that Differs from the Sorting Key
-* It is possible to specify a primary key (an expression with values that are written in the index file for each mark)
-* that is different from the sorting key (an expression for sorting the rows in data parts).
-* In this case the primary key expression tuple must be a prefix of the sorting key expression tuple.
-* This feature is helpful when using the SummingMergeTree and AggregatingMergeTree table engines.
-* In a common case when using these engines, the table has two types of columns: dimensions and measures.
-* Typical queries aggregate values of measure columns with arbitrary GROUP BY and filtering by dimensions.
-* Because SummingMergeTree and AggregatingMergeTree aggregate rows with the same value of the sorting key,
-* it is natural to add all dimensions to it. As a result, the key expression consists of a long list of columns
-* and this list must be frequently updated with newly added dimensions.
-* In this case it makes sense to leave only a few columns in the primary key that will provide efficient
-* range scans and add the remaining dimension columns to the sorting key tuple.
-* ALTER of the sorting key is a lightweight operation because when a new column is simultaneously added t
-* o the table and to the sorting key, existing data parts don't need to be changed.
-* Since the old sorting key is a prefix of the new sorting key and there is no data in the newly added column,
-* the data is sorted by both the old and new sorting keys at the moment of table modification.
-*
-* */
-ASTPtr extractPrimaryKey(const ASTPtr & storage_ast);
-
-ASTPtr extractOrderBy(const ASTPtr & storage_ast);
-
-Names extractPrimaryKeyColumnNames(const ASTPtr & storage_ast);
-
-bool isReplicatedTableEngine(const ASTPtr & storage_ast);
-
-ShardPriority getReplicasPriority(const Cluster::Addresses & replicas, const std::string & local_hostname, UInt8 random);
-
-}
diff --git a/programs/copier/ShardPartition.cpp b/programs/copier/ShardPartition.cpp
deleted file mode 100644
index 4c962fc807d..00000000000
--- a/programs/copier/ShardPartition.cpp
+++ /dev/null
@@ -1,70 +0,0 @@
-#include "ShardPartition.h"
-
-#include "TaskShard.h"
-#include "TaskTable.h"
-
-namespace DB
-{
-
-ShardPartition::ShardPartition(TaskShard & parent, String name_quoted_, size_t number_of_splits)
-    : task_shard(parent)
-    , name(std::move(name_quoted_))
-{
-    pieces.reserve(number_of_splits);
-}
-
-String ShardPartition::getPartitionCleanStartPath() const
-{
-    return getPartitionPath() + "/clean_start";
-}
-
-String ShardPartition::getPartitionPieceCleanStartPath(size_t current_piece_number) const
-{
-    assert(current_piece_number < task_shard.task_table.number_of_splits);
-    return getPartitionPiecePath(current_piece_number) + "/clean_start";
-}
-
-String ShardPartition::getPartitionPath() const
-{
-    return task_shard.task_table.getPartitionPath(name);
-}
-
-String ShardPartition::getPartitionPiecePath(size_t current_piece_number) const
-{
-    assert(current_piece_number < task_shard.task_table.number_of_splits);
-    return task_shard.task_table.getPartitionPiecePath(name, current_piece_number);
-}
-
-String ShardPartition::getShardStatusPath() const
-{
-    // schema: /<root...>/tables/<table>/<partition>/shards/<shard>
-    // e.g. /root/table_test.hits/201701/shards/1
-    return getPartitionShardsPath() + "/" + toString(task_shard.numberInCluster());
-}
-
-String ShardPartition::getPartitionShardsPath() const
-{
-    return getPartitionPath() + "/shards";
-}
-
-String ShardPartition::getPartitionActiveWorkersPath() const
-{
-    return getPartitionPath() + "/partition_active_workers";
-}
-
-String ShardPartition::getActiveWorkerPath() const
-{
-    return getPartitionActiveWorkersPath() + "/" + toString(task_shard.numberInCluster());
-}
-
-String ShardPartition::getCommonPartitionIsDirtyPath() const
-{
-    return getPartitionPath() + "/is_dirty";
-}
-
-String ShardPartition::getCommonPartitionIsCleanedPath() const
-{
-    return getCommonPartitionIsDirtyPath() + "/cleaned";
-}
-
-}
diff --git a/programs/copier/ShardPartition.h b/programs/copier/ShardPartition.h
deleted file mode 100644
index 2457213733c..00000000000
--- a/programs/copier/ShardPartition.h
+++ /dev/null
@@ -1,54 +0,0 @@
-#pragma once
-
-#include "ShardPartitionPiece.h"
-
-#include <base/types.h>
-
-#include <map>
-
-namespace DB
-{
-
-struct TaskShard;
-
-/// Just destination partition of a shard
-/// I don't know what this comment means.
-/// In short, when we discovered what shards contain currently processing partition,
-/// This class describes a partition (name) that is stored on the shard (parent).
-struct ShardPartition
-{
-    ShardPartition(TaskShard &parent, String name_quoted_, size_t number_of_splits = 10);
-
-    String getPartitionPath() const;
-
-    String getPartitionPiecePath(size_t current_piece_number) const;
-
-    String getPartitionCleanStartPath() const;
-
-    String getPartitionPieceCleanStartPath(size_t current_piece_number) const;
-
-    String getCommonPartitionIsDirtyPath() const;
-
-    String getCommonPartitionIsCleanedPath() const;
-
-    String getPartitionActiveWorkersPath() const;
-
-    String getActiveWorkerPath() const;
-
-    String getPartitionShardsPath() const;
-
-    String getShardStatusPath() const;
-
-    /// What partition pieces are present in current shard.
-    /// FYI: Piece is a part of partition which has modulo equals to concrete constant (less than number_of_splits obliously)
-    /// For example SELECT ... from ... WHERE partition=current_partition AND cityHash64(*) == const;
-    /// Absent pieces have field is_absent_piece equals to true.
-    PartitionPieces pieces;
-
-    TaskShard & task_shard;
-    String name;
-};
-
-using TasksPartition = std::map<String, ShardPartition, std::greater<>>;
-
-}
diff --git a/programs/copier/ShardPartitionPiece.cpp b/programs/copier/ShardPartitionPiece.cpp
deleted file mode 100644
index 36d1621e012..00000000000
--- a/programs/copier/ShardPartitionPiece.cpp
+++ /dev/null
@@ -1,64 +0,0 @@
-#include "ShardPartitionPiece.h"
-
-#include "ShardPartition.h"
-#include "TaskShard.h"
-
-#include <IO/WriteHelpers.h>
-
-namespace DB
-{
-
-ShardPartitionPiece::ShardPartitionPiece(ShardPartition & parent, size_t current_piece_number_, bool is_present_piece_)
-    : is_absent_piece(!is_present_piece_)
-    , current_piece_number(current_piece_number_)
-    , shard_partition(parent)
-{
-}
-
-String ShardPartitionPiece::getPartitionPiecePath() const
-{
-    return shard_partition.getPartitionPath() + "/piece_" + toString(current_piece_number);
-}
-
-String ShardPartitionPiece::getPartitionPieceCleanStartPath() const
-{
-    return getPartitionPiecePath() + "/clean_start";
-}
-
-String ShardPartitionPiece::getPartitionPieceIsDirtyPath() const
-{
-    return getPartitionPiecePath() + "/is_dirty";
-}
-
-String ShardPartitionPiece::getPartitionPieceIsCleanedPath() const
-{
-    return getPartitionPieceIsDirtyPath() + "/cleaned";
-}
-
-String ShardPartitionPiece::getPartitionPieceActiveWorkersPath() const
-{
-    return getPartitionPiecePath() + "/partition_piece_active_workers";
-}
-
-String ShardPartitionPiece::getActiveWorkerPath() const
-{
-    return getPartitionPieceActiveWorkersPath() + "/" + toString(shard_partition.task_shard.numberInCluster());
-}
-
-/// On what shards do we have current partition.
-String ShardPartitionPiece::getPartitionPieceShardsPath() const
-{
-    return getPartitionPiecePath() + "/shards";
-}
-
-String ShardPartitionPiece::getShardStatusPath() const
-{
-    return getPartitionPieceShardsPath() + "/" + toString(shard_partition.task_shard.numberInCluster());
-}
-
-String ShardPartitionPiece::getPartitionPieceCleanerPath() const
-{
-    return getPartitionPieceIsDirtyPath() + "/cleaner";
-}
-
-}
diff --git a/programs/copier/ShardPartitionPiece.h b/programs/copier/ShardPartitionPiece.h
deleted file mode 100644
index 453364c0fc8..00000000000
--- a/programs/copier/ShardPartitionPiece.h
+++ /dev/null
@@ -1,43 +0,0 @@
-#pragma once
-
-#include <base/types.h>
-
-#include <vector>
-
-namespace DB
-{
-
-struct ShardPartition;
-
-struct ShardPartitionPiece
-{
-    ShardPartitionPiece(ShardPartition & parent, size_t current_piece_number_, bool is_present_piece_);
-
-    String getPartitionPiecePath() const;
-
-    String getPartitionPieceCleanStartPath() const;
-
-    String getPartitionPieceIsDirtyPath() const;
-
-    String getPartitionPieceIsCleanedPath() const;
-
-    String getPartitionPieceActiveWorkersPath() const;
-
-    String getActiveWorkerPath() const ;
-
-    /// On what shards do we have current partition.
-    String getPartitionPieceShardsPath() const;
-
-    String getShardStatusPath() const;
-
-    String getPartitionPieceCleanerPath() const;
-
-    bool is_absent_piece;
-    const size_t current_piece_number;
-
-    ShardPartition & shard_partition;
-};
-
-using PartitionPieces = std::vector<ShardPartitionPiece>;
-
-}
diff --git a/programs/copier/StatusAccumulator.cpp b/programs/copier/StatusAccumulator.cpp
deleted file mode 100644
index 77adeac708c..00000000000
--- a/programs/copier/StatusAccumulator.cpp
+++ /dev/null
@@ -1,48 +0,0 @@
-#include "StatusAccumulator.h"
-
-#include <Poco/JSON/Parser.h>
-#include <Poco/JSON/JSON.h>
-#include <Poco/JSON/Object.h>
-#include <Poco/JSON/Stringifier.h>
-
-#include <iostream>
-
-namespace DB
-{
-
-StatusAccumulator::MapPtr StatusAccumulator::fromJSON(String state_json)
-{
-    Poco::JSON::Parser parser;
-    auto state = parser.parse(state_json).extract<Poco::JSON::Object::Ptr>();
-    MapPtr result_ptr = std::make_shared<Map>();
-    for (const auto & table_name : state->getNames())
-    {
-        auto table_status_json = state->getValue<String>(table_name);
-        auto table_status = parser.parse(table_status_json).extract<Poco::JSON::Object::Ptr>();
-        /// Map entry will be created if it is absent
-        auto & map_table_status = (*result_ptr)[table_name];
-        map_table_status.all_partitions_count += table_status->getValue<size_t>("all_partitions_count");
-        map_table_status.processed_partitions_count += table_status->getValue<size_t>("processed_partitions_count");
-    }
-    return result_ptr;
-}
-
-String StatusAccumulator::serializeToJSON(MapPtr statuses)
-{
-    Poco::JSON::Object result_json;
-    for (const auto & [table_name, table_status] : *statuses)
-    {
-        Poco::JSON::Object status_json;
-        status_json.set("all_partitions_count", table_status.all_partitions_count);
-        status_json.set("processed_partitions_count", table_status.processed_partitions_count);
-
-        result_json.set(table_name, status_json);
-    }
-    std::ostringstream oss;     // STYLE_CHECK_ALLOW_STD_STRING_STREAM
-    oss.exceptions(std::ios::failbit);
-    Poco::JSON::Stringifier::stringify(result_json, oss);
-    auto result = oss.str();
-    return result;
-}
-
-}
diff --git a/programs/copier/StatusAccumulator.h b/programs/copier/StatusAccumulator.h
deleted file mode 100644
index d420b611602..00000000000
--- a/programs/copier/StatusAccumulator.h
+++ /dev/null
@@ -1,27 +0,0 @@
-#pragma once
-
-#include <base/types.h>
-
-#include <memory>
-#include <unordered_map>
-
-namespace DB
-{
-
-class StatusAccumulator
-{
-public:
-    struct TableStatus
-    {
-        size_t all_partitions_count;
-        size_t processed_partitions_count;
-    };
-
-    using Map = std::unordered_map<String, TableStatus>;
-    using MapPtr = std::shared_ptr<Map>;
-
-    static MapPtr fromJSON(String state_json);
-    static String serializeToJSON(MapPtr statuses);
-};
-
-}
diff --git a/programs/copier/TaskCluster.cpp b/programs/copier/TaskCluster.cpp
deleted file mode 100644
index 0fb06616e50..00000000000
--- a/programs/copier/TaskCluster.cpp
+++ /dev/null
@@ -1,74 +0,0 @@
-#include "TaskCluster.h"
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int BAD_ARGUMENTS;
-}
-
-TaskCluster::TaskCluster(const String & task_zookeeper_path_, const String & default_local_database_)
-    : task_zookeeper_path(task_zookeeper_path_)
-    , default_local_database(default_local_database_)
-{}
-
-void DB::TaskCluster::loadTasks(const Poco::Util::AbstractConfiguration & config, const String & base_key)
-{
-    String prefix = base_key.empty() ? "" : base_key + ".";
-
-    clusters_prefix = prefix + "remote_servers";
-    if (!config.has(clusters_prefix))
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "You should specify list of clusters in {}", clusters_prefix);
-
-    Poco::Util::AbstractConfiguration::Keys tables_keys;
-    config.keys(prefix + "tables", tables_keys);
-
-    for (const auto & table_key : tables_keys)
-    {
-        table_tasks.emplace_back(*this, config, prefix + "tables", table_key);
-    }
-}
-
-void DB::TaskCluster::reloadSettings(const Poco::Util::AbstractConfiguration & config, const String & base_key)
-{
-    String prefix = base_key.empty() ? "" : base_key + ".";
-
-    max_workers = config.getUInt64(prefix + "max_workers");
-
-    settings_common = Settings();
-    if (config.has(prefix + "settings"))
-        settings_common.loadSettingsFromConfig(prefix + "settings", config);
-
-    settings_common.prefer_localhost_replica = false;
-
-    settings_pull = settings_common;
-    if (config.has(prefix + "settings_pull"))
-        settings_pull.loadSettingsFromConfig(prefix + "settings_pull", config);
-
-    settings_push = settings_common;
-    if (config.has(prefix + "settings_push"))
-        settings_push.loadSettingsFromConfig(prefix + "settings_push", config);
-
-    auto set_default_value = [] (auto && setting, auto && default_value)
-    {
-        setting = setting.changed ? setting.value : default_value;
-    };
-
-    /// Override important settings
-    settings_pull.readonly = 1;
-    settings_pull.prefer_localhost_replica = false;
-    settings_push.distributed_foreground_insert = true;
-    settings_push.prefer_localhost_replica = false;
-
-    set_default_value(settings_pull.load_balancing, LoadBalancing::NEAREST_HOSTNAME);
-    set_default_value(settings_pull.max_threads, 1);
-    set_default_value(settings_pull.max_block_size, 8192UL);
-    set_default_value(settings_pull.preferred_block_size_bytes, 0);
-
-    set_default_value(settings_push.distributed_background_insert_timeout, 0);
-    set_default_value(settings_push.alter_sync, 2);
-}
-
-}
-
diff --git a/programs/copier/TaskCluster.h b/programs/copier/TaskCluster.h
deleted file mode 100644
index a7f8bc3baca..00000000000
--- a/programs/copier/TaskCluster.h
+++ /dev/null
@@ -1,51 +0,0 @@
-#pragma once
-
-#include "TaskTable.h"
-
-#include <Core/Settings.h>
-#include <base/types.h>
-
-#include <Poco/Util/AbstractConfiguration.h>
-
-#include <pcg_random.hpp>
-
-namespace DB
-{
-
-struct TaskCluster
-{
-    TaskCluster(const String & task_zookeeper_path_, const String & default_local_database_);
-
-    void loadTasks(const Poco::Util::AbstractConfiguration & config, const String & base_key = "");
-
-    /// Set (or update) settings and max_workers param
-    void reloadSettings(const Poco::Util::AbstractConfiguration & config, const String & base_key = "");
-
-    /// Base node for all tasks. Its structure:
-    ///  workers/ - directory with active workers (amount of them is less or equal max_workers)
-    ///  description - node with task configuration
-    ///  table_table1/ - directories with per-partition copying status
-    String task_zookeeper_path;
-
-    /// Database used to create temporary Distributed tables
-    String default_local_database;
-
-    /// Limits number of simultaneous workers
-    UInt64 max_workers = 0;
-
-    /// Base settings for pull and push
-    Settings settings_common;
-    /// Settings used to fetch data
-    Settings settings_pull;
-    /// Settings used to insert data
-    Settings settings_push;
-
-    String clusters_prefix;
-
-    /// Subtasks
-    TasksTable table_tasks;
-
-    pcg64 random_engine;
-};
-
-}
diff --git a/programs/copier/TaskShard.cpp b/programs/copier/TaskShard.cpp
deleted file mode 100644
index d156f451a84..00000000000
--- a/programs/copier/TaskShard.cpp
+++ /dev/null
@@ -1,37 +0,0 @@
-#include "TaskShard.h"
-
-#include "TaskTable.h"
-
-namespace DB
-{
-
-TaskShard::TaskShard(TaskTable & parent, const Cluster::ShardInfo & info_)
-    : task_table(parent)
-    , info(info_)
-{
-    list_of_split_tables_on_shard.assign(task_table.number_of_splits, DatabaseAndTableName());
-}
-
-UInt32 TaskShard::numberInCluster() const
-{
-    return info.shard_num;
-}
-
-UInt32 TaskShard::indexInCluster() const
-{
-    return info.shard_num - 1;
-}
-
-String DB::TaskShard::getDescription() const
-{
-    return fmt::format("N{} (having a replica {}, pull table {} of cluster {}",
-                       numberInCluster(), getHostNameExample(), getQuotedTable(task_table.table_pull), task_table.cluster_pull_name);
-}
-
-String DB::TaskShard::getHostNameExample() const
-{
-    const auto & replicas = task_table.cluster_pull->getShardsAddresses().at(indexInCluster());
-    return replicas.at(0).readableString();
-}
-
-}
diff --git a/programs/copier/TaskShard.h b/programs/copier/TaskShard.h
deleted file mode 100644
index 05d652077ea..00000000000
--- a/programs/copier/TaskShard.h
+++ /dev/null
@@ -1,56 +0,0 @@
-#pragma once
-
-#include "Aliases.h"
-#include "Internals.h"
-#include "ClusterPartition.h"
-#include "ShardPartition.h"
-
-
-namespace DB
-{
-
-struct TaskTable;
-
-struct TaskShard
-{
-    TaskShard(TaskTable & parent, const Cluster::ShardInfo & info_);
-
-    TaskTable & task_table;
-
-    Cluster::ShardInfo info;
-
-    UInt32 numberInCluster() const;
-
-    UInt32 indexInCluster() const;
-
-    String getDescription() const;
-
-    String getHostNameExample() const;
-
-    /// Used to sort clusters by their proximity
-    ShardPriority priority;
-
-    /// Column with unique destination partitions (computed from engine_push_partition_key expr.) in the shard
-    ColumnWithTypeAndName partition_key_column;
-
-    /// There is a task for each destination partition
-    TasksPartition partition_tasks;
-
-    /// Which partitions have been checked for existence
-    /// If some partition from this lists is exists, it is in partition_tasks
-    std::set<String> checked_partitions;
-
-    /// Last CREATE TABLE query of the table of the shard
-    ASTPtr current_pull_table_create_query;
-    ASTPtr current_push_table_create_query;
-
-    /// Internal distributed tables
-    DatabaseAndTableName table_read_shard;
-    DatabaseAndTableName main_table_split_shard;
-    ListOfDatabasesAndTableNames list_of_split_tables_on_shard;
-};
-
-using TaskShardPtr = std::shared_ptr<TaskShard>;
-using TasksShard = std::vector<TaskShardPtr>;
-
-}
diff --git a/programs/copier/TaskTable.cpp b/programs/copier/TaskTable.cpp
deleted file mode 100644
index d055ceb4c7b..00000000000
--- a/programs/copier/TaskTable.cpp
+++ /dev/null
@@ -1,222 +0,0 @@
-#include "TaskTable.h"
-
-#include "ClusterPartition.h"
-#include "TaskCluster.h"
-
-#include <Parsers/ASTFunction.h>
-#include <Common/escapeForFileName.h>
-
-#include <boost/algorithm/string/join.hpp>
-
-
-namespace DB
-{
-namespace ErrorCodes
-{
-    extern const int UNKNOWN_ELEMENT_IN_CONFIG;
-    extern const int LOGICAL_ERROR;
-}
-
-TaskTable::TaskTable(TaskCluster & parent, const Poco::Util::AbstractConfiguration & config,
-                     const String & prefix_, const String & table_key)
-        : task_cluster(parent)
-{
-    String table_prefix = prefix_ + "." + table_key + ".";
-
-    name_in_config = table_key;
-
-    number_of_splits = config.getUInt64(table_prefix + "number_of_splits", 3);
-
-    allow_to_copy_alias_and_materialized_columns = config.getBool(table_prefix + "allow_to_copy_alias_and_materialized_columns", false);
-    allow_to_drop_target_partitions = config.getBool(table_prefix + "allow_to_drop_target_partitions", false);
-
-    cluster_pull_name = config.getString(table_prefix + "cluster_pull");
-    cluster_push_name = config.getString(table_prefix + "cluster_push");
-
-    table_pull.first = config.getString(table_prefix + "database_pull");
-    table_pull.second = config.getString(table_prefix + "table_pull");
-
-    table_push.first = config.getString(table_prefix + "database_push");
-    table_push.second = config.getString(table_prefix + "table_push");
-
-    /// Used as node name in ZooKeeper
-    table_id = escapeForFileName(cluster_push_name)
-               + "." + escapeForFileName(table_push.first)
-               + "." + escapeForFileName(table_push.second);
-
-    engine_push_str = config.getString(table_prefix + "engine", "rand()");
-
-    {
-        ParserStorage parser_storage{ParserStorage::TABLE_ENGINE};
-        engine_push_ast = parseQuery(parser_storage, engine_push_str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
-        engine_push_partition_key_ast = extractPartitionKey(engine_push_ast);
-        primary_key_comma_separated = boost::algorithm::join(extractPrimaryKeyColumnNames(engine_push_ast), ", ");
-        is_replicated_table = isReplicatedTableEngine(engine_push_ast);
-    }
-
-    sharding_key_str = config.getString(table_prefix + "sharding_key");
-
-    auxiliary_engine_split_asts.reserve(number_of_splits);
-    {
-        ParserExpressionWithOptionalAlias parser_expression(false);
-        sharding_key_ast = parseQuery(parser_expression, sharding_key_str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
-        main_engine_split_ast = createASTStorageDistributed(cluster_push_name, table_push.first, table_push.second,
-                                                            sharding_key_ast);
-
-        for (const auto piece_number : collections::range(0, number_of_splits))
-        {
-            auxiliary_engine_split_asts.emplace_back
-                    (
-                            createASTStorageDistributed(cluster_push_name, table_push.first,
-                                                        table_push.second + "_piece_" + toString(piece_number), sharding_key_ast)
-                    );
-        }
-    }
-
-    where_condition_str = config.getString(table_prefix + "where_condition", "");
-    if (!where_condition_str.empty())
-    {
-        ParserExpressionWithOptionalAlias parser_expression(false);
-        where_condition_ast = parseQuery(parser_expression, where_condition_str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
-
-        // Will use canonical expression form
-        where_condition_str = queryToString(where_condition_ast);
-    }
-
-    String enabled_partitions_prefix = table_prefix + "enabled_partitions";
-    has_enabled_partitions = config.has(enabled_partitions_prefix);
-
-    if (has_enabled_partitions)
-    {
-        Strings keys;
-        config.keys(enabled_partitions_prefix, keys);
-
-        if (keys.empty())
-        {
-            /// Parse list of partition from space-separated string
-            String partitions_str = config.getString(table_prefix + "enabled_partitions");
-            boost::trim_if(partitions_str, isWhitespaceASCII);
-            boost::split(enabled_partitions, partitions_str, isWhitespaceASCII, boost::token_compress_on);
-        }
-        else
-        {
-            /// Parse sequence of <partition>...</partition>
-            for (const String &key : keys)
-            {
-                if (!startsWith(key, "partition"))
-                    throw Exception(ErrorCodes::UNKNOWN_ELEMENT_IN_CONFIG, "Unknown key {} in {}", key, enabled_partitions_prefix);
-
-                enabled_partitions.emplace_back(config.getString(enabled_partitions_prefix + "." + key));
-            }
-        }
-
-        std::copy(enabled_partitions.begin(), enabled_partitions.end(), std::inserter(enabled_partitions_set, enabled_partitions_set.begin()));
-    }
-}
-
-
-String TaskTable::getPartitionPath(const String & partition_name) const
-{
-    return task_cluster.task_zookeeper_path             // root
-           + "/tables/" + table_id                      // tables/dst_cluster.merge.hits
-           + "/" + escapeForFileName(partition_name);   // 201701
-}
-
-String TaskTable::getPartitionAttachIsActivePath(const String & partition_name) const
-{
-    return getPartitionPath(partition_name) + "/attach_active";
-}
-
-String TaskTable::getPartitionAttachIsDonePath(const String & partition_name) const
-{
-    return getPartitionPath(partition_name) + "/attach_is_done";
-}
-
-String TaskTable::getPartitionPiecePath(const String & partition_name, size_t piece_number) const
-{
-    assert(piece_number < number_of_splits);
-    return getPartitionPath(partition_name) + "/piece_" + toString(piece_number);  // 1...number_of_splits
-}
-
-String TaskTable::getCertainPartitionIsDirtyPath(const String &partition_name) const
-{
-    return getPartitionPath(partition_name) + "/is_dirty";
-}
-
-String TaskTable::getCertainPartitionPieceIsDirtyPath(const String & partition_name, const size_t piece_number) const
-{
-    return getPartitionPiecePath(partition_name, piece_number) + "/is_dirty";
-}
-
-String TaskTable::getCertainPartitionIsCleanedPath(const String & partition_name) const
-{
-    return getCertainPartitionIsDirtyPath(partition_name) + "/cleaned";
-}
-
-String TaskTable::getCertainPartitionPieceIsCleanedPath(const String & partition_name, const size_t piece_number) const
-{
-    return getCertainPartitionPieceIsDirtyPath(partition_name, piece_number) + "/cleaned";
-}
-
-String TaskTable::getCertainPartitionTaskStatusPath(const String & partition_name) const
-{
-    return getPartitionPath(partition_name) + "/shards";
-}
-
-String TaskTable::getCertainPartitionPieceTaskStatusPath(const String & partition_name, const size_t piece_number) const
-{
-    return getPartitionPiecePath(partition_name, piece_number) + "/shards";
-}
-
-bool TaskTable::isReplicatedTable() const
-{
-    return is_replicated_table;
-}
-
-String TaskTable::getStatusAllPartitionCount() const
-{
-    return task_cluster.task_zookeeper_path + "/status/all_partitions_count";
-}
-
-String TaskTable::getStatusProcessedPartitionsCount() const
-{
-    return task_cluster.task_zookeeper_path + "/status/processed_partitions_count";
-}
-
-ASTPtr TaskTable::rewriteReplicatedCreateQueryToPlain() const
-{
-    ASTPtr prev_engine_push_ast = engine_push_ast->clone();
-
-    auto & new_storage_ast = prev_engine_push_ast->as<ASTStorage &>();
-    auto & new_engine_ast = new_storage_ast.engine->as<ASTFunction &>();
-
-    /// Remove "Replicated" from name
-    new_engine_ast.name = new_engine_ast.name.substr(10);
-
-    if (new_engine_ast.arguments)
-    {
-        auto & replicated_table_arguments = new_engine_ast.arguments->children;
-
-
-        /// In some cases of Atomic database engine usage ReplicatedMergeTree tables
-        /// could be created without arguments.
-        if (!replicated_table_arguments.empty())
-        {
-            /// Delete first two arguments of Replicated...MergeTree() table.
-            replicated_table_arguments.erase(replicated_table_arguments.begin());
-            replicated_table_arguments.erase(replicated_table_arguments.begin());
-        }
-    }
-
-    return new_storage_ast.clone();
-}
-
-ClusterPartition & TaskTable::getClusterPartition(const String & partition_name)
-{
-    auto it = cluster_partitions.find(partition_name);
-    if (it == cluster_partitions.end())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "There are no cluster partition {} in {}", partition_name, table_id);
-    return it->second;
-}
-
-}
diff --git a/programs/copier/TaskTable.h b/programs/copier/TaskTable.h
deleted file mode 100644
index 2bb7f078bc6..00000000000
--- a/programs/copier/TaskTable.h
+++ /dev/null
@@ -1,173 +0,0 @@
-#pragma once
-
-#include "Aliases.h"
-#include "TaskShard.h"
-
-
-namespace DB
-{
-
-struct ClusterPartition;
-struct TaskCluster;
-
-struct TaskTable
-{
-    TaskTable(TaskCluster & parent, const Poco::Util::AbstractConfiguration & config, const String & prefix, const String & table_key);
-
-    TaskCluster & task_cluster;
-
-    /// These functions used in checkPartitionIsDone() or checkPartitionPieceIsDone()
-    /// They are implemented here not to call task_table.tasks_shard[partition_name].second.pieces[current_piece_number] etc.
-
-    String getPartitionPath(const String & partition_name) const;
-
-    String getPartitionAttachIsActivePath(const String & partition_name) const;
-
-    String getPartitionAttachIsDonePath(const String & partition_name) const;
-
-    String getPartitionPiecePath(const String & partition_name, size_t piece_number) const;
-
-    String getCertainPartitionIsDirtyPath(const String & partition_name) const;
-
-    String getCertainPartitionPieceIsDirtyPath(const String & partition_name, size_t piece_number) const;
-
-    String getCertainPartitionIsCleanedPath(const String & partition_name) const;
-
-    String getCertainPartitionPieceIsCleanedPath(const String & partition_name, size_t piece_number) const;
-
-    String getCertainPartitionTaskStatusPath(const String & partition_name) const;
-
-    String getCertainPartitionPieceTaskStatusPath(const String & partition_name, size_t piece_number) const;
-
-    bool isReplicatedTable() const;
-
-    /// These nodes are used for check-status option
-    String getStatusAllPartitionCount() const;
-    String getStatusProcessedPartitionsCount() const;
-
-    /// Partitions will be split into number-of-splits pieces.
-    /// Each piece will be copied independently. (10 by default)
-    size_t number_of_splits;
-
-    bool allow_to_copy_alias_and_materialized_columns{false};
-    bool allow_to_drop_target_partitions{false};
-
-    String name_in_config;
-
-    /// Used as task ID
-    String table_id;
-
-    /// Column names in primary key
-    String primary_key_comma_separated;
-
-    /// Source cluster and table
-    String cluster_pull_name;
-    DatabaseAndTableName table_pull;
-
-    /// Destination cluster and table
-    String cluster_push_name;
-    DatabaseAndTableName table_push;
-
-    /// Storage of destination table
-    /// (tables that are stored on each shard of target cluster)
-    String engine_push_str;
-    ASTPtr engine_push_ast;
-    ASTPtr engine_push_partition_key_ast;
-
-    /// First argument of Replicated...MergeTree()
-    String engine_push_zk_path;
-    bool is_replicated_table;
-
-    ASTPtr rewriteReplicatedCreateQueryToPlain() const;
-
-    /*
-     * A Distributed table definition used to split data
-     * Distributed table will be created on each shard of default
-     * cluster to perform data copying and resharding
-     * */
-    String sharding_key_str;
-    ASTPtr sharding_key_ast;
-    ASTPtr main_engine_split_ast;
-
-    /*
-     * To copy partition piece form one cluster to another we have to use Distributed table.
-     * In case of usage separate table (engine_push) for each partition piece,
-     * we have to use many Distributed tables.
-     * */
-    ASTs auxiliary_engine_split_asts;
-
-    /// Additional WHERE expression to filter input data
-    String where_condition_str;
-    ASTPtr where_condition_ast;
-
-    /// Resolved clusters
-    ClusterPtr cluster_pull;
-    ClusterPtr cluster_push;
-
-    /// Filter partitions that should be copied
-    bool has_enabled_partitions = false;
-    Strings enabled_partitions;
-    NameSet enabled_partitions_set;
-
-    /**
-     * Prioritized list of shards
-     * all_shards contains information about all shards in the table.
-     * So we have to check whether particular shard have current partition or not while processing.
-     */
-    TasksShard all_shards;
-    TasksShard local_shards;
-
-    /// All partitions of the current table.
-    ClusterPartitions cluster_partitions;
-    NameSet finished_cluster_partitions;
-
-    /// Partition names to process in user-specified order
-    Strings ordered_partition_names;
-
-    ClusterPartition & getClusterPartition(const String & partition_name);
-
-    Stopwatch watch;
-    UInt64 bytes_copied = 0;
-    UInt64 rows_copied = 0;
-
-    template <typename RandomEngine>
-    void initShards(RandomEngine &&random_engine);
-};
-
-using TasksTable = std::list<TaskTable>;
-
-
-template<typename RandomEngine>
-inline void TaskTable::initShards(RandomEngine && random_engine)
-{
-    const String & fqdn_name = getFQDNOrHostName();
-    std::uniform_int_distribution<uint8_t> get_urand(0, std::numeric_limits<UInt8>::max());
-
-    // Compute the priority
-    for (const auto & shard_info : cluster_pull->getShardsInfo())
-    {
-        TaskShardPtr task_shard = std::make_shared<TaskShard>(*this, shard_info);
-        const auto & replicas = cluster_pull->getShardsAddresses().at(task_shard->indexInCluster());
-        task_shard->priority = getReplicasPriority(replicas, fqdn_name, get_urand(random_engine));
-
-        all_shards.emplace_back(task_shard);
-    }
-
-    // Sort by priority
-    std::sort(all_shards.begin(), all_shards.end(),
-              [](const TaskShardPtr & lhs, const TaskShardPtr & rhs)
-              {
-                  return ShardPriority::greaterPriority(lhs->priority, rhs->priority);
-              });
-
-    // Cut local shards
-    auto it_first_remote = std::lower_bound(all_shards.begin(), all_shards.end(), 1,
-                                            [](const TaskShardPtr & lhs, UInt8 is_remote)
-                                            {
-                                                return lhs->priority.is_remote < is_remote;
-                                            });
-
-    local_shards.assign(all_shards.begin(), it_first_remote);
-}
-
-}
diff --git a/programs/copier/ZooKeeperStaff.h b/programs/copier/ZooKeeperStaff.h
deleted file mode 100644
index c15db73f060..00000000000
--- a/programs/copier/ZooKeeperStaff.h
+++ /dev/null
@@ -1,221 +0,0 @@
-#pragma once
-
-/** Allows to compare two incremental counters of type UInt32 in presence of possible overflow.
-  * We assume that we compare values that are not too far away.
-  * For example, when we increment 0xFFFFFFFF, we get 0. So, 0xFFFFFFFF is less than 0.
-  */
-class WrappingUInt32
-{
-public:
-    UInt32 value;
-
-    explicit WrappingUInt32(UInt32 _value)
-            : value(_value)
-    {}
-
-    bool operator<(const WrappingUInt32 & other) const
-    {
-        return value != other.value && *this <= other;
-    }
-
-    bool operator<=(const WrappingUInt32 & other) const
-    {
-        const UInt32 HALF = static_cast<UInt32>(1) << 31;
-        return (value <= other.value && other.value - value < HALF)
-               || (value > other.value && value - other.value > HALF);
-    }
-
-    bool operator==(const WrappingUInt32 & other) const
-    {
-        return value == other.value;
-    }
-};
-
-/** Conforming Zxid definition.
-  * cf. https://github.com/apache/zookeeper/blob/631d1b284f0edb1c4f6b0fb221bf2428aec71aaa/zookeeper-docs/src/main/resources/markdown/zookeeperInternals.md#guarantees-properties-and-definitions
-  *
-  * But it is better to read this: https://zookeeper.apache.org/doc/r3.1.2/zookeeperProgrammers.html
-  *
-  * Actually here is the definition of Zxid.
-  * Every change to the ZooKeeper state receives a stamp in the form of a zxid (ZooKeeper Transaction Id).
-  * This exposes the total ordering of all changes to ZooKeeper. Each change will have a unique zxid
-  * and if zxid1 is smaller than zxid2 then zxid1 happened before zxid2.
-  */
-class Zxid
-{
-public:
-    WrappingUInt32 epoch;
-    WrappingUInt32 counter;
-    explicit Zxid(UInt64 _zxid)
-            : epoch(static_cast<UInt32>(_zxid >> 32))
-            , counter(static_cast<UInt32>(_zxid))
-    {}
-
-    bool operator<=(const Zxid & other) const
-    {
-        return (epoch < other.epoch)
-               || (epoch == other.epoch && counter <= other.counter);
-    }
-
-    bool operator==(const Zxid & other) const
-    {
-        return epoch == other.epoch && counter == other.counter;
-    }
-};
-
-/* When multiple ClusterCopiers discover that the target partition is not empty,
- * they will attempt to clean up this partition before proceeding to copying.
- *
- * Instead of purging is_dirty, the history of cleaning work is preserved and partition hygiene is established
- * based on a happens-before relation between the events.
- * This relation is encoded by LogicalClock based on the mzxid of the is_dirty ZNode and is_dirty/cleaned.
- * The fact of the partition hygiene is encoded by CleanStateClock.
- *
- * For you to know what mzxid means:
- *
- * ZooKeeper Stat Structure:
- * The Stat structure for each znode in ZooKeeper is made up of the following fields:
- *
- * -- czxid
- * The zxid of the change that caused this znode to be created.
- *
- * -- mzxid
- * The zxid of the change that last modified this znode.
- *
- * -- ctime
- * The time in milliseconds from epoch when this znode was created.
- *
- * -- mtime
- * The time in milliseconds from epoch when this znode was last modified.
- *
- * -- version
- * The number of changes to the data of this znode.
- *
- * -- cversion
- * The number of changes to the children of this znode.
- *
- * -- aversion
- * The number of changes to the ACL of this znode.
- *
- * -- ephemeralOwner
- * The session id of the owner of this znode if the znode is an ephemeral node.
- * If it is not an ephemeral node, it will be zero.
- *
- * -- dataLength
- * The length of the data field of this znode.
- *
- * -- numChildren
- * The number of children of this znode.
- * */
-
-class LogicalClock
-{
-public:
-    std::optional<Zxid> zxid;
-
-    LogicalClock() = default;
-
-    explicit LogicalClock(UInt64 _zxid)
-            : zxid(_zxid)
-    {}
-
-    bool hasHappened() const
-    {
-        return bool(zxid);
-    }
-
-    /// happens-before relation with a reasonable time bound
-    bool happensBefore(const LogicalClock & other) const
-    {
-        return !zxid
-               || (other.zxid && *zxid <= *other.zxid);
-    }
-
-    bool operator<=(const LogicalClock & other) const
-    {
-        return happensBefore(other);
-    }
-
-    /// strict equality check
-    bool operator==(const LogicalClock & other) const
-    {
-        return zxid == other.zxid;
-    }
-};
-
-
-class CleanStateClock
-{
-public:
-    LogicalClock discovery_zxid;
-    std::optional<UInt32> discovery_version;
-
-    LogicalClock clean_state_zxid;
-    std::optional<UInt32> clean_state_version;
-
-    std::shared_ptr<std::atomic_bool> stale;
-
-    bool is_clean() const
-    {
-        return !is_stale()
-            && (!discovery_zxid.hasHappened() || (clean_state_zxid.hasHappened() && discovery_zxid <= clean_state_zxid));
-    }
-
-    bool is_stale() const
-    {
-        return stale->load();
-    }
-
-    CleanStateClock(
-            const zkutil::ZooKeeperPtr & zookeeper,
-            const String & discovery_path,
-            const String & clean_state_path)
-            : stale(std::make_shared<std::atomic_bool>(false))
-    {
-        Coordination::Stat stat{};
-        String _some_data;
-        auto watch_callback =
-                [my_stale = stale] (const Coordination::WatchResponse & rsp)
-                {
-                    auto logger = getLogger("ClusterCopier");
-                    if (rsp.error == Coordination::Error::ZOK)
-                    {
-                        switch (rsp.type) /// NOLINT(bugprone-switch-missing-default-case)
-                        {
-                            case Coordination::CREATED:
-                                LOG_DEBUG(logger, "CleanStateClock change: CREATED, at {}", rsp.path);
-                                my_stale->store(true);
-                                break;
-                            case Coordination::CHANGED:
-                                LOG_DEBUG(logger, "CleanStateClock change: CHANGED, at {}", rsp.path);
-                                my_stale->store(true);
-                        }
-                    }
-                };
-        if (zookeeper->tryGetWatch(discovery_path, _some_data, &stat, watch_callback))
-        {
-            discovery_zxid = LogicalClock(stat.mzxid);
-            discovery_version = stat.version;
-        }
-        if (zookeeper->tryGetWatch(clean_state_path, _some_data, &stat, watch_callback))
-        {
-            clean_state_zxid = LogicalClock(stat.mzxid);
-            clean_state_version = stat.version;
-        }
-    }
-
-    bool operator==(const CleanStateClock & other) const
-    {
-        return !is_stale()
-               && !other.is_stale()
-               && discovery_zxid == other.discovery_zxid
-               && discovery_version == other.discovery_version
-               && clean_state_zxid == other.clean_state_zxid
-               && clean_state_version == other.clean_state_version;
-    }
-
-    bool operator!=(const CleanStateClock & other) const
-    {
-        return !(*this == other);
-    }
-};
diff --git a/programs/copier/clickhouse-copier.cpp b/programs/copier/clickhouse-copier.cpp
deleted file mode 100644
index 4dabb01775b..00000000000
--- a/programs/copier/clickhouse-copier.cpp
+++ /dev/null
@@ -1 +0,0 @@
-int mainEntryClickHouseClusterCopier(int argc, char ** argv);
diff --git a/programs/diagnostics/testdata/configs/xml/config.xml b/programs/diagnostics/testdata/configs/xml/config.xml
index ae09d207091..eb7c70cf498 100644
--- a/programs/diagnostics/testdata/configs/xml/config.xml
+++ b/programs/diagnostics/testdata/configs/xml/config.xml
@@ -94,7 +94,7 @@
     <http_port>8123</http_port>
 
     <!-- Port for interaction by native protocol with:
-         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark, clickhouse-copier);
+         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark);
          - clickhouse-server with other clickhouse-servers for distributed query processing;
          - ClickHouse drivers and applications supporting native protocol
          (this protocol is also informally called as "the TCP protocol");
diff --git a/programs/diagnostics/testdata/configs/yaml/config.yaml b/programs/diagnostics/testdata/configs/yaml/config.yaml
index 354065a8a9b..e577a99e675 100644
--- a/programs/diagnostics/testdata/configs/yaml/config.yaml
+++ b/programs/diagnostics/testdata/configs/yaml/config.yaml
@@ -56,7 +56,7 @@ logger:
 http_port: 8123
 
 # Port for interaction by native protocol with:
-# - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark, clickhouse-copier);
+# - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark);
 # - clickhouse-server with other clickhouse-servers for distributed query processing;
 # - ClickHouse drivers and applications supporting native protocol
 # (this protocol is also informally called as "the TCP protocol");
diff --git a/programs/diagnostics/testdata/configs/yandex_xml/config.xml b/programs/diagnostics/testdata/configs/yandex_xml/config.xml
index 181f52a92f8..40d1fa34b1a 100644
--- a/programs/diagnostics/testdata/configs/yandex_xml/config.xml
+++ b/programs/diagnostics/testdata/configs/yandex_xml/config.xml
@@ -94,7 +94,7 @@
     <http_port>8123</http_port>
 
     <!-- Port for interaction by native protocol with:
-         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark, clickhouse-copier);
+         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark);
          - clickhouse-server with other clickhouse-servers for distributed query processing;
          - ClickHouse drivers and applications supporting native protocol
          (this protocol is also informally called as "the TCP protocol");
diff --git a/programs/install/Install.cpp b/programs/install/Install.cpp
index c3d2c61d6d0..0ff0faff624 100644
--- a/programs/install/Install.cpp
+++ b/programs/install/Install.cpp
@@ -433,7 +433,6 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
             "clickhouse-client",
             "clickhouse-local",
             "clickhouse-benchmark",
-            "clickhouse-copier",
             "clickhouse-obfuscator",
             "clickhouse-git-import",
             "clickhouse-compressor",
diff --git a/programs/main.cpp b/programs/main.cpp
index 3896b3819a8..c5f1b30f60e 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -31,7 +31,6 @@ int mainEntryClickHouseBenchmark(int argc, char ** argv);
 int mainEntryClickHouseExtractFromConfig(int argc, char ** argv);
 int mainEntryClickHouseCompressor(int argc, char ** argv);
 int mainEntryClickHouseFormat(int argc, char ** argv);
-int mainEntryClickHouseClusterCopier(int argc, char ** argv);
 int mainEntryClickHouseObfuscator(int argc, char ** argv);
 int mainEntryClickHouseGitImport(int argc, char ** argv);
 int mainEntryClickHouseStaticFilesDiskUploader(int argc, char ** argv);
@@ -80,7 +79,6 @@ std::pair<std::string_view, MainFunc> clickhouse_applications[] =
     {"extract-from-config", mainEntryClickHouseExtractFromConfig},
     {"compressor", mainEntryClickHouseCompressor},
     {"format", mainEntryClickHouseFormat},
-    {"copier", mainEntryClickHouseClusterCopier},
     {"obfuscator", mainEntryClickHouseObfuscator},
     {"git-import", mainEntryClickHouseGitImport},
     {"static-files-disk-uploader", mainEntryClickHouseStaticFilesDiskUploader},
diff --git a/programs/server/config.xml b/programs/server/config.xml
index d19f6d77f30..ea3ead47c32 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -135,7 +135,7 @@
     <http_port>8123</http_port>
 
     <!-- Port for interaction by native protocol with:
-         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark, clickhouse-copier);
+         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark);
          - clickhouse-server with other clickhouse-servers for distributed query processing;
          - ClickHouse drivers and applications supporting native protocol
          (this protocol is also informally called as "the TCP protocol");
diff --git a/programs/server/config.yaml.example b/programs/server/config.yaml.example
index b472b6f4a45..9fc188e97aa 100644
--- a/programs/server/config.yaml.example
+++ b/programs/server/config.yaml.example
@@ -55,7 +55,7 @@ logger:
 http_port: 8123
 
 # Port for interaction by native protocol with:
-# - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark, clickhouse-copier);
+# - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark);
 # - clickhouse-server with other clickhouse-servers for distributed query processing;
 # - ClickHouse drivers and applications supporting native protocol
 # (this protocol is also informally called as "the TCP protocol");
diff --git a/src/Storages/StorageDistributed.h b/src/Storages/StorageDistributed.h
index cf5b78305a5..323646ab911 100644
--- a/src/Storages/StorageDistributed.h
+++ b/src/Storages/StorageDistributed.h
@@ -154,7 +154,6 @@ public:
     /// Used by InterpreterSystemQuery
     void flushClusterNodesAllData(ContextPtr context);
 
-    /// Used by ClusterCopier
     size_t getShardCount() const;
 
     bool initializeDiskOnConfigChange(const std::set<String> & new_added_disks) override;
diff --git a/tests/integration/README.md b/tests/integration/README.md
index 1b5a0ee8994..ac01c43769e 100644
--- a/tests/integration/README.md
+++ b/tests/integration/README.md
@@ -76,7 +76,7 @@ docker pull clickhouse/integration-tests-runner
 Notes:
 * If you want to run integration tests without `sudo` you have to add your user to docker group `sudo usermod -aG docker $USER`. [More information](https://docs.docker.com/install/linux/linux-postinstall/) about docker configuration.
 * If you already had run these tests without `./runner` script you may have problems with pytest cache. It can be removed with `rm -r __pycache__ .pytest_cache/`.
-* Some tests maybe require a lot of resources (CPU, RAM, etc.). Better not try large tests like `test_cluster_copier` or `test_distributed_ddl*` on your laptop.
+* Some tests maybe require a lot of resources (CPU, RAM, etc.). Better not try large tests like `test_distributed_ddl*` on your laptop.
 
 You can run tests via `./runner` script and pass pytest arguments as last arg:
 ```
diff --git a/tests/integration/test_cluster_copier/__init__.py b/tests/integration/test_cluster_copier/__init__.py
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/tests/integration/test_cluster_copier/configs/conf.d/clusters.xml b/tests/integration/test_cluster_copier/configs/conf.d/clusters.xml
deleted file mode 100644
index 07363e6e43a..00000000000
--- a/tests/integration/test_cluster_copier/configs/conf.d/clusters.xml
+++ /dev/null
@@ -1,73 +0,0 @@
-<clickhouse>
-    <remote_servers>
-        <cluster0>
-            <shard>
-                <internal_replication>true</internal_replication>
-                <replica>
-                    <host>s0_0_0</host>
-                    <port>9000</port>
-                </replica>
-                <replica>
-                    <host>s0_0_1</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-            <shard>
-                <internal_replication>true</internal_replication>
-                <replica>
-                    <host>s0_1_0</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </cluster0>
-        <cluster1>
-            <shard>
-                <internal_replication>true</internal_replication>
-                <replica>
-                    <host>s1_0_0</host>
-                    <port>9000</port>
-                </replica>
-                <replica>
-                    <host>s1_0_1</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-            <shard>
-                <internal_replication>true</internal_replication>
-                <replica>
-                    <host>s1_1_0</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </cluster1>
-        <shard_0_0>
-            <shard>
-                <internal_replication>true</internal_replication>
-                <replica>
-                    <host>s0_0_0</host>
-                    <port>9000</port>
-                </replica>
-                <replica>
-                    <host>s0_0_1</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </shard_0_0>
-        <source_trivial_cluster>
-            <shard>
-                <replica>
-                    <host>s0_0_0</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </source_trivial_cluster>
-        <destination_trivial_cluster>
-            <shard>
-                <replica>
-                    <host>s1_0_0</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </destination_trivial_cluster>
-    </remote_servers>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs/conf.d/clusters_trivial.xml b/tests/integration/test_cluster_copier/configs/conf.d/clusters_trivial.xml
deleted file mode 100644
index c91ec627580..00000000000
--- a/tests/integration/test_cluster_copier/configs/conf.d/clusters_trivial.xml
+++ /dev/null
@@ -1,20 +0,0 @@
-<clickhouse>
-    <remote_servers>
-        <source_trivial_cluster>
-            <shard>
-                <replica>
-                    <host>first_trivial</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </source_trivial_cluster>
-        <destination_trivial_cluster>
-            <shard>
-                <replica>
-                    <host>second_trivial</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </destination_trivial_cluster>
-    </remote_servers>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs/conf.d/ddl.xml b/tests/integration/test_cluster_copier/configs/conf.d/ddl.xml
deleted file mode 100644
index 64fa32335ab..00000000000
--- a/tests/integration/test_cluster_copier/configs/conf.d/ddl.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<clickhouse>
-    <distributed_ddl>
-        <path>/clickhouse/task_queue/ddl</path>
-    </distributed_ddl>
-</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_cluster_copier/configs/conf.d/query_log.xml b/tests/integration/test_cluster_copier/configs/conf.d/query_log.xml
deleted file mode 100644
index 1efc65bdb28..00000000000
--- a/tests/integration/test_cluster_copier/configs/conf.d/query_log.xml
+++ /dev/null
@@ -1,14 +0,0 @@
-<clickhouse>
-    <!-- Query log. Used only for queries with setting log_queries = 1. -->
-    <query_log>
-        <!-- What table to insert data. If table is not exist, it will be created.
-             When query log structure is changed after system update,
-              then old table will be renamed and new table will be created automatically.
-        -->
-        <database>system</database>
-        <table>query_log</table>
-
-        <!-- Interval of flushing data. -->
-        <flush_interval_milliseconds>1000</flush_interval_milliseconds>
-    </query_log>
-</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_cluster_copier/configs/config-copier.xml b/tests/integration/test_cluster_copier/configs/config-copier.xml
deleted file mode 100644
index 590b1892f8d..00000000000
--- a/tests/integration/test_cluster_copier/configs/config-copier.xml
+++ /dev/null
@@ -1,11 +0,0 @@
-<clickhouse>
-    <logger>
-        <level>information</level>
-        <log>/var/log/clickhouse-server/copier/log.log</log>
-        <errorlog>/var/log/clickhouse-server/copier/log.err.log</errorlog>
-        <size>1000M</size>
-        <count>10</count>
-        <stderr>/var/log/clickhouse-server/copier/stderr.log</stderr>
-        <stdout>/var/log/clickhouse-server/copier/stdout.log</stdout>
-    </logger>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs/users.xml b/tests/integration/test_cluster_copier/configs/users.xml
deleted file mode 100644
index b463dfc81e7..00000000000
--- a/tests/integration/test_cluster_copier/configs/users.xml
+++ /dev/null
@@ -1,34 +0,0 @@
-<clickhouse>
-    <profiles>
-        <default>
-            <log_queries>1</log_queries>
-            <!-- Just to test settings_pull -->
-            <max_rows_in_distinct>5</max_rows_in_distinct>
-            <allow_deprecated_syntax_for_merge_tree>1</allow_deprecated_syntax_for_merge_tree>
-        </default>
-    </profiles>
-
-    <users>
-        <default>
-            <password></password>
-            <networks incl="networks" replace="replace">
-                <ip>::/0</ip>
-            </networks>
-            <profile>default</profile>
-            <quota>default</quota>
-        </default>
-        <dbuser>
-            <password>12345678</password>
-            <networks incl="networks" replace="replace">
-                <ip>::/0</ip>
-            </networks>
-            <profile>default</profile>
-            <quota>default</quota>
-        </dbuser>
-    </users>
-
-    <quotas>
-        <default>
-        </default>
-    </quotas>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs_three_nodes/conf.d/clusters.xml b/tests/integration/test_cluster_copier/configs_three_nodes/conf.d/clusters.xml
deleted file mode 100644
index 9de7b57de27..00000000000
--- a/tests/integration/test_cluster_copier/configs_three_nodes/conf.d/clusters.xml
+++ /dev/null
@@ -1,27 +0,0 @@
-<clickhouse>
-    <remote_servers>
-        <events>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>first</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>second</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>third</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-         </events>
-    </remote_servers>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs_three_nodes/conf.d/ddl.xml b/tests/integration/test_cluster_copier/configs_three_nodes/conf.d/ddl.xml
deleted file mode 100644
index 64fa32335ab..00000000000
--- a/tests/integration/test_cluster_copier/configs_three_nodes/conf.d/ddl.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<clickhouse>
-    <distributed_ddl>
-        <path>/clickhouse/task_queue/ddl</path>
-    </distributed_ddl>
-</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_cluster_copier/configs_three_nodes/config-copier.xml b/tests/integration/test_cluster_copier/configs_three_nodes/config-copier.xml
deleted file mode 100644
index d0cab0fafb7..00000000000
--- a/tests/integration/test_cluster_copier/configs_three_nodes/config-copier.xml
+++ /dev/null
@@ -1,27 +0,0 @@
-<clickhouse>
-    <logger>
-        <level>information</level>
-        <log>/var/log/clickhouse-server/copier/log.log</log>
-        <errorlog>/var/log/clickhouse-server/copier/log.err.log</errorlog>
-        <size>1000M</size>
-        <count>10</count>
-        <stderr>/var/log/clickhouse-server/copier/stderr.log</stderr>
-        <stdout>/var/log/clickhouse-server/copier/stdout.log</stdout>
-    </logger>
-
-    <zookeeper>
-        <node index="1">
-            <host>zoo1</host>
-            <port>2181</port>
-        </node>
-        <node index="2">
-            <host>zoo2</host>
-            <port>2181</port>
-        </node>
-            <node index="3">
-            <host>zoo3</host>
-            <port>2181</port>
-        </node>
-        <session_timeout_ms>2000</session_timeout_ms>
-    </zookeeper>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs_three_nodes/users.xml b/tests/integration/test_cluster_copier/configs_three_nodes/users.xml
deleted file mode 100644
index badaf46a5ca..00000000000
--- a/tests/integration/test_cluster_copier/configs_three_nodes/users.xml
+++ /dev/null
@@ -1,32 +0,0 @@
-<clickhouse>
-    <profiles>
-        <default>
-            <log_queries>1</log_queries>
-            <allow_deprecated_syntax_for_merge_tree>1</allow_deprecated_syntax_for_merge_tree>
-        </default>
-    </profiles>
-
-    <users>
-        <default>
-            <password></password>
-            <networks incl="networks" replace="replace">
-                <ip>::/0</ip>
-            </networks>
-            <profile>default</profile>
-            <quota>default</quota>
-        </default>
-        <dbuser>
-            <password>12345678</password>
-            <networks incl="networks" replace="replace">
-                <ip>::/0</ip>
-            </networks>
-            <profile>default</profile>
-            <quota>default</quota>
-        </dbuser>
-    </users>
-
-    <quotas>
-        <default>
-        </default>
-    </quotas>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs_two_nodes/conf.d/clusters.xml b/tests/integration/test_cluster_copier/configs_two_nodes/conf.d/clusters.xml
deleted file mode 100644
index 38d88308631..00000000000
--- a/tests/integration/test_cluster_copier/configs_two_nodes/conf.d/clusters.xml
+++ /dev/null
@@ -1,22 +0,0 @@
-<clickhouse>
-    <remote_servers>
-        <source>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>first_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </source>
-        <destination>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>second_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </destination>
-    </remote_servers>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs_two_nodes/conf.d/ddl.xml b/tests/integration/test_cluster_copier/configs_two_nodes/conf.d/ddl.xml
deleted file mode 100644
index 64fa32335ab..00000000000
--- a/tests/integration/test_cluster_copier/configs_two_nodes/conf.d/ddl.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<clickhouse>
-    <distributed_ddl>
-        <path>/clickhouse/task_queue/ddl</path>
-    </distributed_ddl>
-</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_cluster_copier/configs_two_nodes/conf.d/storage_configuration.xml b/tests/integration/test_cluster_copier/configs_two_nodes/conf.d/storage_configuration.xml
deleted file mode 100644
index 8306f40ad6a..00000000000
--- a/tests/integration/test_cluster_copier/configs_two_nodes/conf.d/storage_configuration.xml
+++ /dev/null
@@ -1,34 +0,0 @@
-<clickhouse>
-
-<storage_configuration>
-    <disks>
-        <default>
-        </default>
-        <jbod1>
-            <path>/jbod1/</path>
-        </jbod1>
-        <jbod2>
-            <path>/jbod2/</path>
-        </jbod2>
-        <external>
-            <path>/external/</path>
-        </external>
-    </disks>
-
-    <policies>
-        <external_with_jbods>
-            <volumes>
-                <external>
-                    <disk>external</disk>
-                </external>
-                <main>
-                    <disk>jbod1</disk>
-                    <disk>jbod2</disk>
-                </main>
-            </volumes>
-        </external_with_jbods>
-    </policies>
-
-</storage_configuration>
-
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs_two_nodes/config-copier.xml b/tests/integration/test_cluster_copier/configs_two_nodes/config-copier.xml
deleted file mode 100644
index 55bd24816ae..00000000000
--- a/tests/integration/test_cluster_copier/configs_two_nodes/config-copier.xml
+++ /dev/null
@@ -1,19 +0,0 @@
-<clickhouse>
-    <logger>
-        <level>information</level>
-        <log>/var/log/clickhouse-server/copier/log.log</log>
-        <errorlog>/var/log/clickhouse-server/copier/log.err.log</errorlog>
-        <size>1000M</size>
-        <count>10</count>
-        <stderr>/var/log/clickhouse-server/copier/stderr.log</stderr>
-        <stdout>/var/log/clickhouse-server/copier/stdout.log</stdout>
-    </logger>
-
-    <zookeeper>
-        <node index="1">
-            <host>zoo1</host>
-            <port>2181</port>
-        </node>
-        <session_timeout_ms>2000</session_timeout_ms>
-    </zookeeper>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/configs_two_nodes/users.xml b/tests/integration/test_cluster_copier/configs_two_nodes/users.xml
deleted file mode 100644
index badaf46a5ca..00000000000
--- a/tests/integration/test_cluster_copier/configs_two_nodes/users.xml
+++ /dev/null
@@ -1,32 +0,0 @@
-<clickhouse>
-    <profiles>
-        <default>
-            <log_queries>1</log_queries>
-            <allow_deprecated_syntax_for_merge_tree>1</allow_deprecated_syntax_for_merge_tree>
-        </default>
-    </profiles>
-
-    <users>
-        <default>
-            <password></password>
-            <networks incl="networks" replace="replace">
-                <ip>::/0</ip>
-            </networks>
-            <profile>default</profile>
-            <quota>default</quota>
-        </default>
-        <dbuser>
-            <password>12345678</password>
-            <networks incl="networks" replace="replace">
-                <ip>::/0</ip>
-            </networks>
-            <profile>default</profile>
-            <quota>default</quota>
-        </dbuser>
-    </users>
-
-    <quotas>
-        <default>
-        </default>
-    </quotas>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/task0_description.xml b/tests/integration/test_cluster_copier/task0_description.xml
deleted file mode 100644
index 8d74d0bdde0..00000000000
--- a/tests/integration/test_cluster_copier/task0_description.xml
+++ /dev/null
@@ -1,95 +0,0 @@
-<clickhouse>
-    <!-- How many simualteneous workers are posssible -->
-    <max_workers>3</max_workers>
-
-    <!-- Common setting for pull and push operations -->
-    <settings>
-        <connect_timeout>1</connect_timeout>
-    </settings>
-
-    <!-- Setting used to fetch data -->
-    <settings_pull>
-        <max_rows_in_distinct>0</max_rows_in_distinct>
-    </settings_pull>
-
-    <!-- Setting used to insert data -->
-    <settings_push>
-    </settings_push>
-
-    <!-- Tasks -->
-    <tables>
-        <hits>
-            <cluster_pull>cluster0</cluster_pull>
-            <database_pull>default</database_pull>
-            <table_pull>hits</table_pull>
-
-            <cluster_push>cluster1</cluster_push>
-            <database_push>default</database_push>
-            <table_push>hits</table_push>
-
-            <number_of_splits>2</number_of_splits>
-
-            <enabled_partitions>3 4 5 6 1 2 0   </enabled_partitions>
-
-            <!-- Engine of destination tables -->
-            <engine>ENGINE=ReplicatedMergeTree PARTITION BY d % 3 ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d) SETTINGS index_granularity = 16</engine>
-
-            <!-- Which sarding key to use while copying -->
-            <sharding_key>d + 1</sharding_key>
-
-            <!-- Optional expression that filter copying data -->
-            <where_condition>d - d = 0</where_condition>
-        </hits>
-    </tables>
-
-    <!-- Configuration of clusters -->
-    <remote_servers>
-    <cluster0>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s0_0_0</host>
-                <port>9000</port>
-            </replica>
-            <replica>
-                <host>s0_0_1</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s0_1_0</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-    </cluster0>
-
-    <cluster1>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s1_0_0</host>
-                <port>9000</port>
-            </replica>
-            <replica>
-                <host>s1_0_1</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s1_1_0</host>
-                <port>9000</port>
-            </replica>
-            <replica>
-                <!-- Died replica -->
-                <host>255.255.255.255</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-    </cluster1>
-    </remote_servers>
-
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_drop_target_partition.xml b/tests/integration/test_cluster_copier/task_drop_target_partition.xml
deleted file mode 100644
index dc8e6452243..00000000000
--- a/tests/integration/test_cluster_copier/task_drop_target_partition.xml
+++ /dev/null
@@ -1,41 +0,0 @@
-<clickhouse>
-<remote_servers>
-        <source>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>first_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </source>
-        <destination>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>second_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </destination>
-    </remote_servers>
-
-   <max_workers>2</max_workers>
-
-   <tables>
-     <table_events>
-         <cluster_pull>source</cluster_pull>
-         <database_pull>db_drop_target_partition</database_pull>
-         <table_pull>source</table_pull>
-
-         <cluster_push>destination</cluster_push>
-         <database_push>db_drop_target_partition</database_push>
-         <table_push>destination</table_push>
-
-         <allow_to_drop_target_partitions>true</allow_to_drop_target_partitions>
-
-         <engine>ENGINE = MergeTree() PARTITION BY toYYYYMMDD(Column3) ORDER BY (Column3, Column2, Column1)</engine>
-         <sharding_key>rand()</sharding_key>
-     </table_events>
-   </tables>
- </clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_month_to_week_description.xml b/tests/integration/test_cluster_copier/task_month_to_week_description.xml
deleted file mode 100644
index bc290ca397f..00000000000
--- a/tests/integration/test_cluster_copier/task_month_to_week_description.xml
+++ /dev/null
@@ -1,99 +0,0 @@
-<clickhouse>
-    <!-- How many simualteneous workers are posssible -->
-    <max_workers>4</max_workers>
-
-    <!-- Common setting for pull and push operations -->
-    <settings>
-        <connect_timeout>1</connect_timeout>
-        <max_block_size>2</max_block_size>
-    </settings>
-
-    <settings_pull>
-        <max_rows_in_distinct>0</max_rows_in_distinct>
-    </settings_pull>
-
-    <!-- Tasks -->
-    <tables>
-        <AB>
-            <cluster_pull>cluster0</cluster_pull>
-            <database_pull>default</database_pull>
-            <table_pull>a</table_pull>
-
-            <cluster_push>cluster1</cluster_push>
-            <database_push>default</database_push>
-            <table_push>b</table_push>
-
-            <!--
-            <enabled_partitions>
-                <partition></partition>
-            </enabled_partitions>
-            -->
-
-            <number_of_splits>2</number_of_splits>
-
-            <!-- Engine of destination tables -->
-            <engine>ENGINE=
-                ReplicatedMergeTree
-                PARTITION BY toMonday(date)
-                ORDER BY d
-            </engine>
-
-            <!-- Which sarding key to use while copying -->
-            <sharding_key>jumpConsistentHash(intHash64(d), 2)</sharding_key>
-
-            <!-- Optional expression that filter copying data -->
-            <!-- <where_condition></where_condition> -->
-        </AB>
-    </tables>
-
-    <!-- Configuration of clusters -->
-    <remote_servers>
-    <cluster0>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s0_0_0</host>
-                <port>9000</port>
-            </replica>
-            <replica>
-                <host>s0_0_1</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s0_1_0</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-    </cluster0>
-
-    <cluster1>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s1_0_0</host>
-                <port>9000</port>
-            </replica>
-            <replica>
-                <host>s1_0_1</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s1_1_0</host>
-                <port>9000</port>
-            </replica>
-            <replica>
-                <!-- Died replica -->
-                <host>255.255.255.255</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-    </cluster1>
-    </remote_servers>
-
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_no_arg.xml b/tests/integration/test_cluster_copier/task_no_arg.xml
deleted file mode 100644
index 262ff073537..00000000000
--- a/tests/integration/test_cluster_copier/task_no_arg.xml
+++ /dev/null
@@ -1,39 +0,0 @@
-<clickhouse>
-    <remote_servers>   
-       <source_cluster>
-          <shard>
-              <weight>1</weight>
-              <replica>
-                  <host>s0_0_0</host>
-                  <port>9000</port>
-              </replica>
-          </shard>
-      </source_cluster>     
-      <default_cluster>
-      
-        <shard>
-          <weight>1</weight>
-          <replica>
-              <host>s1_1_0</host>
-              <port>9000</port>
-          </replica>
-        </shard>
-            
-      </default_cluster>     
-    </remote_servers>
-    <max_workers>1</max_workers>
-
-    <tables>
-      <table_crm_fin_account>
-        <cluster_pull>source_cluster</cluster_pull>
-        <database_pull>default</database_pull>
-        <table_pull>copier_test1</table_pull>
-
-        <cluster_push>default_cluster</cluster_push>
-        <database_push>default</database_push>
-        <table_push>copier_test1_1</table_push>
-        <engine>ENGINE = MergeTree PARTITION BY date ORDER BY (date, sipHash64(date)) SAMPLE BY sipHash64(date)</engine>
-        <sharding_key>rand()</sharding_key>
-      </table_crm_fin_account>
-    </tables>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_no_index.xml b/tests/integration/test_cluster_copier/task_no_index.xml
deleted file mode 100644
index 265f99e21a6..00000000000
--- a/tests/integration/test_cluster_copier/task_no_index.xml
+++ /dev/null
@@ -1,109 +0,0 @@
-<clickhouse>
-    <remote_servers>
-        <source_cluster>
-            <shard>
-                <internal_replication>false</internal_replication>
-                    <replica>
-                        <host>s0_0_0</host>
-                        <port>9000</port>
-                    </replica>
-            </shard>
-        </source_cluster>
-
-        <destination_cluster>
-               <shard>
-                <internal_replication>false</internal_replication>
-                    <replica>
-                        <host>s1_1_0</host>
-                        <port>9000</port>
-                    </replica>
-               </shard>
-        </destination_cluster>
-    </remote_servers>
-
-    <!-- How many simultaneously active workers are possible. If you run more workers superfluous workers will sleep. -->
-    <max_workers>2</max_workers>
-
-    <!-- Setting used to fetch (pull) data from source cluster tables -->
-    <settings_pull>
-        <readonly>1</readonly>
-    </settings_pull>
-
-    <!-- Setting used to insert (push) data to destination cluster tables -->
-    <settings_push>
-        <readonly>0</readonly>
-    </settings_push>
-
-    <!-- Common setting for fetch (pull) and insert (push) operations. Also, copier process context uses it.
-         They are overlaid by <settings_pull/> and <settings_push/> respectively. -->
-    <settings>
-        <connect_timeout>3</connect_timeout>
-        <!-- Sync insert is set forcibly, leave it here just in case. -->
-        <distributed_foreground_insert>1</distributed_foreground_insert>
-    </settings>
-
-    <!-- Copying tasks description.
-         You could specify several table task in the same task description (in the same ZooKeeper node), they will be performed
-         sequentially.
-    -->
-    <tables>
-        <!-- A table task, copies one table. -->
-        <table_hits>
-            <!-- Source cluster name (from <remote_servers/> section) and tables in it that should be copied -->
-            <cluster_pull>source_cluster</cluster_pull>
-            <database_pull>default</database_pull>
-            <table_pull>ontime</table_pull>
-        <!-- <table_pull>onetime</table_pull> -->
-
-            <!-- Destination cluster name and tables in which the data should be inserted -->
-            <cluster_push>destination_cluster</cluster_push>
-            <database_push>default</database_push>
-            <table_push>ontime22</table_push>
-        <!-- <table_pull>onetime</table_pull> -->
-
-            <!-- Engine of destination tables.
-                 If destination tables have not be created, workers create them using columns definition from source tables and engine
-                 definition from here.
-
-                 NOTE: If the first worker starts insert data and detects that destination partition is not empty then the partition will
-                 be dropped and refilled, take it into account if you already have some data in destination tables. You could directly
-                 specify partitions that should be copied in <enabled_partitions/>, they should be in quoted format like partition column of
-                 system.parts table.
-        -->
-
-
-            <engine>
-    ENGINE = MergeTree() PARTITION BY Year ORDER BY (Year, FlightDate) SETTINGS index_granularity=8192
-        </engine>
-
-            <!-- Sharding key used to insert data to destination cluster -->
-
-        <sharding_key>jumpConsistentHash(intHash64(Year), 2)</sharding_key>
-
-            <!-- Optional expression that filter data while pull them from source servers -->
-        <!--  <where_condition>CounterID != 0</where_condition> -->
-
-            <!-- This section specifies partitions that should be copied, other partition will be ignored.
-                 Partition names should have the same format as
-                 partition column of system.parts table (i.e. a quoted text).
-                 Since partition key of source and destination cluster could be different,
-                 these partition names specify destination partitions.
-
-                 NOTE: In spite of this section is optional (if it is not specified, all partitions will be copied),
-                 it is strictly recommended to specify them explicitly.
-                 If you already have some ready partitions on destination cluster they
-                 will be removed at the start of the copying since they will be interpeted
-                 as unfinished data from the previous copying!!!
-        -->
-            <enabled_partitions>
-                <partition>2017</partition>
-            </enabled_partitions>
-        </table_hits>
-
-        <!-- Next table to copy. It is not copied until previous table is copying. -->
-    <!-- </table_visits>
-
-        </table_visits>
-    -->
-    </tables>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_non_partitioned_table.xml b/tests/integration/test_cluster_copier/task_non_partitioned_table.xml
deleted file mode 100644
index d5424b95f45..00000000000
--- a/tests/integration/test_cluster_copier/task_non_partitioned_table.xml
+++ /dev/null
@@ -1,39 +0,0 @@
-<clickhouse>
-    <remote_servers>   
-       <source_cluster>
-          <shard>
-              <weight>1</weight>
-              <replica>
-                  <host>s0_0_0</host>
-                  <port>9000</port>
-              </replica>
-          </shard>
-      </source_cluster>     
-      <default_cluster>
-      
-        <shard>
-          <weight>1</weight>
-          <replica>
-              <host>s1_1_0</host>
-              <port>9000</port>
-          </replica>
-        </shard>
-            
-      </default_cluster>     
-    </remote_servers>
-    <max_workers>1</max_workers>
-
-    <tables>
-      <table_copier_test1>
-        <cluster_pull>source_cluster</cluster_pull>
-        <database_pull>default</database_pull>
-        <table_pull>copier_test1</table_pull>
-
-        <cluster_push>default_cluster</cluster_push>
-        <database_push>default</database_push>
-        <table_push>copier_test1_1</table_push>
-        <engine>ENGINE = MergeTree ORDER BY date SETTINGS index_granularity = 8192</engine>
-        <sharding_key>rand()</sharding_key>
-      </table_copier_test1>
-    </tables>
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_self_copy.xml b/tests/integration/test_cluster_copier/task_self_copy.xml
deleted file mode 100644
index 21d577bc397..00000000000
--- a/tests/integration/test_cluster_copier/task_self_copy.xml
+++ /dev/null
@@ -1,63 +0,0 @@
-<clickhouse>
-    <tcp_port_secure>9440</tcp_port_secure>
-    <remote_servers>
-        <source_cluster>
-            <shard>
-                <internal_replication>false</internal_replication>
-                <replica>
-                    <host>s0_0_0</host>
-                    <port>9000</port>
-                    <user>dbuser</user>
-                    <password>12345678</password>
-                    <secure>0</secure>
-                </replica>
-            </shard>
-        </source_cluster>
-
-        <destination_cluster>
-            <shard>
-                <internal_replication>false</internal_replication>
-                <replica>
-                    <host>s0_0_0</host>
-                    <port>9000</port>
-                    <user>dbuser</user>
-                    <password>12345678</password>
-                    <secure>0</secure>
-                </replica>
-            </shard>
-        </destination_cluster>
-    </remote_servers>
-
-    <max_workers>2</max_workers>
-
-    <settings_pull>
-        <readonly>1</readonly>
-    </settings_pull>
-
-    <settings_push>
-        <readonly>0</readonly>
-    </settings_push>
-
-    <settings>
-        <connect_timeout>3</connect_timeout>
-        <distributed_foreground_insert>1</distributed_foreground_insert>
-    </settings>
-
-    <tables>
-        <table1>
-            <cluster_pull>source_cluster</cluster_pull>
-    	    <database_pull>db1</database_pull>
-            <table_pull>source_table</table_pull>
-
-            <cluster_push>destination_cluster</cluster_push>
-            <database_push>db2</database_push>
-            <table_push>destination_table</table_push>
-
-            <engine>
-	            ENGINE = MergeTree PARTITION BY a ORDER BY a SETTINGS index_granularity = 8192
-	        </engine>
-
-    	    <sharding_key>rand()</sharding_key>
-        </table1>
-    </tables>
-</clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_cluster_copier/task_skip_index.xml b/tests/integration/test_cluster_copier/task_skip_index.xml
deleted file mode 100644
index b04cec963d4..00000000000
--- a/tests/integration/test_cluster_copier/task_skip_index.xml
+++ /dev/null
@@ -1,39 +0,0 @@
-<clickhouse>
-<remote_servers>
-        <source>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>first_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </source>
-        <destination>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>second_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </destination>
-    </remote_servers>
-
-   <max_workers>2</max_workers>
-
-   <tables>
-     <table_events>
-         <cluster_pull>source</cluster_pull>
-         <database_pull>db_skip_index</database_pull>
-         <table_pull>source</table_pull>
-
-         <cluster_push>destination</cluster_push>
-         <database_push>db_skip_index</database_push>
-         <table_push>destination</table_push>
-
-         <engine>ENGINE = MergeTree() PARTITION BY toYYYYMMDD(Column3) ORDER BY (Column3, Column2, Column1)</engine>
-         <sharding_key>rand()</sharding_key>
-     </table_events>
-   </tables>
- </clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_taxi_data.xml b/tests/integration/test_cluster_copier/task_taxi_data.xml
deleted file mode 100644
index 94fa5087338..00000000000
--- a/tests/integration/test_cluster_copier/task_taxi_data.xml
+++ /dev/null
@@ -1,42 +0,0 @@
-<clickhouse>
-   <remote_servers>
-         <events>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>first</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>second</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>third</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-         </events>
-   </remote_servers>
-
-   <max_workers>2</max_workers>
-
-   <tables>
-     <table_events>
-         <cluster_pull>events</cluster_pull>
-         <database_pull>dailyhistory</database_pull>
-         <table_pull>yellow_tripdata_staging</table_pull>
-         <cluster_push>events</cluster_push>
-         <database_push>monthlyhistory</database_push>
-         <table_push>yellow_tripdata_staging</table_push>
-         <engine>Engine=ReplacingMergeTree() PRIMARY KEY (tpep_pickup_datetime, id) ORDER BY (tpep_pickup_datetime, id) PARTITION BY (pickup_location_id, toYYYYMM(tpep_pickup_datetime))</engine>
-         <sharding_key>sipHash64(id) % 3</sharding_key>
-     </table_events>
-   </tables>
- </clickhouse>
\ No newline at end of file
diff --git a/tests/integration/test_cluster_copier/task_test_block_size.xml b/tests/integration/test_cluster_copier/task_test_block_size.xml
deleted file mode 100644
index bf29c7e1832..00000000000
--- a/tests/integration/test_cluster_copier/task_test_block_size.xml
+++ /dev/null
@@ -1,101 +0,0 @@
-<clickhouse>
-    <!-- How many simualteneous workers are posssible -->
-    <max_workers>1</max_workers>
-
-    <!-- Common setting for pull and push operations -->
-    <settings>
-        <connect_timeout>1</connect_timeout>
-    </settings>
-
-    <settings_pull>
-    </settings_pull>
-
-    <!-- Tasks -->
-    <tables>
-        <test_block_size>
-            <cluster_pull>shard_0_0</cluster_pull>
-            <database_pull>default</database_pull>
-            <table_pull>test_block_size</table_pull>
-
-            <cluster_push>cluster1</cluster_push>
-            <database_push>default</database_push>
-            <table_push>test_block_size</table_push>
-
-            <enabled_partitions>
-                <partition>'1970-01-01'</partition>
-            </enabled_partitions>
-
-            <!-- Engine of destination tables -->
-            <engine>ENGINE=
-                ReplicatedMergeTree
-                ORDER BY d PARTITION BY partition
-            </engine>
-
-            <!-- Which sarding key to use while copying -->
-            <sharding_key>jumpConsistentHash(intHash64(d), 2)</sharding_key>
-
-            <!-- Optional expression that filter copying data -->
-            <!-- <where_condition></where_condition> -->
-        </test_block_size>
-    </tables>
-
-    <!-- Configuration of clusters -->
-    <remote_servers>
-    <cluster0>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s0_0_0</host>
-                <port>9000</port>
-            </replica>
-            <replica>
-                <host>s0_0_1</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s0_1_0</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-    </cluster0>
-
-    <cluster1>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s1_0_0</host>
-                <port>9000</port>
-            </replica>
-            <replica>
-                <host>s1_0_1</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s1_1_0</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-    </cluster1>
-
-    <shard_0_0>
-        <shard>
-            <internal_replication>true</internal_replication>
-            <replica>
-                <host>s0_0_0</host>
-                <port>9000</port>
-            </replica>
-            <replica>
-                <host>s0_0_1</host>
-                <port>9000</port>
-            </replica>
-        </shard>
-    </shard_0_0>
-    </remote_servers>
-
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_trivial.xml b/tests/integration/test_cluster_copier/task_trivial.xml
deleted file mode 100644
index a3b8bc03888..00000000000
--- a/tests/integration/test_cluster_copier/task_trivial.xml
+++ /dev/null
@@ -1,63 +0,0 @@
-<clickhouse>
-    <!-- How many simualteneous workers are posssible -->
-    <max_workers>3</max_workers>
-
-    <!-- Common setting for pull and push operations -->
-    <settings>
-        <connect_timeout>1</connect_timeout>
-    </settings>
-
-    <!-- Setting used to fetch data -->
-    <settings_pull>
-        <max_rows_in_distinct>0</max_rows_in_distinct>
-    </settings_pull>
-
-    <!-- Setting used to insert data -->
-    <settings_push>
-    </settings_push>
-
-    <!-- Tasks -->
-    <tables>
-        <hits>
-            <cluster_pull>source_trivial_cluster</cluster_pull>
-            <database_pull>default</database_pull>
-            <table_pull>trivial</table_pull>
-
-            <cluster_push>destination_trivial_cluster</cluster_push>
-            <database_push>default</database_push>
-            <table_push>trivial</table_push>
-
-            <!-- Engine of destination tables -->
-            <engine>ENGINE=ReplicatedMergeTree('/clickhouse/tables/cluster{cluster}/{shard}/hits', '{replica}') PARTITION BY d % 5 ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d) SETTINGS index_granularity = 16</engine>
-
-            <!-- Which sarding key to use while copying -->
-            <sharding_key>d + 1</sharding_key>
-
-            <!-- Optional expression that filter copying data -->
-            <where_condition>d - d = 0</where_condition>
-        </hits>
-    </tables>
-
-    <!-- Configuration of clusters -->
-    <remote_servers>
-        <source_trivial_cluster>
-            <shard>
-                <replica>
-                    <host>first_trivial</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </source_trivial_cluster>
-
-
-        <destination_trivial_cluster>
-            <shard>
-                <replica>
-                    <host>second_trivial</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </destination_trivial_cluster>
-    </remote_servers>
-
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_trivial_without_arguments.xml b/tests/integration/test_cluster_copier/task_trivial_without_arguments.xml
deleted file mode 100644
index 0197dee0181..00000000000
--- a/tests/integration/test_cluster_copier/task_trivial_without_arguments.xml
+++ /dev/null
@@ -1,63 +0,0 @@
-<clickhouse>
-    <!-- How many simualteneous workers are posssible -->
-    <max_workers>3</max_workers>
-
-    <!-- Common setting for pull and push operations -->
-    <settings>
-        <connect_timeout>1</connect_timeout>
-    </settings>
-
-    <!-- Setting used to fetch data -->
-    <settings_pull>
-        <max_rows_in_distinct>0</max_rows_in_distinct>
-    </settings_pull>
-
-    <!-- Setting used to insert data -->
-    <settings_push>
-    </settings_push>
-
-    <!-- Tasks -->
-    <tables>
-        <hits>
-            <cluster_pull>source_trivial_cluster</cluster_pull>
-            <database_pull>default</database_pull>
-            <table_pull>trivial_without_arguments</table_pull>
-
-            <cluster_push>destination_trivial_cluster</cluster_push>
-            <database_push>default</database_push>
-            <table_push>trivial_without_arguments</table_push>
-
-            <!-- Engine of destination tables -->
-            <engine>ENGINE=ReplicatedMergeTree() PARTITION BY d % 5 ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d) SETTINGS index_granularity = 16</engine>
-
-            <!-- Which sarding key to use while copying -->
-            <sharding_key>d + 1</sharding_key>
-
-            <!-- Optional expression that filter copying data -->
-            <where_condition>d - d = 0</where_condition>
-        </hits>
-    </tables>
-
-    <!-- Configuration of clusters -->
-    <remote_servers>
-        <source_trivial_cluster>
-            <shard>
-                <replica>
-                    <host>first_trivial</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </source_trivial_cluster>
-
-
-        <destination_trivial_cluster>
-            <shard>
-                <replica>
-                    <host>second_trivial</host>
-                    <port>9000</port>
-                </replica>
-            </shard>
-        </destination_trivial_cluster>
-    </remote_servers>
-
-</clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_ttl_columns.xml b/tests/integration/test_cluster_copier/task_ttl_columns.xml
deleted file mode 100644
index 2069c509c87..00000000000
--- a/tests/integration/test_cluster_copier/task_ttl_columns.xml
+++ /dev/null
@@ -1,39 +0,0 @@
-<clickhouse>
-<remote_servers>
-        <source>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>first_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </source>
-        <destination>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>second_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </destination>
-    </remote_servers>
-
-   <max_workers>2</max_workers>
-
-   <tables>
-     <table_events>
-         <cluster_pull>source</cluster_pull>
-         <database_pull>db_ttl_columns</database_pull>
-         <table_pull>source</table_pull>
-
-         <cluster_push>destination</cluster_push>
-         <database_push>db_ttl_columns</database_push>
-         <table_push>destination</table_push>
-
-         <engine>ENGINE = MergeTree() PARTITION BY toYYYYMMDD(Column3) ORDER BY (Column3, Column2, Column1)</engine>
-         <sharding_key>rand()</sharding_key>
-     </table_events>
-   </tables>
- </clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_ttl_move_to_volume.xml b/tests/integration/test_cluster_copier/task_ttl_move_to_volume.xml
deleted file mode 100644
index 2a51fa7a66d..00000000000
--- a/tests/integration/test_cluster_copier/task_ttl_move_to_volume.xml
+++ /dev/null
@@ -1,39 +0,0 @@
-<clickhouse>
-<remote_servers>
-        <source>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>first_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </source>
-        <destination>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>second_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </destination>
-    </remote_servers>
-
-   <max_workers>2</max_workers>
-
-   <tables>
-     <table_events>
-         <cluster_pull>source</cluster_pull>
-         <database_pull>db_move_to_volume</database_pull>
-         <table_pull>source</table_pull>
-
-         <cluster_push>destination</cluster_push>
-         <database_push>db_move_to_volume</database_push>
-         <table_push>destination</table_push>
-
-         <engine>ENGINE = MergeTree() PARTITION BY toYYYYMMDD(Column3) ORDER BY (Column3, Column2, Column1) TTL Column3 + INTERVAL 1 MONTH TO VOLUME 'external' SETTINGS storage_policy = 'external_with_jbods'</engine>
-         <sharding_key>rand()</sharding_key>
-     </table_events>
-   </tables>
- </clickhouse>
diff --git a/tests/integration/test_cluster_copier/task_with_different_schema.xml b/tests/integration/test_cluster_copier/task_with_different_schema.xml
deleted file mode 100644
index e1e6ee4dc42..00000000000
--- a/tests/integration/test_cluster_copier/task_with_different_schema.xml
+++ /dev/null
@@ -1,39 +0,0 @@
-<clickhouse>
-<remote_servers>
-        <source>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>first_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </source>
-        <destination>
-             <shard>
-                 <internal_replication>false</internal_replication>
-                 <replica>
-                     <host>second_of_two</host>
-                     <port>9000</port>
-                 </replica>
-             </shard>
-        </destination>
-    </remote_servers>
-
-   <max_workers>2</max_workers>
-
-   <tables>
-     <table_events>
-         <cluster_pull>source</cluster_pull>
-         <database_pull>db_different_schema</database_pull>
-         <table_pull>source</table_pull>
-
-         <cluster_push>destination</cluster_push>
-         <database_push>db_different_schema</database_push>
-         <table_push>destination</table_push>
-
-         <engine>ENGINE = MergeTree() PARTITION BY toYYYYMMDD(Column3) ORDER BY (Column9, Column1, Column2, Column3, Column4)</engine>
-         <sharding_key>rand()</sharding_key>
-     </table_events>
-   </tables>
- </clickhouse>
diff --git a/tests/integration/test_cluster_copier/test.py b/tests/integration/test_cluster_copier/test.py
deleted file mode 100644
index be71fc21e33..00000000000
--- a/tests/integration/test_cluster_copier/test.py
+++ /dev/null
@@ -1,653 +0,0 @@
-import os
-import random
-import sys
-import time
-import kazoo
-import pytest
-import string
-import random
-from contextlib import contextmanager
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
-
-import docker
-
-CURRENT_TEST_DIR = os.path.dirname(os.path.abspath(__file__))
-sys.path.insert(0, os.path.dirname(CURRENT_TEST_DIR))
-
-COPYING_FAIL_PROBABILITY = 0.2
-MOVING_FAIL_PROBABILITY = 0.2
-
-cluster = ClickHouseCluster(__file__)
-
-
-def generateRandomString(count):
-    return "".join(
-        random.choice(string.ascii_uppercase + string.digits) for _ in range(count)
-    )
-
-
-def check_all_hosts_sucesfully_executed(tsv_content, num_hosts):
-    M = TSV.toMat(tsv_content)
-    hosts = [(l[0], l[1]) for l in M]  # (host, port)
-    codes = [l[2] for l in M]
-
-    assert len(hosts) == num_hosts and len(set(hosts)) == num_hosts, "\n" + tsv_content
-    assert len(set(codes)) == 1, "\n" + tsv_content
-    assert codes[0] == "0", "\n" + tsv_content
-
-
-def ddl_check_query(instance, query, num_hosts=3):
-    contents = instance.query(query)
-    check_all_hosts_sucesfully_executed(contents, num_hosts)
-    return contents
-
-
-@pytest.fixture(scope="module")
-def started_cluster():
-    global cluster
-    try:
-        clusters_schema = {
-            "0": {"0": ["0", "1"], "1": ["0"]},
-            "1": {"0": ["0", "1"], "1": ["0"]},
-        }
-
-        for cluster_name, shards in clusters_schema.items():
-            for shard_name, replicas in shards.items():
-                for replica_name in replicas:
-                    name = "s{}_{}_{}".format(cluster_name, shard_name, replica_name)
-                    cluster.add_instance(
-                        name,
-                        main_configs=[
-                            "configs/conf.d/query_log.xml",
-                            "configs/conf.d/ddl.xml",
-                            "configs/conf.d/clusters.xml",
-                        ],
-                        user_configs=["configs/users.xml"],
-                        macros={
-                            "cluster": cluster_name,
-                            "shard": shard_name,
-                            "replica": replica_name,
-                        },
-                        with_zookeeper=True,
-                    )
-
-        cluster.start()
-        yield cluster
-
-    finally:
-        cluster.shutdown()
-
-
-class Task1:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_simple_" + generateRandomString(10)
-        self.container_task_file = "/task0_description.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task0_description.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        instance = cluster.instances["s0_0_0"]
-
-        for cluster_num in ["0", "1"]:
-            ddl_check_query(
-                instance,
-                "DROP DATABASE IF EXISTS default ON CLUSTER cluster{} SYNC".format(
-                    cluster_num
-                ),
-            )
-            ddl_check_query(
-                instance,
-                "CREATE DATABASE default ON CLUSTER cluster{} ".format(cluster_num),
-            )
-
-        ddl_check_query(
-            instance,
-            "CREATE TABLE hits ON CLUSTER cluster0 (d UInt64, d1 UInt64 MATERIALIZED d+1) "
-            + "ENGINE=ReplicatedMergeTree "
-            + "PARTITION BY d % 3 ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d) SETTINGS index_granularity = 16",
-        )
-        ddl_check_query(
-            instance,
-            "CREATE TABLE hits_all ON CLUSTER cluster0 (d UInt64) ENGINE=Distributed(cluster0, default, hits, d)",
-        )
-        ddl_check_query(
-            instance,
-            "CREATE TABLE hits_all ON CLUSTER cluster1 (d UInt64) ENGINE=Distributed(cluster1, default, hits, d + 1)",
-        )
-        instance.query(
-            "INSERT INTO hits_all SELECT * FROM system.numbers LIMIT 1002",
-            settings={"distributed_foreground_insert": 1},
-        )
-
-    def check(self):
-        assert (
-            self.cluster.instances["s0_0_0"]
-            .query("SELECT count() FROM hits_all")
-            .strip()
-            == "1002"
-        )
-        assert (
-            self.cluster.instances["s1_0_0"]
-            .query("SELECT count() FROM hits_all")
-            .strip()
-            == "1002"
-        )
-
-        assert (
-            self.cluster.instances["s1_0_0"]
-            .query("SELECT DISTINCT d % 2 FROM hits")
-            .strip()
-            == "1"
-        )
-        assert (
-            self.cluster.instances["s1_1_0"]
-            .query("SELECT DISTINCT d % 2 FROM hits")
-            .strip()
-            == "0"
-        )
-
-        instance = self.cluster.instances["s0_0_0"]
-        ddl_check_query(instance, "DROP TABLE hits_all ON CLUSTER cluster0")
-        ddl_check_query(instance, "DROP TABLE hits_all ON CLUSTER cluster1")
-        ddl_check_query(instance, "DROP TABLE hits ON CLUSTER cluster0")
-        ddl_check_query(instance, "DROP TABLE hits ON CLUSTER cluster1")
-
-
-class Task2:
-    def __init__(self, cluster, unique_zk_path):
-        self.cluster = cluster
-        self.zk_task_path = (
-            "/clickhouse-copier/task_month_to_week_partition_" + generateRandomString(5)
-        )
-        self.unique_zk_path = generateRandomString(10)
-        self.container_task_file = "/task_month_to_week_description.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_month_to_week_description.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        instance = cluster.instances["s0_0_0"]
-
-        for cluster_num in ["0", "1"]:
-            ddl_check_query(
-                instance,
-                "DROP DATABASE IF EXISTS default ON CLUSTER cluster{}".format(
-                    cluster_num
-                ),
-            )
-            ddl_check_query(
-                instance,
-                "CREATE DATABASE IF NOT EXISTS default ON CLUSTER cluster{}".format(
-                    cluster_num
-                ),
-            )
-
-        ddl_check_query(
-            instance,
-            "CREATE TABLE a ON CLUSTER cluster0 (date Date, d UInt64, d1 UInt64 ALIAS d+1) "
-            "ENGINE=ReplicatedMergeTree('/clickhouse/tables/cluster_{cluster}/{shard}/"
-            + self.unique_zk_path
-            + "', "
-            "'{replica}', date, intHash64(d), (date, intHash64(d)), 8192)",
-        )
-        ddl_check_query(
-            instance,
-            "CREATE TABLE a_all ON CLUSTER cluster0 (date Date, d UInt64) ENGINE=Distributed(cluster0, default, a, d)",
-        )
-
-        instance.query(
-            "INSERT INTO a_all SELECT toDate(17581 + number) AS date, number AS d FROM system.numbers LIMIT 85",
-            settings={"distributed_foreground_insert": 1},
-        )
-
-    def check(self):
-        assert TSV(
-            self.cluster.instances["s0_0_0"].query(
-                "SELECT count() FROM cluster(cluster0, default, a)"
-            )
-        ) == TSV("85\n")
-        assert TSV(
-            self.cluster.instances["s1_0_0"].query(
-                "SELECT count(), uniqExact(date) FROM cluster(cluster1, default, b)"
-            )
-        ) == TSV("85\t85\n")
-
-        assert TSV(
-            self.cluster.instances["s1_0_0"].query(
-                "SELECT DISTINCT jumpConsistentHash(intHash64(d), 2) FROM b"
-            )
-        ) == TSV("0\n")
-        assert TSV(
-            self.cluster.instances["s1_1_0"].query(
-                "SELECT DISTINCT jumpConsistentHash(intHash64(d), 2) FROM b"
-            )
-        ) == TSV("1\n")
-
-        assert TSV(
-            self.cluster.instances["s1_0_0"].query(
-                "SELECT uniqExact(partition) IN (12, 13) FROM system.parts WHERE active AND database='default' AND table='b'"
-            )
-        ) == TSV("1\n")
-        assert TSV(
-            self.cluster.instances["s1_1_0"].query(
-                "SELECT uniqExact(partition) IN (12, 13) FROM system.parts WHERE active AND database='default' AND table='b'"
-            )
-        ) == TSV("1\n")
-
-        instance = cluster.instances["s0_0_0"]
-        ddl_check_query(instance, "DROP TABLE a ON CLUSTER cluster0")
-        ddl_check_query(instance, "DROP TABLE b ON CLUSTER cluster1")
-
-
-class Task_test_block_size:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = (
-            "/clickhouse-copier/task_test_block_size_" + generateRandomString(5)
-        )
-        self.rows = 1000000
-        self.container_task_file = "/task_test_block_size.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_test_block_size.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        instance = cluster.instances["s0_0_0"]
-
-        ddl_check_query(
-            instance,
-            """
-            CREATE TABLE test_block_size ON CLUSTER shard_0_0 (partition Date, d UInt64)
-            ENGINE=ReplicatedMergeTree
-            ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d)""",
-            2,
-        )
-
-        instance.query(
-            "INSERT INTO test_block_size SELECT toDate(0) AS partition, number as d FROM system.numbers LIMIT {}".format(
-                self.rows
-            )
-        )
-
-    def check(self):
-        assert TSV(
-            self.cluster.instances["s1_0_0"].query(
-                "SELECT count() FROM cluster(cluster1, default, test_block_size)"
-            )
-        ) == TSV("{}\n".format(self.rows))
-
-        instance = cluster.instances["s0_0_0"]
-        ddl_check_query(instance, "DROP TABLE test_block_size ON CLUSTER shard_0_0", 2)
-        ddl_check_query(instance, "DROP TABLE test_block_size ON CLUSTER cluster1")
-
-
-class Task_no_index:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_no_index_" + generateRandomString(
-            5
-        )
-        self.rows = 1000000
-        self.container_task_file = "/task_no_index.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_no_index.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        instance = cluster.instances["s0_0_0"]
-        instance.query("DROP TABLE IF EXISTS ontime SYNC")
-        instance.query(
-            "create table IF NOT EXISTS ontime (Year UInt16, FlightDate String) ENGINE = Memory"
-        )
-        instance.query(
-            "insert into ontime values (2016, 'test6'), (2017, 'test7'), (2018, 'test8')"
-        )
-
-    def check(self):
-        assert TSV(
-            self.cluster.instances["s1_1_0"].query("SELECT Year FROM ontime22")
-        ) == TSV("2017\n")
-        instance = cluster.instances["s0_0_0"]
-        instance.query("DROP TABLE ontime")
-        instance = cluster.instances["s1_1_0"]
-        instance.query("DROP TABLE ontime22")
-
-
-class Task_no_arg:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_no_arg"
-        self.rows = 1000000
-        self.container_task_file = "/task_no_arg.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_no_arg.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        instance = cluster.instances["s0_0_0"]
-        instance.query("DROP TABLE IF EXISTS copier_test1 SYNC")
-        instance.query(
-            "create table if not exists copier_test1 (date Date, id UInt32) engine = MergeTree PARTITION BY date ORDER BY date SETTINGS index_granularity = 8192"
-        )
-        instance.query("insert into copier_test1 values ('2016-01-01', 10);")
-
-    def check(self):
-        assert TSV(
-            self.cluster.instances["s1_1_0"].query("SELECT date FROM copier_test1_1")
-        ) == TSV("2016-01-01\n")
-        instance = cluster.instances["s0_0_0"]
-        instance.query("DROP TABLE copier_test1 SYNC")
-        instance = cluster.instances["s1_1_0"]
-        instance.query("DROP TABLE copier_test1_1 SYNC")
-
-
-class Task_non_partitioned_table:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_non_partitoned_table"
-        self.rows = 1000000
-        self.container_task_file = "/task_non_partitioned_table.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_non_partitioned_table.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        instance = cluster.instances["s0_0_0"]
-        instance.query("DROP TABLE IF EXISTS copier_test1 SYNC")
-        instance.query(
-            "create table copier_test1 (date Date, id UInt32) engine = MergeTree ORDER BY date SETTINGS index_granularity = 8192"
-        )
-        instance.query("insert into copier_test1 values ('2016-01-01', 10);")
-
-    def check(self):
-        assert TSV(
-            self.cluster.instances["s1_1_0"].query("SELECT date FROM copier_test1_1")
-        ) == TSV("2016-01-01\n")
-        instance = cluster.instances["s0_0_0"]
-        instance.query("DROP TABLE copier_test1")
-        instance = cluster.instances["s1_1_0"]
-        instance.query("DROP TABLE copier_test1_1")
-
-
-class Task_self_copy:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_self_copy"
-        self.container_task_file = "/task_self_copy.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_self_copy.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        instance = cluster.instances["s0_0_0"]
-        instance.query("DROP DATABASE IF EXISTS db1 SYNC")
-        instance.query("DROP DATABASE IF EXISTS db2 SYNC")
-        instance.query("CREATE DATABASE IF NOT EXISTS db1;")
-        instance.query(
-            "CREATE TABLE IF NOT EXISTS db1.source_table (`a` Int8, `b` String, `c` Int8) ENGINE = MergeTree PARTITION BY a ORDER BY a SETTINGS index_granularity = 8192"
-        )
-        instance.query("CREATE DATABASE IF NOT EXISTS db2;")
-        instance.query(
-            "CREATE TABLE IF NOT EXISTS db2.destination_table (`a` Int8, `b` String, `c` Int8) ENGINE = MergeTree PARTITION BY a ORDER BY a SETTINGS index_granularity = 8192"
-        )
-        instance.query("INSERT INTO db1.source_table VALUES (1, 'ClickHouse', 1);")
-        instance.query("INSERT INTO db1.source_table VALUES (2, 'Copier', 2);")
-
-    def check(self):
-        instance = cluster.instances["s0_0_0"]
-        assert TSV(
-            instance.query("SELECT * FROM db2.destination_table ORDER BY a")
-        ) == TSV(instance.query("SELECT * FROM db1.source_table ORDER BY a"))
-        instance = cluster.instances["s0_0_0"]
-        instance.query("DROP DATABASE IF EXISTS db1 SYNC")
-        instance.query("DROP DATABASE IF EXISTS db2 SYNC")
-
-
-def execute_task(started_cluster, task, cmd_options):
-    task.start()
-
-    zk = started_cluster.get_kazoo_client("zoo1")
-    print("Use ZooKeeper server: {}:{}".format(zk.hosts[0][0], zk.hosts[0][1]))
-
-    try:
-        zk.delete("/clickhouse-copier", recursive=True)
-    except kazoo.exceptions.NoNodeError:
-        print("No node /clickhouse-copier. It is Ok in first test.")
-
-    # Run cluster-copier processes on each node
-    docker_api = started_cluster.docker_client.api
-    copiers_exec_ids = []
-
-    cmd = [
-        "/usr/bin/clickhouse",
-        "copier",
-        "--config",
-        "/etc/clickhouse-server/config-copier.xml",
-        "--task-path",
-        task.zk_task_path,
-        "--task-file",
-        task.container_task_file,
-        "--task-upload-force",
-        "true",
-        "--base-dir",
-        "/var/log/clickhouse-server/copier",
-    ]
-    cmd += cmd_options
-
-    print(cmd)
-
-    copiers = random.sample(list(started_cluster.instances.keys()), 3)
-
-    for instance_name in copiers:
-        instance = started_cluster.instances[instance_name]
-        container = instance.get_docker_handle()
-        instance.copy_file_to_container(
-            os.path.join(CURRENT_TEST_DIR, "configs/config-copier.xml"),
-            "/etc/clickhouse-server/config-copier.xml",
-        )
-        print("Copied copier config to {}".format(instance.name))
-        exec_id = docker_api.exec_create(container.id, cmd, stderr=True)
-        output = docker_api.exec_start(exec_id).decode("utf8")
-        print(output)
-        copiers_exec_ids.append(exec_id)
-        print(
-            "Copier for {} ({}) has started".format(instance.name, instance.ip_address)
-        )
-
-    # Wait for copiers stopping and check their return codes
-    for exec_id, instance_name in zip(copiers_exec_ids, copiers):
-        instance = started_cluster.instances[instance_name]
-        while True:
-            res = docker_api.exec_inspect(exec_id)
-            if not res["Running"]:
-                break
-            time.sleep(0.5)
-
-        assert res["ExitCode"] == 0, "Instance: {} ({}). Info: {}".format(
-            instance.name, instance.ip_address, repr(res)
-        )
-
-    try:
-        task.check()
-    finally:
-        zk.delete(task.zk_task_path, recursive=True)
-
-
-# Tests
-
-
-@pytest.mark.parametrize(("use_sample_offset"), [False, True])
-def test_copy_simple(started_cluster, use_sample_offset):
-    if use_sample_offset:
-        execute_task(
-            started_cluster,
-            Task1(started_cluster),
-            ["--experimental-use-sample-offset", "1"],
-        )
-    else:
-        execute_task(started_cluster, Task1(started_cluster), [])
-
-
-@pytest.mark.parametrize(("use_sample_offset"), [False, True])
-def test_copy_with_recovering(started_cluster, use_sample_offset):
-    if use_sample_offset:
-        execute_task(
-            started_cluster,
-            Task1(started_cluster),
-            [
-                "--copy-fault-probability",
-                str(COPYING_FAIL_PROBABILITY),
-                "--experimental-use-sample-offset",
-                "1",
-                "--max-table-tries",
-                "10",
-            ],
-        )
-    else:
-        execute_task(
-            started_cluster,
-            Task1(started_cluster),
-            [
-                "--copy-fault-probability",
-                str(COPYING_FAIL_PROBABILITY),
-                "--max-table-tries",
-                "10",
-            ],
-        )
-
-
-@pytest.mark.parametrize(("use_sample_offset"), [False, True])
-def test_copy_with_recovering_after_move_faults(started_cluster, use_sample_offset):
-    if use_sample_offset:
-        execute_task(
-            started_cluster,
-            Task1(started_cluster),
-            [
-                "--move-fault-probability",
-                str(MOVING_FAIL_PROBABILITY),
-                "--experimental-use-sample-offset",
-                "1",
-            ],
-        )
-    else:
-        execute_task(
-            started_cluster,
-            Task1(started_cluster),
-            ["--move-fault-probability", str(MOVING_FAIL_PROBABILITY)],
-        )
-
-
-@pytest.mark.timeout(600)
-def test_copy_month_to_week_partition(started_cluster):
-    execute_task(started_cluster, Task2(started_cluster, "test1"), [])
-
-
-@pytest.mark.timeout(600)
-def test_copy_month_to_week_partition_with_recovering(started_cluster):
-    execute_task(
-        started_cluster,
-        Task2(started_cluster, "test2"),
-        [
-            "--copy-fault-probability",
-            str(COPYING_FAIL_PROBABILITY),
-            "--max-table-tries",
-            "10",
-        ],
-    )
-
-
-@pytest.mark.timeout(600)
-def test_copy_month_to_week_partition_with_recovering_after_move_faults(
-    started_cluster,
-):
-    execute_task(
-        started_cluster,
-        Task2(started_cluster, "test3"),
-        ["--move-fault-probability", str(MOVING_FAIL_PROBABILITY)],
-    )
-
-
-def test_block_size(started_cluster):
-    execute_task(started_cluster, Task_test_block_size(started_cluster), [])
-
-
-def test_no_index(started_cluster):
-    execute_task(started_cluster, Task_no_index(started_cluster), [])
-
-
-def test_no_arg(started_cluster):
-    execute_task(started_cluster, Task_no_arg(started_cluster), [])
-
-
-def test_non_partitioned_table(started_cluster):
-    execute_task(started_cluster, Task_non_partitioned_table(started_cluster), [])
-
-
-def test_self_copy(started_cluster):
-    execute_task(started_cluster, Task_self_copy(started_cluster), [])
diff --git a/tests/integration/test_cluster_copier/test_three_nodes.py b/tests/integration/test_cluster_copier/test_three_nodes.py
deleted file mode 100644
index e7d07757adb..00000000000
--- a/tests/integration/test_cluster_copier/test_three_nodes.py
+++ /dev/null
@@ -1,286 +0,0 @@
-import os
-import sys
-import time
-import logging
-import pytest
-
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
-
-import docker
-
-CURRENT_TEST_DIR = os.path.dirname(os.path.abspath(__file__))
-sys.path.insert(0, os.path.dirname(CURRENT_TEST_DIR))
-
-cluster = ClickHouseCluster(__file__)
-
-
-@pytest.fixture(scope="module")
-def started_cluster():
-    global cluster
-    try:
-        for name in ["first", "second", "third"]:
-            cluster.add_instance(
-                name,
-                main_configs=[
-                    "configs_three_nodes/conf.d/clusters.xml",
-                    "configs_three_nodes/conf.d/ddl.xml",
-                ],
-                user_configs=["configs_three_nodes/users.xml"],
-                with_zookeeper=True,
-            )
-
-        cluster.start()
-        yield cluster
-
-    finally:
-        cluster.shutdown()
-
-
-class Task:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task"
-        self.container_task_file = "/task_taxi_data.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_taxi_data.xml"),
-                self.container_task_file,
-            )
-            logging.debug(
-                f"Copied task file to container of '{instance_name}' instance. Path {self.container_task_file}"
-            )
-
-    def start(self):
-        for name in ["first", "second", "third"]:
-            node = cluster.instances[name]
-            node.query("DROP DATABASE IF EXISTS dailyhistory SYNC;")
-            node.query("DROP DATABASE IF EXISTS monthlyhistory SYNC;")
-
-        first = cluster.instances["first"]
-
-        # daily partition database
-        first.query("CREATE DATABASE IF NOT EXISTS dailyhistory on cluster events;")
-        first.query(
-            """CREATE TABLE dailyhistory.yellow_tripdata_staging ON CLUSTER events
-        (
-            id UUID DEFAULT generateUUIDv4(),
-            vendor_id String,
-            tpep_pickup_datetime DateTime('UTC'),
-            tpep_dropoff_datetime DateTime('UTC'),
-            passenger_count Nullable(Float64),
-            trip_distance String,
-            pickup_longitude Float64,
-            pickup_latitude Float64,
-            rate_code_id String,
-            store_and_fwd_flag String,
-            dropoff_longitude Float64,
-            dropoff_latitude Float64,
-            payment_type String,
-            fare_amount String,
-            extra String,
-            mta_tax String,
-            tip_amount String,
-            tolls_amount String,
-            improvement_surcharge String,
-            total_amount String,
-            pickup_location_id String,
-            dropoff_location_id String,
-            congestion_surcharge String,
-            junk1 String,  junk2 String
-        )
-        Engine = ReplacingMergeTree()
-        PRIMARY KEY (tpep_pickup_datetime, id)
-        ORDER BY (tpep_pickup_datetime, id)
-        PARTITION BY (toYYYYMMDD(tpep_pickup_datetime))"""
-        )
-
-        first.query(
-            """CREATE TABLE dailyhistory.yellow_tripdata
-            ON CLUSTER events
-            AS dailyhistory.yellow_tripdata_staging
-            ENGINE = Distributed('events', 'dailyhistory', yellow_tripdata_staging, sipHash64(id) % 3);"""
-        )
-
-        first.query(
-            """INSERT INTO dailyhistory.yellow_tripdata
-            SELECT * FROM generateRandom(
-                'id UUID DEFAULT generateUUIDv4(),
-                vendor_id String,
-                tpep_pickup_datetime DateTime(\\'UTC\\'),
-                tpep_dropoff_datetime DateTime(\\'UTC\\'),
-                passenger_count Nullable(Float64),
-                trip_distance String,
-                pickup_longitude Float64,
-                pickup_latitude Float64,
-                rate_code_id String,
-                store_and_fwd_flag String,
-                dropoff_longitude Float64,
-                dropoff_latitude Float64,
-                payment_type String,
-                fare_amount String,
-                extra String,
-                mta_tax String,
-                tip_amount String,
-                tolls_amount String,
-                improvement_surcharge String,
-                total_amount String,
-                pickup_location_id String,
-                dropoff_location_id String,
-                congestion_surcharge String,
-                junk1 String,
-                junk2 String',
-            1, 10, 2) LIMIT 50;"""
-        )
-
-        # monthly partition database
-        first.query("create database IF NOT EXISTS monthlyhistory on cluster events;")
-        first.query(
-            """CREATE TABLE monthlyhistory.yellow_tripdata_staging ON CLUSTER events
-        (
-            id UUID DEFAULT generateUUIDv4(),
-            vendor_id String,
-            tpep_pickup_datetime DateTime('UTC'),
-            tpep_dropoff_datetime DateTime('UTC'),
-            passenger_count Nullable(Float64),
-            trip_distance String,
-            pickup_longitude Float64,
-            pickup_latitude Float64,
-            rate_code_id String,
-            store_and_fwd_flag String,
-            dropoff_longitude Float64,
-            dropoff_latitude Float64,
-            payment_type String,
-            fare_amount String,
-            extra String,
-            mta_tax String,
-            tip_amount String,
-            tolls_amount String,
-            improvement_surcharge String,
-            total_amount String,
-            pickup_location_id String,
-            dropoff_location_id String,
-            congestion_surcharge String,
-            junk1 String,
-            junk2 String
-        )
-        Engine = ReplacingMergeTree()
-        PRIMARY KEY (tpep_pickup_datetime, id)
-        ORDER BY (tpep_pickup_datetime, id)
-        PARTITION BY (pickup_location_id, toYYYYMM(tpep_pickup_datetime))"""
-        )
-
-        first.query(
-            """CREATE TABLE monthlyhistory.yellow_tripdata
-            ON CLUSTER events
-            AS monthlyhistory.yellow_tripdata_staging
-            ENGINE = Distributed('events', 'monthlyhistory', yellow_tripdata_staging, sipHash64(id) % 3);"""
-        )
-
-    def check(self):
-        first = cluster.instances["first"]
-        a = TSV(first.query("SELECT count() from dailyhistory.yellow_tripdata"))
-        b = TSV(first.query("SELECT count() from monthlyhistory.yellow_tripdata"))
-        assert a == b, "Distributed tables"
-
-        for instance_name, instance in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            a = instance.query(
-                "SELECT count() from dailyhistory.yellow_tripdata_staging"
-            )
-            b = instance.query(
-                "SELECT count() from monthlyhistory.yellow_tripdata_staging"
-            )
-            assert a == b, "MergeTree tables on each shard"
-
-            a = TSV(
-                instance.query(
-                    "SELECT sipHash64(*) from dailyhistory.yellow_tripdata_staging ORDER BY id"
-                )
-            )
-            b = TSV(
-                instance.query(
-                    "SELECT sipHash64(*) from monthlyhistory.yellow_tripdata_staging ORDER BY id"
-                )
-            )
-
-            assert a == b, "Data on each shard"
-
-        for name in ["first", "second", "third"]:
-            node = cluster.instances[name]
-            node.query("DROP DATABASE IF EXISTS dailyhistory SYNC;")
-            node.query("DROP DATABASE IF EXISTS monthlyhistory SYNC;")
-
-
-def execute_task(started_cluster, task, cmd_options):
-    task.start()
-
-    zk = started_cluster.get_kazoo_client("zoo1")
-    logging.debug("Use ZooKeeper server: {}:{}".format(zk.hosts[0][0], zk.hosts[0][1]))
-
-    # Run cluster-copier processes on each node
-    docker_api = started_cluster.docker_client.api
-    copiers_exec_ids = []
-
-    cmd = [
-        "/usr/bin/clickhouse",
-        "copier",
-        "--config",
-        "/etc/clickhouse-server/config-copier.xml",
-        "--task-path",
-        task.zk_task_path,
-        "--task-file",
-        task.container_task_file,
-        "--task-upload-force",
-        "true",
-        "--base-dir",
-        "/var/log/clickhouse-server/copier",
-    ]
-    cmd += cmd_options
-
-    logging.debug(f"execute_task cmd: {cmd}")
-
-    for instance_name in started_cluster.instances.keys():
-        instance = started_cluster.instances[instance_name]
-        container = instance.get_docker_handle()
-        instance.copy_file_to_container(
-            os.path.join(CURRENT_TEST_DIR, "configs_three_nodes/config-copier.xml"),
-            "/etc/clickhouse-server/config-copier.xml",
-        )
-        logging.info("Copied copier config to {}".format(instance.name))
-        exec_id = docker_api.exec_create(container.id, cmd, stderr=True)
-        output = docker_api.exec_start(exec_id).decode("utf8")
-        logging.info(output)
-        copiers_exec_ids.append(exec_id)
-        logging.info(
-            "Copier for {} ({}) has started".format(instance.name, instance.ip_address)
-        )
-
-    # time.sleep(1000)
-
-    # Wait for copiers stopping and check their return codes
-    for exec_id, instance in zip(
-        copiers_exec_ids, iter(started_cluster.instances.values())
-    ):
-        while True:
-            res = docker_api.exec_inspect(exec_id)
-            if not res["Running"]:
-                break
-            time.sleep(1)
-
-        assert res["ExitCode"] == 0, "Instance: {} ({}). Info: {}".format(
-            instance.name, instance.ip_address, repr(res)
-        )
-
-    try:
-        task.check()
-    finally:
-        zk.delete(task.zk_task_path, recursive=True)
-
-
-# Tests
-@pytest.mark.timeout(600)
-def test(started_cluster):
-    execute_task(started_cluster, Task(started_cluster), [])
diff --git a/tests/integration/test_cluster_copier/test_trivial.py b/tests/integration/test_cluster_copier/test_trivial.py
deleted file mode 100644
index b8060583ef8..00000000000
--- a/tests/integration/test_cluster_copier/test_trivial.py
+++ /dev/null
@@ -1,227 +0,0 @@
-import os
-import sys
-import time
-import random
-import string
-
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
-
-import kazoo
-import pytest
-import docker
-
-
-CURRENT_TEST_DIR = os.path.dirname(os.path.abspath(__file__))
-sys.path.insert(0, os.path.dirname(CURRENT_TEST_DIR))
-
-
-COPYING_FAIL_PROBABILITY = 0.1
-MOVING_FAIL_PROBABILITY = 0.1
-
-cluster = ClickHouseCluster(__file__)
-
-
-def generateRandomString(count):
-    return "".join(
-        random.choice(string.ascii_uppercase + string.digits) for _ in range(count)
-    )
-
-
-@pytest.fixture(scope="module")
-def started_cluster():
-    global cluster
-    try:
-        for name in ["first_trivial", "second_trivial"]:
-            instance = cluster.add_instance(
-                name,
-                main_configs=["configs/conf.d/clusters_trivial.xml"],
-                user_configs=["configs_two_nodes/users.xml"],
-                macros={
-                    "cluster": name,
-                    "shard": "the_only_shard",
-                    "replica": "the_only_replica",
-                },
-                with_zookeeper=True,
-            )
-
-        cluster.start()
-        yield cluster
-
-    finally:
-        cluster.shutdown()
-
-
-class TaskTrivial:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_trivial"
-        self.copier_task_config = open(
-            os.path.join(CURRENT_TEST_DIR, "task_trivial.xml"), "r"
-        ).read()
-
-    def start(self):
-        source = cluster.instances["first_trivial"]
-        destination = cluster.instances["second_trivial"]
-
-        for node in [source, destination]:
-            node.query("DROP DATABASE IF EXISTS default")
-            node.query("CREATE DATABASE IF NOT EXISTS default")
-
-        source.query(
-            "CREATE TABLE trivial (d UInt64, d1 UInt64 MATERIALIZED d+1)"
-            "ENGINE=ReplicatedMergeTree('/clickhouse/tables/source_trivial_cluster/1/trivial/{}', '1') "
-            "PARTITION BY d % 5 ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d) SETTINGS index_granularity = 16".format(
-                generateRandomString(10)
-            )
-        )
-
-        source.query(
-            "INSERT INTO trivial SELECT * FROM system.numbers LIMIT 1002",
-            settings={"distributed_foreground_insert": 1},
-        )
-
-    def check(self):
-        zk = cluster.get_kazoo_client("zoo1")
-        status_data, _ = zk.get(self.zk_task_path + "/status")
-        assert (
-            status_data
-            == b'{"hits":{"all_partitions_count":5,"processed_partitions_count":5}}'
-        )
-
-        source = cluster.instances["first_trivial"]
-        destination = cluster.instances["second_trivial"]
-
-        assert TSV(source.query("SELECT count() FROM trivial")) == TSV("1002\n")
-        assert TSV(destination.query("SELECT count() FROM trivial")) == TSV("1002\n")
-
-        for node in [source, destination]:
-            node.query("DROP TABLE trivial")
-
-
-class TaskReplicatedWithoutArguments:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_trivial_without_arguments"
-        self.copier_task_config = open(
-            os.path.join(CURRENT_TEST_DIR, "task_trivial_without_arguments.xml"), "r"
-        ).read()
-
-    def start(self):
-        source = cluster.instances["first_trivial"]
-        destination = cluster.instances["second_trivial"]
-
-        for node in [source, destination]:
-            node.query("DROP DATABASE IF EXISTS default")
-            node.query("CREATE DATABASE IF NOT EXISTS default")
-
-        source.query(
-            "CREATE TABLE trivial_without_arguments ON CLUSTER source_trivial_cluster (d UInt64, d1 UInt64 MATERIALIZED d+1) "
-            "ENGINE=ReplicatedMergeTree() "
-            "PARTITION BY d % 5 ORDER BY (d, sipHash64(d)) SAMPLE BY sipHash64(d) SETTINGS index_granularity = 16"
-        )
-
-        source.query(
-            "INSERT INTO trivial_without_arguments SELECT * FROM system.numbers LIMIT 1002",
-            settings={"distributed_foreground_insert": 1},
-        )
-
-    def check(self):
-        zk = cluster.get_kazoo_client("zoo1")
-        status_data, _ = zk.get(self.zk_task_path + "/status")
-        assert (
-            status_data
-            == b'{"hits":{"all_partitions_count":5,"processed_partitions_count":5}}'
-        )
-
-        source = cluster.instances["first_trivial"]
-        destination = cluster.instances["second_trivial"]
-
-        assert TSV(
-            source.query("SELECT count() FROM trivial_without_arguments")
-        ) == TSV("1002\n")
-        assert TSV(
-            destination.query("SELECT count() FROM trivial_without_arguments")
-        ) == TSV("1002\n")
-
-        for node in [source, destination]:
-            node.query("DROP TABLE trivial_without_arguments")
-
-
-def execute_task(started_cluster, task, cmd_options):
-    task.start()
-
-    zk = started_cluster.get_kazoo_client("zoo1")
-    print("Use ZooKeeper server: {}:{}".format(zk.hosts[0][0], zk.hosts[0][1]))
-
-    try:
-        zk.delete("/clickhouse-copier", recursive=True)
-    except kazoo.exceptions.NoNodeError:
-        print("No node /clickhouse-copier. It is Ok in first test.")
-
-    zk_task_path = task.zk_task_path
-    zk.ensure_path(zk_task_path)
-    zk.create(zk_task_path + "/description", task.copier_task_config.encode())
-
-    # Run cluster-copier processes on each node
-    docker_api = started_cluster.docker_client.api
-    copiers_exec_ids = []
-
-    cmd = [
-        "/usr/bin/clickhouse",
-        "copier",
-        "--config",
-        "/etc/clickhouse-server/config-copier.xml",
-        "--task-path",
-        zk_task_path,
-        "--base-dir",
-        "/var/log/clickhouse-server/copier",
-    ]
-    cmd += cmd_options
-
-    copiers = list(started_cluster.instances.keys())
-
-    for instance_name in copiers:
-        instance = started_cluster.instances[instance_name]
-        container = instance.get_docker_handle()
-        instance.copy_file_to_container(
-            os.path.join(CURRENT_TEST_DIR, "configs/config-copier.xml"),
-            "/etc/clickhouse-server/config-copier.xml",
-        )
-        print("Copied copier config to {}".format(instance.name))
-        exec_id = docker_api.exec_create(container.id, cmd, stderr=True)
-        output = docker_api.exec_start(exec_id).decode("utf8")
-        print(output)
-        copiers_exec_ids.append(exec_id)
-        print(
-            "Copier for {} ({}) has started".format(instance.name, instance.ip_address)
-        )
-
-    # Wait for copiers stopping and check their return codes
-    for exec_id, instance_name in zip(copiers_exec_ids, copiers):
-        instance = started_cluster.instances[instance_name]
-        while True:
-            res = docker_api.exec_inspect(exec_id)
-            if not res["Running"]:
-                break
-            time.sleep(0.5)
-
-        assert res["ExitCode"] == 0, "Instance: {} ({}). Info: {}".format(
-            instance.name, instance.ip_address, repr(res)
-        )
-
-    try:
-        task.check()
-    finally:
-        zk.delete(zk_task_path, recursive=True)
-
-
-# Tests
-
-
-def test_trivial_copy(started_cluster):
-    execute_task(started_cluster, TaskTrivial(started_cluster), [])
-
-
-def test_trivial_without_arguments(started_cluster):
-    execute_task(started_cluster, TaskReplicatedWithoutArguments(started_cluster), [])
diff --git a/tests/integration/test_cluster_copier/test_two_nodes.py b/tests/integration/test_cluster_copier/test_two_nodes.py
deleted file mode 100644
index 1bd3561f24f..00000000000
--- a/tests/integration/test_cluster_copier/test_two_nodes.py
+++ /dev/null
@@ -1,597 +0,0 @@
-import os
-import sys
-import time
-import logging
-import pytest
-
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import TSV
-
-import docker
-
-CURRENT_TEST_DIR = os.path.dirname(os.path.abspath(__file__))
-sys.path.insert(0, os.path.dirname(CURRENT_TEST_DIR))
-
-cluster = ClickHouseCluster(__file__)
-
-
-@pytest.fixture(scope="module")
-def started_cluster():
-    global cluster
-    try:
-        for name in ["first_of_two", "second_of_two"]:
-            instance = cluster.add_instance(
-                name,
-                main_configs=[
-                    "configs_two_nodes/conf.d/clusters.xml",
-                    "configs_two_nodes/conf.d/ddl.xml",
-                    "configs_two_nodes/conf.d/storage_configuration.xml",
-                ],
-                user_configs=["configs_two_nodes/users.xml"],
-                with_zookeeper=True,
-            )
-
-        cluster.start()
-
-        for name in ["first_of_two", "second_of_two"]:
-            instance = cluster.instances[name]
-            instance.exec_in_container(["bash", "-c", "mkdir /jbod1"])
-            instance.exec_in_container(["bash", "-c", "mkdir /jbod2"])
-            instance.exec_in_container(["bash", "-c", "mkdir /external"])
-
-        yield cluster
-
-    finally:
-        cluster.shutdown()
-
-
-# Will copy table from `first` node to `second`
-class TaskWithDifferentSchema:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_with_different_schema"
-        self.container_task_file = "/task_with_different_schema.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_with_different_schema.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["second_of_two"]
-
-        first.query("DROP DATABASE IF EXISTS db_different_schema SYNC")
-        second.query("DROP DATABASE IF EXISTS db_different_schema SYNC")
-
-        first.query("CREATE DATABASE IF NOT EXISTS db_different_schema;")
-        first.query(
-            """CREATE TABLE db_different_schema.source
-        (
-            Column1 String,
-            Column2 UInt32,
-            Column3 Date,
-            Column4 DateTime,
-            Column5 UInt16,
-            Column6 String,
-            Column7 String,
-            Column8 String,
-            Column9 String,
-            Column10 String,
-            Column11 String,
-            Column12 Decimal(3, 1),
-            Column13 DateTime,
-            Column14 UInt16
-        )
-        ENGINE = MergeTree()
-        PARTITION BY (toYYYYMMDD(Column3), Column3)
-        PRIMARY KEY (Column1, Column2, Column3, Column4, Column6, Column7, Column8, Column9)
-        ORDER BY (Column1, Column2, Column3, Column4, Column6, Column7, Column8, Column9)
-        SETTINGS index_granularity = 8192"""
-        )
-
-        first.query(
-            """INSERT INTO db_different_schema.source SELECT * FROM generateRandom(
-            'Column1 String, Column2 UInt32, Column3 Date, Column4 DateTime, Column5 UInt16,
-            Column6 String, Column7 String, Column8 String, Column9 String, Column10 String,
-            Column11 String, Column12 Decimal(3, 1), Column13 DateTime, Column14 UInt16', 1, 10, 2) LIMIT 50;"""
-        )
-
-        second.query("CREATE DATABASE IF NOT EXISTS db_different_schema;")
-        second.query(
-            """CREATE TABLE db_different_schema.destination
-        (
-            Column1 LowCardinality(String) CODEC(LZ4),
-            Column2 UInt32 CODEC(LZ4),
-            Column3 Date CODEC(DoubleDelta, LZ4),
-            Column4 DateTime CODEC(DoubleDelta, LZ4),
-            Column5 UInt16 CODEC(LZ4),
-            Column6 LowCardinality(String) CODEC(ZSTD),
-            Column7 LowCardinality(String) CODEC(ZSTD),
-            Column8 LowCardinality(String) CODEC(ZSTD),
-            Column9 LowCardinality(String) CODEC(ZSTD),
-            Column10 String CODEC(ZSTD(6)),
-            Column11 LowCardinality(String) CODEC(LZ4),
-            Column12 Decimal(3,1) CODEC(LZ4),
-            Column13 DateTime CODEC(DoubleDelta, LZ4),
-            Column14 UInt16 CODEC(LZ4)
-        ) ENGINE = MergeTree()
-        PARTITION BY toYYYYMMDD(Column3)
-        ORDER BY (Column9, Column1, Column2, Column3, Column4);"""
-        )
-
-        print("Preparation completed")
-
-    def check(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["second_of_two"]
-
-        a = first.query("SELECT count() from db_different_schema.source")
-        b = second.query("SELECT count() from db_different_schema.destination")
-        assert a == b, "Count"
-
-        a = TSV(
-            first.query(
-                """SELECT sipHash64(*) from db_different_schema.source
-            ORDER BY (Column1, Column2, Column3, Column4, Column5, Column6, Column7, Column8, Column9, Column10, Column11, Column12, Column13, Column14)"""
-            )
-        )
-        b = TSV(
-            second.query(
-                """SELECT sipHash64(*) from db_different_schema.destination
-            ORDER BY (Column1, Column2, Column3, Column4, Column5, Column6, Column7, Column8, Column9, Column10, Column11, Column12, Column13, Column14)"""
-            )
-        )
-        assert a == b, "Data"
-
-        first.query("DROP DATABASE IF EXISTS db_different_schema SYNC")
-        second.query("DROP DATABASE IF EXISTS db_different_schema SYNC")
-
-
-# Just simple copying, but table schema has TTL on columns
-# Also table will have slightly different schema
-class TaskTTL:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_ttl_columns"
-        self.container_task_file = "/task_ttl_columns.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_ttl_columns.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["second_of_two"]
-
-        first.query("DROP DATABASE IF EXISTS db_ttl_columns SYNC")
-        second.query("DROP DATABASE IF EXISTS db_ttl_columns SYNC")
-
-        first.query("CREATE DATABASE IF NOT EXISTS db_ttl_columns;")
-        first.query(
-            """CREATE TABLE db_ttl_columns.source
-        (
-            Column1 String,
-            Column2 UInt32,
-            Column3 Date,
-            Column4 DateTime,
-            Column5 UInt16,
-            Column6 String TTL now() + INTERVAL 1 MONTH,
-            Column7 Decimal(3, 1) TTL now() + INTERVAL 1 MONTH,
-            Column8 Tuple(Float64, Float64) TTL now() + INTERVAL 1 MONTH
-        )
-        ENGINE = MergeTree()
-        PARTITION BY (toYYYYMMDD(Column3), Column3)
-        PRIMARY KEY (Column1, Column2, Column3)
-        ORDER BY (Column1, Column2, Column3)
-        SETTINGS index_granularity = 8192"""
-        )
-
-        first.query(
-            """INSERT INTO db_ttl_columns.source SELECT * FROM generateRandom(
-            'Column1 String, Column2 UInt32, Column3 Date, Column4 DateTime, Column5 UInt16,
-            Column6 String, Column7 Decimal(3, 1), Column8 Tuple(Float64, Float64)', 1, 10, 2) LIMIT 50;"""
-        )
-
-        second.query("CREATE DATABASE IF NOT EXISTS db_ttl_columns;")
-        second.query(
-            """CREATE TABLE db_ttl_columns.destination
-        (
-            Column1 String,
-            Column2 UInt32,
-            Column3 Date,
-            Column4 DateTime TTL now() + INTERVAL 1 MONTH,
-            Column5 UInt16 TTL now() + INTERVAL 1 MONTH,
-            Column6 String TTL now() + INTERVAL 1 MONTH,
-            Column7 Decimal(3, 1) TTL now() + INTERVAL 1 MONTH,
-            Column8 Tuple(Float64, Float64)
-        ) ENGINE = MergeTree()
-        PARTITION BY toYYYYMMDD(Column3)
-        ORDER BY (Column3, Column2, Column1);"""
-        )
-
-        print("Preparation completed")
-
-    def check(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["second_of_two"]
-
-        a = first.query("SELECT count() from db_ttl_columns.source")
-        b = second.query("SELECT count() from db_ttl_columns.destination")
-        assert a == b, "Count"
-
-        a = TSV(
-            first.query(
-                """SELECT sipHash64(*) from db_ttl_columns.source
-            ORDER BY (Column1, Column2, Column3, Column4, Column5, Column6, Column7, Column8)"""
-            )
-        )
-        b = TSV(
-            second.query(
-                """SELECT sipHash64(*) from db_ttl_columns.destination
-            ORDER BY (Column1, Column2, Column3, Column4, Column5, Column6, Column7, Column8)"""
-            )
-        )
-        assert a == b, "Data"
-
-        first.query("DROP DATABASE IF EXISTS db_ttl_columns SYNC")
-        second.query("DROP DATABASE IF EXISTS db_ttl_columns SYNC")
-
-
-class TaskSkipIndex:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_skip_index"
-        self.container_task_file = "/task_skip_index.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_skip_index.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["second_of_two"]
-
-        first.query("DROP DATABASE IF EXISTS db_skip_index SYNC")
-        second.query("DROP DATABASE IF EXISTS db_skip_index SYNC")
-
-        first.query("CREATE DATABASE IF NOT EXISTS db_skip_index;")
-        first.query(
-            """CREATE TABLE db_skip_index.source
-        (
-            Column1 UInt64,
-            Column2 Int32,
-            Column3 Date,
-            Column4 DateTime,
-            Column5 String,
-            INDEX a (Column1 * Column2, Column5) TYPE minmax GRANULARITY 3,
-            INDEX b (Column1 * length(Column5)) TYPE set(1000) GRANULARITY 4
-        )
-        ENGINE = MergeTree()
-        PARTITION BY (toYYYYMMDD(Column3), Column3)
-        PRIMARY KEY (Column1, Column2, Column3)
-        ORDER BY (Column1, Column2, Column3)
-        SETTINGS index_granularity = 8192"""
-        )
-
-        first.query(
-            """INSERT INTO db_skip_index.source SELECT * FROM generateRandom(
-            'Column1 UInt64, Column2 Int32, Column3 Date, Column4 DateTime, Column5 String', 1, 10, 2) LIMIT 100;"""
-        )
-
-        second.query("CREATE DATABASE IF NOT EXISTS db_skip_index;")
-        second.query(
-            """CREATE TABLE db_skip_index.destination
-        (
-            Column1 UInt64,
-            Column2 Int32,
-            Column3 Date,
-            Column4 DateTime,
-            Column5 String,
-            INDEX a (Column1 * Column2, Column5) TYPE minmax GRANULARITY 3,
-            INDEX b (Column1 * length(Column5)) TYPE set(1000) GRANULARITY 4
-        ) ENGINE = MergeTree()
-        PARTITION BY toYYYYMMDD(Column3)
-        ORDER BY (Column3, Column2, Column1);"""
-        )
-
-        print("Preparation completed")
-
-    def check(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["second_of_two"]
-
-        a = first.query("SELECT count() from db_skip_index.source")
-        b = second.query("SELECT count() from db_skip_index.destination")
-        assert a == b, "Count"
-
-        a = TSV(
-            first.query(
-                """SELECT sipHash64(*) from db_skip_index.source
-            ORDER BY (Column1, Column2, Column3, Column4, Column5)"""
-            )
-        )
-        b = TSV(
-            second.query(
-                """SELECT sipHash64(*) from db_skip_index.destination
-            ORDER BY (Column1, Column2, Column3, Column4, Column5)"""
-            )
-        )
-        assert a == b, "Data"
-
-        first.query("DROP DATABASE IF EXISTS db_skip_index SYNC")
-        second.query("DROP DATABASE IF EXISTS db_skip_index SYNC")
-
-
-class TaskTTLMoveToVolume:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_ttl_move_to_volume"
-        self.container_task_file = "/task_ttl_move_to_volume.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_ttl_move_to_volume.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["first_of_two"]
-
-        first.query("DROP DATABASE IF EXISTS db_move_to_volume SYNC")
-        second.query("DROP DATABASE IF EXISTS db_move_to_volume SYNC")
-
-        first.query("CREATE DATABASE IF NOT EXISTS db_move_to_volume;")
-        first.query(
-            """CREATE TABLE db_move_to_volume.source
-        (
-            Column1 UInt64,
-            Column2 Int32,
-            Column3 Date,
-            Column4 DateTime,
-            Column5 String
-        )
-        ENGINE = MergeTree()
-        PARTITION BY (toYYYYMMDD(Column3), Column3)
-        PRIMARY KEY (Column1, Column2, Column3)
-        ORDER BY (Column1, Column2, Column3)
-        TTL Column3 + INTERVAL 1 MONTH TO VOLUME 'external'
-        SETTINGS storage_policy = 'external_with_jbods';"""
-        )
-
-        first.query(
-            """INSERT INTO db_move_to_volume.source SELECT * FROM generateRandom(
-            'Column1 UInt64, Column2 Int32, Column3 Date, Column4 DateTime, Column5 String', 1, 10, 2) LIMIT 100;"""
-        )
-
-        second.query("CREATE DATABASE IF NOT EXISTS db_move_to_volume;")
-        second.query(
-            """CREATE TABLE db_move_to_volume.destination
-        (
-            Column1 UInt64,
-            Column2 Int32,
-            Column3 Date,
-            Column4 DateTime,
-            Column5 String
-        ) ENGINE = MergeTree()
-        PARTITION BY toYYYYMMDD(Column3)
-        ORDER BY (Column3, Column2, Column1)
-        TTL Column3 + INTERVAL 1 MONTH TO VOLUME 'external'
-        SETTINGS storage_policy = 'external_with_jbods';"""
-        )
-
-        print("Preparation completed")
-
-    def check(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["second_of_two"]
-
-        a = first.query("SELECT count() from db_move_to_volume.source")
-        b = second.query("SELECT count() from db_move_to_volume.destination")
-        assert a == b, "Count"
-
-        a = TSV(
-            first.query(
-                """SELECT sipHash64(*) from db_move_to_volume.source
-            ORDER BY (Column1, Column2, Column3, Column4, Column5)"""
-            )
-        )
-        b = TSV(
-            second.query(
-                """SELECT sipHash64(*) from db_move_to_volume.destination
-            ORDER BY (Column1, Column2, Column3, Column4, Column5)"""
-            )
-        )
-        assert a == b, "Data"
-
-        first.query("DROP DATABASE IF EXISTS db_move_to_volume SYNC")
-        second.query("DROP DATABASE IF EXISTS db_move_to_volume SYNC")
-
-
-class TaskDropTargetPartition:
-    def __init__(self, cluster):
-        self.cluster = cluster
-        self.zk_task_path = "/clickhouse-copier/task_drop_target_partition"
-        self.container_task_file = "/task_drop_target_partition.xml"
-
-        for instance_name, _ in cluster.instances.items():
-            instance = cluster.instances[instance_name]
-            instance.copy_file_to_container(
-                os.path.join(CURRENT_TEST_DIR, "./task_drop_target_partition.xml"),
-                self.container_task_file,
-            )
-            print(
-                "Copied task file to container of '{}' instance. Path {}".format(
-                    instance_name, self.container_task_file
-                )
-            )
-
-    def start(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["second_of_two"]
-
-        first.query("DROP DATABASE IF EXISTS db_drop_target_partition SYNC")
-        second.query("DROP DATABASE IF EXISTS db_drop_target_partition SYNC")
-
-        first.query("CREATE DATABASE IF NOT EXISTS db_drop_target_partition;")
-        first.query(
-            """CREATE TABLE db_drop_target_partition.source
-        (
-            Column1 UInt64,
-            Column2 Int32,
-            Column3 Date,
-            Column4 DateTime,
-            Column5 String
-        )
-        ENGINE = MergeTree()
-        PARTITION BY (toYYYYMMDD(Column3), Column3)
-        PRIMARY KEY (Column1, Column2, Column3)
-        ORDER BY (Column1, Column2, Column3);"""
-        )
-
-        first.query(
-            """INSERT INTO db_drop_target_partition.source SELECT * FROM generateRandom(
-            'Column1 UInt64, Column2 Int32, Column3 Date, Column4 DateTime, Column5 String', 1, 10, 2) LIMIT 100;"""
-        )
-
-        second.query("CREATE DATABASE IF NOT EXISTS db_drop_target_partition;")
-        second.query(
-            """CREATE TABLE db_drop_target_partition.destination
-        (
-            Column1 UInt64,
-            Column2 Int32,
-            Column3 Date,
-            Column4 DateTime,
-            Column5 String
-        ) ENGINE = MergeTree()
-        PARTITION BY toYYYYMMDD(Column3)
-        ORDER BY (Column3, Column2, Column1);"""
-        )
-
-        # Insert data in target too. It has to be dropped.
-        first.query(
-            """INSERT INTO db_drop_target_partition.destination SELECT * FROM db_drop_target_partition.source;"""
-        )
-
-        print("Preparation completed")
-
-    def check(self):
-        first = cluster.instances["first_of_two"]
-        second = cluster.instances["second_of_two"]
-
-        a = first.query("SELECT count() from db_drop_target_partition.source")
-        b = second.query("SELECT count() from db_drop_target_partition.destination")
-        assert a == b, "Count"
-
-        a = TSV(
-            first.query(
-                """SELECT sipHash64(*) from db_drop_target_partition.source
-            ORDER BY (Column1, Column2, Column3, Column4, Column5)"""
-            )
-        )
-        b = TSV(
-            second.query(
-                """SELECT sipHash64(*) from db_drop_target_partition.destination
-            ORDER BY (Column1, Column2, Column3, Column4, Column5)"""
-            )
-        )
-        assert a == b, "Data"
-
-        first.query("DROP DATABASE IF EXISTS db_drop_target_partition SYNC")
-        second.query("DROP DATABASE IF EXISTS db_drop_target_partition SYNC")
-
-
-def execute_task(started_cluster, task, cmd_options):
-    task.start()
-
-    zk = started_cluster.get_kazoo_client("zoo1")
-    print("Use ZooKeeper server: {}:{}".format(zk.hosts[0][0], zk.hosts[0][1]))
-
-    # Run cluster-copier processes on each node
-    docker_api = started_cluster.docker_client.api
-    copiers_exec_ids = []
-
-    cmd = [
-        "/usr/bin/clickhouse",
-        "copier",
-        "--config",
-        "/etc/clickhouse-server/config-copier.xml",
-        "--task-path",
-        task.zk_task_path,
-        "--task-file",
-        task.container_task_file,
-        "--task-upload-force",
-        "true",
-        "--base-dir",
-        "/var/log/clickhouse-server/copier",
-    ]
-    cmd += cmd_options
-
-    print(cmd)
-
-    for instance_name in started_cluster.instances.keys():
-        instance = started_cluster.instances[instance_name]
-        container = instance.get_docker_handle()
-        instance.copy_file_to_container(
-            os.path.join(CURRENT_TEST_DIR, "configs_two_nodes/config-copier.xml"),
-            "/etc/clickhouse-server/config-copier.xml",
-        )
-        logging.info("Copied copier config to {}".format(instance.name))
-        exec_id = docker_api.exec_create(container.id, cmd, stderr=True)
-        output = docker_api.exec_start(exec_id).decode("utf8")
-        logging.info(output)
-        copiers_exec_ids.append(exec_id)
-        logging.info(
-            "Copier for {} ({}) has started".format(instance.name, instance.ip_address)
-        )
-
-    # time.sleep(1000)
-
-    # Wait for copiers stopping and check their return codes
-    for exec_id, instance in zip(
-        copiers_exec_ids, iter(started_cluster.instances.values())
-    ):
-        while True:
-            res = docker_api.exec_inspect(exec_id)
-            if not res["Running"]:
-                break
-            time.sleep(1)
-
-        assert res["ExitCode"] == 0, "Instance: {} ({}). Info: {}".format(
-            instance.name, instance.ip_address, repr(res)
-        )
-
-    try:
-        task.check()
-    finally:
-        zk.delete(task.zk_task_path, recursive=True)
diff --git a/tests/integration/test_config_xml_full/configs/config.xml b/tests/integration/test_config_xml_full/configs/config.xml
index ac59b3428e8..628e1432350 100644
--- a/tests/integration/test_config_xml_full/configs/config.xml
+++ b/tests/integration/test_config_xml_full/configs/config.xml
@@ -72,7 +72,7 @@
     <http_port>8123</http_port>
 
     <!-- Port for interaction by native protocol with:
-         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark, clickhouse-copier);
+         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark);
          - clickhouse-server with other clickhouse-servers for distributed query processing;
          - ClickHouse drivers and applications supporting native protocol
          (this protocol is also informally called as "the TCP protocol");

From 7365da9293adf2b63bef173769e171581d727d82 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <nikitamikhaylov@clickhouse.com>
Date: Thu, 7 Mar 2024 19:30:31 +0000
Subject: [PATCH 171/985] Better

---
 docs/ru/operations/backup.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/ru/operations/backup.md b/docs/ru/operations/backup.md
index 50ee6b45e09..44877ff8071 100644
--- a/docs/ru/operations/backup.md
+++ b/docs/ru/operations/backup.md
@@ -24,6 +24,8 @@ sidebar_label: "Резервное копирование данных"
 
 Некоторые локальные файловые системы позволяют делать снимки (например, [ZFS](https://en.wikipedia.org/wiki/ZFS)), но они могут быть не лучшим выбором для обслуживания живых запросов. Возможным решением является создание дополнительных реплик с такой файловой системой и исключение их из [Distributed](../engines/table-engines/special/distributed.md) таблиц, используемых для запросов `SELECT`. Снимки на таких репликах будут недоступны для запросов, изменяющих данные. В качестве бонуса, эти реплики могут иметь особые конфигурации оборудования с большим количеством дисков, подключенных к серверу, что будет экономически эффективным.
 
+Для небольших объёмов данных можно применять `INSERT INTO ... SELECT ...` в удалённые таблицы.
+
 ## Манипуляции с партициями {#manipuliatsii-s-partitsiiami}
 
 ClickHouse позволяет использовать запрос `ALTER TABLE ... FREEZE PARTITION ...` для создания локальной копии партиций таблицы. Это реализуется с помощью жестких ссылок (hardlinks) на каталог `/var/lib/clickhouse/shadow/`, поэтому такая копия обычно не занимает дополнительное место на диске для старых данных. Созданные копии файлов не обрабатываются сервером ClickHouse, поэтому вы можете просто оставить их там: у вас будет простая резервная копия, которая не требует дополнительной внешней системы, однако при аппаратных проблемах вы можете утратить и актуальные данные и сохраненную копию. По этой причине, лучше удаленно скопировать их в другое место, а затем удалить локальную копию. Распределенные файловые системы и хранилища объектов по-прежнему являются хорошими вариантами для этого, однако можно использовать и обычные присоединенные файловые серверы с достаточно большой ёмкостью (в этом случае передача будет происходить через сетевую файловую систему или, возможно, [rsync](https://en.wikipedia.org/wiki/Rsync)).

From b0b38121a60682ee79d47914e18dd57d892f394e Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 7 Mar 2024 20:44:03 +0000
Subject: [PATCH 172/985] Crash repro

---
 src/Storages/StorageMergeTree.cpp             |  1 +
 ...eplicas_cte_explain_syntax_crash.reference | 15 +++++++
 ...llel_replicas_cte_explain_syntax_crash.sql | 44 +++++++++++++++++++
 3 files changed, 60 insertions(+)
 create mode 100644 tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.reference
 create mode 100644 tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index e15b308f084..dbc901d4a5f 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -220,6 +220,7 @@ void StorageMergeTree::read(
         Block header;
         if (local_context->getSettingsRef().allow_experimental_analyzer)
         {
+            chassert(query_info.query_tree);
             QueryTreeNodePtr modified_query_tree = query_info.query_tree->clone();
             rewriteJoinToGlobalJoin(modified_query_tree, local_context);
             modified_query_tree = buildQueryTreeForShard(query_info.planner_context, modified_query_tree);
diff --git a/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.reference b/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.reference
new file mode 100644
index 00000000000..078890722fd
--- /dev/null
+++ b/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.reference
@@ -0,0 +1,15 @@
+WITH
+    cte1 AS
+    (
+        SELECT n
+        FROM numbers_1e6__fuzz_34
+    ),
+    cte2 AS
+    (
+        SELECT n
+        FROM numbers_1e6__fuzz_33
+        PREWHERE n IN cte1
+    )
+SELECT count()
+FROM
+cte2
diff --git a/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql b/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql
new file mode 100644
index 00000000000..a407fceb1c6
--- /dev/null
+++ b/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql
@@ -0,0 +1,44 @@
+DROP TABLE IF EXISTS numbers_1e6__fuzz_34;
+DROP TABLE IF EXISTS numbers_1e6__fuzz_33;
+
+CREATE TABLE numbers_1e6__fuzz_34
+(
+    `n` LowCardinality(Nullable(UInt8))
+)
+ENGINE = MergeTree
+ORDER BY n
+SETTINGS allow_nullable_key = 1
+AS SELECT *
+FROM numbers(1000000)
+SETTINGS allow_suspicious_low_cardinality_types = 1;
+
+
+CREATE TABLE numbers_1e6__fuzz_33
+(
+    `n` LowCardinality(Nullable(UInt8))
+)
+ENGINE = MergeTree
+ORDER BY n
+SETTINGS allow_nullable_key = 1
+AS SELECT *
+FROM numbers(1000000)
+SETTINGS allow_suspicious_low_cardinality_types = 1;
+
+SET allow_experimental_analyzer = 0;
+SET allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3;
+EXPLAIN SYNTAX
+WITH
+    cte1 AS
+    (
+        SELECT n
+        FROM numbers_1e6__fuzz_34
+    ),
+    cte2 AS
+    (
+        SELECT n
+        FROM numbers_1e6__fuzz_33
+        PREWHERE n IN (cte1)
+    )
+SELECT count()
+FROM cte2;
+-- SETTINGS allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3;

From cde811804f68656577dd1497e511a4a9295d4544 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Fri, 8 Mar 2024 12:20:34 +0800
Subject: [PATCH 173/985] prevent memcpySmallAllowReadWriteOverflow15Impl
 optimized to memcpy

---
 src/Common/memcpySmall.h | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Common/memcpySmall.h b/src/Common/memcpySmall.h
index f3d26c60380..f5e9f31fc46 100644
--- a/src/Common/memcpySmall.h
+++ b/src/Common/memcpySmall.h
@@ -49,6 +49,9 @@ namespace detail
             dst += 16;
             src += 16;
             n -= 16;
+
+            /// Avoid clang loop-idion optimization, which transforms _mm_storeu_si128 to built-in memcpy
+            __asm__ __volatile__("" : : : "memory");
         }
     }
 }

From 89ae39e598a481dbb2c610ee7dca1fc7272517b7 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Fri, 8 Mar 2024 12:22:07 +0800
Subject: [PATCH 174/985] optimize column string replicate

---
 src/Columns/ColumnString.cpp | 38 ++++++++++++++++++++----------------
 1 file changed, 21 insertions(+), 17 deletions(-)

diff --git a/src/Columns/ColumnString.cpp b/src/Columns/ColumnString.cpp
index b9128372cea..0c52a7be086 100644
--- a/src/Columns/ColumnString.cpp
+++ b/src/Columns/ColumnString.cpp
@@ -460,6 +460,7 @@ void ColumnString::updatePermutationWithCollation(const Collator & collator, Per
             DefaultPartialSort());
 }
 
+
 ColumnPtr ColumnString::replicate(const Offsets & replicate_offsets) const
 {
     size_t col_size = size();
@@ -471,32 +472,35 @@ ColumnPtr ColumnString::replicate(const Offsets & replicate_offsets) const
     if (0 == col_size)
         return res;
 
-    Chars & res_chars = res->chars;
     Offsets & res_offsets = res->offsets;
-    res_chars.reserve_exact(chars.size() / col_size * replicate_offsets.back());
-    res_offsets.reserve_exact(replicate_offsets.back());
-
-    Offset prev_replicate_offset = 0;
-    Offset prev_string_offset = 0;
-    Offset current_new_offset = 0;
+    res_offsets.resize_exact(replicate_offsets.back());
 
+    Chars & res_chars = res->chars;
+    size_t res_chars_size = 0;
     for (size_t i = 0; i < col_size; ++i)
     {
-        size_t size_to_replicate = replicate_offsets[i] - prev_replicate_offset;
-        size_t string_size = offsets[i] - prev_string_offset;
+        size_t size_to_replicate = replicate_offsets[i] - replicate_offsets[i - 1];
+        size_t string_size = offsets[i] - offsets[i - 1];
+        res_chars_size += size_to_replicate * string_size;
+    }
+    res_chars.resize_exact(res_chars_size);
 
+    size_t curr_row = 0;
+    size_t curr_offset = 0;
+    for (size_t i = 0; i < col_size; ++i)
+    {
+        const size_t size_to_replicate = replicate_offsets[i] - replicate_offsets[i - 1];
+        const size_t string_size = offsets[i] - offsets[i-1];
+        const UInt8 * src = &chars[offsets[i - 1]];
         for (size_t j = 0; j < size_to_replicate; ++j)
         {
-            current_new_offset += string_size;
-            res_offsets.push_back(current_new_offset);
-
-            res_chars.resize(res_chars.size() + string_size);
             memcpySmallAllowReadWriteOverflow15(
-                &res_chars[res_chars.size() - string_size], &chars[prev_string_offset], string_size);
-        }
+                &res_chars[curr_offset], src, string_size);
 
-        prev_replicate_offset = replicate_offsets[i];
-        prev_string_offset = offsets[i];
+            curr_offset += string_size;
+            res_offsets[curr_row] = curr_offset;
+            ++curr_row;
+        }
     }
 
     return res;

From 391af00b64e62dc7d9e1c5726c1aa202f19dffd8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E6=9D=8E=E6=89=AC?= <654010905@qq.com>
Date: Fri, 8 Mar 2024 13:47:35 +0800
Subject: [PATCH 175/985] Update memcpySmall.h

---
 src/Common/memcpySmall.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/memcpySmall.h b/src/Common/memcpySmall.h
index f5e9f31fc46..90648254d76 100644
--- a/src/Common/memcpySmall.h
+++ b/src/Common/memcpySmall.h
@@ -50,7 +50,7 @@ namespace detail
             src += 16;
             n -= 16;
 
-            /// Avoid clang loop-idion optimization, which transforms _mm_storeu_si128 to built-in memcpy
+            /// Avoid clang loop-idiom optimization, which transforms _mm_storeu_si128 to built-in memcpy
             __asm__ __volatile__("" : : : "memory");
         }
     }

From 4c3fa4e8642780d2e27ed4f31590345646f0bb26 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 8 Mar 2024 09:42:49 +0000
Subject: [PATCH 176/985] Use global scalars cache in analyzer.

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 47 ++++++++++++++++++++---
 1 file changed, 42 insertions(+), 5 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index c62641ca05c..e7c48b81fbc 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -86,6 +86,7 @@
 namespace ProfileEvents
 {
     extern const Event ScalarSubqueriesGlobalCacheHit;
+    extern const Event ScalarSubqueriesLocalCacheHit;
     extern const Event ScalarSubqueriesCacheMiss;
 }
 
@@ -1444,7 +1445,8 @@ private:
     std::unordered_map<QueryTreeNodePtr, size_t> node_to_tree_size;
 
     /// Global scalar subquery to scalar value map
-    std::unordered_map<QueryTreeNodePtrWithHash, Block> scalar_subquery_to_scalar_value;
+    std::unordered_map<QueryTreeNodePtrWithHash, Block> scalar_subquery_to_scalar_value_local;
+    std::unordered_map<QueryTreeNodePtrWithHash, Block> scalar_subquery_to_scalar_value_global;
 
     const bool only_analyze;
 };
@@ -1951,6 +1953,24 @@ QueryTreeNodePtr QueryAnalyzer::tryGetLambdaFromSQLUserDefinedFunctions(const st
     return result_node;
 }
 
+bool subtreeHasViewSource(const IQueryTreeNode * node, const Context & context)
+{
+    if (!node)
+        return false;
+
+    if (const auto * table_node = node->as<TableNode>())
+    {
+        if (table_node->getStorageID().getFullNameNotQuoted() == context.getViewSource()->getStorageID().getFullNameNotQuoted())
+            return true;
+    }
+
+    for (const auto & child : node->getChildren())
+        if (subtreeHasViewSource(child.get(), context))
+            return true;
+
+    return false;
+}
+
 /// Evaluate scalar subquery and perform constant folding if scalar subquery does not have constant value
 void QueryAnalyzer::evaluateScalarSubqueryIfNeeded(QueryTreeNodePtr & node, IdentifierResolveScope & scope)
 {
@@ -1970,13 +1990,28 @@ void QueryAnalyzer::evaluateScalarSubqueryIfNeeded(QueryTreeNodePtr & node, Iden
     node_without_alias->removeAlias();
 
     QueryTreeNodePtrWithHash node_with_hash(node_without_alias);
-    auto scalar_value_it = scalar_subquery_to_scalar_value.find(node_with_hash);
+    auto str_hash = DB::toString(node_with_hash.hash);
 
-    if (scalar_value_it != scalar_subquery_to_scalar_value.end())
+    bool can_use_global_scalars = !(context->getViewSource() && subtreeHasViewSource(node_without_alias.get(), *context));
+
+    auto & scalars_cache = can_use_global_scalars ? scalar_subquery_to_scalar_value_global : scalar_subquery_to_scalar_value_local;
+    auto scalar_value_it = scalars_cache.find(node_with_hash);
+
+    if (scalar_value_it != scalars_cache.end())
     {
-        ProfileEvents::increment(ProfileEvents::ScalarSubqueriesGlobalCacheHit);
+        if (can_use_global_scalars)
+            ProfileEvents::increment(ProfileEvents::ScalarSubqueriesGlobalCacheHit);
+        else
+            ProfileEvents::increment(ProfileEvents::ScalarSubqueriesLocalCacheHit);
+
         scalar_block = scalar_value_it->second;
     }
+    else if (context->hasQueryContext() && can_use_global_scalars && context->getQueryContext()->hasScalar(str_hash))
+    {
+        scalar_block = context->getQueryContext()->getScalar(str_hash);
+        scalar_subquery_to_scalar_value_global.emplace(node_with_hash, scalar_block);
+        ProfileEvents::increment(ProfileEvents::ScalarSubqueriesGlobalCacheHit);
+    }
     else
     {
         ProfileEvents::increment(ProfileEvents::ScalarSubqueriesCacheMiss);
@@ -2087,7 +2122,9 @@ void QueryAnalyzer::evaluateScalarSubqueryIfNeeded(QueryTreeNodePtr & node, Iden
             }
         }
 
-        scalar_subquery_to_scalar_value.emplace(node_with_hash, scalar_block);
+        scalars_cache.emplace(node_with_hash, scalar_block);
+        if (can_use_global_scalars && context->hasQueryContext())
+            context->getQueryContext()->addScalar(str_hash, scalar_block);
     }
 
     const auto & scalar_column_with_type = scalar_block.safeGetByPosition(0);

From d52027c5a09f0f9619bc2f5df639f1a042b2c084 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 8 Mar 2024 12:00:34 +0100
Subject: [PATCH 177/985] Style and comments

---
 base/base/itoa.cpp | 47 +++++++++++++++++++++++-----------------------
 1 file changed, 24 insertions(+), 23 deletions(-)

diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
index 08912edf3ea..4475ae416b9 100644
--- a/base/base/itoa.cpp
+++ b/base/base/itoa.cpp
@@ -165,16 +165,16 @@ ALWAYS_INLINE inline char * outDigit(char * p, uint8_t value)
 // into ascii characters as described by Andrei Alexandrescu in
 // https://www.facebook.com/notes/facebook-engineering/three-optimization-tips-for-c/10151361643253920/
 
-static const char digits[201] = "00010203040506070809"
-                                "10111213141516171819"
-                                "20212223242526272829"
-                                "30313233343536373839"
-                                "40414243444546474849"
-                                "50515253545556575859"
-                                "60616263646566676869"
-                                "70717273747576777879"
-                                "80818283848586878889"
-                                "90919293949596979899";
+const char digits[201] = "00010203040506070809"
+                         "10111213141516171819"
+                         "20212223242526272829"
+                         "30313233343536373839"
+                         "40414243444546474849"
+                         "50515253545556575859"
+                         "60616263646566676869"
+                         "70717273747576777879"
+                         "80818283848586878889"
+                         "90919293949596979899";
 
 ALWAYS_INLINE inline char * outTwoDigits(char * p, uint8_t value)
 {
@@ -334,23 +334,24 @@ ALWAYS_INLINE inline char * itoa(I i, char * p)
 
 
 const uint64_t max_multiple_of_hundred_that_fits_in_64_bits = 1'00'00'00'00'00'00'00'00'00ull;
-constexpr int max_multiple_of_hundred_blocks = 9;
+const int max_multiple_of_hundred_blocks = 9;
 static_assert(max_multiple_of_hundred_that_fits_in_64_bits % 100 == 0);
 
 ALWAYS_INLINE inline char * writeUIntText(UInt128 _x, char * p)
 {
-    /// If we the highest 8 byte item is empty, we can print only the lowest item as i64
+    /// If we the highest 64bit item is empty, we can print just the lowest item as u64
     if (_x.items[UInt128::_impl::little(1)] == 0)
         return convert::itoa(_x.items[UInt128::_impl::little(0)], p);
 
-    /// Doing operations using __int128 is faster, as we already rely on this feature
+    /// Doing operations using __int128 is faster and we already rely on this feature
     using T = unsigned __int128;
     T x = (T(_x.items[UInt128::_impl::little(1)]) << 64) + T(_x.items[UInt128::_impl::little(0)]);
 
     /// We are going to accumulate blocks of 2 digits to print until the number is small enough to be printed as u64
     /// To do this we could do: x / 100, x % 100
-    /// But this is too many iterations with long integers, so instead we can divide by a much longer integer
-    /// max_multiple_of_hundred_that_fits_in_64_bits and then get the blocks out of this (as u64)
+    /// But these would mean doing many iterations with long integers, so instead we divide by a much longer integer
+    /// multiple of 100 (100^9) and then get the blocks out of it (as u64)
+    /// Once we reach u64::max we can stop and use the fast method to print that in the front
     static const T large_divisor = max_multiple_of_hundred_that_fits_in_64_bits;
     static const T largest_uint64 = std::numeric_limits<uint64_t>::max();
     uint8_t two_values[20] = {0}; // 39 Max characters / 2
@@ -358,15 +359,15 @@ ALWAYS_INLINE inline char * writeUIntText(UInt128 _x, char * p)
     int current_block = 0;
     while (x > largest_uint64)
     {
-        uint64_t remainder = uint64_t(x % large_divisor);
+        uint64_t u64_remainder = uint64_t(x % large_divisor);
         x /= large_divisor;
 
         int pos = current_block;
-        while (remainder)
+        while (u64_remainder)
         {
-            two_values[pos] = uint8_t(remainder % 100);
+            two_values[pos] = uint8_t(u64_remainder % 100);
             pos++;
-            remainder /= 100;
+            u64_remainder /= 100;
         }
         current_block += max_multiple_of_hundred_blocks;
     }
@@ -417,15 +418,15 @@ ALWAYS_INLINE inline char * writeUIntText(UInt256 _x, char * p)
 
     while (x > largest_uint128)
     {
-        uint64_t remainder = uint64_t(x % large_divisor);
+        uint64_t u64_remainder = uint64_t(x % large_divisor);
         x /= large_divisor;
 
         int pos = current_pos;
-        while (remainder)
+        while (u64_remainder)
         {
-            two_values[pos] = uint8_t(remainder % 100);
+            two_values[pos] = uint8_t(u64_remainder % 100);
             pos++;
-            remainder /= 100;
+            u64_remainder /= 100;
         }
         current_pos += max_multiple_of_hundred_blocks;
     }

From 2f3c103367de4fab57602e3fc1821608df718c77 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 8 Mar 2024 12:02:53 +0100
Subject: [PATCH 178/985] OSX quirks

---
 base/base/itoa.cpp | 4 ++++
 base/base/itoa.h   | 4 ++++
 2 files changed, 8 insertions(+)

diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
index 4475ae416b9..d877f15b563 100644
--- a/base/base/itoa.cpp
+++ b/base/base/itoa.cpp
@@ -542,6 +542,10 @@ char * itoa(Int256 i, char * p)
 #define INSTANTIATION(T) template char * itoa(T i, char * p);
 FOR_MISSING_INTEGER_TYPES(INSTANTIATION)
 
+#if defined(OS_DARWIN)
+INSTANTIATION(size_t)
+#endif
+
 #undef FOR_MISSING_INTEGER_TYPES
 #undef INSTANTIATION
 
diff --git a/base/base/itoa.h b/base/base/itoa.h
index 71603cdeb88..98a570b12fa 100644
--- a/base/base/itoa.h
+++ b/base/base/itoa.h
@@ -25,6 +25,10 @@ template <> char * itoa(Int256 i, char * p);
     extern template char * itoa(T i, char * p);
 FOR_MISSING_INTEGER_TYPES(INSTANTIATION)
 
+#if defined(OS_DARWIN)
+INSTANTIATION(size_t)
+#endif
+
 #undef FOR_MISSING_INTEGER_TYPES
 #undef INSTANTIATION
 

From e7cc49212a15ca8bcf87950225e066d04c8823e4 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 8 Mar 2024 12:28:14 +0100
Subject: [PATCH 179/985] fix tidy build

---
 src/Functions/array/arrayDistance.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index 03f0bc7b286..0045075ddef 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -523,18 +523,18 @@ private:
         const auto & offsets_y = array_y.getOffsets();
 
         ColumnArray::Offset prev_offset = 0;
-        for (size_t row = 0; row < offsets_y.size(); ++row)
+        for (auto offset_y : offsets_y)
         {
-            if (offsets_x[0] != offsets_y[row] - prev_offset) [[unlikely]]
+            if (offsets_x[0] != offset_y - prev_offset) [[unlikely]]
             {
                 throw Exception(
                     ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH,
                     "Arguments of function {} have different array sizes: {} and {}",
                     getName(),
                     offsets_x[0],
-                    offsets_y[row] - prev_offset);
+                    offset_y - prev_offset);
             }
-            prev_offset = offsets_y[row];
+            prev_offset = offset_y;
         }
 
         const typename Kernel::ConstParams kernel_params = initConstParams(arguments);

From 435e78d01dec0448002d0b7057e4d8b4307aea59 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Fri, 8 Mar 2024 12:33:40 +0100
Subject: [PATCH 180/985] Analyzer: fix
 01244_optimize_distributed_group_by_sharding_key

---
 tests/analyzer_tech_debt.txt                                    | 1 -
 .../01244_optimize_distributed_group_by_sharding_key.sql        | 2 +-
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index dc6284d20c5..f6a662177c8 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -4,7 +4,6 @@
 01062_pm_all_join_with_block_continuation
 01083_expressions_in_engine_arguments
 01155_rename_move_materialized_view
-01244_optimize_distributed_group_by_sharding_key
 01584_distributed_buffer_cannot_find_column
 01624_soft_constraints
 01747_join_view_filter_dictionary
diff --git a/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql b/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql
index 0d24b238d64..e80f41b173c 100644
--- a/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql
+++ b/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql
@@ -42,7 +42,7 @@ select 'GROUP BY number ORDER BY number DESC';
 select count(), * from dist_01247 group by number order by number desc;
 
 select 'GROUP BY toString(number)';
-select count(), * from dist_01247 group by toString(number);
+select count(), any(number) from dist_01247 group by toString(number);
 
 select 'GROUP BY number%2';
 select count(), any(number) from dist_01247 group by number%2;

From 07ce390609238318a7ab115b3d7020f03150ce76 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 8 Mar 2024 13:59:24 +0100
Subject: [PATCH 181/985] No public templates, just happiness

---
 base/base/itoa.cpp | 44 +++++++++++++++++++++-----------------------
 base/base/itoa.h   | 35 ++++++++++++++---------------------
 2 files changed, 35 insertions(+), 44 deletions(-)

diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
index d877f15b563..3c4f0bb048d 100644
--- a/base/base/itoa.cpp
+++ b/base/base/itoa.cpp
@@ -32,9 +32,11 @@
 #include <base/extended_types.h>
 #include <base/itoa.h>
 
+namespace
+{
 
 template <typename T>
-inline int digits10(T x)
+int digits10T(T x)
 {
     if (x < 10ULL)
         return 1;
@@ -64,13 +66,9 @@ inline int digits10(T x)
         return 11 + (x >= 100000000000ULL);
     }
 
-    return 12 + digits10(x / 1000000000000ULL);
+    return 12 + digits10T(x / 1000000000000ULL);
 }
 
-
-namespace
-{
-
 template <typename T>
 ALWAYS_INLINE inline constexpr T pow10(size_t x)
 {
@@ -487,67 +485,62 @@ ALWAYS_INLINE inline char * writeSIntText(T x, char * pos)
 }
 }
 
-template <typename T>
-char * itoa(T i, char * p)
-{
-    return convert::itoa(i, p);
-}
 
-template <>
 char * itoa(UInt8 i, char * p)
 {
     return convert::itoa(uint8_t(i), p);
 }
 
-template <>
 char * itoa(Int8 i, char * p)
 {
     return convert::itoa(int8_t(i), p);
 }
 
-template <>
 char * itoa(UInt128 i, char * p)
 {
     return writeUIntText(i, p);
 }
 
-template <>
 char * itoa(Int128 i, char * p)
 {
     return writeSIntText(i, p);
 }
 
-template <>
 char * itoa(UInt256 i, char * p)
 {
     return writeUIntText(i, p);
 }
 
-template <>
 char * itoa(Int256 i, char * p)
 {
     return writeSIntText(i, p);
 }
 
+#define DEFAULT_ITOA(T) \
+    char * itoa(T i, char * p) \
+    { \
+        return convert::itoa(i, p); \
+    }
+
 #define FOR_MISSING_INTEGER_TYPES(M) \
-    M(int8_t) \
     M(uint8_t) \
     M(UInt16) \
     M(UInt32) \
     M(UInt64) \
+    M(int8_t) \
     M(Int16) \
     M(Int32) \
     M(Int64)
 
-#define INSTANTIATION(T) template char * itoa(T i, char * p);
-FOR_MISSING_INTEGER_TYPES(INSTANTIATION)
+FOR_MISSING_INTEGER_TYPES(DEFAULT_ITOA)
 
 #if defined(OS_DARWIN)
-INSTANTIATION(size_t)
+DEFAULT_ITOA(unsigned long)
+DEFAULT_ITOA(long)
 #endif
 
 #undef FOR_MISSING_INTEGER_TYPES
-#undef INSTANTIATION
+#undef DEFAULT_ITOA
 
 
 #define DIGITS_INTEGER_TYPES(M) \
@@ -559,7 +552,12 @@ INSTANTIATION(size_t)
     M(UInt128) \
     M(UInt256)
 
-#define INSTANTIATION(T) template int digits10(T x);
+#define INSTANTIATION(T) \
+    int digits10(T x) \
+    { \
+        return digits10T(x); \
+    }
+
 DIGITS_INTEGER_TYPES(INSTANTIATION)
 
 #undef DIGITS_INTEGER_TYPES
diff --git a/base/base/itoa.h b/base/base/itoa.h
index 98a570b12fa..9a89fa739dd 100644
--- a/base/base/itoa.h
+++ b/base/base/itoa.h
@@ -2,39 +2,33 @@
 
 #include <base/extended_types.h>
 
-template <typename T> char * itoa(T i, char * p);
-
-template <> char * itoa(UInt8 i, char * p);
-template <> char * itoa(Int8 i, char * p);
-template <> char * itoa(UInt128 i, char * p);
-template <> char * itoa(Int128 i, char * p);
-template <> char * itoa(UInt256 i, char * p);
-template <> char * itoa(Int256 i, char * p);
-
-#define FOR_MISSING_INTEGER_TYPES(M) \
-    M(int8_t) \
+#define FOR_INTEGER_TYPES(M) \
     M(uint8_t) \
+    M(UInt8) \
     M(UInt16) \
     M(UInt32) \
     M(UInt64) \
+    M(UInt128) \
+    M(UInt256) \
+    M(int8_t) \
+    M(Int8) \
     M(Int16) \
     M(Int32) \
-    M(Int64)
+    M(Int64) \
+    M(Int128) \
+    M(Int256)
 
-#define INSTANTIATION(T) \
-    extern template char * itoa(T i, char * p);
-FOR_MISSING_INTEGER_TYPES(INSTANTIATION)
+#define INSTANTIATION(T) char * itoa(T i, char * p);
+FOR_INTEGER_TYPES(INSTANTIATION)
 
 #if defined(OS_DARWIN)
-INSTANTIATION(size_t)
+INSTANTIATION(unsigned long)
+INSTANTIATION(long)
 #endif
 
 #undef FOR_MISSING_INTEGER_TYPES
 #undef INSTANTIATION
 
-
-template <typename T> int digits10(T x);
-
 #define DIGITS_INTEGER_TYPES(M) \
     M(uint8_t) \
     M(UInt8) \
@@ -43,8 +37,7 @@ template <typename T> int digits10(T x);
     M(UInt64) \
     M(UInt128) \
     M(UInt256)
-#define INSTANTIATION(T) \
-    extern template int digits10(T x);
+#define INSTANTIATION(T) int digits10(T x);
 DIGITS_INTEGER_TYPES(INSTANTIATION)
 #undef DIGITS_INTEGER_TYPES
 #undef INSTANTIATION

From 46332f334ccda467abfa673a9e75683a47e24110 Mon Sep 17 00:00:00 2001
From: tomershafir <tomer.shafir8@gmail.com>
Date: Fri, 8 Mar 2024 15:17:07 +0200
Subject: [PATCH 182/985] rm unused alias set/vector pair

---
 src/Client/QueryFuzzer.cpp | 16 ----------------
 src/Client/QueryFuzzer.h   |  4 +---
 2 files changed, 1 insertion(+), 19 deletions(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index 0597a7c1eed..ea2e5e17afd 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -1227,12 +1227,6 @@ void QueryFuzzer::collectFuzzInfoMain(ASTPtr ast)
 {
     collectFuzzInfoRecurse(ast);
 
-    aliases.clear();
-    for (const auto & alias : aliases_set)
-    {
-        aliases.push_back(alias);
-    }
-
     column_like.clear();
     for (const auto & [name, value] : column_like_map)
     {
@@ -1285,16 +1279,6 @@ void QueryFuzzer::addColumnLike(ASTPtr ast)
 
 void QueryFuzzer::collectFuzzInfoRecurse(ASTPtr ast)
 {
-    if (auto * impl = dynamic_cast<ASTWithAlias *>(ast.get()))
-    {
-        if (aliases_set.size() > 1000)
-        {
-            aliases_set.clear();
-        }
-
-        aliases_set.insert(impl->alias);
-    }
-
     if (typeid_cast<ASTLiteral *>(ast.get()))
     {
         addColumnLike(ast);
diff --git a/src/Client/QueryFuzzer.h b/src/Client/QueryFuzzer.h
index f5465626d96..3bc7b0842d3 100644
--- a/src/Client/QueryFuzzer.h
+++ b/src/Client/QueryFuzzer.h
@@ -50,9 +50,7 @@ struct QueryFuzzer
     // we are currently fuzzing. We add some part from each new query we are asked
     // to fuzz, and keep this state between queries, so the fuzzing output becomes
     // more interesting over time, as the queries mix.
-    std::unordered_set<std::string> aliases_set;
-    std::vector<std::string> aliases;
-
+    // The maps are used for collection, and the vectors are used for random access.
     std::unordered_map<std::string, ASTPtr> column_like_map;
     std::vector<ASTPtr> column_like;
 

From 4b964979c2c831a2ddeee5a7b0c10066f520ab11 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 8 Mar 2024 14:22:33 +0100
Subject: [PATCH 183/985] Digits doesn't belong with itoa anymore

---
 base/base/itoa.cpp            | 55 -----------------------------------
 base/base/itoa.h              | 13 ---------
 src/Functions/countDigits.cpp | 34 ++++++++++++++++++++++
 3 files changed, 34 insertions(+), 68 deletions(-)

diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
index 3c4f0bb048d..608258c6b56 100644
--- a/base/base/itoa.cpp
+++ b/base/base/itoa.cpp
@@ -35,40 +35,6 @@
 namespace
 {
 
-template <typename T>
-int digits10T(T x)
-{
-    if (x < 10ULL)
-        return 1;
-    if (x < 100ULL)
-        return 2;
-    if (x < 1000ULL)
-        return 3;
-
-    if (x < 1000000000000ULL)
-    {
-        if (x < 100000000ULL)
-        {
-            if (x < 1000000ULL)
-            {
-                if (x < 10000ULL)
-                    return 4;
-                else
-                    return 5 + (x >= 100000ULL);
-            }
-
-            return 7 + (x >= 10000000ULL);
-        }
-
-        if (x < 10000000000ULL)
-            return 9 + (x >= 1000000000ULL);
-
-        return 11 + (x >= 100000000000ULL);
-    }
-
-    return 12 + digits10T(x / 1000000000000ULL);
-}
-
 template <typename T>
 ALWAYS_INLINE inline constexpr T pow10(size_t x)
 {
@@ -541,24 +507,3 @@ DEFAULT_ITOA(long)
 
 #undef FOR_MISSING_INTEGER_TYPES
 #undef DEFAULT_ITOA
-
-
-#define DIGITS_INTEGER_TYPES(M) \
-    M(uint8_t) \
-    M(UInt8) \
-    M(UInt16) \
-    M(UInt32) \
-    M(UInt64) \
-    M(UInt128) \
-    M(UInt256)
-
-#define INSTANTIATION(T) \
-    int digits10(T x) \
-    { \
-        return digits10T(x); \
-    }
-
-DIGITS_INTEGER_TYPES(INSTANTIATION)
-
-#undef DIGITS_INTEGER_TYPES
-#undef INSTANTIATION
diff --git a/base/base/itoa.h b/base/base/itoa.h
index 9a89fa739dd..e69ce0ef17d 100644
--- a/base/base/itoa.h
+++ b/base/base/itoa.h
@@ -28,16 +28,3 @@ INSTANTIATION(long)
 
 #undef FOR_MISSING_INTEGER_TYPES
 #undef INSTANTIATION
-
-#define DIGITS_INTEGER_TYPES(M) \
-    M(uint8_t) \
-    M(UInt8) \
-    M(UInt16) \
-    M(UInt32) \
-    M(UInt64) \
-    M(UInt128) \
-    M(UInt256)
-#define INSTANTIATION(T) int digits10(T x);
-DIGITS_INTEGER_TYPES(INSTANTIATION)
-#undef DIGITS_INTEGER_TYPES
-#undef INSTANTIATION
diff --git a/src/Functions/countDigits.cpp b/src/Functions/countDigits.cpp
index 2ca8d944b0a..f2712b5b301 100644
--- a/src/Functions/countDigits.cpp
+++ b/src/Functions/countDigits.cpp
@@ -20,6 +20,40 @@ namespace ErrorCodes
 namespace
 {
 
+template <typename T>
+int digits10(T x)
+{
+    if (x < 10ULL)
+        return 1;
+    if (x < 100ULL)
+        return 2;
+    if (x < 1000ULL)
+        return 3;
+
+    if (x < 1000000000000ULL)
+    {
+        if (x < 100000000ULL)
+        {
+            if (x < 1000000ULL)
+            {
+                if (x < 10000ULL)
+                    return 4;
+                else
+                    return 5 + (x >= 100000ULL);
+            }
+
+            return 7 + (x >= 10000000ULL);
+        }
+
+        if (x < 10000000000ULL)
+            return 9 + (x >= 1000000000ULL);
+
+        return 11 + (x >= 100000000000ULL);
+    }
+
+    return 12 + digits10(x / 1000000000000ULL);
+}
+
 /// Returns number of decimal digits you need to represent the value.
 /// For Decimal values takes in account their scales: calculates result over underlying int type which is (value * scale).
 /// countDigits(42) = 2, countDigits(42.000) = 5, countDigits(0.04200) = 4.

From 4f27dd8f9c887cec6273dc7960b165ee2537ad26 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Fri, 8 Mar 2024 14:27:50 +0100
Subject: [PATCH 184/985] upd test

---
 .../0_stateless/02864_restore_table_with_broken_part.reference  | 2 +-
 .../queries/0_stateless/02864_restore_table_with_broken_part.sh | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02864_restore_table_with_broken_part.reference b/tests/queries/0_stateless/02864_restore_table_with_broken_part.reference
index 9a8dcda81df..9247a7d6ab6 100644
--- a/tests/queries/0_stateless/02864_restore_table_with_broken_part.reference
+++ b/tests/queries/0_stateless/02864_restore_table_with_broken_part.reference
@@ -1,4 +1,4 @@
-data.bin doesn't exist: while restoring part all_2_2_0
+OK
 RESTORED
 1
 3
diff --git a/tests/queries/0_stateless/02864_restore_table_with_broken_part.sh b/tests/queries/0_stateless/02864_restore_table_with_broken_part.sh
index cf99c7e9284..d3252b29eb7 100755
--- a/tests/queries/0_stateless/02864_restore_table_with_broken_part.sh
+++ b/tests/queries/0_stateless/02864_restore_table_with_broken_part.sh
@@ -26,7 +26,7 @@ ln -s "$SRC_BACKUP_DIR/$SRC_BACKUP_FILENAME" "$BACKUPS_DIR/$BACKUP_FILENAME"
 $CLICKHOUSE_CLIENT --query "DROP TABLE IF EXISTS tbl"
 
 # First try to restore with the setting `restore_broken_parts_as_detached` set to false.
-$CLICKHOUSE_CLIENT --query "RESTORE TABLE default.tbl AS tbl FROM $BACKUP_NAME" 2>&1 | grep -o -m 1 "data.bin doesn't exist: while restoring part all_2_2_0"
+$CLICKHOUSE_CLIENT --query "RESTORE TABLE default.tbl AS tbl FROM $BACKUP_NAME" 2>&1 | tr -d \\n | grep "data.bin doesn't exist" | grep "while restoring part all_2_2_0" > /dev/null && echo "OK" || echo "FAILED"
 
 $CLICKHOUSE_CLIENT --query "DROP TABLE IF EXISTS tbl"
 

From 45a1f0f8ed33fb09fee92137a391dfd25ba63f05 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Fri, 8 Mar 2024 14:02:34 +0000
Subject: [PATCH 185/985] More consistency and extended tests

---
 src/Functions/array/arrayDistance.cpp         |  8 ++--
 src/Functions/array/arrayDotProduct.cpp       | 43 ++++++++-----------
 .../0_stateless/02708_dotProduct.reference    | 12 ++++++
 .../queries/0_stateless/02708_dotProduct.sql  | 16 +++++--
 4 files changed, 47 insertions(+), 32 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index 0045075ddef..8b591e37ff6 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -471,10 +471,9 @@ private:
 
         const typename Kernel::ConstParams kernel_params = initConstParams(arguments);
 
-        auto result = ColumnVector<ResultType>::create(input_rows_count);
-        auto & result_data = result->getData();
+        auto col_res = ColumnVector<ResultType>::create(input_rows_count);
+        auto & result_data = col_res->getData();
 
-        /// Do the actual computation
         ColumnArray::Offset prev = 0;
         size_t row = 0;
 
@@ -503,7 +502,7 @@ private:
             result_data[row] = Kernel::finalize(state, kernel_params);
             row++;
         }
-        return result;
+        return col_res;
     }
 
     /// Special case when the 1st parameter is Const
@@ -542,7 +541,6 @@ private:
         auto result = ColumnVector<ResultType>::create(input_rows_count);
         auto & result_data = result->getData();
 
-        /// Do the actual computation
         size_t prev = 0;
         size_t row = 0;
 
diff --git a/src/Functions/array/arrayDotProduct.cpp b/src/Functions/array/arrayDotProduct.cpp
index 8b7c85e05dd..97dc9653bab 100644
--- a/src/Functions/array/arrayDotProduct.cpp
+++ b/src/Functions/array/arrayDotProduct.cpp
@@ -140,6 +140,7 @@ public:
     static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionArrayScalarProduct>(); }
     size_t getNumberOfArguments() const override { return 2; }
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+    bool useDefaultImplementationForConstants() const override { return true; }
 
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
     {
@@ -174,13 +175,13 @@ public:
     ACTION(Float32) \
     ACTION(Float64)
 
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t /* input_rows_count */) const override
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
     {
         switch (result_type->getTypeId())
         {
         #define ON_TYPE(type) \
             case TypeIndex::type: \
-                return executeWithResultType<type>(arguments); \
+                return executeWithResultType<type>(arguments, input_rows_count); \
                 break;
 
             SUPPORTED_TYPES(ON_TYPE)
@@ -193,7 +194,7 @@ public:
 
 private:
     template <typename ResultType>
-    ColumnPtr executeWithResultType(const ColumnsWithTypeAndName & arguments) const
+    ColumnPtr executeWithResultType(const ColumnsWithTypeAndName & arguments, size_t input_rows_count) const
     {
         DataTypePtr type_x = typeid_cast<const DataTypeArray *>(arguments[0].type.get())->getNestedType();
 
@@ -201,7 +202,7 @@ private:
         {
 #define ON_TYPE(type) \
             case TypeIndex::type: \
-                return executeWithResultTypeAndLeftType<ResultType, type>(arguments); \
+                return executeWithResultTypeAndLeftType<ResultType, type>(arguments, input_rows_count); \
                 break;
 
             SUPPORTED_TYPES(ON_TYPE)
@@ -218,7 +219,7 @@ private:
     }
 
     template <typename ResultType, typename LeftType>
-    ColumnPtr executeWithResultTypeAndLeftType(const ColumnsWithTypeAndName & arguments) const
+    ColumnPtr executeWithResultTypeAndLeftType(const ColumnsWithTypeAndName & arguments, size_t input_rows_count) const
     {
         DataTypePtr type_y = typeid_cast<const DataTypeArray *>(arguments[1].type.get())->getNestedType();
 
@@ -226,7 +227,7 @@ private:
         {
         #define ON_TYPE(type) \
             case TypeIndex::type: \
-                return executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, type>(arguments[0].column, arguments[1].column); \
+                return executeWithResultTypeAndLeftTypeAndRightType<ResultType, LeftType, type>(arguments[0].column, arguments[1].column, input_rows_count); \
                 break;
 
             SUPPORTED_TYPES(ON_TYPE)
@@ -243,15 +244,15 @@ private:
     }
 
     template <typename ResultType, typename LeftType, typename RightType>
-    ColumnPtr executeWithResultTypeAndLeftTypeAndRightType(ColumnPtr col_x, ColumnPtr col_y) const
+    ColumnPtr executeWithResultTypeAndLeftTypeAndRightType(ColumnPtr col_x, ColumnPtr col_y, size_t input_rows_count) const
     {
         if (typeid_cast<const ColumnConst *>(col_x.get()))
         {
-            return executeWithLeftArgConst<ResultType, LeftType, RightType>(col_x, col_y);
+            return executeWithLeftArgConst<ResultType, LeftType, RightType>(col_x, col_y, input_rows_count);
         }
         else if (typeid_cast<const ColumnConst *>(col_y.get()))
         {
-            return executeWithLeftArgConst<ResultType, RightType, LeftType>(col_y, col_x);
+            return executeWithLeftArgConst<ResultType, RightType, LeftType>(col_y, col_x, input_rows_count);
         }
 
         col_x = col_x->convertToFullColumnIfConst();
@@ -268,16 +269,13 @@ private:
         if (!array_x.hasEqualOffsets(array_y))
             throw Exception(ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH, "Array arguments for function {} must have equal sizes", getName());
 
-        auto col_res = ColumnVector<ResultType>::create();
-        auto & result = col_res->getData();
-
-        size_t size = offsets_x.size();
-        result.resize(size);
+        auto col_res = ColumnVector<ResultType>::create(input_rows_count);
+        auto & result_data = col_res->getData();
 
         ColumnArray::Offset current_offset = 0;
-        for (size_t row = 0; row < size; ++row)
+        for (size_t row = 0; row < input_rows_count; ++row)
         {
-            size_t array_size = offsets_x[row] - current_offset;
+            const size_t array_size = offsets_x[row] - current_offset;
 
             size_t i = 0;
 
@@ -298,7 +296,7 @@ private:
             for (; i < array_size; ++i)
                 Kernel::template accumulate<ResultType>(state, static_cast<ResultType>(data_x[current_offset + i]), static_cast<ResultType>(data_y[current_offset + i]));
 
-            result[row] = Kernel::template finalize<ResultType>(state);
+            result_data[row] = Kernel::template finalize<ResultType>(state);
 
             current_offset = offsets_x[row];
         }
@@ -307,7 +305,7 @@ private:
     }
 
     template <typename ResultType, typename LeftType, typename RightType>
-    ColumnPtr executeWithLeftArgConst(ColumnPtr col_x, ColumnPtr col_y) const
+    ColumnPtr executeWithLeftArgConst(ColumnPtr col_x, ColumnPtr col_y, size_t input_rows_count) const
     {
         col_x = assert_cast<const ColumnConst *>(col_x.get())->getDataColumnPtr();
         col_y = col_y->convertToFullColumnIfConst();
@@ -336,16 +334,13 @@ private:
             prev_offset = offset_y;
         }
 
-        auto col_res = ColumnVector<ResultType>::create();
+        auto col_res = ColumnVector<ResultType>::create(input_rows_count);
         auto & result = col_res->getData();
 
-        size_t size = offsets_y.size();
-        result.resize(size);
-
         ColumnArray::Offset current_offset = 0;
-        for (size_t row = 0; row < size; ++row)
+        for (size_t row = 0; row < input_rows_count; ++row)
         {
-            size_t array_size = offsets_x[0];
+            const size_t array_size = offsets_x[0];
 
             typename Kernel::template State<ResultType> state;
             size_t i = 0;
diff --git a/tests/queries/0_stateless/02708_dotProduct.reference b/tests/queries/0_stateless/02708_dotProduct.reference
index 593071a3521..93a67e4c0be 100644
--- a/tests/queries/0_stateless/02708_dotProduct.reference
+++ b/tests/queries/0_stateless/02708_dotProduct.reference
@@ -11,6 +11,8 @@
 [-1,-2,-3]	[4,5,6]	-32	Int64
 [1,2,3]	[4,5,6]	32	Float32
 [1,2,3]	[4,5,6]	32	Float64
+[]	[]	0	Float32
+[]	[]	0	UInt16
    -- Tuple
 (1,2,3)	(4,5,6)	32	UInt64
 (1,2,3)	(4,5,6)	32	UInt64
@@ -24,6 +26,8 @@
 (1,2,3)	(4,5,6)	32	Float64
 -- Non-const argument
 [1,2,3]	[4,5,6]	32	UInt16
+[]	[]	0	Float32
+[]	[]	0	UInt16
  -- Array with mixed element arguments types (result type is the supertype)
 [1,2,3]	[4,5,6]	32	Float32
  -- Tuple with mixed element arguments types
@@ -33,8 +37,16 @@
 32
 32
 -- Tests that trigger special paths
+   -- non-const / non-const
 0	61
 1	186
+0	61
+1	186
+0	61
+1	186
+   -- const / non-const
+0	62
+1	187
 0	62
 1	187
 0	62
diff --git a/tests/queries/0_stateless/02708_dotProduct.sql b/tests/queries/0_stateless/02708_dotProduct.sql
index ac94ecc28d3..05c66777dff 100644
--- a/tests/queries/0_stateless/02708_dotProduct.sql
+++ b/tests/queries/0_stateless/02708_dotProduct.sql
@@ -19,6 +19,9 @@ SELECT [-1, -2, -3]::Array(Int32) AS x, [4, 5, 6]::Array(Int32) AS y, dotProduct
 SELECT [-1, -2, -3]::Array(Int64) AS x, [4, 5, 6]::Array(Int64) AS y, dotProduct(x, y) AS res, toTypeName(res);
 SELECT [1, 2, 3]::Array(Float32) AS x, [4, 5, 6]::Array(Float32) AS y, dotProduct(x, y) AS res, toTypeName(res);
 SELECT [1, 2, 3]::Array(Float64) AS x, [4, 5, 6]::Array(Float64) AS y, dotProduct(x, y) AS res, toTypeName(res);
+-- empty arrays
+SELECT []::Array(Float32) AS x, []::Array(Float32) AS y, dotProduct(x, y) AS res, toTypeName(res);
+SELECT []::Array(UInt8) AS x, []::Array(UInt8) AS y, dotProduct(x, y) AS res, toTypeName(res);
 
 SELECT '   -- Tuple';
 SELECT (1::UInt8, 2::UInt8, 3::UInt8) AS x, (4::UInt8, 5::UInt8, 6::UInt8) AS y, dotProduct(x, y) AS res, toTypeName(res);
@@ -34,6 +37,8 @@ SELECT (1::Float64, 2::Float64, 3::Float64) AS x, (4::Float64, 5::Float64, 6::Fl
 
 SELECT '-- Non-const argument';
 SELECT materialize([1::UInt8, 2::UInt8, 3::UInt8]) AS x, [4::UInt8, 5::UInt8, 6::UInt8] AS y, dotProduct(x, y) AS res, toTypeName(res);
+SELECT materialize([]::Array(Float32)) AS x, []::Array(Float32) AS y, dotProduct(x, y) AS res, toTypeName(res);
+SELECT materialize([]::Array(UInt8)) AS x, []::Array(UInt8) AS y, dotProduct(x, y) AS res, toTypeName(res);
 
 SELECT ' -- Array with mixed element arguments types (result type is the supertype)';
 SELECT [1::UInt16, 2::UInt8, 3::Float32] AS x, [4::Int16, 5::Float32, 6::UInt8] AS y, dotProduct(x, y) AS res, toTypeName(res);
@@ -50,7 +55,12 @@ SELECT '-- Tests that trigger special paths';
 DROP TABLE IF EXISTS tab;
 CREATE TABLE tab(id UInt64, vec Array(Float32)) ENGINE = MergeTree ORDER BY id;
 INSERT INTO tab VALUES (0, [0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0]) (1, [5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0]);
-SELECT id, arrayDotProduct(vec, vec) FROM tab ORDER BY id; -- non-const / non-const
-SELECT id, arrayDotProduct([5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0]::Array(Float32), vec) FROM tab ORDER BY id; -- const / non-const
-SELECT id, arrayDotProduct([5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0]::Array(Float64), vec) FROM tab ORDER BY id; -- const / non-const
+SELECT '   -- non-const / non-const';
+SELECT id, arrayDotProduct(vec, vec) FROM tab ORDER BY id;
+SELECT id, arrayDotProduct(vec::Array(Float64), vec::Array(Float64)) FROM tab ORDER BY id;
+SELECT id, arrayDotProduct(vec::Array(UInt32), vec::Array(UInt32)) FROM tab ORDER BY id;
+SELECT '   -- const / non-const';
+SELECT id, arrayDotProduct([5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0]::Array(Float32), vec) FROM tab ORDER BY id;
+SELECT id, arrayDotProduct([5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0]::Array(Float64), vec) FROM tab ORDER BY id;
+SELECT id, arrayDotProduct([5, 2, 2, 3, 5, 1, 2, 3, 5, 1, 2, 3, 5, 1, 2, 3, 5, 1, 2]::Array(UInt32), vec) FROM tab ORDER BY id;
 DROP TABLE tab;

From 45efa69189784ce65bffd0d84462dcb30c1e6bf4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 8 Mar 2024 15:17:59 +0100
Subject: [PATCH 186/985] Add perf tests

---
 tests/performance/bigint_formatting.xml | 13 +++++++++++++
 1 file changed, 13 insertions(+)
 create mode 100644 tests/performance/bigint_formatting.xml

diff --git a/tests/performance/bigint_formatting.xml b/tests/performance/bigint_formatting.xml
new file mode 100644
index 00000000000..c3454f91d1d
--- /dev/null
+++ b/tests/performance/bigint_formatting.xml
@@ -0,0 +1,13 @@
+<test>
+    <create_query>
+        CREATE TABLE bigint ( u128 UInt128, i128 Int128, u256 UInt256, i256 Int256) ENGINE = Memory
+        AS
+        SELECT * FROM generateRandom('u128 UInt128, i128 Int128, u256 UInt256, i256 Int256', 42) LIMIT 50000;
+    </create_query>
+    <drop_query>DROP TABLE IF EXISTS bigint</drop_query>
+
+    <query>SELECT * FROM bigint WHERE NOT ignore(toString(u128)) SETTINGS max_threads = 1</query>
+    <query>SELECT * FROM bigint WHERE NOT ignore(toString(i128)) SETTINGS max_threads = 1</query>
+    <query>SELECT * FROM bigint WHERE NOT ignore(toString(u256)) SETTINGS max_threads = 1</query>
+    <query>SELECT * FROM bigint WHERE NOT ignore(toString(i256)) SETTINGS max_threads = 1</query>
+</test>

From cacbd3ce3450e9a2f8915b392ce8ec08f9662282 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Fri, 8 Mar 2024 14:13:23 +0000
Subject: [PATCH 187/985] CI: support merge queue event in pr_info

 #do_not_test
---
 tests/ci/pr_info.py | 56 +++++++++++++++++++++++++++++++--------------
 1 file changed, 39 insertions(+), 17 deletions(-)

diff --git a/tests/ci/pr_info.py b/tests/ci/pr_info.py
index aba32d88c0a..6f4b400f7a8 100644
--- a/tests/ci/pr_info.py
+++ b/tests/ci/pr_info.py
@@ -44,11 +44,12 @@ RETRY_SLEEP = 0
 
 
 class EventType:
-    UNKNOWN = 0
-    PUSH = 1
-    PULL_REQUEST = 2
-    SCHEDULE = 3
-    DISPATCH = 4
+    UNKNOWN = "unknown"
+    PUSH = "commits"
+    PULL_REQUEST = "pull_request"
+    SCHEDULE = "schedule"
+    DISPATCH = "dispatch"
+    MERGE_QUEUE = "merge_group"
 
 
 def get_pr_for_commit(sha, ref):
@@ -114,6 +115,12 @@ class PRInfo:
         # release_pr and merged_pr are used for docker images additional cache
         self.release_pr = 0
         self.merged_pr = 0
+        self.labels = set()
+
+        repo_prefix = f"{GITHUB_SERVER_URL}/{GITHUB_REPOSITORY}"
+        self.task_url = GITHUB_RUN_URL
+        self.repo_full_name = GITHUB_REPOSITORY
+
         self.event_type = EventType.UNKNOWN
         ref = github_event.get("ref", "refs/heads/master")
         if ref and ref.startswith("refs/heads/"):
@@ -154,10 +161,6 @@ class PRInfo:
             else:
                 self.sha = github_event["pull_request"]["head"]["sha"]
 
-            repo_prefix = f"{GITHUB_SERVER_URL}/{GITHUB_REPOSITORY}"
-            self.task_url = GITHUB_RUN_URL
-
-            self.repo_full_name = GITHUB_REPOSITORY
             self.commit_html_url = f"{repo_prefix}/commits/{self.sha}"
             self.pr_html_url = f"{repo_prefix}/pull/{self.number}"
 
@@ -176,7 +179,7 @@ class PRInfo:
             self.body = github_event["pull_request"]["body"]
             self.labels = {
                 label["name"] for label in github_event["pull_request"]["labels"]
-            }  # type: Set[str]
+            }
 
             self.user_login = github_event["pull_request"]["user"]["login"]  # type: str
             self.user_orgs = set()  # type: Set[str]
@@ -191,6 +194,28 @@ class PRInfo:
 
             self.diff_urls.append(self.compare_pr_url(github_event["pull_request"]))
 
+        elif (
+            EventType.MERGE_QUEUE in github_event
+        ):  # pull request and other similar events
+            self.event_type = EventType.MERGE_QUEUE
+            # FIXME: need pr? we can parse it from ["head_ref": "refs/heads/gh-readonly-queue/test-merge-queue/pr-6751-4690229995a155e771c52e95fbd446d219c069bf"]
+            self.number = 0
+            self.sha = github_event[EventType.MERGE_QUEUE]["head_sha"]
+            self.base_ref = github_event[EventType.MERGE_QUEUE]["base_ref"]
+            base_sha = github_event[EventType.MERGE_QUEUE]["base_sha"]  # type: str
+            # ClickHouse/ClickHouse
+            self.base_name = github_event["repository"]["full_name"]
+            # any_branch-name - the name of working branch name
+            self.head_ref = github_event[EventType.MERGE_QUEUE]["head_ref"]
+            # UserName/ClickHouse or ClickHouse/ClickHouse
+            self.head_name = self.base_name
+            self.user_login = github_event["sender"]["login"]
+            self.diff_urls.append(
+                github_event["repository"]["compare_url"]
+                .replace("{base}", base_sha)
+                .replace("{head}", self.sha)
+            )
+
         elif "commits" in github_event:
             self.event_type = EventType.PUSH
             # `head_commit` always comes with `commits`
@@ -203,10 +228,8 @@ class PRInfo:
                     logging.error("Failed to convert %s to integer", merged_pr)
             self.sha = github_event["after"]
             pull_request = get_pr_for_commit(self.sha, github_event["ref"])
-            repo_prefix = f"{GITHUB_SERVER_URL}/{GITHUB_REPOSITORY}"
-            self.task_url = GITHUB_RUN_URL
             self.commit_html_url = f"{repo_prefix}/commits/{self.sha}"
-            self.repo_full_name = GITHUB_REPOSITORY
+
             if pull_request is None or pull_request["state"] == "closed":
                 # it's merged PR to master
                 self.number = 0
@@ -272,11 +295,7 @@ class PRInfo:
                 "GITHUB_SHA", "0000000000000000000000000000000000000000"
             )
             self.number = 0
-            self.labels = set()
-            repo_prefix = f"{GITHUB_SERVER_URL}/{GITHUB_REPOSITORY}"
-            self.task_url = GITHUB_RUN_URL
             self.commit_html_url = f"{repo_prefix}/commits/{self.sha}"
-            self.repo_full_name = GITHUB_REPOSITORY
             self.pr_html_url = f"{repo_prefix}/commits/{ref}"
             self.base_ref = ref
             self.base_name = self.repo_full_name
@@ -300,6 +319,9 @@ class PRInfo:
     def is_scheduled(self):
         return self.event_type == EventType.SCHEDULE
 
+    def is_merge_queue(self):
+        return self.event_type == EventType.MERGE_QUEUE
+
     def is_dispatched(self):
         return self.event_type == EventType.DISPATCH
 

From d6e0dd45b9cc88b9002de68138440cd24452fb17 Mon Sep 17 00:00:00 2001
From: Amos Bird <amosbird@gmail.com>
Date: Fri, 8 Mar 2024 22:57:49 +0800
Subject: [PATCH 188/985] Fix build

---
 src/Functions/coverage.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Functions/coverage.cpp b/src/Functions/coverage.cpp
index f4cac26df78..0f4cd1940b7 100644
--- a/src/Functions/coverage.cpp
+++ b/src/Functions/coverage.cpp
@@ -5,6 +5,7 @@
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnVector.h>
 #include <Columns/ColumnConst.h>
+#include <Columns/ColumnsNumber.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/IFunction.h>
 #include <Interpreters/Context.h>

From 2196c75dd8ddaeb1d2f18ca7b05fb4ae37550a4b Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Fri, 8 Mar 2024 11:07:04 -0400
Subject: [PATCH 189/985] Adds substring-UTF8 docs.

---
 .../functions/string-functions.md             | 69 ++++++++++++++++++-
 1 file changed, 67 insertions(+), 2 deletions(-)

diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index 3b49e4954ed..f9c3f91a12b 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -588,8 +588,41 @@ Result:
 
 ## substringUTF8
 
-Like `substring` but for Unicode code points. Assumes that the string contains valid UTF-8 encoded text. If this assumption is violated, no exception is thrown and the result is undefined.
+Returns the substring of a string `s` which starts at the specified byte index `offset` for Unicode code points. Byte counting starts from `1`. If `offset` is `0`, an empty string is returned. If `offset` is negative, the substring starts `pos` characters from the end of the string, rather than from the beginning. An optional argument `length` specifies the maximum number of bytes the returned substring may have.
 
+Assumes that the string contains valid UTF-8 encoded text. If this assumption is violated, no exception is thrown and the result is undefined.
+
+**Syntax**
+
+```sql
+substringUTF8(s, offset[, length])
+```
+
+**Arguments**
+
+- `s`: The string to calculate a substring from. [String](../../sql-reference/data-types/string.md), [FixedString](../../sql-reference/data-types/fixedstring.md) or [Enum](../../sql-reference/data-types/enum.md)
+- `offset`: The starting position of the substring in `s` . [(U)Int*](../../sql-reference/data-types/int-uint.md).
+- `length`: The maximum length of the substring. [(U)Int*](../../sql-reference/data-types/int-uint.md). Optional.
+
+**Returned value**
+
+A substring of `s` with `length` many bytes, starting at index `offset`.
+
+**Implementation details**
+
+Assumes that the string contains valid UTF-8 encoded text. If this assumption is violated, no exception is thrown and the result is undefined.
+
+**Example**
+
+```sql
+SELECT 'database' AS string, substringUTF8(string, 5), substringUTF8(string, 5, 1)
+```
+
+```response
+┌─string───┬─substringUTF8('database', 5)─┬─substringUTF8('database', 5, 1)─┐
+│ database │ base                         │ b                               │
+└──────────┴──────────────────────────────┴─────────────────────────────────┘
+```
 
 ## substringIndex
 
@@ -624,7 +657,39 @@ Result:
 
 ## substringIndexUTF8
 
-Like `substringIndex` but for Unicode code points. Assumes that the string contains valid UTF-8 encoded text. If this assumption is violated, no exception is thrown and the result is undefined.
+Returns the substring of `s` before `count` occurrences of the delimiter `delim`, specifically for Unicode code points.
+
+Assumes that the string contains valid UTF-8 encoded text. If this assumption is violated, no exception is thrown and the result is undefined.
+
+**Syntax**
+
+```sql
+substringIndexUTF8(s, delim, count)
+```
+
+**Arguments**
+
+- `s`: The string to extract substring from. [String](../../sql-reference/data-types/string.md).
+- `delim`: The character to split. [String](../../sql-reference/data-types/string.md).
+- `count`: The number of occurrences of the delimiter to count before extracting the substring. If count is positive, everything to the left of the final delimiter (counting from the left) is returned. If count is negative, everything to the right of the final delimiter (counting from the right) is returned. [UInt or Int](../data-types/int-uint.md)
+
+**Returned value**
+
+A substring [String](../../sql-reference/data-types/string.md) of `s` before `count` occurrences of `delim`.
+
+**Implementation details**
+
+Assumes that the string contains valid UTF-8 encoded text. If this assumption is violated, no exception is thrown and the result is undefined.
+
+**Example**
+
+```sql
+SELECT substringIndexUTF8('www.clickhouse.com', '.', 2)
+```
+
+```response
+www.clickhouse
+```
 
 ## appendTrailingCharIfAbsent
 

From 0336ef3557b0c3c05ef974a4c6aa6771b3aa0757 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 8 Mar 2024 16:14:11 +0100
Subject: [PATCH 190/985] reload CI


From 6f31a77f704b4a0400d433541b67236f6d87a958 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 8 Mar 2024 15:33:45 +0000
Subject: [PATCH 191/985] Fix test 02174_cte_scalar_cache_mv

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     |  7 +-
 .../02174_cte_scalar_cache_mv.reference       | 63 ++++++++++++
 .../0_stateless/02174_cte_scalar_cache_mv.sql | 99 +++++++++++++++++++
 3 files changed, 165 insertions(+), 4 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index e7c48b81fbc..1da5d86edf3 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1992,19 +1992,18 @@ void QueryAnalyzer::evaluateScalarSubqueryIfNeeded(QueryTreeNodePtr & node, Iden
     QueryTreeNodePtrWithHash node_with_hash(node_without_alias);
     auto str_hash = DB::toString(node_with_hash.hash);
 
-    bool can_use_global_scalars = !(context->getViewSource() && subtreeHasViewSource(node_without_alias.get(), *context));
+    bool can_use_global_scalars = !only_analyze && !(context->getViewSource() && subtreeHasViewSource(node_without_alias.get(), *context));
 
     auto & scalars_cache = can_use_global_scalars ? scalar_subquery_to_scalar_value_global : scalar_subquery_to_scalar_value_local;
-    auto scalar_value_it = scalars_cache.find(node_with_hash);
 
-    if (scalar_value_it != scalars_cache.end())
+    if (scalars_cache.contains(node_with_hash))
     {
         if (can_use_global_scalars)
             ProfileEvents::increment(ProfileEvents::ScalarSubqueriesGlobalCacheHit);
         else
             ProfileEvents::increment(ProfileEvents::ScalarSubqueriesLocalCacheHit);
 
-        scalar_block = scalar_value_it->second;
+        scalar_block = scalars_cache.at(node_with_hash);
     }
     else if (context->hasQueryContext() && can_use_global_scalars && context->getQueryContext()->hasScalar(str_hash))
     {
diff --git a/tests/queries/0_stateless/02174_cte_scalar_cache_mv.reference b/tests/queries/0_stateless/02174_cte_scalar_cache_mv.reference
index 8ec3608317f..dcfab092b5c 100644
--- a/tests/queries/0_stateless/02174_cte_scalar_cache_mv.reference
+++ b/tests/queries/0_stateless/02174_cte_scalar_cache_mv.reference
@@ -19,6 +19,48 @@
 94	94	94	94	5
 99	99	99	99	5
 02177_MV	7	80	22
+4	4	4	4	5
+9	9	9	9	5
+14	14	14	14	5
+19	19	19	19	5
+24	24	24	24	5
+29	29	29	29	5
+34	34	34	34	5
+39	39	39	39	5
+44	44	44	44	5
+49	49	49	49	5
+54	54	54	54	5
+59	59	59	59	5
+64	64	64	64	5
+69	69	69	69	5
+74	74	74	74	5
+79	79	79	79	5
+84	84	84	84	5
+89	89	89	89	5
+94	94	94	94	5
+99	99	99	99	5
+02177_MV	0	0	22
+10
+40
+70
+100
+130
+160
+190
+220
+250
+280
+310
+340
+370
+400
+430
+460
+490
+520
+550
+580
+02177_MV_2	0	0	21
 10
 40
 70
@@ -61,3 +103,24 @@
 188
 198
 02177_MV_3	20	0	1
+8
+18
+28
+38
+48
+58
+68
+78
+88
+98
+108
+118
+128
+138
+148
+158
+168
+178
+188
+198
+02177_MV_3	19	0	2
diff --git a/tests/queries/0_stateless/02174_cte_scalar_cache_mv.sql b/tests/queries/0_stateless/02174_cte_scalar_cache_mv.sql
index 742d72fe2b2..ca54b9e1400 100644
--- a/tests/queries/0_stateless/02174_cte_scalar_cache_mv.sql
+++ b/tests/queries/0_stateless/02174_cte_scalar_cache_mv.sql
@@ -14,6 +14,8 @@ CREATE MATERIALIZED VIEW mv1 TO t2 AS
     FROM t1
     LIMIT 5;
 
+set allow_experimental_analyzer = 0;
+
 -- FIRST INSERT
 INSERT INTO t1
 WITH
@@ -58,8 +60,48 @@ WHERE
   AND query LIKE '-- FIRST INSERT\nINSERT INTO t1\n%'
   AND event_date >= yesterday() AND event_time > now() - interval 10 minute;
 
+truncate table t2;
+set allow_experimental_analyzer = 1;
+
+-- FIRST INSERT ANALYZER
+INSERT INTO t1
+WITH
+    (SELECT max(i) FROM t1) AS t1
+SELECT
+       number as i,
+       t1 + t1 + t1 AS j -- Using global cache
+FROM system.numbers
+LIMIT 100
+SETTINGS
+    min_insert_block_size_rows=5,
+    max_insert_block_size=5,
+    min_insert_block_size_rows_for_materialized_views=5,
+    max_block_size=5,
+    max_threads=1;
+
+SELECT k, l, m, n, count()
+FROM t2
+GROUP BY k, l, m, n
+ORDER BY k, l, m, n;
+
+SYSTEM FLUSH LOGS;
+
+SELECT
+    '02177_MV',
+    ProfileEvents['ScalarSubqueriesGlobalCacheHit'] as scalar_cache_global_hit,
+    ProfileEvents['ScalarSubqueriesLocalCacheHit'] as scalar_cache_local_hit,
+    ProfileEvents['ScalarSubqueriesCacheMiss'] as scalar_cache_miss
+FROM system.query_log
+WHERE
+      current_database = currentDatabase()
+  AND type = 'QueryFinish'
+  AND query LIKE '-- FIRST INSERT ANALYZER\nINSERT INTO t1\n%'
+  AND event_date >= yesterday() AND event_time > now() - interval 10 minute;
+
 DROP TABLE mv1;
 
+set allow_experimental_analyzer = 0;
+
 CREATE TABLE t3 (z Int64) ENGINE = Memory;
 CREATE MATERIALIZED VIEW mv2 TO t3 AS
 SELECT
@@ -91,8 +133,36 @@ WHERE
   AND query LIKE '-- SECOND INSERT\nINSERT INTO t1%'
   AND event_date >= yesterday() AND event_time > now() - interval 10 minute;
 
+truncate table t3;
+set allow_experimental_analyzer = 1;
+
+-- SECOND INSERT ANALYZER
+INSERT INTO t1
+SELECT 0 as i, number as j from numbers(100)
+SETTINGS
+    min_insert_block_size_rows=5,
+    max_insert_block_size=5,
+    min_insert_block_size_rows_for_materialized_views=5,
+    max_block_size=5,
+    max_threads=1;
+
+SELECT * FROM t3 ORDER BY z ASC;
+SYSTEM FLUSH LOGS;
+SELECT
+    '02177_MV_2',
+    ProfileEvents['ScalarSubqueriesGlobalCacheHit'] as scalar_cache_global_hit,
+    ProfileEvents['ScalarSubqueriesLocalCacheHit'] as scalar_cache_local_hit,
+    ProfileEvents['ScalarSubqueriesCacheMiss'] as scalar_cache_miss
+FROM system.query_log
+WHERE
+        current_database = currentDatabase()
+  AND type = 'QueryFinish'
+  AND query LIKE '-- SECOND INSERT ANALYZER\nINSERT INTO t1%'
+  AND event_date >= yesterday() AND event_time > now() - interval 10 minute;
+
 DROP TABLE mv2;
 
+set allow_experimental_analyzer = 0;
 
 CREATE TABLE t4 (z Int64) ENGINE = Memory;
 CREATE MATERIALIZED VIEW mv3 TO t4 AS
@@ -126,6 +196,35 @@ WHERE
   AND query LIKE '-- THIRD INSERT\nINSERT INTO t1%'
   AND event_date >= yesterday() AND event_time > now() - interval 10 minute;
 
+truncate table t4;
+set allow_experimental_analyzer = 1;
+
+-- THIRD INSERT ANALYZER
+INSERT INTO t1
+SELECT number as i, number as j from numbers(100)
+    SETTINGS
+    min_insert_block_size_rows=5,
+    max_insert_block_size=5,
+    min_insert_block_size_rows_for_materialized_views=5,
+    max_block_size=5,
+    max_threads=1;
+SYSTEM FLUSH LOGS;
+
+SELECT * FROM t4 ORDER BY z ASC;
+
+SELECT
+    '02177_MV_3',
+    ProfileEvents['ScalarSubqueriesGlobalCacheHit'] as scalar_cache_global_hit,
+    ProfileEvents['ScalarSubqueriesLocalCacheHit'] as scalar_cache_local_hit,
+    ProfileEvents['ScalarSubqueriesCacheMiss'] as scalar_cache_miss
+FROM system.query_log
+WHERE
+        current_database = currentDatabase()
+  AND type = 'QueryFinish'
+  AND query LIKE '-- THIRD INSERT ANALYZER\nINSERT INTO t1%'
+  AND event_date >= yesterday() AND event_time > now() - interval 10 minute;
+
+
 DROP TABLE mv3;
 DROP TABLE t1;
 DROP TABLE t2;

From ceb82cb3bd8579c4ba8accd6e701f4a5cd05d505 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 8 Mar 2024 15:34:19 +0000
Subject: [PATCH 192/985] Fix test 02174_cte_scalar_cache_mv

---
 tests/analyzer_tech_debt.txt | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index dc6284d20c5..e856da394d2 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -11,7 +11,6 @@
 01761_cast_to_enum_nullable
 01925_join_materialized_columns
 01952_optimize_distributed_group_by_sharding_key
-02174_cte_scalar_cache_mv
 02354_annoy
 # Check after constants refactoring
 02901_parallel_replicas_rollup

From e2317477f7b95d07407db8def968d286aa9e270d Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Fri, 8 Mar 2024 17:12:31 +0100
Subject: [PATCH 193/985] fix removing is_active node after re-creation

---
 src/Databases/DatabaseReplicatedWorker.cpp         | 2 ++
 tests/integration/test_replicated_database/test.py | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/src/Databases/DatabaseReplicatedWorker.cpp b/src/Databases/DatabaseReplicatedWorker.cpp
index 2056b403ff6..0a6e8f9345e 100644
--- a/src/Databases/DatabaseReplicatedWorker.cpp
+++ b/src/Databases/DatabaseReplicatedWorker.cpp
@@ -75,6 +75,8 @@ void DatabaseReplicatedDDLWorker::initializeReplication()
     String active_path = fs::path(database->replica_path) / "active";
     String active_id = toString(ServerUUID::get());
     zookeeper->deleteEphemeralNodeIfContentMatches(active_path, active_id);
+    if (active_node_holder)
+        active_node_holder->setAlreadyRemoved();
     zookeeper->create(active_path, active_id, zkutil::CreateMode::Ephemeral);
     active_node_holder.reset();
     active_node_holder_zookeeper = zookeeper;
diff --git a/tests/integration/test_replicated_database/test.py b/tests/integration/test_replicated_database/test.py
index b47f86a843d..4f449f9a296 100644
--- a/tests/integration/test_replicated_database/test.py
+++ b/tests/integration/test_replicated_database/test.py
@@ -1141,6 +1141,8 @@ def test_sync_replica(started_cluster):
 
     dummy_node.query("SYSTEM SYNC DATABASE REPLICA test_sync_database")
 
+    assert "2\n" == main_node.query("SELECT sum(is_active) FROM system.clusters WHERE cluster='test_sync_database'")
+
     assert dummy_node.query(
         "SELECT count() FROM system.tables where database='test_sync_database'"
     ).strip() == str(number_of_tables)

From 4997f95426786a037328d4ed2bbce2245144eb1f Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Fri, 8 Mar 2024 17:30:58 +0100
Subject: [PATCH 194/985] fix build

---
 programs/keeper/Keeper.cpp                |  3 +++
 programs/server/Server.cpp                |  5 +++++
 src/Common/CgroupsMemoryUsageObserver.cpp |  4 +---
 src/Common/CgroupsMemoryUsageObserver.h   | 10 ++++++++--
 4 files changed, 17 insertions(+), 5 deletions(-)

diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index 76dd8cb15a5..c2ad81a3227 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -630,6 +630,9 @@ try
     {
         observer.emplace(std::chrono::seconds(cgroups_memory_observer_wait_time));
         observer->startThread();
+        observer->setOnMemoryLimitUpdate([&](){
+            main_config_reloader->reload();
+        });
     }
 
 
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index ee55cfd1837..c81e9b56e35 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -1701,6 +1701,11 @@ try
         throw;
     }
 
+    if (cgroups_memory_usage_observer)
+        cgroups_memory_usage_observer->setOnMemoryLimitUpdate([&](){
+            main_config_reloader->reload();
+        });
+
     /// Reload config in SYSTEM RELOAD CONFIG query.
     global_context->setConfigReloadCallback([&]()
     {
diff --git a/src/Common/CgroupsMemoryUsageObserver.cpp b/src/Common/CgroupsMemoryUsageObserver.cpp
index 5f24c2553b5..3fda51a119f 100644
--- a/src/Common/CgroupsMemoryUsageObserver.cpp
+++ b/src/Common/CgroupsMemoryUsageObserver.cpp
@@ -8,7 +8,6 @@
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadBufferFromFileDescriptor.h>
 #include <IO/ReadHelpers.h>
-#include <Interpreters/Context.h>
 #include <base/cgroupsv2.h>
 #include <base/getMemoryAmount.h>
 #include <base/sleep.h>
@@ -291,8 +290,7 @@ void CgroupsMemoryUsageObserver::runThread()
                 last_memory_amount = memory_limit;
                 /// if we find memory amount changes, we just reload config.
                 /// Reloading config will check the memory amount again and calculate soft/hard limit again.
-                auto global_context = getContext()->getGlobalContext();
-                global_context->reloadConfig();
+                on_memory_limit_update();
             }
             std::lock_guard<std::mutex> set_limit_lock(set_limit_mutex);
             if (soft_limit > 0 && hard_limit > 0)
diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index 6edf2e2049d..639433b5016 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -1,7 +1,6 @@
 #pragma once
 
 #include <Common/ThreadPool.h>
-#include <Interpreters/Context_fwd.h>
 
 #include <atomic>
 #include <chrono>
@@ -15,7 +14,7 @@ namespace DB
 /// - When the soft memory limit is hit, drop jemalloc cache.
 /// - When the hard memory limit is hit, update MemoryTracking metric to throw memory exceptions faster.
 #if defined(OS_LINUX)
-class CgroupsMemoryUsageObserver : public WithContext
+class CgroupsMemoryUsageObserver
 {
 public:
     enum class CgroupsVersion
@@ -28,6 +27,10 @@ public:
     ~CgroupsMemoryUsageObserver();
 
     void setLimits(uint64_t hard_limit_, uint64_t soft_limit_);
+    void setOnMemoryLimitUpdate(std::function<void()> on_memory_limit_update_)
+    {
+        on_memory_limit_update = on_memory_limit_update_;
+    }
     void startThread();
 
     size_t getHardLimit() const { return hard_limit; }
@@ -46,6 +49,7 @@ private:
     using CallbackFn = std::function<void(bool)>;
     CallbackFn on_hard_limit;
     CallbackFn on_soft_limit;
+    std::function<void()> on_memory_limit_update;
 
     uint64_t last_usage = 0;
 
@@ -87,8 +91,10 @@ public:
 
     void setLimits(uint64_t, uint64_t) {}
     size_t readMemoryUsage() { return 0; }
+    void startThread();
     size_t getHardLimit() { return 0; }
     size_t getSoftLimit() { return 0; }
+    void setOnMemoryLimitUpdate(std::function<void()>) {}
 };
 #endif
 

From babe00003620ca34f228009d919d5613db867dee Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 8 Mar 2024 16:43:10 +0000
Subject: [PATCH 195/985] Automatic style fix

---
 tests/integration/test_replicated_database/test.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_replicated_database/test.py b/tests/integration/test_replicated_database/test.py
index 4f449f9a296..881659262ac 100644
--- a/tests/integration/test_replicated_database/test.py
+++ b/tests/integration/test_replicated_database/test.py
@@ -1141,7 +1141,9 @@ def test_sync_replica(started_cluster):
 
     dummy_node.query("SYSTEM SYNC DATABASE REPLICA test_sync_database")
 
-    assert "2\n" == main_node.query("SELECT sum(is_active) FROM system.clusters WHERE cluster='test_sync_database'")
+    assert "2\n" == main_node.query(
+        "SELECT sum(is_active) FROM system.clusters WHERE cluster='test_sync_database'"
+    )
 
     assert dummy_node.query(
         "SELECT count() FROM system.tables where database='test_sync_database'"

From 68360aa522169b1c0955837e93687c6d3a124912 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 8 Mar 2024 18:37:03 +0100
Subject: [PATCH 196/985] Clang format

---
 base/base/itoa.cpp | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
index 608258c6b56..9bd2fcd1837 100644
--- a/base/base/itoa.cpp
+++ b/base/base/itoa.cpp
@@ -34,7 +34,6 @@
 
 namespace
 {
-
 template <typename T>
 ALWAYS_INLINE inline constexpr T pow10(size_t x)
 {
@@ -117,7 +116,6 @@ QuotientAndRemainder<N> inline split(UnsignedOfSize<N> value)
     return {quotient, remainder};
 }
 
-
 ALWAYS_INLINE inline char * outDigit(char * p, uint8_t value)
 {
     *p = '0' + value;
@@ -147,7 +145,6 @@ ALWAYS_INLINE inline char * outTwoDigits(char * p, uint8_t value)
     return p;
 }
 
-
 namespace convert
 {
 template <typename UInt, size_t N = sizeof(UInt)>
@@ -296,7 +293,6 @@ ALWAYS_INLINE inline char * itoa(I i, char * p)
 }
 }
 
-
 const uint64_t max_multiple_of_hundred_that_fits_in_64_bits = 1'00'00'00'00'00'00'00'00'00ull;
 const int max_multiple_of_hundred_blocks = 9;
 static_assert(max_multiple_of_hundred_that_fits_in_64_bits % 100 == 0);
@@ -411,7 +407,6 @@ ALWAYS_INLINE inline char * writeUIntText(UInt256 _x, char * p)
     return highest_part_print;
 }
 
-
 ALWAYS_INLINE inline char * writeLeadingMinus(char * pos)
 {
     *pos = '-';
@@ -451,7 +446,6 @@ ALWAYS_INLINE inline char * writeSIntText(T x, char * pos)
 }
 }
 
-
 char * itoa(UInt8 i, char * p)
 {
     return convert::itoa(uint8_t(i), p);

From c090c6fb0a6a91bb530654bf96bb31acb9d19f91 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 8 Mar 2024 18:52:15 +0000
Subject: [PATCH 197/985] Fix

---
 src/Interpreters/InterpreterSelectQuery.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 987bf560add..bcedba7346d 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -2122,7 +2122,7 @@ void InterpreterSelectQuery::applyFiltersToPrewhereInAnalysis(ExpressionAnalysis
     {
         /// Add row level security actions to prewhere.
         analysis.prewhere_info->row_level_filter = analysis.filter_info->actions;
-        analysis.prewhere_info->row_level_column_name = std::move(analysis.filter_info->column_name);
+        analysis.prewhere_info->row_level_column_name = analysis.filter_info->column_name;
         analysis.prewhere_info->row_level_filter->projectInput(false);
         analysis.filter_info = nullptr;
     }

From bd530a175301860ba1ed13b5b97c56f12e7b13ce Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Fri, 8 Mar 2024 20:21:28 +0000
Subject: [PATCH 198/985] Forgot to enable analyzer

---
 .../03006_parallel_replicas_cte_explain_syntax_crash.sql       | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql b/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql
index a407fceb1c6..f46817d5e82 100644
--- a/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql
+++ b/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql
@@ -24,7 +24,7 @@ AS SELECT *
 FROM numbers(1000000)
 SETTINGS allow_suspicious_low_cardinality_types = 1;
 
-SET allow_experimental_analyzer = 0;
+SET allow_experimental_analyzer = 1;
 SET allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3;
 EXPLAIN SYNTAX
 WITH
@@ -41,4 +41,3 @@ WITH
     )
 SELECT count()
 FROM cte2;
--- SETTINGS allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3;

From 2ce96f48f3c3958ef51c3e620b886d633436bb26 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Fri, 8 Mar 2024 21:58:01 +0100
Subject: [PATCH 199/985] Update
 02962_system_sync_replica_lightweight_from_modifier.sh

---
 .../02962_system_sync_replica_lightweight_from_modifier.sh  | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/02962_system_sync_replica_lightweight_from_modifier.sh b/tests/queries/0_stateless/02962_system_sync_replica_lightweight_from_modifier.sh
index f47801abf73..b61be87411d 100755
--- a/tests/queries/0_stateless/02962_system_sync_replica_lightweight_from_modifier.sh
+++ b/tests/queries/0_stateless/02962_system_sync_replica_lightweight_from_modifier.sh
@@ -14,7 +14,7 @@ export REPLICAS_TO_DROP
 
 for i in $(seq $TOTAL_REPLICAS); do
     $CLICKHOUSE_CLIENT --query "DROP TABLE IF EXISTS test_table_$i"
-    $CLICKHOUSE_CLIENT --query "CREATE TABLE test_table_$i (key UInt64, value UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/test_table', '$i') ORDER BY key"
+    $CLICKHOUSE_CLIENT --query "CREATE TABLE test_table_$i (key UInt64, value UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/test_table', '$i') ORDER BY key SETTINGS old_parts_lifetime=1"
 done
 
 function insert_thread() {
@@ -35,7 +35,7 @@ function sync_and_drop_replicas() {
         done
 
         for i in $(seq $REPLICAS_TO_DROP); do
-            $CLICKHOUSE_CLIENT --query "CREATE TABLE test_table_$i (key UInt64, value UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/test_table', '$i') ORDER BY key"
+            $CLICKHOUSE_CLIENT --query "CREATE TABLE test_table_$i (key UInt64, value UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/test_table', '$i') ORDER BY key SETTINGS old_parts_lifetime=1"
         done
     done
 }
@@ -87,4 +87,4 @@ for i in $(seq $TOTAL_REPLICAS); do
     if [ $i -gt $REPLICAS_TO_DROP ]; then
         $CLICKHOUSE_CLIENT --query "DROP TABLE IF EXISTS test_table_$i"
     fi
-done
\ No newline at end of file
+done

From 23b55ecbe8521692acab507408fc70665aa16f1b Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 8 Mar 2024 22:02:22 +0100
Subject: [PATCH 200/985] beautify exception

---
 src/Functions/array/arrayDotProduct.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/array/arrayDotProduct.cpp b/src/Functions/array/arrayDotProduct.cpp
index 97dc9653bab..3f37e6f609f 100644
--- a/src/Functions/array/arrayDotProduct.cpp
+++ b/src/Functions/array/arrayDotProduct.cpp
@@ -212,7 +212,7 @@ private:
                 throw Exception(
                     ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                     "Arguments of function {} has nested type {}. "
-                    "Support: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
+                    "Supported types: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
                     getName(),
                     type_x->getName());
         }

From c01a6775d747606b3aae70c9615404720208aeda Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Sat, 9 Mar 2024 02:28:39 +0100
Subject: [PATCH 201/985] fix style

---
 programs/keeper/Keeper.cpp | 3 ++-
 programs/server/Server.cpp | 5 ++++-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index c2ad81a3227..31e0b7dc576 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -630,7 +630,8 @@ try
     {
         observer.emplace(std::chrono::seconds(cgroups_memory_observer_wait_time));
         observer->startThread();
-        observer->setOnMemoryLimitUpdate([&](){
+        observer->setOnMemoryLimitUpdate([&]()
+        {
             main_config_reloader->reload();
         });
     }
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index c81e9b56e35..33a30a1de2c 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -1702,9 +1702,12 @@ try
     }
 
     if (cgroups_memory_usage_observer)
-        cgroups_memory_usage_observer->setOnMemoryLimitUpdate([&](){
+    {
+        cgroups_memory_usage_observer->setOnMemoryLimitUpdate([&]()
+        {
             main_config_reloader->reload();
         });
+    }
 
     /// Reload config in SYSTEM RELOAD CONFIG query.
     global_context->setConfigReloadCallback([&]()

From 009c2ea9f6e3c9dcd30a2528f7737cd9059296dd Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 05:27:29 +0100
Subject: [PATCH 202/985] Move a class into an anonymous namespace

---
 src/Disks/IO/ReadBufferFromRemoteFSGather.cpp | 3 ---
 src/Functions/CastOverloadResolver.cpp        | 5 +++++
 2 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
index 417f7615dd7..38da4e96ff1 100644
--- a/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
+++ b/src/Disks/IO/ReadBufferFromRemoteFSGather.cpp
@@ -1,7 +1,5 @@
 #include "ReadBufferFromRemoteFSGather.h"
 
-#include <IO/SeekableReadBuffer.h>
-
 #include <Disks/IO/CachedOnDiskReadBufferFromFile.h>
 #include <Disks/ObjectStorages/Cached/CachedObjectStorage.h>
 #include <Interpreters/Cache/FileCache.h>
@@ -9,7 +7,6 @@
 #include <IO/ReadSettings.h>
 #include <IO/SwapHelper.h>
 #include <Interpreters/FilesystemCacheLog.h>
-#include <base/hex.h>
 #include <Common/logger_useful.h>
 
 using namespace DB;
diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 7fc46db50f1..a72563212ff 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -12,6 +12,9 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
+namespace
+{
+
 /** CastInternal does not preserve nullability of the data type,
   * i.e. CastInternal(toNullable(toInt8(1)) as Int32) will be Int32(1).
   *
@@ -136,6 +139,8 @@ using CastOverloadResolver = CastOverloadResolverImpl<cast_type, false, CastOver
 template <CastType cast_type>
 using CastInternalOverloadResolver = CastOverloadResolverImpl<cast_type, true, CastInternalOverloadName, CastInternalName>;
 
+}
+
 
 FunctionOverloadResolverPtr createInternalCastOverloadResolver(CastType type, std::optional<CastDiagnostic> diagnostic)
 {

From 2be09581ddc0ddfb57134f8a0ea6c33314f8071e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 05:48:52 +0100
Subject: [PATCH 203/985] Split CastOverloadResolver translation unit

---
 programs/library-bridge/CMakeLists.txt |   3 +
 programs/odbc-bridge/CMakeLists.txt    |   3 +
 src/Functions/CastOverloadResolver.cpp | 139 +------------------------
 3 files changed, 7 insertions(+), 138 deletions(-)

diff --git a/programs/library-bridge/CMakeLists.txt b/programs/library-bridge/CMakeLists.txt
index dd0bf67cb64..f42b574b807 100644
--- a/programs/library-bridge/CMakeLists.txt
+++ b/programs/library-bridge/CMakeLists.txt
@@ -11,6 +11,9 @@ set (CLICKHOUSE_LIBRARY_BRIDGE_SOURCES
     LibraryBridgeHandlers.cpp
     SharedLibrary.cpp
     library-bridge.cpp
+
+    ../../src/Functions/CastOverloadResolverImpl.cpp
+    ../../src/Functions/CastInternalOverloadResolverImpl.cpp
 )
 
 clickhouse_add_executable(clickhouse-library-bridge ${CLICKHOUSE_LIBRARY_BRIDGE_SOURCES})
diff --git a/programs/odbc-bridge/CMakeLists.txt b/programs/odbc-bridge/CMakeLists.txt
index 56373601b95..4e5dbac486e 100644
--- a/programs/odbc-bridge/CMakeLists.txt
+++ b/programs/odbc-bridge/CMakeLists.txt
@@ -13,6 +13,9 @@ set (CLICKHOUSE_ODBC_BRIDGE_SOURCES
     getIdentifierQuote.cpp
     odbc-bridge.cpp
     validateODBCConnectionString.cpp
+
+    ../../src/Functions/CastOverloadResolverImpl.cpp
+    ../../src/Functions/CastInternalOverloadResolverImpl.cpp
 )
 
 clickhouse_add_executable(clickhouse-odbc-bridge ${CLICKHOUSE_ODBC_BRIDGE_SOURCES})
diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index a72563212ff..1c57bcfa979 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -1,147 +1,11 @@
 #include <Functions/FunctionFactory.h>
-#include <Functions/FunctionsConversion.h>
 #include <Functions/CastOverloadResolver.h>
-#include <Interpreters/parseColumnsListForTableFunction.h>
+#include <Functions/CastOverloadResolverImpl.h>
 
 
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-}
-
-namespace
-{
-
-/** CastInternal does not preserve nullability of the data type,
-  * i.e. CastInternal(toNullable(toInt8(1)) as Int32) will be Int32(1).
-  *
-  * Cast preserves nullability according to setting `cast_keep_nullable`,
-  * i.e. Cast(toNullable(toInt8(1)) as Int32) will be Nullable(Int32(1)) if `cast_keep_nullable` == 1.
-  */
-template <CastType cast_type, bool internal, typename CastName, typename FunctionName>
-class CastOverloadResolverImpl : public IFunctionOverloadResolver
-{
-public:
-    using MonotonicityForRange = FunctionCastBase::MonotonicityForRange;
-
-    static constexpr auto name = cast_type == CastType::accurate
-        ? CastName::accurate_cast_name
-        : (cast_type == CastType::accurateOrNull ? CastName::accurate_cast_or_null_name : CastName::cast_name);
-
-    String getName() const override { return name; }
-
-    size_t getNumberOfArguments() const override { return 2; }
-
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
-
-    explicit CastOverloadResolverImpl(ContextPtr context_, std::optional<CastDiagnostic> diagnostic_, bool keep_nullable_, const DataTypeValidationSettings & data_type_validation_settings_)
-        : context(context_)
-        , diagnostic(std::move(diagnostic_))
-        , keep_nullable(keep_nullable_)
-        , data_type_validation_settings(data_type_validation_settings_)
-    {
-    }
-
-    static FunctionOverloadResolverPtr create(ContextPtr context)
-    {
-        const auto & settings_ref = context->getSettingsRef();
-
-        if constexpr (internal)
-            return createImpl(context, {}, false /*keep_nullable*/);
-
-        return createImpl(context, {}, settings_ref.cast_keep_nullable, DataTypeValidationSettings(settings_ref));
-    }
-
-    static FunctionOverloadResolverPtr createImpl(ContextPtr context, std::optional<CastDiagnostic> diagnostic = {}, bool keep_nullable = false, const DataTypeValidationSettings & data_type_validation_settings = {})
-    {
-        assert(!internal || !keep_nullable);
-        return std::make_unique<CastOverloadResolverImpl>(context, std::move(diagnostic), keep_nullable, data_type_validation_settings);
-    }
-
-    static FunctionOverloadResolverPtr createImpl(std::optional<CastDiagnostic> diagnostic = {}, bool keep_nullable = false, const DataTypeValidationSettings & data_type_validation_settings = {})
-    {
-        assert(!internal || !keep_nullable);
-        return std::make_unique<CastOverloadResolverImpl>(ContextPtr(), std::move(diagnostic), keep_nullable, data_type_validation_settings);
-    }
-
-protected:
-
-    FunctionBasePtr buildImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
-    {
-        DataTypes data_types(arguments.size());
-
-        for (size_t i = 0; i < arguments.size(); ++i)
-            data_types[i] = arguments[i].type;
-
-        auto monotonicity = MonotonicityHelper::getMonotonicityInformation(arguments.front().type, return_type.get());
-        return std::make_unique<FunctionCast<FunctionName>>(context, name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
-    }
-
-    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
-    {
-        const auto & column = arguments.back().column;
-        if (!column)
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Second argument to {} must be a constant string describing type. "
-                "Instead there is non-constant column of type {}", getName(), arguments.back().type->getName());
-
-        const auto * type_col = checkAndGetColumnConst<ColumnString>(column.get());
-        if (!type_col)
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Second argument to {} must be a constant string describing type. "
-                "Instead there is a column with the following structure: {}", getName(), column->dumpStructure());
-
-        DataTypePtr type = DataTypeFactory::instance().get(type_col->getValue<String>());
-        validateDataType(type, data_type_validation_settings);
-
-        if constexpr (cast_type == CastType::accurateOrNull)
-            return makeNullable(type);
-
-        if constexpr (internal)
-            return type;
-
-        if (keep_nullable && arguments.front().type->isNullable() && type->canBeInsideNullable())
-            return makeNullable(type);
-
-        return type;
-    }
-
-    bool useDefaultImplementationForNulls() const override { return false; }
-    bool useDefaultImplementationForNothing() const override { return false; }
-    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
-
-private:
-    ContextPtr context;
-    std::optional<CastDiagnostic> diagnostic;
-    bool keep_nullable;
-    DataTypeValidationSettings data_type_validation_settings;
-};
-
-
-struct CastOverloadName
-{
-    static constexpr auto cast_name = "CAST";
-    static constexpr auto accurate_cast_name = "accurateCast";
-    static constexpr auto accurate_cast_or_null_name = "accurateCastOrNull";
-};
-
-struct CastInternalOverloadName
-{
-    static constexpr auto cast_name = "_CAST";
-    static constexpr auto accurate_cast_name = "accurate_Cast";
-    static constexpr auto accurate_cast_or_null_name = "accurate_CastOrNull";
-};
-
-template <CastType cast_type>
-using CastOverloadResolver = CastOverloadResolverImpl<cast_type, false, CastOverloadName, CastName>;
-
-template <CastType cast_type>
-using CastInternalOverloadResolver = CastOverloadResolverImpl<cast_type, true, CastInternalOverloadName, CastInternalName>;
-
-}
-
-
 FunctionOverloadResolverPtr createInternalCastOverloadResolver(CastType type, std::optional<CastDiagnostic> diagnostic)
 {
     switch (type)
@@ -155,7 +19,6 @@ FunctionOverloadResolverPtr createInternalCastOverloadResolver(CastType type, st
     }
 }
 
-
 REGISTER_FUNCTION(CastOverloadResolvers)
 {
     factory.registerFunction<CastInternalOverloadResolver<CastType::nonAccurate>>({}, FunctionFactory::CaseInsensitive);

From c67e8d5d73a6ac1647a023740a859e739d6ab2ee Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 05:50:19 +0100
Subject: [PATCH 204/985] Add files

---
 .../CastInternalOverloadResolverImpl.cpp      |  10 ++
 src/Functions/CastOverloadResolverImpl.cpp    |  10 ++
 src/Functions/CastOverloadResolverImpl.h      | 149 ++++++++++++++++++
 3 files changed, 169 insertions(+)
 create mode 100644 src/Functions/CastInternalOverloadResolverImpl.cpp
 create mode 100644 src/Functions/CastOverloadResolverImpl.cpp
 create mode 100644 src/Functions/CastOverloadResolverImpl.h

diff --git a/src/Functions/CastInternalOverloadResolverImpl.cpp b/src/Functions/CastInternalOverloadResolverImpl.cpp
new file mode 100644
index 00000000000..d8ee0c76fd8
--- /dev/null
+++ b/src/Functions/CastInternalOverloadResolverImpl.cpp
@@ -0,0 +1,10 @@
+#include <Functions/CastOverloadResolverImpl.h>
+
+namespace DB
+{
+
+template class CastOverloadResolverImpl<CastType::nonAccurate, true, CastInternalOverloadName, CastInternalName>;
+template class CastOverloadResolverImpl<CastType::accurate, true, CastInternalOverloadName, CastInternalName>;
+template class CastOverloadResolverImpl<CastType::accurateOrNull, true, CastInternalOverloadName, CastInternalName>;
+
+}
diff --git a/src/Functions/CastOverloadResolverImpl.cpp b/src/Functions/CastOverloadResolverImpl.cpp
new file mode 100644
index 00000000000..d2325db5e0a
--- /dev/null
+++ b/src/Functions/CastOverloadResolverImpl.cpp
@@ -0,0 +1,10 @@
+#include <Functions/CastOverloadResolverImpl.h>
+
+namespace DB
+{
+
+template class CastOverloadResolverImpl<CastType::nonAccurate, false, CastOverloadName, CastName>;
+template class CastOverloadResolverImpl<CastType::accurate, false, CastOverloadName, CastName>;
+template class CastOverloadResolverImpl<CastType::accurateOrNull, false, CastOverloadName, CastName>;
+
+}
diff --git a/src/Functions/CastOverloadResolverImpl.h b/src/Functions/CastOverloadResolverImpl.h
new file mode 100644
index 00000000000..61ccc66fb6c
--- /dev/null
+++ b/src/Functions/CastOverloadResolverImpl.h
@@ -0,0 +1,149 @@
+#pragma once
+
+#include <Functions/FunctionsConversion.h>
+#include <Functions/CastOverloadResolver.h>
+#include <Interpreters/parseColumnsListForTableFunction.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+}
+
+
+/** CastInternal does not preserve nullability of the data type,
+  * i.e. CastInternal(toNullable(toInt8(1)) as Int32) will be Int32(1).
+  *
+  * Cast preserves nullability according to setting `cast_keep_nullable`,
+  * i.e. Cast(toNullable(toInt8(1)) as Int32) will be Nullable(Int32(1)) if `cast_keep_nullable` == 1.
+  */
+template <CastType cast_type, bool internal, typename CastName, typename FunctionName>
+class CastOverloadResolverImpl : public IFunctionOverloadResolver
+{
+public:
+    using MonotonicityForRange = FunctionCastBase::MonotonicityForRange;
+
+    static constexpr auto name = cast_type == CastType::accurate
+        ? CastName::accurate_cast_name
+        : (cast_type == CastType::accurateOrNull ? CastName::accurate_cast_or_null_name : CastName::cast_name);
+
+    String getName() const override { return name; }
+
+    size_t getNumberOfArguments() const override { return 2; }
+
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
+
+    explicit CastOverloadResolverImpl(ContextPtr context_, std::optional<CastDiagnostic> diagnostic_, bool keep_nullable_, const DataTypeValidationSettings & data_type_validation_settings_)
+        : context(context_)
+        , diagnostic(std::move(diagnostic_))
+        , keep_nullable(keep_nullable_)
+        , data_type_validation_settings(data_type_validation_settings_)
+    {
+    }
+
+    static FunctionOverloadResolverPtr create(ContextPtr context)
+    {
+        const auto & settings_ref = context->getSettingsRef();
+
+        if constexpr (internal)
+            return createImpl(context, {}, false /*keep_nullable*/);
+
+        return createImpl(context, {}, settings_ref.cast_keep_nullable, DataTypeValidationSettings(settings_ref));
+    }
+
+    static FunctionOverloadResolverPtr createImpl(ContextPtr context, std::optional<CastDiagnostic> diagnostic = {}, bool keep_nullable = false, const DataTypeValidationSettings & data_type_validation_settings = {})
+    {
+        assert(!internal || !keep_nullable);
+        return std::make_unique<CastOverloadResolverImpl>(context, std::move(diagnostic), keep_nullable, data_type_validation_settings);
+    }
+
+    static FunctionOverloadResolverPtr createImpl(std::optional<CastDiagnostic> diagnostic = {}, bool keep_nullable = false, const DataTypeValidationSettings & data_type_validation_settings = {})
+    {
+        assert(!internal || !keep_nullable);
+        return std::make_unique<CastOverloadResolverImpl>(ContextPtr(), std::move(diagnostic), keep_nullable, data_type_validation_settings);
+    }
+
+protected:
+
+    FunctionBasePtr buildImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
+    {
+        DataTypes data_types(arguments.size());
+
+        for (size_t i = 0; i < arguments.size(); ++i)
+            data_types[i] = arguments[i].type;
+
+        auto monotonicity = MonotonicityHelper::getMonotonicityInformation(arguments.front().type, return_type.get());
+        return std::make_unique<FunctionCast<FunctionName>>(context, name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
+    }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
+    {
+        const auto & column = arguments.back().column;
+        if (!column)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Second argument to {} must be a constant string describing type. "
+                "Instead there is non-constant column of type {}", getName(), arguments.back().type->getName());
+
+        const auto * type_col = checkAndGetColumnConst<ColumnString>(column.get());
+        if (!type_col)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Second argument to {} must be a constant string describing type. "
+                "Instead there is a column with the following structure: {}", getName(), column->dumpStructure());
+
+        DataTypePtr type = DataTypeFactory::instance().get(type_col->getValue<String>());
+        validateDataType(type, data_type_validation_settings);
+
+        if constexpr (cast_type == CastType::accurateOrNull)
+            return makeNullable(type);
+
+        if constexpr (internal)
+            return type;
+
+        if (keep_nullable && arguments.front().type->isNullable() && type->canBeInsideNullable())
+            return makeNullable(type);
+
+        return type;
+    }
+
+    bool useDefaultImplementationForNulls() const override { return false; }
+    bool useDefaultImplementationForNothing() const override { return false; }
+    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
+
+private:
+    ContextPtr context;
+    std::optional<CastDiagnostic> diagnostic;
+    bool keep_nullable;
+    DataTypeValidationSettings data_type_validation_settings;
+};
+
+
+struct CastOverloadName
+{
+    static constexpr auto cast_name = "CAST";
+    static constexpr auto accurate_cast_name = "accurateCast";
+    static constexpr auto accurate_cast_or_null_name = "accurateCastOrNull";
+};
+
+struct CastInternalOverloadName
+{
+    static constexpr auto cast_name = "_CAST";
+    static constexpr auto accurate_cast_name = "accurate_Cast";
+    static constexpr auto accurate_cast_or_null_name = "accurate_CastOrNull";
+};
+
+template <CastType cast_type>
+using CastOverloadResolver = CastOverloadResolverImpl<cast_type, false, CastOverloadName, CastName>;
+
+template <CastType cast_type>
+using CastInternalOverloadResolver = CastOverloadResolverImpl<cast_type, true, CastInternalOverloadName, CastInternalName>;
+
+extern template class CastOverloadResolverImpl<CastType::nonAccurate, false, CastOverloadName, CastName>;
+extern template class CastOverloadResolverImpl<CastType::accurate, false, CastOverloadName, CastName>;
+extern template class CastOverloadResolverImpl<CastType::accurateOrNull, false, CastOverloadName, CastName>;
+
+extern template class CastOverloadResolverImpl<CastType::nonAccurate, true, CastInternalOverloadName, CastInternalName>;
+extern template class CastOverloadResolverImpl<CastType::accurate, true, CastInternalOverloadName, CastInternalName>;
+extern template class CastOverloadResolverImpl<CastType::accurateOrNull, true, CastInternalOverloadName, CastInternalName>;
+
+}

From 6d45eecdad4b737584b9f64e9a44c8fd845f17a4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 06:11:34 +0100
Subject: [PATCH 205/985] Remove garbage

---
 programs/odbc-bridge/CMakeLists.txt           |  3 --
 src/Functions/CMakeLists.txt                  |  2 +
 .../CastInternalOverloadResolverImpl.cpp      |  6 +--
 src/Functions/CastOverloadResolverImpl.cpp    |  6 +--
 src/Functions/CastOverloadResolverImpl.h      | 51 +++++++++----------
 src/Functions/FunctionsConversion.cpp         | 15 ++++++
 src/Functions/FunctionsConversion.h           | 17 +------
 7 files changed, 49 insertions(+), 51 deletions(-)

diff --git a/programs/odbc-bridge/CMakeLists.txt b/programs/odbc-bridge/CMakeLists.txt
index 4e5dbac486e..56373601b95 100644
--- a/programs/odbc-bridge/CMakeLists.txt
+++ b/programs/odbc-bridge/CMakeLists.txt
@@ -13,9 +13,6 @@ set (CLICKHOUSE_ODBC_BRIDGE_SOURCES
     getIdentifierQuote.cpp
     odbc-bridge.cpp
     validateODBCConnectionString.cpp
-
-    ../../src/Functions/CastOverloadResolverImpl.cpp
-    ../../src/Functions/CastInternalOverloadResolverImpl.cpp
 )
 
 clickhouse_add_executable(clickhouse-odbc-bridge ${CLICKHOUSE_ODBC_BRIDGE_SOURCES})
diff --git a/src/Functions/CMakeLists.txt b/src/Functions/CMakeLists.txt
index ac3e3671ae0..f27bcae1fe3 100644
--- a/src/Functions/CMakeLists.txt
+++ b/src/Functions/CMakeLists.txt
@@ -15,6 +15,8 @@ extract_into_parent_list(clickhouse_functions_sources dbms_sources
     checkHyperscanRegexp.cpp
     array/has.cpp
     CastOverloadResolver.cpp
+    CastOverloadResolverImpl.cpp
+    CastInternalOverloadResolverImpl.cpp
 )
 extract_into_parent_list(clickhouse_functions_headers dbms_headers
     IFunction.h
diff --git a/src/Functions/CastInternalOverloadResolverImpl.cpp b/src/Functions/CastInternalOverloadResolverImpl.cpp
index d8ee0c76fd8..8b74f76ca39 100644
--- a/src/Functions/CastInternalOverloadResolverImpl.cpp
+++ b/src/Functions/CastInternalOverloadResolverImpl.cpp
@@ -3,8 +3,8 @@
 namespace DB
 {
 
-template class CastOverloadResolverImpl<CastType::nonAccurate, true, CastInternalOverloadName, CastInternalName>;
-template class CastOverloadResolverImpl<CastType::accurate, true, CastInternalOverloadName, CastInternalName>;
-template class CastOverloadResolverImpl<CastType::accurateOrNull, true, CastInternalOverloadName, CastInternalName>;
+template class CastOverloadResolverImpl<CastType::nonAccurate, true>;
+template class CastOverloadResolverImpl<CastType::accurate, true>;
+template class CastOverloadResolverImpl<CastType::accurateOrNull, true>;
 
 }
diff --git a/src/Functions/CastOverloadResolverImpl.cpp b/src/Functions/CastOverloadResolverImpl.cpp
index d2325db5e0a..a7f7024892e 100644
--- a/src/Functions/CastOverloadResolverImpl.cpp
+++ b/src/Functions/CastOverloadResolverImpl.cpp
@@ -3,8 +3,8 @@
 namespace DB
 {
 
-template class CastOverloadResolverImpl<CastType::nonAccurate, false, CastOverloadName, CastName>;
-template class CastOverloadResolverImpl<CastType::accurate, false, CastOverloadName, CastName>;
-template class CastOverloadResolverImpl<CastType::accurateOrNull, false, CastOverloadName, CastName>;
+template class CastOverloadResolverImpl<CastType::nonAccurate, false>;
+template class CastOverloadResolverImpl<CastType::accurate, false>;
+template class CastOverloadResolverImpl<CastType::accurateOrNull, false>;
 
 }
diff --git a/src/Functions/CastOverloadResolverImpl.h b/src/Functions/CastOverloadResolverImpl.h
index 61ccc66fb6c..36376c5f254 100644
--- a/src/Functions/CastOverloadResolverImpl.h
+++ b/src/Functions/CastOverloadResolverImpl.h
@@ -13,6 +13,15 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
+struct CastName
+{
+    static constexpr auto name = "CAST";
+};
+
+struct CastInternalName
+{
+    static constexpr auto name = "_CAST";
+};
 
 /** CastInternal does not preserve nullability of the data type,
   * i.e. CastInternal(toNullable(toInt8(1)) as Int32) will be Int32(1).
@@ -20,15 +29,16 @@ namespace ErrorCodes
   * Cast preserves nullability according to setting `cast_keep_nullable`,
   * i.e. Cast(toNullable(toInt8(1)) as Int32) will be Nullable(Int32(1)) if `cast_keep_nullable` == 1.
   */
-template <CastType cast_type, bool internal, typename CastName, typename FunctionName>
+template <CastType cast_type, bool internal>
 class CastOverloadResolverImpl : public IFunctionOverloadResolver
 {
 public:
     using MonotonicityForRange = FunctionCastBase::MonotonicityForRange;
 
     static constexpr auto name = cast_type == CastType::accurate
-        ? CastName::accurate_cast_name
-        : (cast_type == CastType::accurateOrNull ? CastName::accurate_cast_or_null_name : CastName::cast_name);
+        ? "accurateCast"
+        : (cast_type == CastType::accurateOrNull ? "accurateCastOrNull"
+        : (internal ? "_CAST" : "CAST"));
 
     String getName() const override { return name; }
 
@@ -76,7 +86,9 @@ protected:
             data_types[i] = arguments[i].type;
 
         auto monotonicity = MonotonicityHelper::getMonotonicityInformation(arguments.front().type, return_type.get());
-        return std::make_unique<FunctionCast<FunctionName>>(context, name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
+
+        using Function = FunctionCast<std::conditional_t<internal, CastInternalName, CastName>>;
+        return std::make_unique<Function>(context, name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
     }
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
@@ -118,32 +130,19 @@ private:
 };
 
 
-struct CastOverloadName
-{
-    static constexpr auto cast_name = "CAST";
-    static constexpr auto accurate_cast_name = "accurateCast";
-    static constexpr auto accurate_cast_or_null_name = "accurateCastOrNull";
-};
-
-struct CastInternalOverloadName
-{
-    static constexpr auto cast_name = "_CAST";
-    static constexpr auto accurate_cast_name = "accurate_Cast";
-    static constexpr auto accurate_cast_or_null_name = "accurate_CastOrNull";
-};
+template <CastType cast_type>
+using CastOverloadResolver = CastOverloadResolverImpl<cast_type, false>;
 
 template <CastType cast_type>
-using CastOverloadResolver = CastOverloadResolverImpl<cast_type, false, CastOverloadName, CastName>;
+using CastInternalOverloadResolver = CastOverloadResolverImpl<cast_type, true>;
 
-template <CastType cast_type>
-using CastInternalOverloadResolver = CastOverloadResolverImpl<cast_type, true, CastInternalOverloadName, CastInternalName>;
 
-extern template class CastOverloadResolverImpl<CastType::nonAccurate, false, CastOverloadName, CastName>;
-extern template class CastOverloadResolverImpl<CastType::accurate, false, CastOverloadName, CastName>;
-extern template class CastOverloadResolverImpl<CastType::accurateOrNull, false, CastOverloadName, CastName>;
+extern template class CastOverloadResolverImpl<CastType::nonAccurate, false>;
+extern template class CastOverloadResolverImpl<CastType::accurate, false>;
+extern template class CastOverloadResolverImpl<CastType::accurateOrNull, false>;
 
-extern template class CastOverloadResolverImpl<CastType::nonAccurate, true, CastInternalOverloadName, CastInternalName>;
-extern template class CastOverloadResolverImpl<CastType::accurate, true, CastInternalOverloadName, CastInternalName>;
-extern template class CastOverloadResolverImpl<CastType::accurateOrNull, true, CastInternalOverloadName, CastInternalName>;
+extern template class CastOverloadResolverImpl<CastType::nonAccurate, true>;
+extern template class CastOverloadResolverImpl<CastType::accurate, true>;
+extern template class CastOverloadResolverImpl<CastType::accurateOrNull, true>;
 
 }
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 01e057e19a1..59455ba51b7 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -5,6 +5,21 @@
 namespace DB
 {
 
+UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
+{
+    const auto * arg_type = named_column.type.get();
+    bool ok = checkAndGetDataType<DataTypeUInt64>(arg_type)
+        || checkAndGetDataType<DataTypeUInt32>(arg_type)
+        || checkAndGetDataType<DataTypeUInt16>(arg_type)
+        || checkAndGetDataType<DataTypeUInt8>(arg_type);
+    if (!ok)
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type of toDecimal() scale {}", named_column.type->getName());
+
+    Field field;
+    named_column.column->get(0, field);
+    return static_cast<UInt32>(field.get<UInt32>());
+}
+
 REGISTER_FUNCTION(Conversion)
 {
     factory.registerFunction<FunctionToUInt8>();
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index 1522e76893e..fac74715fa0 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -98,20 +98,7 @@ namespace ErrorCodes
   * toType - conversion in "natural way";
   */
 
-inline UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
-{
-    const auto * arg_type = named_column.type.get();
-    bool ok = checkAndGetDataType<DataTypeUInt64>(arg_type)
-        || checkAndGetDataType<DataTypeUInt32>(arg_type)
-        || checkAndGetDataType<DataTypeUInt16>(arg_type)
-        || checkAndGetDataType<DataTypeUInt8>(arg_type);
-    if (!ok)
-        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type of toDecimal() scale {}", named_column.type->getName());
-
-    Field field;
-    named_column.column->get(0, field);
-    return static_cast<UInt32>(field.get<UInt32>());
-}
+UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column);
 
 /// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
 struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
@@ -3182,8 +3169,6 @@ private:
     std::optional<CastDiagnostic> diagnostic;
 };
 
-struct CastName { static constexpr auto name = "CAST"; };
-struct CastInternalName { static constexpr auto name = "_CAST"; };
 
 class FunctionCastBase : public IFunctionBase
 {

From ea54ac3cb4842c332529bab14c0e619115911a2c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 06:12:22 +0100
Subject: [PATCH 206/985] Remove garbage

---
 programs/library-bridge/CMakeLists.txt | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/programs/library-bridge/CMakeLists.txt b/programs/library-bridge/CMakeLists.txt
index f42b574b807..dd0bf67cb64 100644
--- a/programs/library-bridge/CMakeLists.txt
+++ b/programs/library-bridge/CMakeLists.txt
@@ -11,9 +11,6 @@ set (CLICKHOUSE_LIBRARY_BRIDGE_SOURCES
     LibraryBridgeHandlers.cpp
     SharedLibrary.cpp
     library-bridge.cpp
-
-    ../../src/Functions/CastOverloadResolverImpl.cpp
-    ../../src/Functions/CastInternalOverloadResolverImpl.cpp
 )
 
 clickhouse_add_executable(clickhouse-library-bridge ${CLICKHOUSE_LIBRARY_BRIDGE_SOURCES})

From 7983e2b6206c5b78158802430b639e9b060d7b0c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 06:14:32 +0100
Subject: [PATCH 207/985] Remove garbage

---
 src/Functions/CastOverloadResolver.cpp | 15 +++++++++++++++
 src/Functions/FunctionsConversion.cpp  | 15 ---------------
 2 files changed, 15 insertions(+), 15 deletions(-)

diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 1c57bcfa979..a343dbb62fe 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -6,6 +6,21 @@
 namespace DB
 {
 
+UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
+{
+    const auto * arg_type = named_column.type.get();
+    bool ok = checkAndGetDataType<DataTypeUInt64>(arg_type)
+        || checkAndGetDataType<DataTypeUInt32>(arg_type)
+        || checkAndGetDataType<DataTypeUInt16>(arg_type)
+        || checkAndGetDataType<DataTypeUInt8>(arg_type);
+    if (!ok)
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type of toDecimal() scale {}", named_column.type->getName());
+
+    Field field;
+    named_column.column->get(0, field);
+    return static_cast<UInt32>(field.get<UInt32>());
+}
+
 FunctionOverloadResolverPtr createInternalCastOverloadResolver(CastType type, std::optional<CastDiagnostic> diagnostic)
 {
     switch (type)
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 59455ba51b7..01e057e19a1 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -5,21 +5,6 @@
 namespace DB
 {
 
-UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
-{
-    const auto * arg_type = named_column.type.get();
-    bool ok = checkAndGetDataType<DataTypeUInt64>(arg_type)
-        || checkAndGetDataType<DataTypeUInt32>(arg_type)
-        || checkAndGetDataType<DataTypeUInt16>(arg_type)
-        || checkAndGetDataType<DataTypeUInt8>(arg_type);
-    if (!ok)
-        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type of toDecimal() scale {}", named_column.type->getName());
-
-    Field field;
-    named_column.column->get(0, field);
-    return static_cast<UInt32>(field.get<UInt32>());
-}
-
 REGISTER_FUNCTION(Conversion)
 {
     factory.registerFunction<FunctionToUInt8>();

From 0d05b8ccc1f56d774c502f780cbbd98326dd8401 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 06:37:50 +0100
Subject: [PATCH 208/985] Fix style

---
 src/Functions/CastOverloadResolver.cpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index a343dbb62fe..6bacc7f4847 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -6,6 +6,11 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+}
+
 UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
 {
     const auto * arg_type = named_column.type.get();

From dc7f4b39eef4c2a9b47cee7b7197c58fd86c0520 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 07:00:28 +0100
Subject: [PATCH 209/985] Remove garbage

---
 src/Functions/CMakeLists.txt                  |  2 -
 .../CastInternalOverloadResolverImpl.cpp      | 10 ---
 src/Functions/CastOverloadResolver.cpp        | 21 +-----
 src/Functions/CastOverloadResolverImpl.cpp    | 10 ---
 src/Functions/CastOverloadResolverImpl.h      | 73 +++++++------------
 5 files changed, 31 insertions(+), 85 deletions(-)
 delete mode 100644 src/Functions/CastInternalOverloadResolverImpl.cpp
 delete mode 100644 src/Functions/CastOverloadResolverImpl.cpp

diff --git a/src/Functions/CMakeLists.txt b/src/Functions/CMakeLists.txt
index f27bcae1fe3..ac3e3671ae0 100644
--- a/src/Functions/CMakeLists.txt
+++ b/src/Functions/CMakeLists.txt
@@ -15,8 +15,6 @@ extract_into_parent_list(clickhouse_functions_sources dbms_sources
     checkHyperscanRegexp.cpp
     array/has.cpp
     CastOverloadResolver.cpp
-    CastOverloadResolverImpl.cpp
-    CastInternalOverloadResolverImpl.cpp
 )
 extract_into_parent_list(clickhouse_functions_headers dbms_headers
     IFunction.h
diff --git a/src/Functions/CastInternalOverloadResolverImpl.cpp b/src/Functions/CastInternalOverloadResolverImpl.cpp
deleted file mode 100644
index 8b74f76ca39..00000000000
--- a/src/Functions/CastInternalOverloadResolverImpl.cpp
+++ /dev/null
@@ -1,10 +0,0 @@
-#include <Functions/CastOverloadResolverImpl.h>
-
-namespace DB
-{
-
-template class CastOverloadResolverImpl<CastType::nonAccurate, true>;
-template class CastOverloadResolverImpl<CastType::accurate, true>;
-template class CastOverloadResolverImpl<CastType::accurateOrNull, true>;
-
-}
diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 6bacc7f4847..79b17d3297c 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -26,27 +26,14 @@ UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
     return static_cast<UInt32>(field.get<UInt32>());
 }
 
-FunctionOverloadResolverPtr createInternalCastOverloadResolver(CastType type, std::optional<CastDiagnostic> diagnostic)
-{
-    switch (type)
-    {
-        case CastType::nonAccurate:
-            return CastInternalOverloadResolver<CastType::nonAccurate>::createImpl(diagnostic);
-        case CastType::accurate:
-            return CastInternalOverloadResolver<CastType::accurate>::createImpl(diagnostic);
-        case CastType::accurateOrNull:
-            return CastInternalOverloadResolver<CastType::accurateOrNull>::createImpl(diagnostic);
-    }
-}
-
 REGISTER_FUNCTION(CastOverloadResolvers)
 {
-    factory.registerFunction<CastInternalOverloadResolver<CastType::nonAccurate>>({}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction("_CAST", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::nonAccurate, true); }, {}, FunctionFactory::CaseInsensitive);
     /// Note: "internal" (not affected by null preserving setting) versions of accurate cast functions are unneeded.
 
-    factory.registerFunction<CastOverloadResolver<CastType::nonAccurate>>({}, FunctionFactory::CaseInsensitive);
-    factory.registerFunction<CastOverloadResolver<CastType::accurate>>();
-    factory.registerFunction<CastOverloadResolver<CastType::accurateOrNull>>();
+    factory.registerFunction("CAST", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::nonAccurate, false); }, {}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction("accurateCast", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::accurate, false); }, {});
+    factory.registerFunction("accurateCastOrNull", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::accurateOrNull, false); }, {});
 }
 
 }
diff --git a/src/Functions/CastOverloadResolverImpl.cpp b/src/Functions/CastOverloadResolverImpl.cpp
deleted file mode 100644
index a7f7024892e..00000000000
--- a/src/Functions/CastOverloadResolverImpl.cpp
+++ /dev/null
@@ -1,10 +0,0 @@
-#include <Functions/CastOverloadResolverImpl.h>
-
-namespace DB
-{
-
-template class CastOverloadResolverImpl<CastType::nonAccurate, false>;
-template class CastOverloadResolverImpl<CastType::accurate, false>;
-template class CastOverloadResolverImpl<CastType::accurateOrNull, false>;
-
-}
diff --git a/src/Functions/CastOverloadResolverImpl.h b/src/Functions/CastOverloadResolverImpl.h
index 36376c5f254..b3f3e50ebf8 100644
--- a/src/Functions/CastOverloadResolverImpl.h
+++ b/src/Functions/CastOverloadResolverImpl.h
@@ -29,55 +29,48 @@ struct CastInternalName
   * Cast preserves nullability according to setting `cast_keep_nullable`,
   * i.e. Cast(toNullable(toInt8(1)) as Int32) will be Nullable(Int32(1)) if `cast_keep_nullable` == 1.
   */
-template <CastType cast_type, bool internal>
 class CastOverloadResolverImpl : public IFunctionOverloadResolver
 {
 public:
     using MonotonicityForRange = FunctionCastBase::MonotonicityForRange;
 
-    static constexpr auto name = cast_type == CastType::accurate
-        ? "accurateCast"
-        : (cast_type == CastType::accurateOrNull ? "accurateCastOrNull"
-        : (internal ? "_CAST" : "CAST"));
-
-    String getName() const override { return name; }
+    String getName() const override
+    {
+        if (cast_type == CastType::accurate)
+            return "accurateCast";
+        if (cast_type == CastType::accurateOrNull)
+            return "accurateCastOrNull";
+        if (internal)
+            return "_CAST";
+        else
+            return "CAST";
+    }
 
     size_t getNumberOfArguments() const override { return 2; }
 
     ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
 
-    explicit CastOverloadResolverImpl(ContextPtr context_, std::optional<CastDiagnostic> diagnostic_, bool keep_nullable_, const DataTypeValidationSettings & data_type_validation_settings_)
+    explicit CastOverloadResolverImpl(ContextPtr context_, CastType cast_type_, bool internal_, std::optional<CastDiagnostic> diagnostic_, bool keep_nullable_, const DataTypeValidationSettings & data_type_validation_settings_)
         : context(context_)
+        , cast_type(cast_type_)
+        , internal(internal_)
         , diagnostic(std::move(diagnostic_))
         , keep_nullable(keep_nullable_)
         , data_type_validation_settings(data_type_validation_settings_)
     {
     }
 
-    static FunctionOverloadResolverPtr create(ContextPtr context)
+    static FunctionOverloadResolverPtr create(ContextPtr context, CastType cast_type, bool internal)
     {
         const auto & settings_ref = context->getSettingsRef();
 
-        if constexpr (internal)
-            return createImpl(context, {}, false /*keep_nullable*/);
-
-        return createImpl(context, {}, settings_ref.cast_keep_nullable, DataTypeValidationSettings(settings_ref));
-    }
-
-    static FunctionOverloadResolverPtr createImpl(ContextPtr context, std::optional<CastDiagnostic> diagnostic = {}, bool keep_nullable = false, const DataTypeValidationSettings & data_type_validation_settings = {})
-    {
-        assert(!internal || !keep_nullable);
-        return std::make_unique<CastOverloadResolverImpl>(context, std::move(diagnostic), keep_nullable, data_type_validation_settings);
-    }
-
-    static FunctionOverloadResolverPtr createImpl(std::optional<CastDiagnostic> diagnostic = {}, bool keep_nullable = false, const DataTypeValidationSettings & data_type_validation_settings = {})
-    {
-        assert(!internal || !keep_nullable);
-        return std::make_unique<CastOverloadResolverImpl>(ContextPtr(), std::move(diagnostic), keep_nullable, data_type_validation_settings);
+        if (internal)
+            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, std::nullopt, false /*keep_nullable*/, DataTypeValidationSettings{});
+        else
+            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, std::nullopt, settings_ref.cast_keep_nullable, DataTypeValidationSettings(settings_ref));
     }
 
 protected:
-
     FunctionBasePtr buildImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
     {
         DataTypes data_types(arguments.size());
@@ -87,8 +80,10 @@ protected:
 
         auto monotonicity = MonotonicityHelper::getMonotonicityInformation(arguments.front().type, return_type.get());
 
-        using Function = FunctionCast<std::conditional_t<internal, CastInternalName, CastName>>;
-        return std::make_unique<Function>(context, name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
+        if (internal)
+            return std::make_unique<FunctionCast<CastInternalName>>(context, CastInternalName::name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
+        else
+            return std::make_unique<FunctionCast<CastName>>(context, CastName::name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
     }
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
@@ -106,10 +101,10 @@ protected:
         DataTypePtr type = DataTypeFactory::instance().get(type_col->getValue<String>());
         validateDataType(type, data_type_validation_settings);
 
-        if constexpr (cast_type == CastType::accurateOrNull)
+        if (cast_type == CastType::accurateOrNull)
             return makeNullable(type);
 
-        if constexpr (internal)
+        if (internal)
             return type;
 
         if (keep_nullable && arguments.front().type->isNullable() && type->canBeInsideNullable())
@@ -124,25 +119,11 @@ protected:
 
 private:
     ContextPtr context;
+    CastType cast_type;
+    bool internal;
     std::optional<CastDiagnostic> diagnostic;
     bool keep_nullable;
     DataTypeValidationSettings data_type_validation_settings;
 };
 
-
-template <CastType cast_type>
-using CastOverloadResolver = CastOverloadResolverImpl<cast_type, false>;
-
-template <CastType cast_type>
-using CastInternalOverloadResolver = CastOverloadResolverImpl<cast_type, true>;
-
-
-extern template class CastOverloadResolverImpl<CastType::nonAccurate, false>;
-extern template class CastOverloadResolverImpl<CastType::accurate, false>;
-extern template class CastOverloadResolverImpl<CastType::accurateOrNull, false>;
-
-extern template class CastOverloadResolverImpl<CastType::nonAccurate, true>;
-extern template class CastOverloadResolverImpl<CastType::accurate, true>;
-extern template class CastOverloadResolverImpl<CastType::accurateOrNull, true>;
-
 }

From 83a5611355fdb7bf6ad95a8ae6b3e60321e00c69 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 07:04:05 +0100
Subject: [PATCH 210/985] Remove garbage

---
 src/Functions/CastOverloadResolver.cpp   | 13 +++++++++----
 src/Functions/CastOverloadResolverImpl.h |  6 +++---
 2 files changed, 12 insertions(+), 7 deletions(-)

diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 79b17d3297c..898842c8505 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -26,14 +26,19 @@ UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
     return static_cast<UInt32>(field.get<UInt32>());
 }
 
+FunctionOverloadResolverPtr createInternalCastOverloadResolver(CastType type, std::optional<CastDiagnostic> diagnostic)
+{
+    return CastOverloadResolverImpl::create(ContextPtr{}, type, true, diagnostic);
+}
+
 REGISTER_FUNCTION(CastOverloadResolvers)
 {
-    factory.registerFunction("_CAST", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::nonAccurate, true); }, {}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction("_CAST", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::nonAccurate, true, {}); }, {}, FunctionFactory::CaseInsensitive);
     /// Note: "internal" (not affected by null preserving setting) versions of accurate cast functions are unneeded.
 
-    factory.registerFunction("CAST", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::nonAccurate, false); }, {}, FunctionFactory::CaseInsensitive);
-    factory.registerFunction("accurateCast", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::accurate, false); }, {});
-    factory.registerFunction("accurateCastOrNull", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::accurateOrNull, false); }, {});
+    factory.registerFunction("CAST", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::nonAccurate, false, {}); }, {}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction("accurateCast", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::accurate, false, {}); }, {});
+    factory.registerFunction("accurateCastOrNull", [](ContextPtr context){ return CastOverloadResolverImpl::create(context, CastType::accurateOrNull, false, {}); }, {});
 }
 
 }
diff --git a/src/Functions/CastOverloadResolverImpl.h b/src/Functions/CastOverloadResolverImpl.h
index b3f3e50ebf8..74b3fd3df3f 100644
--- a/src/Functions/CastOverloadResolverImpl.h
+++ b/src/Functions/CastOverloadResolverImpl.h
@@ -60,14 +60,14 @@ public:
     {
     }
 
-    static FunctionOverloadResolverPtr create(ContextPtr context, CastType cast_type, bool internal)
+    static FunctionOverloadResolverPtr create(ContextPtr context, CastType cast_type, bool internal, std::optional<CastDiagnostic> diagnostic)
     {
         const auto & settings_ref = context->getSettingsRef();
 
         if (internal)
-            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, std::nullopt, false /*keep_nullable*/, DataTypeValidationSettings{});
+            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, diagnostic, false /*keep_nullable*/, DataTypeValidationSettings{});
         else
-            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, std::nullopt, settings_ref.cast_keep_nullable, DataTypeValidationSettings(settings_ref));
+            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, diagnostic, settings_ref.cast_keep_nullable, DataTypeValidationSettings(settings_ref));
     }
 
 protected:

From 574d4863224ed7343db64f976f53442f1d166e4a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 07:55:59 +0100
Subject: [PATCH 211/985] Something

---
 programs/library-bridge/CMakeLists.txt        |  1 +
 .../library-bridge/createFunctionBaseCast.cpp | 19 +++++++++++++
 programs/odbc-bridge/CMakeLists.txt           |  1 +
 .../odbc-bridge/createFunctionBaseCast.cpp    | 19 +++++++++++++
 src/Functions/CastOverloadResolver.cpp        |  1 +
 src/Functions/CastOverloadResolverImpl.h      | 28 ++++---------------
 src/Functions/FunctionsConversion.cpp         | 23 +++++++++++++++
 src/Functions/FunctionsConversion.h           |  7 +++++
 8 files changed, 77 insertions(+), 22 deletions(-)
 create mode 100644 programs/library-bridge/createFunctionBaseCast.cpp
 create mode 100644 programs/odbc-bridge/createFunctionBaseCast.cpp

diff --git a/programs/library-bridge/CMakeLists.txt b/programs/library-bridge/CMakeLists.txt
index dd0bf67cb64..98d8848502d 100644
--- a/programs/library-bridge/CMakeLists.txt
+++ b/programs/library-bridge/CMakeLists.txt
@@ -11,6 +11,7 @@ set (CLICKHOUSE_LIBRARY_BRIDGE_SOURCES
     LibraryBridgeHandlers.cpp
     SharedLibrary.cpp
     library-bridge.cpp
+    createFunctionBaseCast.cpp
 )
 
 clickhouse_add_executable(clickhouse-library-bridge ${CLICKHOUSE_LIBRARY_BRIDGE_SOURCES})
diff --git a/programs/library-bridge/createFunctionBaseCast.cpp b/programs/library-bridge/createFunctionBaseCast.cpp
new file mode 100644
index 00000000000..473aa1ca81d
--- /dev/null
+++ b/programs/library-bridge/createFunctionBaseCast.cpp
@@ -0,0 +1,19 @@
+#include <Functions/IFunction.h>
+#include <Functions/CastOverloadResolver.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int NOT_IMPLEMENTED;
+}
+
+FunctionBasePtr createFunctionBaseCast(
+    ContextPtr, const ColumnsWithTypeAndName &, const DataTypePtr &, std::optional<CastDiagnostic>, CastType)
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Type conversions are not implemented for ODBC Bridge");
+}
+
+}
diff --git a/programs/odbc-bridge/CMakeLists.txt b/programs/odbc-bridge/CMakeLists.txt
index 56373601b95..18cda4d7a04 100644
--- a/programs/odbc-bridge/CMakeLists.txt
+++ b/programs/odbc-bridge/CMakeLists.txt
@@ -13,6 +13,7 @@ set (CLICKHOUSE_ODBC_BRIDGE_SOURCES
     getIdentifierQuote.cpp
     odbc-bridge.cpp
     validateODBCConnectionString.cpp
+    createFunctionBaseCast.cpp
 )
 
 clickhouse_add_executable(clickhouse-odbc-bridge ${CLICKHOUSE_ODBC_BRIDGE_SOURCES})
diff --git a/programs/odbc-bridge/createFunctionBaseCast.cpp b/programs/odbc-bridge/createFunctionBaseCast.cpp
new file mode 100644
index 00000000000..473aa1ca81d
--- /dev/null
+++ b/programs/odbc-bridge/createFunctionBaseCast.cpp
@@ -0,0 +1,19 @@
+#include <Functions/IFunction.h>
+#include <Functions/CastOverloadResolver.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int NOT_IMPLEMENTED;
+}
+
+FunctionBasePtr createFunctionBaseCast(
+    ContextPtr, const ColumnsWithTypeAndName &, const DataTypePtr &, std::optional<CastDiagnostic>, CastType)
+{
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Type conversions are not implemented for ODBC Bridge");
+}
+
+}
diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 898842c8505..6ab6f95410f 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -1,6 +1,7 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/CastOverloadResolver.h>
 #include <Functions/CastOverloadResolverImpl.h>
+#include <DataTypes/DataTypesNumber.h>
 
 
 namespace DB
diff --git a/src/Functions/CastOverloadResolverImpl.h b/src/Functions/CastOverloadResolverImpl.h
index 74b3fd3df3f..2bb83040163 100644
--- a/src/Functions/CastOverloadResolverImpl.h
+++ b/src/Functions/CastOverloadResolverImpl.h
@@ -1,7 +1,12 @@
 #pragma once
 
 #include <Functions/FunctionsConversion.h>
+#include <Functions/FunctionHelpers.h>
 #include <Functions/CastOverloadResolver.h>
+#include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <Columns/ColumnString.h>
+#include <Interpreters/Context.h>
 #include <Interpreters/parseColumnsListForTableFunction.h>
 
 
@@ -13,15 +18,6 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
-struct CastName
-{
-    static constexpr auto name = "CAST";
-};
-
-struct CastInternalName
-{
-    static constexpr auto name = "_CAST";
-};
 
 /** CastInternal does not preserve nullability of the data type,
   * i.e. CastInternal(toNullable(toInt8(1)) as Int32) will be Int32(1).
@@ -32,8 +28,6 @@ struct CastInternalName
 class CastOverloadResolverImpl : public IFunctionOverloadResolver
 {
 public:
-    using MonotonicityForRange = FunctionCastBase::MonotonicityForRange;
-
     String getName() const override
     {
         if (cast_type == CastType::accurate)
@@ -73,17 +67,7 @@ public:
 protected:
     FunctionBasePtr buildImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
     {
-        DataTypes data_types(arguments.size());
-
-        for (size_t i = 0; i < arguments.size(); ++i)
-            data_types[i] = arguments[i].type;
-
-        auto monotonicity = MonotonicityHelper::getMonotonicityInformation(arguments.front().type, return_type.get());
-
-        if (internal)
-            return std::make_unique<FunctionCast<CastInternalName>>(context, CastInternalName::name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
-        else
-            return std::make_unique<FunctionCast<CastName>>(context, CastName::name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
+        return createFunctionBaseCast(context, arguments, return_type, diagnostic, cast_type);
     }
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 01e057e19a1..ce9e4fd66e1 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -5,6 +5,29 @@
 namespace DB
 {
 
+namespace
+{
+
+struct CastInternalName { static constexpr auto name = "_CAST"; };
+
+}
+
+FunctionBasePtr createFunctionBaseCast(
+    ContextPtr context
+    , const ColumnsWithTypeAndName & arguments
+    , const DataTypePtr & return_type
+    , std::optional<CastDiagnostic> diagnostic
+    , CastType cast_type)
+{
+    DataTypes data_types(arguments.size());
+
+    for (size_t i = 0; i < arguments.size(); ++i)
+        data_types[i] = arguments[i].type;
+
+    auto monotonicity = MonotonicityHelper::getMonotonicityInformation(arguments.front().type, return_type.get());
+    return std::make_unique<FunctionCast<CastInternalName>>(context, CastInternalName::name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
+}
+
 REGISTER_FUNCTION(Conversion)
 {
     factory.registerFunction<FunctionToUInt8>();
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index fac74715fa0..689b72dc917 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -4972,4 +4972,11 @@ public:
     }
 };
 
+FunctionBasePtr createFunctionBaseCast(
+    ContextPtr context
+    , const ColumnsWithTypeAndName & arguments
+    , const DataTypePtr & return_type
+    , std::optional<CastDiagnostic> diagnostic
+    , CastType cast_type);
+
 }

From feed74e598503eeaa0e6aac44684f19e1fd42361 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 07:59:09 +0100
Subject: [PATCH 212/985] Better

---
 src/Functions/CastOverloadResolver.cpp   | 100 +++++++++++++++++++-
 src/Functions/CastOverloadResolverImpl.h | 113 -----------------------
 2 files changed, 99 insertions(+), 114 deletions(-)
 delete mode 100644 src/Functions/CastOverloadResolverImpl.h

diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 6ab6f95410f..98debc3e2a4 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -1,7 +1,12 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/CastOverloadResolver.h>
-#include <Functions/CastOverloadResolverImpl.h>
+#include <Functions/FunctionsConversion.h>
+#include <Functions/FunctionHelpers.h>
+#include <DataTypes/DataTypeFactory.h>
 #include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <Columns/ColumnString.h>
+#include <Interpreters/parseColumnsListForTableFunction.h>
 
 
 namespace DB
@@ -12,6 +17,99 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
+
+/** CastInternal does not preserve nullability of the data type,
+  * i.e. CastInternal(toNullable(toInt8(1)) as Int32) will be Int32(1).
+  *
+  * Cast preserves nullability according to setting `cast_keep_nullable`,
+  * i.e. Cast(toNullable(toInt8(1)) as Int32) will be Nullable(Int32(1)) if `cast_keep_nullable` == 1.
+  */
+class CastOverloadResolverImpl : public IFunctionOverloadResolver
+{
+public:
+    String getName() const override
+    {
+        if (cast_type == CastType::accurate)
+            return "accurateCast";
+        if (cast_type == CastType::accurateOrNull)
+            return "accurateCastOrNull";
+        if (internal)
+            return "_CAST";
+        else
+            return "CAST";
+    }
+
+    size_t getNumberOfArguments() const override { return 2; }
+
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
+
+    explicit CastOverloadResolverImpl(ContextPtr context_, CastType cast_type_, bool internal_, std::optional<CastDiagnostic> diagnostic_, bool keep_nullable_, const DataTypeValidationSettings & data_type_validation_settings_)
+        : context(context_)
+        , cast_type(cast_type_)
+        , internal(internal_)
+        , diagnostic(std::move(diagnostic_))
+        , keep_nullable(keep_nullable_)
+        , data_type_validation_settings(data_type_validation_settings_)
+    {
+    }
+
+    static FunctionOverloadResolverPtr create(ContextPtr context, CastType cast_type, bool internal, std::optional<CastDiagnostic> diagnostic)
+    {
+        const auto & settings_ref = context->getSettingsRef();
+
+        if (internal)
+            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, diagnostic, false /*keep_nullable*/, DataTypeValidationSettings{});
+        else
+            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, diagnostic, settings_ref.cast_keep_nullable, DataTypeValidationSettings(settings_ref));
+    }
+
+protected:
+    FunctionBasePtr buildImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
+    {
+        return createFunctionBaseCast(context, arguments, return_type, diagnostic, cast_type);
+    }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
+    {
+        const auto & column = arguments.back().column;
+        if (!column)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Second argument to {} must be a constant string describing type. "
+                "Instead there is non-constant column of type {}", getName(), arguments.back().type->getName());
+
+        const auto * type_col = checkAndGetColumnConst<ColumnString>(column.get());
+        if (!type_col)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Second argument to {} must be a constant string describing type. "
+                "Instead there is a column with the following structure: {}", getName(), column->dumpStructure());
+
+        DataTypePtr type = DataTypeFactory::instance().get(type_col->getValue<String>());
+        validateDataType(type, data_type_validation_settings);
+
+        if (cast_type == CastType::accurateOrNull)
+            return makeNullable(type);
+
+        if (internal)
+            return type;
+
+        if (keep_nullable && arguments.front().type->isNullable() && type->canBeInsideNullable())
+            return makeNullable(type);
+
+        return type;
+    }
+
+    bool useDefaultImplementationForNulls() const override { return false; }
+    bool useDefaultImplementationForNothing() const override { return false; }
+    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
+
+private:
+    ContextPtr context;
+    CastType cast_type;
+    bool internal;
+    std::optional<CastDiagnostic> diagnostic;
+    bool keep_nullable;
+    DataTypeValidationSettings data_type_validation_settings;
+};
+
+
 UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
 {
     const auto * arg_type = named_column.type.get();
diff --git a/src/Functions/CastOverloadResolverImpl.h b/src/Functions/CastOverloadResolverImpl.h
deleted file mode 100644
index 2bb83040163..00000000000
--- a/src/Functions/CastOverloadResolverImpl.h
+++ /dev/null
@@ -1,113 +0,0 @@
-#pragma once
-
-#include <Functions/FunctionsConversion.h>
-#include <Functions/FunctionHelpers.h>
-#include <Functions/CastOverloadResolver.h>
-#include <DataTypes/DataTypeFactory.h>
-#include <DataTypes/DataTypeNullable.h>
-#include <Columns/ColumnString.h>
-#include <Interpreters/Context.h>
-#include <Interpreters/parseColumnsListForTableFunction.h>
-
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-}
-
-
-/** CastInternal does not preserve nullability of the data type,
-  * i.e. CastInternal(toNullable(toInt8(1)) as Int32) will be Int32(1).
-  *
-  * Cast preserves nullability according to setting `cast_keep_nullable`,
-  * i.e. Cast(toNullable(toInt8(1)) as Int32) will be Nullable(Int32(1)) if `cast_keep_nullable` == 1.
-  */
-class CastOverloadResolverImpl : public IFunctionOverloadResolver
-{
-public:
-    String getName() const override
-    {
-        if (cast_type == CastType::accurate)
-            return "accurateCast";
-        if (cast_type == CastType::accurateOrNull)
-            return "accurateCastOrNull";
-        if (internal)
-            return "_CAST";
-        else
-            return "CAST";
-    }
-
-    size_t getNumberOfArguments() const override { return 2; }
-
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
-
-    explicit CastOverloadResolverImpl(ContextPtr context_, CastType cast_type_, bool internal_, std::optional<CastDiagnostic> diagnostic_, bool keep_nullable_, const DataTypeValidationSettings & data_type_validation_settings_)
-        : context(context_)
-        , cast_type(cast_type_)
-        , internal(internal_)
-        , diagnostic(std::move(diagnostic_))
-        , keep_nullable(keep_nullable_)
-        , data_type_validation_settings(data_type_validation_settings_)
-    {
-    }
-
-    static FunctionOverloadResolverPtr create(ContextPtr context, CastType cast_type, bool internal, std::optional<CastDiagnostic> diagnostic)
-    {
-        const auto & settings_ref = context->getSettingsRef();
-
-        if (internal)
-            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, diagnostic, false /*keep_nullable*/, DataTypeValidationSettings{});
-        else
-            return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, diagnostic, settings_ref.cast_keep_nullable, DataTypeValidationSettings(settings_ref));
-    }
-
-protected:
-    FunctionBasePtr buildImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
-    {
-        return createFunctionBaseCast(context, arguments, return_type, diagnostic, cast_type);
-    }
-
-    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
-    {
-        const auto & column = arguments.back().column;
-        if (!column)
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Second argument to {} must be a constant string describing type. "
-                "Instead there is non-constant column of type {}", getName(), arguments.back().type->getName());
-
-        const auto * type_col = checkAndGetColumnConst<ColumnString>(column.get());
-        if (!type_col)
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Second argument to {} must be a constant string describing type. "
-                "Instead there is a column with the following structure: {}", getName(), column->dumpStructure());
-
-        DataTypePtr type = DataTypeFactory::instance().get(type_col->getValue<String>());
-        validateDataType(type, data_type_validation_settings);
-
-        if (cast_type == CastType::accurateOrNull)
-            return makeNullable(type);
-
-        if (internal)
-            return type;
-
-        if (keep_nullable && arguments.front().type->isNullable() && type->canBeInsideNullable())
-            return makeNullable(type);
-
-        return type;
-    }
-
-    bool useDefaultImplementationForNulls() const override { return false; }
-    bool useDefaultImplementationForNothing() const override { return false; }
-    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
-
-private:
-    ContextPtr context;
-    CastType cast_type;
-    bool internal;
-    std::optional<CastDiagnostic> diagnostic;
-    bool keep_nullable;
-    DataTypeValidationSettings data_type_validation_settings;
-};
-
-}

From 061cee257c489eccdcbcda7e694937fa93444d18 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 08:10:59 +0100
Subject: [PATCH 213/985] Remove crap

---
 src/Functions/CastOverloadResolver.cpp |  9 +++-
 src/Functions/FunctionsConversion.cpp  | 59 +++++++++++++++++---
 src/Functions/FunctionsConversion.h    | 75 ++++++--------------------
 src/Functions/concat.cpp               |  2 +-
 4 files changed, 76 insertions(+), 69 deletions(-)

diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 98debc3e2a4..4a081d684f6 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -1,12 +1,12 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/CastOverloadResolver.h>
-#include <Functions/FunctionsConversion.h>
 #include <Functions/FunctionHelpers.h>
 #include <DataTypes/DataTypeFactory.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <Columns/ColumnString.h>
 #include <Interpreters/parseColumnsListForTableFunction.h>
+#include <Interpreters/Context.h>
 
 
 namespace DB
@@ -17,6 +17,13 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
+FunctionBasePtr createFunctionBaseCast(
+    ContextPtr context
+    , const ColumnsWithTypeAndName & arguments
+    , const DataTypePtr & return_type
+    , std::optional<CastDiagnostic> diagnostic
+    , CastType cast_type);
+
 
 /** CastInternal does not preserve nullability of the data type,
   * i.e. CastInternal(toNullable(toInt8(1)) as Int32) will be Int32(1).
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index ce9e4fd66e1..ebb63f1b25d 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -5,13 +5,6 @@
 namespace DB
 {
 
-namespace
-{
-
-struct CastInternalName { static constexpr auto name = "_CAST"; };
-
-}
-
 FunctionBasePtr createFunctionBaseCast(
     ContextPtr context
     , const ColumnsWithTypeAndName & arguments
@@ -25,7 +18,7 @@ FunctionBasePtr createFunctionBaseCast(
         data_types[i] = arguments[i].type;
 
     auto monotonicity = MonotonicityHelper::getMonotonicityInformation(arguments.front().type, return_type.get());
-    return std::make_unique<FunctionCast<CastInternalName>>(context, CastInternalName::name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
+    return std::make_unique<FunctionCast>(context, "CAST", std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
 }
 
 REGISTER_FUNCTION(Conversion)
@@ -153,4 +146,54 @@ REGISTER_FUNCTION(Conversion)
     factory.registerFunction<FunctionConvert<DataTypeInterval, NameToIntervalYear, PositiveMonotonicity>>();
 }
 
+
+MonotonicityHelper::MonotonicityForRange MonotonicityHelper::getMonotonicityInformation(const DataTypePtr & from_type, const IDataType * to_type)
+{
+    if (const auto * type = checkAndGetDataType<DataTypeUInt8>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeUInt16>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeUInt32>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeUInt64>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeUInt128>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeUInt256>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeInt8>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeInt16>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeInt32>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeInt64>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeInt128>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeInt256>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeFloat32>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeFloat64>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeDate>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeDate32>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeDateTime>(to_type))
+        return monotonicityForType(type);
+    if (const auto * type = checkAndGetDataType<DataTypeString>(to_type))
+        return monotonicityForType(type);
+    if (isEnum(from_type))
+    {
+        if (const auto * type = checkAndGetDataType<DataTypeEnum8>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeEnum16>(to_type))
+            return monotonicityForType(type);
+    }
+    /// other types like Null, FixedString, Array and Tuple have no monotonicity defined
+    return {};
+}
+
 }
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index 689b72dc917..0c4b7b41b93 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -3170,13 +3170,17 @@ private:
 };
 
 
+struct FunctionCastName
+{
+    static constexpr auto name = "CAST";
+};
+
 class FunctionCastBase : public IFunctionBase
 {
 public:
     using MonotonicityForRange = std::function<Monotonicity(const IDataType &, const Field &, const Field &)>;
 };
 
-template <typename FunctionName>
 class FunctionCast final : public FunctionCastBase
 {
 public:
@@ -3204,7 +3208,7 @@ public:
         try
         {
             return std::make_unique<ExecutableFunctionCast>(
-                    prepareUnpackDictionaries(getArgumentTypes()[0], getResultType()), cast_name, diagnostic);
+                prepareUnpackDictionaries(getArgumentTypes()[0], getResultType()), cast_name, diagnostic);
         }
         catch (Exception & e)
         {
@@ -3278,7 +3282,7 @@ private:
         {
             /// In case when converting to Nullable type, we apply different parsing rule,
             /// that will not throw an exception but return NULL in case of malformed input.
-            FunctionPtr function = FunctionConvertFromString<ToDataType, FunctionName, ConvertFromStringExceptionMode::Null>::create();
+            FunctionPtr function = FunctionConvertFromString<ToDataType, FunctionCastName, ConvertFromStringExceptionMode::Null>::create();
             return createFunctionAdaptor(function, from_type);
         }
         else if (!can_apply_accurate_cast)
@@ -3304,7 +3308,7 @@ private:
                     {
 #define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
             case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
+                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
                 arguments, result_type, input_rows_count, ADDITIONS()); \
                 break;
                         if (wrapper_cast_type == CastType::accurate)
@@ -3334,7 +3338,7 @@ private:
                     {
 #define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
             case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::template execute<ADDITIONS>( \
+            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::template execute<ADDITIONS>( \
 arguments, result_type, input_rows_count); \
                 break;
                         if (wrapper_cast_type == CastType::accurate)
@@ -3368,7 +3372,7 @@ arguments, result_type, input_rows_count); \
             {
                 if (wrapper_cast_type == CastType::accurateOrNull)
                 {
-                    auto nullable_column_wrapper = FunctionCast<FunctionName>::createToNullableColumnWrapper();
+                    auto nullable_column_wrapper = FunctionCast::createToNullableColumnWrapper();
                     return nullable_column_wrapper(arguments, result_type, column_nullable, input_rows_count);
                 }
                 else
@@ -3494,7 +3498,7 @@ arguments, result_type, input_rows_count); \
                     {
                         AccurateConvertStrategyAdditions additions;
                         additions.scale = scale;
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(
+                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
                             arguments, result_type, input_rows_count, additions);
 
                         return true;
@@ -3503,7 +3507,7 @@ arguments, result_type, input_rows_count); \
                     {
                         AccurateOrNullConvertStrategyAdditions additions;
                         additions.scale = scale;
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(
+                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
                             arguments, result_type, input_rows_count, additions);
 
                         return true;
@@ -3516,14 +3520,14 @@ arguments, result_type, input_rows_count); \
                         /// Consistent with CAST(Nullable(String) AS Nullable(Numbers))
                         /// In case when converting to Nullable type, we apply different parsing rule,
                         /// that will not throw an exception but return NULL in case of malformed input.
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName, ConvertReturnNullOnErrorTag>::execute(
+                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertReturnNullOnErrorTag>::execute(
                             arguments, result_type, input_rows_count, scale);
 
                         return true;
                     }
                 }
 
-                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(arguments, result_type, input_rows_count, scale);
+                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(arguments, result_type, input_rows_count, scale);
 
                 return true;
             });
@@ -3533,7 +3537,7 @@ arguments, result_type, input_rows_count); \
             {
                 if (wrapper_cast_type == CastType::accurateOrNull)
                 {
-                    auto nullable_column_wrapper = FunctionCast<FunctionName>::createToNullableColumnWrapper();
+                    auto nullable_column_wrapper = FunctionCast::createToNullableColumnWrapper();
                     return nullable_column_wrapper(arguments, result_type, column_nullable, input_rows_count);
                 }
                 else
@@ -4922,54 +4926,7 @@ public:
         return FunctionTo<DataType>::Type::Monotonic::get;
     }
 
-    static MonotonicityForRange getMonotonicityInformation(const DataTypePtr & from_type, const IDataType * to_type)
-    {
-        if (const auto * type = checkAndGetDataType<DataTypeUInt8>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt16>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt64>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt128>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt256>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt8>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt16>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt64>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt128>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt256>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeFloat32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeFloat64>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeDate>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeDate32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeDateTime>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeString>(to_type))
-            return monotonicityForType(type);
-        if (isEnum(from_type))
-        {
-            if (const auto * type = checkAndGetDataType<DataTypeEnum8>(to_type))
-                return monotonicityForType(type);
-            if (const auto * type = checkAndGetDataType<DataTypeEnum16>(to_type))
-                return monotonicityForType(type);
-        }
-        /// other types like Null, FixedString, Array and Tuple have no monotonicity defined
-        return {};
-    }
+    static MonotonicityForRange getMonotonicityInformation(const DataTypePtr & from_type, const IDataType * to_type);
 };
 
 FunctionBasePtr createFunctionBaseCast(
diff --git a/src/Functions/concat.cpp b/src/Functions/concat.cpp
index d68f5256f6d..c75a806559c 100644
--- a/src/Functions/concat.cpp
+++ b/src/Functions/concat.cpp
@@ -1,8 +1,8 @@
 #include <Columns/ColumnString.h>
+#include <Columns/ColumnStringHelpers.h>
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
-#include <Functions/FunctionsConversion.h>
 #include <Functions/GatherUtils/Algorithms.h>
 #include <Functions/GatherUtils/Sinks.h>
 #include <Functions/GatherUtils/Sources.h>

From 804c07156d90c0b4ce6b632f30b5481077d0f5d3 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 08:24:53 +0100
Subject: [PATCH 214/985] Fix garbage

---
 .../Serializations/SerializationObject.cpp    | 20 +++-
 src/Functions/FunctionsConversion.h           | 97 ++++++++-----------
 2 files changed, 57 insertions(+), 60 deletions(-)

diff --git a/src/DataTypes/Serializations/SerializationObject.cpp b/src/DataTypes/Serializations/SerializationObject.cpp
index e6dc16ef5a0..cd186ec2c46 100644
--- a/src/DataTypes/Serializations/SerializationObject.cpp
+++ b/src/DataTypes/Serializations/SerializationObject.cpp
@@ -5,13 +5,11 @@
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/ObjectUtils.h>
 #include <DataTypes/DataTypeFactory.h>
-#include <DataTypes/NestedUtils.h>
 #include <Common/JSONParsers/SimdJSONParser.h>
 #include <Common/JSONParsers/RapidJSONParser.h>
-#include <Common/HashTable/HashSet.h>
 #include <Columns/ColumnObject.h>
+#include <Columns/ColumnTuple.h>
 #include <Columns/ColumnString.h>
-#include <Functions/FunctionsConversion.h>
 
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
@@ -30,6 +28,7 @@ namespace ErrorCodes
     extern const int CANNOT_READ_ALL_DATA;
     extern const int ARGUMENT_OUT_OF_BOUND;
     extern const int LOGICAL_ERROR;
+    extern const int CANNOT_PARSE_TEXT;
 }
 
 template <typename Parser>
@@ -344,7 +343,20 @@ void SerializationObject<Parser>::deserializeBinaryBulkFromString(
     state.nested_serialization->deserializeBinaryBulkWithMultipleStreams(
         column_string, limit, settings, state.nested_state, cache);
 
-    ConvertImplGenericFromString<ColumnString>::executeImpl(*column_string, column_object, *this, column_string->size());
+    size_t input_rows_count = column_string->size();
+    column_object.reserve(input_rows_count);
+
+    FormatSettings format_settings;
+    for (size_t i = 0; i < input_rows_count; ++i)
+    {
+        const auto & val = column_string->getDataAt(i);
+        ReadBufferFromMemory read_buffer(val.data, val.size);
+        deserializeWholeText(column_object, read_buffer, format_settings);
+
+        if (!read_buffer.eof())
+            throw Exception(ErrorCodes::CANNOT_PARSE_TEXT,
+                "Cannot parse string to column Object. Expected eof");
+    }
 }
 
 template <typename Parser>
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index 0c4b7b41b93..c21e85fb40e 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -1818,14 +1818,10 @@ struct ConvertImpl<FromDataType, ToDataType, Name, ConvertReturnZeroOnErrorTag,
     : ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::Normal> {};
 
 /// Generic conversion of any type from String. Used for complex types: Array and Tuple or types with custom serialization.
-template <typename StringColumnType>
 struct ConvertImplGenericFromString
 {
     static ColumnPtr execute(ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * column_nullable, size_t input_rows_count)
     {
-        static_assert(std::is_same_v<StringColumnType, ColumnString> || std::is_same_v<StringColumnType, ColumnFixedString>,
-                "Can be used only to parse from ColumnString or ColumnFixedString");
-
         const IColumn & column_from = *arguments[0].column;
         const IDataType & data_type_to = *result_type;
         auto res = data_type_to.createColumn();
@@ -1841,63 +1837,52 @@ struct ConvertImplGenericFromString
         IColumn & column_to,
         const ISerialization & serialization_from,
         size_t input_rows_count,
-        const PaddedPODArray<UInt8> * null_map = nullptr,
-        const IDataType * result_type = nullptr)
+        const PaddedPODArray<UInt8> * null_map,
+        const IDataType * result_type)
     {
-        static_assert(std::is_same_v<StringColumnType, ColumnString> || std::is_same_v<StringColumnType, ColumnFixedString>,
-                "Can be used only to parse from ColumnString or ColumnFixedString");
+        column_to.reserve(input_rows_count);
 
-        if (const StringColumnType * col_from_string = checkAndGetColumn<StringColumnType>(&column_from))
+        FormatSettings format_settings;
+        for (size_t i = 0; i < input_rows_count; ++i)
         {
-            column_to.reserve(input_rows_count);
-
-            FormatSettings format_settings;
-            for (size_t i = 0; i < input_rows_count; ++i)
+            if (null_map && (*null_map)[i])
             {
-                if (null_map && (*null_map)[i])
+                column_to.insertDefault();
+                continue;
+            }
+
+            const auto & val = column_from.getDataAt(i);
+            ReadBufferFromMemory read_buffer(val.data, val.size);
+            try
+            {
+                serialization_from.deserializeWholeText(column_to, read_buffer, format_settings);
+            }
+            catch (const Exception & e)
+            {
+                auto * nullable_column = typeid_cast<ColumnNullable *>(&column_to);
+                if (e.code() == ErrorCodes::CANNOT_PARSE_BOOL && nullable_column)
                 {
-                    column_to.insertDefault();
+                    auto & col_nullmap = nullable_column->getNullMapData();
+                    if (col_nullmap.size() != nullable_column->size())
+                        col_nullmap.resize_fill(nullable_column->size());
+                    if (nullable_column->size() == (i + 1))
+                        nullable_column->popBack(1);
+                    nullable_column->insertDefault();
                     continue;
                 }
+                throw;
+            }
 
-                const auto & val = col_from_string->getDataAt(i);
-                ReadBufferFromMemory read_buffer(val.data, val.size);
-                try
-                {
-                    serialization_from.deserializeWholeText(column_to, read_buffer, format_settings);
-                }
-                catch (const Exception & e)
-                {
-                    auto * nullable_column = typeid_cast<ColumnNullable *>(&column_to);
-                    if (e.code() == ErrorCodes::CANNOT_PARSE_BOOL && nullable_column)
-                    {
-                        auto & col_nullmap = nullable_column->getNullMapData();
-                        if (col_nullmap.size() != nullable_column->size())
-                            col_nullmap.resize_fill(nullable_column->size());
-                        if (nullable_column->size() == (i + 1))
-                            nullable_column->popBack(1);
-                        nullable_column->insertDefault();
-                        continue;
-                    }
-                    throw;
-                }
-
-                if (!read_buffer.eof())
-                {
-                    if (result_type)
-                        throwExceptionForIncompletelyParsedValue(read_buffer, *result_type);
-                    else
-                        throw Exception(ErrorCodes::CANNOT_PARSE_TEXT,
-                            "Cannot parse string to column {}. Expected eof", column_to.getName());
-                }
+            if (!read_buffer.eof())
+            {
+                if (result_type)
+                    throwExceptionForIncompletelyParsedValue(read_buffer, *result_type);
+                else
+                    throw Exception(ErrorCodes::CANNOT_PARSE_TEXT,
+                        "Cannot parse string to column {}. Expected eof", column_to.getName());
             }
         }
-        else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN,
-                "Illegal column {} of first argument of conversion function from string",
-                column_from.getName());
     }
-
 };
 
 
@@ -3392,7 +3377,7 @@ arguments, result_type, input_rows_count); \
     {
         if (checkAndGetDataType<DataTypeString>(from_type.get()))
         {
-            return &ConvertImplGenericFromString<ColumnString>::execute;
+            return &ConvertImplGenericFromString::execute;
         }
 
         return createWrapper<ToDataType>(from_type, to_type, requested_result_is_nullable);
@@ -3555,7 +3540,7 @@ arguments, result_type, input_rows_count); \
         /// Conversion from String through parsing.
         if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
         {
-            return &ConvertImplGenericFromString<ColumnString>::execute;
+            return &ConvertImplGenericFromString::execute;
         }
         else if (const auto * agg_type = checkAndGetDataType<DataTypeAggregateFunction>(from_type_untyped.get()))
         {
@@ -3598,7 +3583,7 @@ arguments, result_type, input_rows_count); \
         /// Conversion from String through parsing.
         if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
         {
-            return &ConvertImplGenericFromString<ColumnString>::execute;
+            return &ConvertImplGenericFromString::execute;
         }
 
         DataTypePtr from_type_holder;
@@ -3689,7 +3674,7 @@ arguments, result_type, input_rows_count); \
         /// Conversion from String through parsing.
         if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
         {
-            return &ConvertImplGenericFromString<ColumnString>::execute;
+            return &ConvertImplGenericFromString::execute;
         }
 
         const auto * from_type = checkAndGetDataType<DataTypeTuple>(from_type_untyped.get());
@@ -4034,7 +4019,7 @@ arguments, result_type, input_rows_count); \
         {
             return [] (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * nullable_source, size_t input_rows_count)
             {
-                auto res = ConvertImplGenericFromString<ColumnString>::execute(arguments, result_type, nullable_source, input_rows_count)->assumeMutable();
+                auto res = ConvertImplGenericFromString::execute(arguments, result_type, nullable_source, input_rows_count)->assumeMutable();
                 res->finalize();
                 return res;
             };
@@ -4831,7 +4816,7 @@ arguments, result_type, input_rows_count); \
                         auto wrapped_result_type = result_type;
                         if (requested_result_is_nullable)
                             wrapped_result_type = makeNullable(result_type);
-                        return ConvertImplGenericFromString<typename FromDataType::ColumnType>::execute(
+                        return ConvertImplGenericFromString::execute(
                             arguments, wrapped_result_type, column_nullable, input_rows_count);
                     };
                     return true;

From f2c4a5bb94ea319b38caf35ac90a9b9208cdc745 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 08:30:13 +0100
Subject: [PATCH 215/985] Prevent garbage from appearing

---
 src/Functions/FunctionsConversion.cpp | 5008 ++++++++++++++++++++++++-
 src/Functions/FunctionsConversion.h   | 4924 ------------------------
 2 files changed, 4957 insertions(+), 4975 deletions(-)
 delete mode 100644 src/Functions/FunctionsConversion.h

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index ebb63f1b25d..865f7db8e12 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1,10 +1,4966 @@
+#include <cstddef>
+#include <type_traits>
+
+#include <IO/WriteBufferFromVector.h>
+#include <IO/ReadBufferFromMemory.h>
+#include <IO/Operators.h>
+#include <IO/parseDateTimeBestEffort.h>
+#include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/DataTypesDecimal.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypeFixedString.h>
+#include <DataTypes/DataTypeDate.h>
+#include <DataTypes/DataTypeDate32.h>
+#include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeDateTime64.h>
+#include <DataTypes/DataTypeEnum.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypeMap.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeNothing.h>
+#include <DataTypes/DataTypeUUID.h>
+#include <DataTypes/DataTypeInterval.h>
+#include <DataTypes/DataTypeAggregateFunction.h>
+#include <DataTypes/DataTypeObject.h>
+#include <DataTypes/ObjectUtils.h>
+#include <DataTypes/DataTypeNested.h>
+#include <DataTypes/DataTypeVariant.h>
+#include <DataTypes/Serializations/SerializationDecimal.h>
+#include <Formats/FormatSettings.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnFixedString.h>
+#include <Columns/ColumnConst.h>
+#include <Columns/ColumnAggregateFunction.h>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnTuple.h>
+#include <Columns/ColumnMap.h>
+#include <Columns/ColumnObject.h>
+#include <Columns/ColumnsCommon.h>
+#include <Columns/ColumnVariant.h>
+#include <Columns/ColumnStringHelpers.h>
+#include <Common/assert_cast.h>
+#include <Common/Concepts.h>
+#include <Common/quoteString.h>
+#include <Common/Exception.h>
+#include <Core/AccurateComparison.h>
 #include <Functions/FunctionFactory.h>
-#include <Functions/FunctionsConversion.h>
+#include <Functions/IFunctionAdaptors.h>
+#include <Functions/FunctionHelpers.h>
+#include <Functions/DateTimeTransforms.h>
+#include <Functions/toFixedString.h>
+#include <Functions/TransformDateTime64.h>
+#include <Functions/FunctionsCodingIP.h>
+#include <Functions/CastOverloadResolver.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <Columns/ColumnLowCardinality.h>
+#include <Interpreters/Context.h>
+#include <Common/HashTable/HashMap.h>
+#include <DataTypes/DataTypeIPv4andIPv6.h>
+#include <Common/IPv6ToBinary.h>
+#include <Core/Types.h>
 
 
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int ATTEMPT_TO_READ_AFTER_EOF;
+    extern const int CANNOT_PARSE_NUMBER;
+    extern const int CANNOT_READ_ARRAY_FROM_TEXT;
+    extern const int CANNOT_PARSE_INPUT_ASSERTION_FAILED;
+    extern const int CANNOT_PARSE_QUOTED_STRING;
+    extern const int CANNOT_PARSE_ESCAPE_SEQUENCE;
+    extern const int CANNOT_PARSE_DATE;
+    extern const int CANNOT_PARSE_DATETIME;
+    extern const int CANNOT_PARSE_TEXT;
+    extern const int CANNOT_PARSE_UUID;
+    extern const int CANNOT_PARSE_IPV4;
+    extern const int CANNOT_PARSE_IPV6;
+    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
+    extern const int LOGICAL_ERROR;
+    extern const int TYPE_MISMATCH;
+    extern const int CANNOT_CONVERT_TYPE;
+    extern const int ILLEGAL_COLUMN;
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+    extern const int NOT_IMPLEMENTED;
+    extern const int CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN;
+    extern const int CANNOT_PARSE_BOOL;
+    extern const int VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE;
+}
+
+/** Type conversion functions.
+  * toType - conversion in "natural way";
+  */
+
+UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column);
+
+/// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
+struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
+
+struct AccurateConvertStrategyAdditions
+{
+    UInt32 scale { 0 };
+};
+
+struct AccurateOrNullConvertStrategyAdditions
+{
+    UInt32 scale { 0 };
+};
+
+
+struct ConvertDefaultBehaviorTag {};
+struct ConvertReturnNullOnErrorTag {};
+struct ConvertReturnZeroOnErrorTag {};
+
+/** Conversion of number types to each other, enums to numbers, dates and datetimes to numbers and back: done by straight assignment.
+  *  (Date is represented internally as number of days from some day; DateTime - as unix timestamp)
+  */
+template <typename FromDataType, typename ToDataType, typename Name,
+    typename SpecialTag = ConvertDefaultBehaviorTag,
+    FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
+struct ConvertImpl
+{
+    using FromFieldType = typename FromDataType::FieldType;
+    using ToFieldType = typename ToDataType::FieldType;
+
+    template <typename Additions = void *>
+    static ColumnPtr NO_SANITIZE_UNDEFINED execute(
+        const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type [[maybe_unused]], size_t input_rows_count,
+        Additions additions [[maybe_unused]] = Additions())
+    {
+        const ColumnWithTypeAndName & named_from = arguments[0];
+
+        using ColVecFrom = typename FromDataType::ColumnType;
+        using ColVecTo = typename ToDataType::ColumnType;
+
+        if constexpr ((IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
+            && !(std::is_same_v<DataTypeDateTime64, FromDataType> || std::is_same_v<DataTypeDateTime64, ToDataType>))
+        {
+            if constexpr (!IsDataTypeDecimalOrNumber<FromDataType> || !IsDataTypeDecimalOrNumber<ToDataType>)
+            {
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                    named_from.column->getName(), Name::name);
+            }
+        }
+
+        if (const ColVecFrom * col_from = checkAndGetColumn<ColVecFrom>(named_from.column.get()))
+        {
+            typename ColVecTo::MutablePtr col_to = nullptr;
+
+            if constexpr (IsDataTypeDecimal<ToDataType>)
+            {
+                UInt32 scale;
+
+                if constexpr (std::is_same_v<Additions, AccurateConvertStrategyAdditions>
+                    || std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                {
+                    scale = additions.scale;
+                }
+                else
+                {
+                    scale = additions;
+                }
+
+                col_to = ColVecTo::create(0, scale);
+            }
+            else
+                col_to = ColVecTo::create();
+
+            const auto & vec_from = col_from->getData();
+            auto & vec_to = col_to->getData();
+            vec_to.resize(input_rows_count);
+
+            ColumnUInt8::MutablePtr col_null_map_to;
+            ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
+            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+            {
+                col_null_map_to = ColumnUInt8::create(input_rows_count, false);
+                vec_null_map_to = &col_null_map_to->getData();
+            }
+
+            bool result_is_bool = isBool(result_type);
+            for (size_t i = 0; i < input_rows_count; ++i)
+            {
+                if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
+                {
+                    if (result_is_bool)
+                    {
+                        vec_to[i] = vec_from[i] != FromFieldType(0);
+                        continue;
+                    }
+                }
+
+                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> && std::is_same_v<ToDataType, DataTypeUInt128>)
+                {
+                    static_assert(
+                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
+                        "UInt128 and UUID types must be same");
+
+                    vec_to[i].items[1] = vec_from[i].toUnderType().items[0];
+                    vec_to[i].items[0] = vec_from[i].toUnderType().items[1];
+
+                    continue;
+                }
+
+                if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
+                {
+                    static_assert(
+                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
+                        "UInt128 and IPv6 types must be same");
+
+                    vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
+                    vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
+
+                    continue;
+                }
+
+                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
+                {
+                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                                    "Conversion between numeric types and UUID is not supported. "
+                                    "Probably the passed UUID is unquoted");
+                }
+                else if constexpr (
+                    (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
+                    && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6> || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>)
+                )
+                {
+                    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
+                                    TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
+                }
+                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6> && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
+                {
+                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                                    "Conversion between numeric types and IPv6 is not supported. "
+                                    "Probably the passed IPv6 is unquoted");
+                }
+                else
+                {
+                    if constexpr (IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
+                    {
+                        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                        {
+                            ToFieldType result;
+                            bool convert_result = false;
+
+                            if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                                convert_result = tryConvertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale(), result);
+                            else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
+                                convert_result = tryConvertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), result);
+                            else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                                convert_result = tryConvertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale(), result);
+
+                            if (convert_result)
+                                vec_to[i] = result;
+                            else
+                            {
+                                vec_to[i] = static_cast<ToFieldType>(0);
+                                (*vec_null_map_to)[i] = true;
+                            }
+                        }
+                        else
+                        {
+                            if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                                vec_to[i] = convertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale());
+                            else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
+                                vec_to[i] = convertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale());
+                            else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                                vec_to[i] = convertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale());
+                            else
+                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unsupported data type in conversion function");
+                        }
+                    }
+                    else
+                    {
+                        /// If From Data is Nan or Inf and we convert to integer type, throw exception
+                        if constexpr (std::is_floating_point_v<FromFieldType> && !std::is_floating_point_v<ToFieldType>)
+                        {
+                            if (!isFinite(vec_from[i]))
+                            {
+                                if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                                {
+                                    vec_to[i] = 0;
+                                    (*vec_null_map_to)[i] = true;
+                                    continue;
+                                }
+                                else
+                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unexpected inf or nan to integer conversion");
+                            }
+                        }
+
+                        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>
+                                || std::is_same_v<Additions, AccurateConvertStrategyAdditions>)
+                        {
+                            bool convert_result = accurate::convertNumeric(vec_from[i], vec_to[i]);
+
+                            if (!convert_result)
+                            {
+                                if (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                                {
+                                    vec_to[i] = 0;
+                                    (*vec_null_map_to)[i] = true;
+                                }
+                                else
+                                {
+                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Value in column {} cannot be safely converted into type {}",
+                                        named_from.column->getName(), result_type->getName());
+                                }
+                            }
+                        }
+                        else
+                        {
+                            if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
+                            {
+                                const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
+                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                                if (!matchIPv6Subnet(src, ip4_cidr, 96))
+                                {
+                                    char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
+                                    char * paddr = addr;
+                                    formatIPv6(src, paddr);
+
+                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
+                                }
+
+                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                                if constexpr (std::endian::native == std::endian::little)
+                                {
+                                    dst[0] = src[15];
+                                    dst[1] = src[14];
+                                    dst[2] = src[13];
+                                    dst[3] = src[12];
+                                }
+                                else
+                                {
+                                    dst[0] = src[12];
+                                    dst[1] = src[13];
+                                    dst[2] = src[14];
+                                    dst[3] = src[15];
+                                }
+                            }
+                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
+                            {
+                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                                std::memset(dst, '\0', IPV6_BINARY_LENGTH);
+                                dst[10] = dst[11] = 0xff;
+
+                                if constexpr (std::endian::native == std::endian::little)
+                                {
+                                    dst[12] = src[3];
+                                    dst[13] = src[2];
+                                    dst[14] = src[1];
+                                    dst[15] = src[0];
+                                }
+                                else
+                                {
+                                    dst[12] = src[0];
+                                    dst[13] = src[1];
+                                    dst[14] = src[2];
+                                    dst[15] = src[3];
+                                }
+                            }
+                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
+                                vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
+                            else if constexpr (std::is_same_v<Name, NameToUnixTimestamp> && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
+                                vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
+                            else
+                                vec_to[i] = static_cast<ToFieldType>(vec_from[i]);
+                        }
+                    }
+                }
+            }
+
+            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
+            else
+                return col_to;
+        }
+        else
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                named_from.column->getName(), Name::name);
+    }
+};
+
+/** Conversion of DateTime to Date: throw off time component.
+  */
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDateTime, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDate, ToDateImpl<date_time_overflow_behavior>, false> {};
+
+/** Conversion of DateTime to Date32: throw off time component.
+  */
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDateTime, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDate32, ToDate32Impl, false> {};
+
+/** Conversion of Date to DateTime: adding 00:00:00 time component.
+  */
+template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
+struct ToDateTimeImpl
+{
+    static constexpr auto name = "toDateTime";
+
+    static UInt32 execute(UInt16 d, const DateLUTImpl & time_zone)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (d > MAX_DATETIME_DAY_NUM) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Day number {} is out of bounds of type DateTime", d);
+        }
+        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
+        {
+            if (d > MAX_DATETIME_DAY_NUM)
+                d = MAX_DATETIME_DAY_NUM;
+        }
+        return static_cast<UInt32>(time_zone.fromDayNum(DayNum(d)));
+    }
+
+    static UInt32 execute(Int32 d, const DateLUTImpl & time_zone)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
+        {
+            if (d < 0)
+                return 0;
+            else if (d > MAX_DATETIME_DAY_NUM)
+                d = MAX_DATETIME_DAY_NUM;
+        }
+        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (d < 0 || d > MAX_DATETIME_DAY_NUM) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", d);
+        }
+        return static_cast<UInt32>(time_zone.fromDayNum(ExtendedDayNum(d)));
+    }
+
+    static UInt32 execute(UInt32 dt, const DateLUTImpl & /*time_zone*/)
+    {
+        return dt;
+    }
+
+    static UInt32 execute(Int64 dt64, const DateLUTImpl & /*time_zone*/)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Ignore)
+            return static_cast<UInt32>(dt64);
+        else
+        {
+            if (dt64 < 0 || dt64 >= MAX_DATETIME_TIMESTAMP)
+            {
+                if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
+                    return dt64 < 0 ? 0 : std::numeric_limits<UInt32>::max();
+                else
+                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", dt64);
+            }
+            else
+                return static_cast<UInt32>(dt64);
+        }
+    }
+};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDate, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDate, DataTypeDateTime, ToDateTimeImpl<date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDate32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDate32, DataTypeDateTime, ToDateTimeImpl<date_time_overflow_behavior>, false> {};
+
+/// Implementation of toDate function.
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTransform32Or64
+{
+    static constexpr auto name = "toDate";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
+        }
+        /// if value is smaller (or equal) than maximum day value for Date, than treat it as day num,
+        /// otherwise treat it as unix timestamp. This is a bit weird, but we leave this behavior.
+        if (from <= DATE_LUT_MAX_DAY_NUM)
+            return from;
+        else
+            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
+    }
+};
+
+/** Conversion of Date32 to Date.
+  */
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDate32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDate32, DataTypeDate, ToDateImpl<date_time_overflow_behavior>, false> {};
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTransform32Or64Signed
+{
+    static constexpr auto name = "toDate";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    {
+        // TODO: decide narrow or extended range based on FromType
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < 0 || from > MAX_DATE_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
+        }
+        else
+        {
+            if (from < 0)
+                return 0;
+        }
+        return (from <= DATE_LUT_MAX_DAY_NUM)
+            ? static_cast<ToType>(from)
+            : time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATE_TIMESTAMP)));
+    }
+};
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTransform8Or16Signed
+{
+    static constexpr auto name = "toDate";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        if (from < 0)
+        {
+            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
+            else
+                return 0;
+        }
+        return from;
+    }
+};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDateTime64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+        : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false> {};
+
+/// Implementation of toDate32 function.
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDate32Transform32Or64
+{
+    static constexpr auto name = "toDate32";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    {
+        if (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
+            return static_cast<ToType>(from);
+        else
+        {
+            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+            {
+                if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
+            }
+            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME64_TIMESTAMP)));
+        }
+    }
+};
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDate32Transform32Or64Signed
+{
+    static constexpr auto name = "toDate32";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    {
+        static const Int32 daynum_min_offset = -static_cast<Int32>(time_zone.getDayNumOffsetEpoch());
+
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < daynum_min_offset || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
+        }
+
+        if (from < daynum_min_offset)
+            return daynum_min_offset;
+
+        return (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
+            ? static_cast<ToType>(from)
+            : time_zone.toDayNum(std::min(time_t(Int64(from)), time_t(MAX_DATETIME64_TIMESTAMP)));
+    }
+};
+
+template <typename FromType, typename ToType>
+struct ToDate32Transform8Or16Signed
+{
+    static constexpr auto name = "toDate32";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        return from;
+    }
+};
+
+/** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
+  * Float32, Float64) to Date. If the
+  * number is less than 65536, then it is treated as DayNum, and if it's greater or equals to 65536,
+  * then treated as unix timestamp. If the number exceeds UInt32, saturate to MAX_UINT32 then as DayNum.
+  * It's a bit illogical, as we actually have two functions in one.
+  * But allows to support frequent case,
+  *  when user write toDate(UInt32), expecting conversion of unix timestamp to Date.
+  *  (otherwise such usage would be frequent mistake).
+  */
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeUInt32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeUInt32, DataTypeDate, ToDateTransform32Or64<UInt32, UInt16, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeUInt64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDate, ToDateTransform32Or64<UInt64, UInt16, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt8, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt8, DataTypeDate, ToDateTransform8Or16Signed<Int8, UInt16, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt16, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt16, DataTypeDate, ToDateTransform8Or16Signed<Int16, UInt16, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt32, DataTypeDate, ToDateTransform32Or64Signed<Int32, UInt16, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt64, DataTypeDate, ToDateTransform32Or64Signed<Int64, UInt16, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeFloat32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDate, ToDateTransform32Or64Signed<Float32, UInt16, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeFloat64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDate, ToDateTransform32Or64Signed<Float64, UInt16, default_date_time_overflow_behavior>, false> {};
+
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeUInt32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeUInt32, DataTypeDate32, ToDate32Transform32Or64<UInt32, Int32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeUInt64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDate32, ToDate32Transform32Or64<UInt64, Int32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt8, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt8, DataTypeDate32, ToDate32Transform8Or16Signed<Int8, Int32>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt16, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt16, DataTypeDate32, ToDate32Transform8Or16Signed<Int16, Int32>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt32, DataTypeDate32, ToDate32Transform32Or64Signed<Int32, Int32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt64, DataTypeDate32, ToDate32Transform32Or64Signed<Int64, Int32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeFloat32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDate32, ToDate32Transform32Or64Signed<Float32, Int32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeFloat64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDate32, ToDate32Transform32Or64Signed<Float64, Int32, default_date_time_overflow_behavior>, false> {};
+
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTimeTransform64
+{
+    static constexpr auto name = "toDateTime";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
+        }
+        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
+    }
+};
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTimeTransformSigned
+{
+    static constexpr auto name = "toDateTime";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        if (from < 0)
+        {
+            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
+            else
+                return 0;
+        }
+        return from;
+    }
+};
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTimeTransform64Signed
+{
+    static constexpr auto name = "toDateTime";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < 0 || from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
+        }
+
+        if (from < 0)
+            return 0;
+        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
+    }
+};
+
+/// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt8, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt8, DataTypeDateTime, ToDateTimeTransformSigned<Int8, UInt32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt16, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt16, DataTypeDateTime, ToDateTimeTransformSigned<Int16, UInt32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt32, DataTypeDateTime, ToDateTimeTransformSigned<Int32, UInt32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt64, DataTypeDateTime, ToDateTimeTransform64Signed<Int64, UInt32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeUInt64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDateTime, ToDateTimeTransform64<UInt64, UInt32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeFloat32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDateTime, ToDateTimeTransform64Signed<Float32, UInt32, default_date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeFloat64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDateTime, ToDateTimeTransform64Signed<Float64, UInt32, default_date_time_overflow_behavior>, false> {};
+
+/** Conversion of numeric to DateTime64
+  */
+
+template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTime64TransformUnsigned
+{
+    static constexpr auto name = "toDateTime64";
+
+    const DateTime64::NativeType scale_multiplier = 1;
+
+    ToDateTime64TransformUnsigned(UInt32 scale = 0) /// NOLINT
+        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
+    {}
+
+    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
+            else
+                return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
+        }
+        else
+            return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP), 0, scale_multiplier);
+    }
+};
+template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTime64TransformSigned
+{
+    static constexpr auto name = "toDateTime64";
+
+    const DateTime64::NativeType scale_multiplier = 1;
+
+    ToDateTime64TransformSigned(UInt32 scale = 0) /// NOLINT
+        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
+    {}
+
+    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
+        }
+        from = static_cast<FromType>(std::max<time_t>(from, MIN_DATETIME64_TIMESTAMP));
+        from = static_cast<FromType>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP));
+
+        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
+    }
+};
+template <typename FromDataType, typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTime64TransformFloat
+{
+    static constexpr auto name = "toDateTime64";
+
+    const UInt32 scale = 1;
+
+    ToDateTime64TransformFloat(UInt32 scale_ = 0) /// NOLINT
+        : scale(scale_)
+    {}
+
+    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
+        }
+
+        from = std::max(from, static_cast<FromType>(MIN_DATETIME64_TIMESTAMP));
+        from = std::min(from, static_cast<FromType>(MAX_DATETIME64_TIMESTAMP));
+        return convertToDecimal<FromDataType, DataTypeDateTime64>(from, scale);
+    }
+};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt8, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt8, DataTypeDateTime64, ToDateTime64TransformSigned<Int8, date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt16, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt16, DataTypeDateTime64, ToDateTime64TransformSigned<Int16, date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt32, DataTypeDateTime64, ToDateTime64TransformSigned<Int32, date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeInt64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeInt64, DataTypeDateTime64, ToDateTime64TransformSigned<Int64, date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeUInt64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDateTime64, ToDateTime64TransformUnsigned<UInt64, date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeFloat32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDateTime64, ToDateTime64TransformFloat<DataTypeFloat32, Float32, date_time_overflow_behavior>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeFloat64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDateTime64, ToDateTime64TransformFloat<DataTypeFloat64, Float64, date_time_overflow_behavior>, false> {};
+
+
+/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
+ */
+template <typename Transform>
+struct FromDateTime64Transform
+{
+    static constexpr auto name = Transform::name;
+
+    const DateTime64::NativeType scale_multiplier = 1;
+
+    FromDateTime64Transform(UInt32 scale) /// NOLINT
+        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
+    {}
+
+    auto execute(DateTime64::NativeType dt, const DateLUTImpl & time_zone) const
+    {
+        const auto c = DecimalUtils::splitWithScaleMultiplier(DateTime64(dt), scale_multiplier);
+        return Transform::execute(static_cast<UInt32>(c.whole), time_zone);
+    }
+};
+
+/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
+ */
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDateTime64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDateTime64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDateTime, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false> {};
+
+struct ToDateTime64Transform
+{
+    static constexpr auto name = "toDateTime64";
+
+    const DateTime64::NativeType scale_multiplier = 1;
+
+    ToDateTime64Transform(UInt32 scale = 0) /// NOLINT
+        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
+    {}
+
+    DateTime64::NativeType execute(UInt16 d, const DateLUTImpl & time_zone) const
+    {
+        const auto dt = ToDateTimeImpl<>::execute(d, time_zone);
+        return execute(dt, time_zone);
+    }
+
+    DateTime64::NativeType execute(Int32 d, const DateLUTImpl & time_zone) const
+    {
+        Int64 dt = static_cast<Int64>(time_zone.fromDayNum(ExtendedDayNum(d)));
+        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
+    }
+
+    DateTime64::NativeType execute(UInt32 dt, const DateLUTImpl & /*time_zone*/) const
+    {
+        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
+    }
+};
+
+/** Conversion of Date or DateTime to DateTime64: add zero sub-second part.
+  */
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDate, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDate, DataTypeDateTime64, ToDateTime64Transform> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDate32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDate32, DataTypeDateTime64, ToDateTime64Transform> {};
+
+template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ConvertImpl<DataTypeDateTime, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDateTime64, ToDateTime64Transform> {};
+
+
+/** Transformation of numbers, dates, datetimes to strings: through formatting.
+  */
+template <typename DataType>
+struct FormatImpl
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const typename DataType::FieldType x, WriteBuffer & wb, const DataType *, const DateLUTImpl *)
+    {
+        writeText(x, wb);
+        return ReturnType(true);
+    }
+};
+
+template <>
+struct FormatImpl<DataTypeDate>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const DataTypeDate::FieldType x, WriteBuffer & wb, const DataTypeDate *, const DateLUTImpl * time_zone)
+    {
+        writeDateText(DayNum(x), wb, *time_zone);
+        return ReturnType(true);
+    }
+};
+
+template <>
+struct FormatImpl<DataTypeDate32>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const DataTypeDate32::FieldType x, WriteBuffer & wb, const DataTypeDate32 *, const DateLUTImpl * time_zone)
+    {
+        writeDateText(ExtendedDayNum(x), wb, *time_zone);
+        return ReturnType(true);
+    }
+};
+
+template <>
+struct FormatImpl<DataTypeDateTime>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const DataTypeDateTime::FieldType x, WriteBuffer & wb, const DataTypeDateTime *, const DateLUTImpl * time_zone)
+    {
+        writeDateTimeText(x, wb, *time_zone);
+        return ReturnType(true);
+    }
+};
+
+template <>
+struct FormatImpl<DataTypeDateTime64>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const DataTypeDateTime64::FieldType x, WriteBuffer & wb, const DataTypeDateTime64 * type, const DateLUTImpl * time_zone)
+    {
+        writeDateTimeText(DateTime64(x), type->getScale(), wb, *time_zone);
+        return ReturnType(true);
+    }
+};
+
+
+template <typename FieldType>
+struct FormatImpl<DataTypeEnum<FieldType>>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeEnum<FieldType> * type, const DateLUTImpl *)
+    {
+        static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+        if constexpr (throw_exception)
+        {
+            writeString(type->getNameForValue(x), wb);
+        }
+        else
+        {
+            StringRef res;
+            bool is_ok = type->getNameForValue(x, res);
+            if (is_ok)
+                writeString(res, wb);
+            return ReturnType(is_ok);
+        }
+    }
+};
+
+template <typename FieldType>
+struct FormatImpl<DataTypeDecimal<FieldType>>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeDecimal<FieldType> * type, const DateLUTImpl *)
+    {
+        writeText(x, type->getScale(), wb, false);
+        return ReturnType(true);
+    }
+};
+
+
+/// DataTypeEnum<T> to DataType<T> free conversion
+template <typename FieldType, typename Name>
+struct ConvertImpl<DataTypeEnum<FieldType>, DataTypeNumber<FieldType>, Name, ConvertDefaultBehaviorTag>
+{
+    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/)
+    {
+        return arguments[0].column;
+    }
+};
+
+static inline ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
+{
+    ColumnUInt8::MutablePtr null_map = nullptr;
+    if (const auto * col_null = checkAndGetColumn<ColumnNullable>(col.get()))
+    {
+        null_map = ColumnUInt8::create();
+        null_map->insertRangeFrom(col_null->getNullMapColumn(), 0, col_null->size());
+    }
+    return null_map;
+}
+
+template <typename FromDataType, typename Name>
+requires (!std::is_same_v<FromDataType, DataTypeString>)
+struct ConvertImpl<FromDataType, DataTypeString, Name, ConvertDefaultBehaviorTag>
+{
+    using FromFieldType = typename FromDataType::FieldType;
+    using ColVecType = ColumnVectorOrDecimal<FromFieldType>;
+
+    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/)
+    {
+        if constexpr (IsDataTypeDateOrDateTime<FromDataType>)
+        {
+            auto datetime_arg = arguments[0];
+
+            const DateLUTImpl * time_zone = nullptr;
+            const ColumnConst * time_zone_column = nullptr;
+
+            if (arguments.size() == 1)
+            {
+                auto non_null_args = createBlockWithNestedColumns(arguments);
+                time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
+            }
+            else /// When we have a column for timezone
+            {
+                datetime_arg.column = datetime_arg.column->convertToFullColumnIfConst();
+
+                if constexpr (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
+                    time_zone = &DateLUT::instance();
+                /// For argument of Date or DateTime type, second argument with time zone could be specified.
+                if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDateTime64>)
+                {
+                    if ((time_zone_column = checkAndGetColumnConst<ColumnString>(arguments[1].column.get())))
+                    {
+                        auto non_null_args = createBlockWithNestedColumns(arguments);
+                        time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
+                    }
+                }
+            }
+            const auto & col_with_type_and_name = columnGetNested(datetime_arg);
+
+            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
+            {
+                auto col_to = ColumnString::create();
+
+                const typename ColVecType::Container & vec_from = col_from->getData();
+                ColumnString::Chars & data_to = col_to->getChars();
+                ColumnString::Offsets & offsets_to = col_to->getOffsets();
+                size_t size = vec_from.size();
+
+                if constexpr (std::is_same_v<FromDataType, DataTypeDate>)
+                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
+                else if constexpr (std::is_same_v<FromDataType, DataTypeDate32>)
+                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
+                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime>)
+                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss") + 1));
+                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>)
+                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss.") + col_from->getScale() + 1));
+                else
+                    data_to.resize(size * 3);   /// Arbitrary
+
+                offsets_to.resize(size);
+
+                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
+                const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
+
+                ColumnUInt8::MutablePtr null_map = copyNullMap(datetime_arg.column);
+
+                if (!null_map && arguments.size() > 1)
+                    null_map = copyNullMap(arguments[1].column->convertToFullColumnIfConst());
+
+                if (null_map)
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        if (!time_zone_column && arguments.size() > 1)
+                        {
+                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
+                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
+                            else
+                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
+                        }
+                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, time_zone);
+                        null_map->getData()[i] |= !is_ok;
+                        writeChar(0, write_buffer);
+                        offsets_to[i] = write_buffer.count();
+                    }
+                }
+                else
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        if (!time_zone_column && arguments.size() > 1)
+                        {
+                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
+                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
+                            else
+                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
+                        }
+                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, time_zone);
+                        writeChar(0, write_buffer);
+                        offsets_to[i] = write_buffer.count();
+                    }
+                }
+
+                write_buffer.finalize();
+
+                if (null_map)
+                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
+                return col_to;
+            }
+            else
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                        arguments[0].column->getName(), Name::name);
+        }
+        else
+        {
+            ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
+
+            const auto & col_with_type_and_name = columnGetNested(arguments[0]);
+            const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
+
+            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
+            {
+                auto col_to = ColumnString::create();
+
+                const typename ColVecType::Container & vec_from = col_from->getData();
+                ColumnString::Chars & data_to = col_to->getChars();
+                ColumnString::Offsets & offsets_to = col_to->getOffsets();
+                size_t size = vec_from.size();
+
+                data_to.resize(size * 3);
+                offsets_to.resize(size);
+
+                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
+
+                if (null_map)
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, nullptr);
+                        /// We don't use timezones in this branch
+                        null_map->getData()[i] |= !is_ok;
+                        writeChar(0, write_buffer);
+                        offsets_to[i] = write_buffer.count();
+                    }
+                }
+                else
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, nullptr);
+                        writeChar(0, write_buffer);
+                        offsets_to[i] = write_buffer.count();
+                    }
+                }
+
+                write_buffer.finalize();
+
+                if (null_map)
+                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
+                return col_to;
+            }
+            else
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                        arguments[0].column->getName(), Name::name);
+        }
+    }
+};
+
+
+/// Generic conversion of any type to String or FixedString via serialization to text.
+template <typename StringColumnType>
+struct ConvertImplGenericToString
+{
+    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t /*input_rows_count*/)
+    {
+        static_assert(std::is_same_v<StringColumnType, ColumnString> || std::is_same_v<StringColumnType, ColumnFixedString>,
+                "Can be used only to serialize to ColumnString or ColumnFixedString");
+
+        ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
+
+        const auto & col_with_type_and_name = columnGetNested(arguments[0]);
+        const IDataType & type = *col_with_type_and_name.type;
+        const IColumn & col_from = *col_with_type_and_name.column;
+
+        size_t size = col_from.size();
+        auto col_to = removeNullable(result_type)->createColumn();
+
+        {
+            ColumnStringHelpers::WriteHelper write_helper(
+                    assert_cast<StringColumnType &>(*col_to),
+                    size);
+
+            auto & write_buffer = write_helper.getWriteBuffer();
+
+            FormatSettings format_settings;
+            auto serialization = type.getDefaultSerialization();
+            for (size_t row = 0; row < size; ++row)
+            {
+                serialization->serializeText(col_from, row, write_buffer, format_settings);
+                write_helper.rowWritten();
+            }
+
+            write_helper.finalize();
+        }
+
+        if (result_type->isNullable() && null_map)
+            return ColumnNullable::create(std::move(col_to), std::move(null_map));
+        return col_to;
+    }
+};
+
+/** Conversion of time_t to UInt16, Int32, UInt32
+  */
+template <typename DataType>
+void convertFromTime(typename DataType::FieldType & x, time_t & time)
+{
+    x = time;
+}
+
+template <>
+inline void convertFromTime<DataTypeDate>(DataTypeDate::FieldType & x, time_t & time)
+{
+    if (unlikely(time < 0))
+        x = 0;
+    else if (unlikely(time > 0xFFFF))
+        x = 0xFFFF;
+    else
+        x = time;
+}
+
+template <>
+inline void convertFromTime<DataTypeDate32>(DataTypeDate32::FieldType & x, time_t & time)
+{
+    x = static_cast<UInt32>(time);
+}
+
+template <>
+inline void convertFromTime<DataTypeDateTime>(DataTypeDateTime::FieldType & x, time_t & time)
+{
+    if (unlikely(time < 0))
+        x = 0;
+    else if (unlikely(time > MAX_DATETIME_TIMESTAMP))
+        x = MAX_DATETIME_TIMESTAMP;
+    else
+        x = static_cast<UInt32>(time);
+}
+
+/** Conversion of strings to numbers, dates, datetimes: through parsing.
+  */
+template <typename DataType>
+void parseImpl(typename DataType::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool precise_float_parsing)
+{
+    if constexpr (std::is_floating_point_v<typename DataType::FieldType>)
+    {
+        if (precise_float_parsing)
+            readFloatTextPrecise(x, rb);
+        else
+            readFloatTextFast(x, rb);
+    }
+    else
+        readText(x, rb);
+}
+
+template <>
+inline void parseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
+{
+    DayNum tmp(0);
+    readDateText(tmp, rb, *time_zone);
+    x = tmp;
+}
+
+template <>
+inline void parseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
+{
+    ExtendedDayNum tmp(0);
+    readDateText(tmp, rb, *time_zone);
+    x = tmp;
+}
+
+
+// NOTE: no need of extra overload of DateTime64, since readDateTimeText64 has different signature and that case is explicitly handled in the calling code.
+template <>
+inline void parseImpl<DataTypeDateTime>(DataTypeDateTime::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
+{
+    time_t time = 0;
+    readDateTimeText(time, rb, *time_zone);
+    convertFromTime<DataTypeDateTime>(x, time);
+}
+
+template <>
+inline void parseImpl<DataTypeUUID>(DataTypeUUID::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
+{
+    UUID tmp;
+    readUUIDText(tmp, rb);
+    x = tmp.toUnderType();
+}
+
+template <>
+inline void parseImpl<DataTypeIPv4>(DataTypeIPv4::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
+{
+    IPv4 tmp;
+    readIPv4Text(tmp, rb);
+    x = tmp.toUnderType();
+}
+
+template <>
+inline void parseImpl<DataTypeIPv6>(DataTypeIPv6::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
+{
+    IPv6 tmp;
+    readIPv6Text(tmp, rb);
+    x = tmp;
+}
+
+template <typename DataType>
+bool tryParseImpl(typename DataType::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool precise_float_parsing)
+{
+    if constexpr (std::is_floating_point_v<typename DataType::FieldType>)
+    {
+        if (precise_float_parsing)
+            return tryReadFloatTextPrecise(x, rb);
+        else
+            return tryReadFloatTextFast(x, rb);
+    }
+    else /*if constexpr (is_integer_v<typename DataType::FieldType>)*/
+        return tryReadIntText(x, rb);
+}
+
+template <>
+inline bool tryParseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
+{
+    DayNum tmp(0);
+    if (!tryReadDateText(tmp, rb, *time_zone))
+        return false;
+    x = tmp;
+    return true;
+}
+
+template <>
+inline bool tryParseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
+{
+    ExtendedDayNum tmp(0);
+    if (!tryReadDateText(tmp, rb, *time_zone))
+        return false;
+    x = tmp;
+    return true;
+}
+
+template <>
+inline bool tryParseImpl<DataTypeDateTime>(DataTypeDateTime::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
+{
+    time_t time = 0;
+    if (!tryReadDateTimeText(time, rb, *time_zone))
+        return false;
+    convertFromTime<DataTypeDateTime>(x, time);
+    return true;
+}
+
+template <>
+inline bool tryParseImpl<DataTypeUUID>(DataTypeUUID::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
+{
+    UUID tmp;
+    if (!tryReadUUIDText(tmp, rb))
+        return false;
+
+    x = tmp.toUnderType();
+    return true;
+}
+
+template <>
+inline bool tryParseImpl<DataTypeIPv4>(DataTypeIPv4::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
+{
+    IPv4 tmp;
+    if (!tryReadIPv4Text(tmp, rb))
+        return false;
+
+    x = tmp.toUnderType();
+    return true;
+}
+
+template <>
+inline bool tryParseImpl<DataTypeIPv6>(DataTypeIPv6::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
+{
+    IPv6 tmp;
+    if (!tryReadIPv6Text(tmp, rb))
+        return false;
+
+    x = tmp;
+    return true;
+}
+
+
+/** Throw exception with verbose message when string value is not parsed completely.
+  */
+[[noreturn]] inline void throwExceptionForIncompletelyParsedValue(ReadBuffer & read_buffer, const IDataType & result_type)
+{
+    WriteBufferFromOwnString message_buf;
+    message_buf << "Cannot parse string " << quote << String(read_buffer.buffer().begin(), read_buffer.buffer().size())
+                << " as " << result_type.getName()
+                << ": syntax error";
+
+    if (read_buffer.offset())
+        message_buf << " at position " << read_buffer.offset()
+                    << " (parsed just " << quote << String(read_buffer.buffer().begin(), read_buffer.offset()) << ")";
+    else
+        message_buf << " at begin of string";
+
+    // Currently there are no functions toIPv{4,6}Or{Null,Zero}
+    if (isNativeNumber(result_type) && !(result_type.getName() == "IPv4" || result_type.getName() == "IPv6"))
+        message_buf << ". Note: there are to" << result_type.getName() << "OrZero and to" << result_type.getName() << "OrNull functions, which returns zero/NULL instead of throwing exception.";
+
+    throw Exception(PreformattedMessage{message_buf.str(), "Cannot parse string {} as {}: syntax error {}"}, ErrorCodes::CANNOT_PARSE_TEXT);
+}
+
+
+enum class ConvertFromStringExceptionMode
+{
+    Throw,  /// Throw exception if value cannot be parsed.
+    Zero,   /// Fill with zero or default if value cannot be parsed.
+    Null    /// Return ColumnNullable with NULLs when value cannot be parsed.
+};
+
+enum class ConvertFromStringParsingMode
+{
+    Normal,
+    BestEffort,  /// Only applicable for DateTime. Will use sophisticated method, that is slower.
+    BestEffortUS
+};
+
+template <typename FromDataType, typename ToDataType, typename Name,
+    ConvertFromStringExceptionMode exception_mode, ConvertFromStringParsingMode parsing_mode>
+struct ConvertThroughParsing
+{
+    static_assert(std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>,
+        "ConvertThroughParsing is only applicable for String or FixedString data types");
+
+    static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
+
+    static bool isAllRead(ReadBuffer & in)
+    {
+        /// In case of FixedString, skip zero bytes at end.
+        if constexpr (std::is_same_v<FromDataType, DataTypeFixedString>)
+            while (!in.eof() && *in.position() == 0)
+                ++in.position();
+
+        if (in.eof())
+            return true;
+
+        /// Special case, that allows to parse string with DateTime or DateTime64 as Date or Date32.
+        if constexpr (std::is_same_v<ToDataType, DataTypeDate> || std::is_same_v<ToDataType, DataTypeDate32>)
+        {
+            if (!in.eof() && (*in.position() == ' ' || *in.position() == 'T'))
+            {
+                if (in.buffer().size() == strlen("YYYY-MM-DD hh:mm:ss"))
+                    return true;
+
+                if (in.buffer().size() >= strlen("YYYY-MM-DD hh:mm:ss.x")
+                    && in.buffer().begin()[19] == '.')
+                {
+                    in.position() = in.buffer().begin() + 20;
+
+                    while (!in.eof() && isNumericASCII(*in.position()))
+                        ++in.position();
+
+                    if (in.eof())
+                        return true;
+                }
+            }
+        }
+
+        return false;
+    }
+
+    template <typename Additions = void *>
+    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & res_type, size_t input_rows_count,
+                        Additions additions [[maybe_unused]] = Additions())
+    {
+        using ColVecTo = typename ToDataType::ColumnType;
+
+        const DateLUTImpl * local_time_zone [[maybe_unused]] = nullptr;
+        const DateLUTImpl * utc_time_zone [[maybe_unused]] = nullptr;
+
+        /// For conversion to Date or DateTime type, second argument with time zone could be specified.
+        if constexpr (std::is_same_v<ToDataType, DataTypeDateTime> || to_datetime64)
+        {
+            const auto result_type = removeNullable(res_type);
+            // Time zone is already figured out during result type resolution, no need to do it here.
+            if (const auto dt_col = checkAndGetDataType<ToDataType>(result_type.get()))
+                local_time_zone = &dt_col->getTimeZone();
+            else
+                local_time_zone = &extractTimeZoneFromFunctionArguments(arguments, 1, 0);
+
+            if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort || parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
+                utc_time_zone = &DateLUT::instance("UTC");
+        }
+        else if constexpr (std::is_same_v<ToDataType, DataTypeDate> || std::is_same_v<ToDataType, DataTypeDate32>)
+        {
+            // Timezone is more or less dummy when parsing Date/Date32 from string.
+            local_time_zone = &DateLUT::instance();
+            utc_time_zone = &DateLUT::instance("UTC");
+        }
+
+        const IColumn * col_from = arguments[0].column.get();
+        const ColumnString * col_from_string = checkAndGetColumn<ColumnString>(col_from);
+        const ColumnFixedString * col_from_fixed_string = checkAndGetColumn<ColumnFixedString>(col_from);
+
+        if (std::is_same_v<FromDataType, DataTypeString> && !col_from_string)
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                col_from->getName(), Name::name);
+
+        if (std::is_same_v<FromDataType, DataTypeFixedString> && !col_from_fixed_string)
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                col_from->getName(), Name::name);
+
+        size_t size = input_rows_count;
+        typename ColVecTo::MutablePtr col_to = nullptr;
+
+        if constexpr (IsDataTypeDecimal<ToDataType>)
+        {
+            UInt32 scale = additions;
+            if constexpr (to_datetime64)
+            {
+                ToDataType check_bounds_in_ctor(scale, local_time_zone ? local_time_zone->getTimeZone() : String{});
+            }
+            else
+            {
+                ToDataType check_bounds_in_ctor(ToDataType::maxPrecision(), scale);
+            }
+            col_to = ColVecTo::create(size, scale);
+        }
+        else
+            col_to = ColVecTo::create(size);
+
+        typename ColVecTo::Container & vec_to = col_to->getData();
+
+        ColumnUInt8::MutablePtr col_null_map_to;
+        ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
+        if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
+        {
+            col_null_map_to = ColumnUInt8::create(size);
+            vec_null_map_to = &col_null_map_to->getData();
+        }
+
+        const ColumnString::Chars * chars = nullptr;
+        const IColumn::Offsets * offsets = nullptr;
+        size_t fixed_string_size = 0;
+
+        if constexpr (std::is_same_v<FromDataType, DataTypeString>)
+        {
+            chars = &col_from_string->getChars();
+            offsets = &col_from_string->getOffsets();
+        }
+        else
+        {
+            chars = &col_from_fixed_string->getChars();
+            fixed_string_size = col_from_fixed_string->getN();
+        }
+
+        size_t current_offset = 0;
+
+        bool precise_float_parsing = false;
+
+        if (DB::CurrentThread::isInitialized())
+        {
+            const DB::ContextPtr query_context = DB::CurrentThread::get().getQueryContext();
+
+            if (query_context)
+                precise_float_parsing = query_context->getSettingsRef().precise_float_parsing;
+        }
+
+        for (size_t i = 0; i < size; ++i)
+        {
+            size_t next_offset = std::is_same_v<FromDataType, DataTypeString> ? (*offsets)[i] : (current_offset + fixed_string_size);
+            size_t string_size = std::is_same_v<FromDataType, DataTypeString> ? next_offset - current_offset - 1 : fixed_string_size;
+
+            ReadBufferFromMemory read_buffer(&(*chars)[current_offset], string_size);
+
+            if constexpr (exception_mode == ConvertFromStringExceptionMode::Throw)
+            {
+                if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort)
+                {
+                    if constexpr (to_datetime64)
+                    {
+                        DateTime64 res = 0;
+                        parseDateTime64BestEffort(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
+                        vec_to[i] = res;
+                    }
+                    else
+                    {
+                        time_t res;
+                        parseDateTimeBestEffort(res, read_buffer, *local_time_zone, *utc_time_zone);
+                        convertFromTime<ToDataType>(vec_to[i], res);
+                    }
+                }
+                else if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
+                {
+                    if constexpr (to_datetime64)
+                    {
+                        DateTime64 res = 0;
+                        parseDateTime64BestEffortUS(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
+                        vec_to[i] = res;
+                    }
+                    else
+                    {
+                        time_t res;
+                        parseDateTimeBestEffortUS(res, read_buffer, *local_time_zone, *utc_time_zone);
+                        convertFromTime<ToDataType>(vec_to[i], res);
+                    }
+                }
+                else
+                {
+                    if constexpr (to_datetime64)
+                    {
+                        DateTime64 value = 0;
+                        readDateTime64Text(value, col_to->getScale(), read_buffer, *local_time_zone);
+                        vec_to[i] = value;
+                    }
+                    else if constexpr (IsDataTypeDecimal<ToDataType>)
+                    {
+                        SerializationDecimal<typename ToDataType::FieldType>::readText(
+                            vec_to[i], read_buffer, ToDataType::maxPrecision(), col_to->getScale());
+                    }
+                    else
+                    {
+                        /// we want to utilize constexpr condition here, which is not mixable with value comparison
+                        do
+                        {
+                            if constexpr (std::is_same_v<FromDataType, DataTypeFixedString> && std::is_same_v<ToDataType, DataTypeIPv6>)
+                            {
+                                if (fixed_string_size == IPV6_BINARY_LENGTH)
+                                {
+                                    readBinary(vec_to[i], read_buffer);
+                                    break;
+                                }
+                            }
+                            parseImpl<ToDataType>(vec_to[i], read_buffer, local_time_zone, precise_float_parsing);
+                        } while (false);
+                    }
+                }
+
+                if (!isAllRead(read_buffer))
+                    throwExceptionForIncompletelyParsedValue(read_buffer, *res_type);
+            }
+            else
+            {
+                bool parsed;
+
+                if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort)
+                {
+                    if constexpr (to_datetime64)
+                    {
+                        DateTime64 res = 0;
+                        parsed = tryParseDateTime64BestEffort(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
+                        vec_to[i] = res;
+                    }
+                    else
+                    {
+                        time_t res;
+                        parsed = tryParseDateTimeBestEffort(res, read_buffer, *local_time_zone, *utc_time_zone);
+                        convertFromTime<ToDataType>(vec_to[i],res);
+                    }
+                }
+                else if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
+                {
+                    if constexpr (to_datetime64)
+                    {
+                        DateTime64 res = 0;
+                        parsed = tryParseDateTime64BestEffortUS(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
+                        vec_to[i] = res;
+                    }
+                    else
+                    {
+                        time_t res;
+                        parsed = tryParseDateTimeBestEffortUS(res, read_buffer, *local_time_zone, *utc_time_zone);
+                        convertFromTime<ToDataType>(vec_to[i],res);
+                    }
+                }
+                else
+                {
+                    if constexpr (to_datetime64)
+                    {
+                        DateTime64 value = 0;
+                        parsed = tryReadDateTime64Text(value, col_to->getScale(), read_buffer, *local_time_zone);
+                        vec_to[i] = value;
+                    }
+                    else if constexpr (IsDataTypeDecimal<ToDataType>)
+                    {
+                        parsed = SerializationDecimal<typename ToDataType::FieldType>::tryReadText(
+                            vec_to[i], read_buffer, ToDataType::maxPrecision(), col_to->getScale());
+                    }
+                    else
+                    {
+                        /// we want to utilize constexpr condition here, which is not mixable with value comparison
+                        do
+                        {
+                            if constexpr (std::is_same_v<FromDataType, DataTypeFixedString> && std::is_same_v<ToDataType, DataTypeIPv6>)
+                            {
+                                if (fixed_string_size == IPV6_BINARY_LENGTH)
+                                {
+                                    readBinary(vec_to[i], read_buffer);
+                                    parsed = true;
+                                    break;
+                                }
+                            }
+
+                            parsed = tryParseImpl<ToDataType>(vec_to[i], read_buffer, local_time_zone, precise_float_parsing);
+                        } while (false);
+                    }
+                }
+
+                if (!isAllRead(read_buffer))
+                    parsed = false;
+
+                if (!parsed)
+                {
+                    if constexpr (std::is_same_v<ToDataType, DataTypeDate32>)
+                    {
+                        vec_to[i] = -static_cast<Int32>(DateLUT::instance().getDayNumOffsetEpoch());
+                    }
+                    else
+                    {
+                        vec_to[i] = static_cast<typename ToDataType::FieldType>(0);
+                    }
+                }
+
+                if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
+                    (*vec_null_map_to)[i] = !parsed;
+            }
+
+            current_offset = next_offset;
+        }
+
+        if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
+            return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
+        else
+            return col_to;
+    }
+};
+
+
+template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+requires (!std::is_same_v<ToDataType, DataTypeString>)
+struct ConvertImpl<DataTypeString, ToDataType, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : ConvertThroughParsing<DataTypeString, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal> {};
+
+template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+requires (!std::is_same_v<ToDataType, DataTypeFixedString>)
+struct ConvertImpl<DataTypeFixedString, ToDataType, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
+    : ConvertThroughParsing<DataTypeFixedString, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal> {};
+
+template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+requires (!std::is_same_v<ToDataType, DataTypeString>)
+struct ConvertImpl<DataTypeString, ToDataType, Name, ConvertReturnNullOnErrorTag, date_time_overflow_behavior>
+    : ConvertThroughParsing<DataTypeString, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal> {};
+
+template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+requires (!std::is_same_v<ToDataType, DataTypeFixedString>)
+struct ConvertImpl<DataTypeFixedString, ToDataType, Name, ConvertReturnNullOnErrorTag, date_time_overflow_behavior>
+    : ConvertThroughParsing<DataTypeFixedString, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal> {};
+
+template <typename FromDataType, typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+requires (is_any_of<FromDataType, DataTypeString, DataTypeFixedString> && is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>)
+struct ConvertImpl<FromDataType, ToDataType, Name, ConvertReturnZeroOnErrorTag, date_time_overflow_behavior>
+    : ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::Normal> {};
+
+/// Generic conversion of any type from String. Used for complex types: Array and Tuple or types with custom serialization.
+struct ConvertImplGenericFromString
+{
+    static ColumnPtr execute(ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * column_nullable, size_t input_rows_count)
+    {
+        const IColumn & column_from = *arguments[0].column;
+        const IDataType & data_type_to = *result_type;
+        auto res = data_type_to.createColumn();
+        auto serialization = data_type_to.getDefaultSerialization();
+        const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
+
+        executeImpl(column_from, *res, *serialization, input_rows_count, null_map, result_type.get());
+        return res;
+    }
+
+    static void executeImpl(
+        const IColumn & column_from,
+        IColumn & column_to,
+        const ISerialization & serialization_from,
+        size_t input_rows_count,
+        const PaddedPODArray<UInt8> * null_map,
+        const IDataType * result_type)
+    {
+        column_to.reserve(input_rows_count);
+
+        FormatSettings format_settings;
+        for (size_t i = 0; i < input_rows_count; ++i)
+        {
+            if (null_map && (*null_map)[i])
+            {
+                column_to.insertDefault();
+                continue;
+            }
+
+            const auto & val = column_from.getDataAt(i);
+            ReadBufferFromMemory read_buffer(val.data, val.size);
+            try
+            {
+                serialization_from.deserializeWholeText(column_to, read_buffer, format_settings);
+            }
+            catch (const Exception & e)
+            {
+                auto * nullable_column = typeid_cast<ColumnNullable *>(&column_to);
+                if (e.code() == ErrorCodes::CANNOT_PARSE_BOOL && nullable_column)
+                {
+                    auto & col_nullmap = nullable_column->getNullMapData();
+                    if (col_nullmap.size() != nullable_column->size())
+                        col_nullmap.resize_fill(nullable_column->size());
+                    if (nullable_column->size() == (i + 1))
+                        nullable_column->popBack(1);
+                    nullable_column->insertDefault();
+                    continue;
+                }
+                throw;
+            }
+
+            if (!read_buffer.eof())
+            {
+                if (result_type)
+                    throwExceptionForIncompletelyParsedValue(read_buffer, *result_type);
+                else
+                    throw Exception(ErrorCodes::CANNOT_PARSE_TEXT,
+                        "Cannot parse string to column {}. Expected eof", column_to.getName());
+            }
+        }
+    }
+};
+
+
+template <>
+struct ConvertImpl<DataTypeString, DataTypeUInt32, NameToUnixTimestamp, ConvertDefaultBehaviorTag>
+    : ConvertImpl<DataTypeString, DataTypeDateTime, NameToUnixTimestamp, ConvertDefaultBehaviorTag> {};
+
+template <>
+struct ConvertImpl<DataTypeString, DataTypeUInt32, NameToUnixTimestamp, ConvertReturnNullOnErrorTag>
+    : ConvertImpl<DataTypeString, DataTypeDateTime, NameToUnixTimestamp, ConvertReturnNullOnErrorTag> {};
+
+/** If types are identical, just take reference to column.
+  */
+template <typename T, typename Name>
+requires (!T::is_parametric)
+struct ConvertImpl<T, T, Name, ConvertDefaultBehaviorTag>
+{
+    template <typename Additions = void *>
+    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/,
+        Additions additions [[maybe_unused]] = Additions())
+    {
+        return arguments[0].column;
+    }
+};
+
+template <typename Name>
+struct ConvertImpl<DataTypeUInt8, DataTypeUInt8, Name, ConvertDefaultBehaviorTag>
+{
+    template <typename Additions = void *>
+    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/,
+                             Additions additions [[maybe_unused]] = Additions())
+    {
+
+        return arguments[0].column;
+    }
+};
+
+
+/** Conversion from FixedString to String.
+  * Cutting sequences of zero bytes from end of strings.
+  */
+template <typename Name>
+struct ConvertImpl<DataTypeFixedString, DataTypeString, Name, ConvertDefaultBehaviorTag>
+{
+    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type, size_t /*input_rows_count*/)
+    {
+        ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
+        const auto & nested =  columnGetNested(arguments[0]);
+        if (const ColumnFixedString * col_from = checkAndGetColumn<ColumnFixedString>(nested.column.get()))
+        {
+            auto col_to = ColumnString::create();
+
+            const ColumnFixedString::Chars & data_from = col_from->getChars();
+            ColumnString::Chars & data_to = col_to->getChars();
+            ColumnString::Offsets & offsets_to = col_to->getOffsets();
+            size_t size = col_from->size();
+            size_t n = col_from->getN();
+            data_to.resize(size * (n + 1)); /// + 1 - zero terminator
+            offsets_to.resize(size);
+
+            size_t offset_from = 0;
+            size_t offset_to = 0;
+            for (size_t i = 0; i < size; ++i)
+            {
+                if (!null_map || !null_map->getData()[i])
+                {
+                    size_t bytes_to_copy = n;
+                    while (bytes_to_copy > 0 && data_from[offset_from + bytes_to_copy - 1] == 0)
+                        --bytes_to_copy;
+
+                    memcpy(&data_to[offset_to], &data_from[offset_from], bytes_to_copy);
+                    offset_to += bytes_to_copy;
+                }
+                data_to[offset_to] = 0;
+                ++offset_to;
+                offsets_to[i] = offset_to;
+                offset_from += n;
+            }
+
+            data_to.resize(offset_to);
+            if (return_type->isNullable() && null_map)
+                return ColumnNullable::create(std::move(col_to), std::move(null_map));
+            return col_to;
+        }
+        else
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                    arguments[0].column->getName(), Name::name);
+    }
+};
+
+
+/// Declared early because used below.
+struct NameToDate { static constexpr auto name = "toDate"; };
+struct NameToDate32 { static constexpr auto name = "toDate32"; };
+struct NameToDateTime { static constexpr auto name = "toDateTime"; };
+struct NameToDateTime32 { static constexpr auto name = "toDateTime32"; };
+struct NameToDateTime64 { static constexpr auto name = "toDateTime64"; };
+struct NameToString { static constexpr auto name = "toString"; };
+struct NameToDecimal32 { static constexpr auto name = "toDecimal32"; };
+struct NameToDecimal64 { static constexpr auto name = "toDecimal64"; };
+struct NameToDecimal128 { static constexpr auto name = "toDecimal128"; };
+struct NameToDecimal256 { static constexpr auto name = "toDecimal256"; };
+
+
+#define DEFINE_NAME_TO_INTERVAL(INTERVAL_KIND) \
+    struct NameToInterval ## INTERVAL_KIND \
+    { \
+        static constexpr auto name = "toInterval" #INTERVAL_KIND; \
+        static constexpr auto kind = IntervalKind::Kind::INTERVAL_KIND; \
+    };
+
+DEFINE_NAME_TO_INTERVAL(Nanosecond)
+DEFINE_NAME_TO_INTERVAL(Microsecond)
+DEFINE_NAME_TO_INTERVAL(Millisecond)
+DEFINE_NAME_TO_INTERVAL(Second)
+DEFINE_NAME_TO_INTERVAL(Minute)
+DEFINE_NAME_TO_INTERVAL(Hour)
+DEFINE_NAME_TO_INTERVAL(Day)
+DEFINE_NAME_TO_INTERVAL(Week)
+DEFINE_NAME_TO_INTERVAL(Month)
+DEFINE_NAME_TO_INTERVAL(Quarter)
+DEFINE_NAME_TO_INTERVAL(Year)
+
+#undef DEFINE_NAME_TO_INTERVAL
+
+struct NameParseDateTimeBestEffort;
+struct NameParseDateTimeBestEffortOrZero;
+struct NameParseDateTimeBestEffortOrNull;
+
+template<typename Name, typename ToDataType>
+static inline bool isDateTime64(const ColumnsWithTypeAndName & arguments)
+{
+    if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
+        return true;
+    else if constexpr (std::is_same_v<Name, NameToDateTime> || std::is_same_v<Name, NameParseDateTimeBestEffort>
+        || std::is_same_v<Name, NameParseDateTimeBestEffortOrZero> || std::is_same_v<Name, NameParseDateTimeBestEffortOrNull>)
+    {
+        return (arguments.size() == 2 && isUInt(arguments[1].type)) || arguments.size() == 3;
+    }
+
+    return false;
+}
+
+template <typename ToDataType, typename Name, typename MonotonicityImpl>
+class FunctionConvert : public IFunction
+{
+public:
+    using Monotonic = MonotonicityImpl;
+
+    static constexpr auto name = Name::name;
+    static constexpr bool to_decimal =
+        std::is_same_v<Name, NameToDecimal32> || std::is_same_v<Name, NameToDecimal64>
+         || std::is_same_v<Name, NameToDecimal128> || std::is_same_v<Name, NameToDecimal256>;
+
+    static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
+
+    static constexpr bool to_string_or_fixed_string = std::is_same_v<ToDataType, DataTypeFixedString> ||
+                                                      std::is_same_v<ToDataType, DataTypeString>;
+
+    static constexpr bool to_date_or_datetime = std::is_same_v<ToDataType, DataTypeDate> ||
+                                                std::is_same_v<ToDataType, DataTypeDate32> ||
+                                                std::is_same_v<ToDataType, DataTypeDateTime>;
+
+    static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionConvert>(context); }
+    static FunctionPtr create() { return std::make_shared<FunctionConvert>(); }
+
+    FunctionConvert() = default;
+    explicit FunctionConvert(ContextPtr context_) : context(context_) {}
+
+    String getName() const override
+    {
+        return name;
+    }
+
+    bool isVariadic() const override { return true; }
+    size_t getNumberOfArguments() const override { return 0; }
+    bool isInjective(const ColumnsWithTypeAndName &) const override { return std::is_same_v<Name, NameToString>; }
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & arguments) const override
+    {
+        /// TODO: We can make more optimizations here.
+        return !(to_date_or_datetime && isNumber(*arguments[0].type));
+    }
+
+    using DefaultReturnTypeGetter = std::function<DataTypePtr(const ColumnsWithTypeAndName &)>;
+    static DataTypePtr getReturnTypeDefaultImplementationForNulls(const ColumnsWithTypeAndName & arguments, const DefaultReturnTypeGetter & getter)
+    {
+        NullPresence null_presence = getNullPresense(arguments);
+
+        if (null_presence.has_null_constant)
+        {
+            return makeNullable(std::make_shared<DataTypeNothing>());
+        }
+        if (null_presence.has_nullable)
+        {
+            auto nested_columns = Block(createBlockWithNestedColumns(arguments));
+            auto return_type = getter(ColumnsWithTypeAndName(nested_columns.begin(), nested_columns.end()));
+            return makeNullable(return_type);
+        }
+
+        return getter(arguments);
+    }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
+    {
+        auto getter = [&] (const auto & args) { return getReturnTypeImplRemovedNullable(args); };
+        auto res = getReturnTypeDefaultImplementationForNulls(arguments, getter);
+        to_nullable = res->isNullable();
+        checked_return_type = true;
+        return res;
+    }
+
+    DataTypePtr getReturnTypeImplRemovedNullable(const ColumnsWithTypeAndName & arguments) const
+    {
+        FunctionArgumentDescriptors mandatory_args = {{"Value", nullptr, nullptr, nullptr}};
+        FunctionArgumentDescriptors optional_args;
+
+        if constexpr (to_decimal)
+        {
+            mandatory_args.push_back({"scale", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isNativeInteger), &isColumnConst, "const Integer"});
+        }
+
+        if (!to_decimal && isDateTime64<Name, ToDataType>(arguments))
+        {
+            mandatory_args.push_back({"scale", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isNativeInteger), &isColumnConst, "const Integer"});
+        }
+
+        // toString(DateTime or DateTime64, [timezone: String])
+        if ((std::is_same_v<Name, NameToString> && !arguments.empty() && (isDateTime64(arguments[0].type) || isDateTime(arguments[0].type)))
+            // toUnixTimestamp(value[, timezone : String])
+            || std::is_same_v<Name, NameToUnixTimestamp>
+            // toDate(value[, timezone : String])
+            || std::is_same_v<ToDataType, DataTypeDate> // TODO: shall we allow timestamp argument for toDate? DateTime knows nothing about timezones and this argument is ignored below.
+            // toDate32(value[, timezone : String])
+            || std::is_same_v<ToDataType, DataTypeDate32>
+            // toDateTime(value[, timezone: String])
+            || std::is_same_v<ToDataType, DataTypeDateTime>
+            // toDateTime64(value, scale : Integer[, timezone: String])
+            || std::is_same_v<ToDataType, DataTypeDateTime64>)
+        {
+            optional_args.push_back({"timezone", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isString), nullptr, "String"});
+        }
+
+        validateFunctionArgumentTypes(*this, arguments, mandatory_args, optional_args);
+
+        if constexpr (std::is_same_v<ToDataType, DataTypeInterval>)
+        {
+            return std::make_shared<DataTypeInterval>(Name::kind);
+        }
+        else if constexpr (to_decimal)
+        {
+            UInt64 scale = extractToDecimalScale(arguments[1]);
+
+            if constexpr (std::is_same_v<Name, NameToDecimal32>)
+                return createDecimalMaxPrecision<Decimal32>(scale);
+            else if constexpr (std::is_same_v<Name, NameToDecimal64>)
+                return createDecimalMaxPrecision<Decimal64>(scale);
+            else if constexpr (std::is_same_v<Name, NameToDecimal128>)
+                return createDecimalMaxPrecision<Decimal128>(scale);
+            else if constexpr (std::is_same_v<Name, NameToDecimal256>)
+                return createDecimalMaxPrecision<Decimal256>(scale);
+
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected branch in code of conversion function: it is a bug.");
+        }
+        else
+        {
+            // Optional second argument with time zone for DateTime.
+            UInt8 timezone_arg_position = 1;
+            UInt32 scale [[maybe_unused]] = DataTypeDateTime64::default_scale;
+
+            // DateTime64 requires more arguments: scale and timezone. Since timezone is optional, scale should be first.
+            if (isDateTime64<Name, ToDataType>(arguments))
+            {
+                timezone_arg_position += 1;
+                scale = static_cast<UInt32>(arguments[1].column->get64(0));
+
+                if (to_datetime64 || scale != 0) /// toDateTime('xxxx-xx-xx xx:xx:xx', 0) return DateTime
+                    return std::make_shared<DataTypeDateTime64>(scale,
+                        extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
+
+                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
+            }
+
+            if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
+                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
+            else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected branch in code of conversion function: it is a bug.");
+            else
+                return std::make_shared<ToDataType>();
+        }
+    }
+
+    /// Function actually uses default implementation for nulls,
+    /// but we need to know if return type is Nullable or not,
+    /// so we use checked_return_type only to intercept the first call to getReturnTypeImpl(...).
+    bool useDefaultImplementationForNulls() const override
+    {
+        bool to_nullable_string = to_nullable && std::is_same_v<ToDataType, DataTypeString>;
+        return checked_return_type && !to_nullable_string;
+    }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override
+    {
+        if constexpr (std::is_same_v<ToDataType, DataTypeString>)
+            return {};
+        else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
+            return {2};
+        return {1};
+    }
+    bool canBeExecutedOnDefaultArguments() const override { return false; }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
+    {
+        try
+        {
+            return executeInternal(arguments, result_type, input_rows_count);
+        }
+        catch (Exception & e)
+        {
+            /// More convenient error message.
+            if (e.code() == ErrorCodes::ATTEMPT_TO_READ_AFTER_EOF)
+            {
+                e.addMessage("Cannot parse "
+                    + result_type->getName() + " from "
+                    + arguments[0].type->getName()
+                    + ", because value is too short");
+            }
+            else if (e.code() == ErrorCodes::CANNOT_PARSE_NUMBER
+                || e.code() == ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT
+                || e.code() == ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED
+                || e.code() == ErrorCodes::CANNOT_PARSE_QUOTED_STRING
+                || e.code() == ErrorCodes::CANNOT_PARSE_ESCAPE_SEQUENCE
+                || e.code() == ErrorCodes::CANNOT_PARSE_DATE
+                || e.code() == ErrorCodes::CANNOT_PARSE_DATETIME
+                || e.code() == ErrorCodes::CANNOT_PARSE_UUID
+                || e.code() == ErrorCodes::CANNOT_PARSE_IPV4
+                || e.code() == ErrorCodes::CANNOT_PARSE_IPV6)
+            {
+                e.addMessage("Cannot parse "
+                    + result_type->getName() + " from "
+                    + arguments[0].type->getName());
+            }
+
+            throw;
+        }
+    }
+
+    bool hasInformationAboutMonotonicity() const override
+    {
+        return Monotonic::has();
+    }
+
+    Monotonicity getMonotonicityForRange(const IDataType & type, const Field & left, const Field & right) const override
+    {
+        return Monotonic::get(type, left, right);
+    }
+
+private:
+    ContextPtr context;
+    mutable bool checked_return_type = false;
+    mutable bool to_nullable = false;
+
+    ColumnPtr executeInternal(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const
+    {
+        if (arguments.empty())
+            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} expects at least 1 argument", getName());
+
+        if (result_type->onlyNull())
+            return result_type->createColumnConstWithDefaultValue(input_rows_count);
+
+        const DataTypePtr from_type = removeNullable(arguments[0].type);
+        ColumnPtr result_column;
+
+        [[maybe_unused]] FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior;
+
+        if (context)
+            date_time_overflow_behavior = context->getSettingsRef().date_time_overflow_behavior.value;
+
+        auto call = [&](const auto & types, const auto & tag) -> bool
+        {
+            using Types = std::decay_t<decltype(types)>;
+            using LeftDataType = typename Types::LeftType;
+            using RightDataType = typename Types::RightType;
+            using SpecialTag = std::decay_t<decltype(tag)>;
+
+            if constexpr (IsDataTypeDecimal<RightDataType>)
+            {
+                if constexpr (std::is_same_v<RightDataType, DataTypeDateTime64>)
+                {
+                    /// Account for optional timezone argument.
+                    if (arguments.size() != 2 && arguments.size() != 3)
+                        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} expects 2 or 3 arguments for DataTypeDateTime64.", getName());
+                }
+                else if (arguments.size() != 2)
+                {
+                    throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} expects 2 arguments for Decimal.", getName());
+                }
+
+                const ColumnWithTypeAndName & scale_column = arguments[1];
+                UInt32 scale = extractToDecimalScale(scale_column);
+
+                switch (date_time_overflow_behavior)
+                {
+                    case FormatSettings::DateTimeOverflowBehavior::Throw:
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, scale);
+                        break;
+                    case FormatSettings::DateTimeOverflowBehavior::Ignore:
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, scale);
+                        break;
+                    case FormatSettings::DateTimeOverflowBehavior::Saturate:
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, scale);
+                        break;
+                }
+
+            }
+            else if constexpr (IsDataTypeDateOrDateTime<RightDataType> && std::is_same_v<LeftDataType, DataTypeDateTime64>)
+            {
+                const auto * dt64 = assert_cast<const DataTypeDateTime64 *>(arguments[0].type.get());
+                switch (date_time_overflow_behavior)
+                {
+                    case FormatSettings::DateTimeOverflowBehavior::Throw:
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, dt64->getScale());
+                        break;
+                    case FormatSettings::DateTimeOverflowBehavior::Ignore:
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, dt64->getScale());
+                        break;
+                    case FormatSettings::DateTimeOverflowBehavior::Saturate:
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, dt64->getScale());
+                        break;
+                }
+            }
+#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE) \
+            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
+                result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
+                arguments, result_type, input_rows_count); \
+                break;
+
+            else if constexpr (IsDataTypeDecimalOrNumber<LeftDataType> && IsDataTypeDecimalOrNumber<RightDataType>)
+            {
+                using LeftT = typename LeftDataType::FieldType;
+                using RightT = typename RightDataType::FieldType;
+
+                static constexpr bool bad_left =
+                    is_decimal<LeftT> || std::is_floating_point_v<LeftT> || is_big_int_v<LeftT> || is_signed_v<LeftT>;
+                static constexpr bool bad_right =
+                    is_decimal<RightT> || std::is_floating_point_v<RightT> || is_big_int_v<RightT> || is_signed_v<RightT>;
+
+                /// Disallow int vs UUID conversion (but support int vs UInt128 conversion)
+                if constexpr ((bad_left && std::is_same_v<RightDataType, DataTypeUUID>) ||
+                              (bad_right && std::is_same_v<LeftDataType, DataTypeUUID>))
+                {
+                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Wrong UUID conversion");
+                }
+                else
+                {
+                    switch (date_time_overflow_behavior)
+                    {
+                        GENERATE_OVERFLOW_MODE_CASE(Throw)
+                        GENERATE_OVERFLOW_MODE_CASE(Ignore)
+                        GENERATE_OVERFLOW_MODE_CASE(Saturate)
+                    }
+                }
+            }
+            else if constexpr ((IsDataTypeNumber<LeftDataType> || IsDataTypeDateOrDateTime<LeftDataType>)
+                               && IsDataTypeDateOrDateTime<RightDataType>)
+            {
+                switch (date_time_overflow_behavior)
+                {
+                    GENERATE_OVERFLOW_MODE_CASE(Throw)
+                    GENERATE_OVERFLOW_MODE_CASE(Ignore)
+                    GENERATE_OVERFLOW_MODE_CASE(Saturate)
+                }
+            }
+#undef GENERATE_OVERFLOW_MODE_CASE
+            else
+                  result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag>::execute(arguments, result_type, input_rows_count);
+
+            return true;
+        };
+
+        if (isDateTime64<Name, ToDataType>(arguments))
+        {
+            /// For toDateTime('xxxx-xx-xx xx:xx:xx.00', 2[, 'timezone']) we need to it convert to DateTime64
+            const ColumnWithTypeAndName & scale_column = arguments[1];
+            UInt32 scale = extractToDecimalScale(scale_column);
+
+            if (to_datetime64 || scale != 0) /// When scale = 0, the data type is DateTime otherwise the data type is DateTime64
+            {
+                if (!callOnIndexAndDataType<DataTypeDateTime64>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{}))
+                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
+                                    arguments[0].type->getName(), getName());
+
+                return result_column;
+            }
+        }
+
+        if constexpr (std::is_same_v<ToDataType, DataTypeString>)
+        {
+            if (from_type->getCustomSerialization())
+                return ConvertImplGenericToString<ColumnString>::execute(arguments, result_type, input_rows_count);
+        }
+
+        bool done = false;
+        if constexpr (to_string_or_fixed_string)
+        {
+            done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
+        }
+        else
+        {
+            bool cast_ipv4_ipv6_default_on_conversion_error = false;
+            if constexpr (is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>)
+                if (context && (cast_ipv4_ipv6_default_on_conversion_error = context->getSettingsRef().cast_ipv4_ipv6_default_on_conversion_error))
+                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertReturnZeroOnErrorTag{});
+
+            if (!cast_ipv4_ipv6_default_on_conversion_error)
+            {
+                /// We should use ConvertFromStringExceptionMode::Null mode when converting from String (or FixedString)
+                /// to Nullable type, to avoid 'value is too short' error on attempt to parse empty string from NULL values.
+                if (to_nullable && WhichDataType(from_type).isStringOrFixedString())
+                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertReturnNullOnErrorTag{});
+                else
+                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
+            }
+        }
+
+        if (!done)
+        {
+            /// Generic conversion of any type to String.
+            if (std::is_same_v<ToDataType, DataTypeString>)
+            {
+                return ConvertImplGenericToString<ColumnString>::execute(arguments, result_type, input_rows_count);
+            }
+            else
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
+                    arguments[0].type->getName(), getName());
+        }
+
+        return result_column;
+    }
+};
+
+
+/** Function toTOrZero (where T is number of date or datetime type):
+  *  try to convert from String to type T through parsing,
+  *  if cannot parse, return default value instead of throwing exception.
+  * Function toTOrNull will return Nullable type with NULL when cannot parse.
+  * NOTE Also need to implement tryToUnixTimestamp with timezone.
+  */
+template <typename ToDataType, typename Name,
+    ConvertFromStringExceptionMode exception_mode,
+    ConvertFromStringParsingMode parsing_mode = ConvertFromStringParsingMode::Normal>
+class FunctionConvertFromString : public IFunction
+{
+public:
+    static constexpr auto name = Name::name;
+    static constexpr bool to_decimal =
+        std::is_same_v<ToDataType, DataTypeDecimal<Decimal32>> ||
+        std::is_same_v<ToDataType, DataTypeDecimal<Decimal64>> ||
+        std::is_same_v<ToDataType, DataTypeDecimal<Decimal128>> ||
+        std::is_same_v<ToDataType, DataTypeDecimal<Decimal256>>;
+
+    static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
+
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionConvertFromString>(); }
+    static FunctionPtr create() { return std::make_shared<FunctionConvertFromString>(); }
+
+    String getName() const override
+    {
+        return name;
+    }
+
+    bool isVariadic() const override { return true; }
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+    size_t getNumberOfArguments() const override { return 0; }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+    bool canBeExecutedOnDefaultArguments() const override { return false; }
+
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
+    {
+        DataTypePtr res;
+
+        if (isDateTime64<Name, ToDataType>(arguments))
+        {
+            validateFunctionArgumentTypes(*this, arguments,
+                FunctionArgumentDescriptors{{"string", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isStringOrFixedString), nullptr, "String or FixedString"}},
+                // optional
+                FunctionArgumentDescriptors{
+                    {"precision", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isUInt8), isColumnConst, "const UInt8"},
+                    {"timezone", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isStringOrFixedString), isColumnConst, "const String or FixedString"},
+                });
+
+            UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
+            if (arguments.size() > 1)
+                scale = extractToDecimalScale(arguments[1]);
+            const auto timezone = extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false);
+
+            res = scale == 0 ? res = std::make_shared<DataTypeDateTime>(timezone) : std::make_shared<DataTypeDateTime64>(scale, timezone);
+        }
+        else
+        {
+            if ((arguments.size() != 1 && arguments.size() != 2) || (to_decimal && arguments.size() != 2))
+                throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                    "Number of arguments for function {} doesn't match: passed {}, should be 1 or 2. "
+                    "Second argument only make sense for DateTime (time zone, optional) and Decimal (scale).",
+                    getName(), arguments.size());
+
+            if (!isStringOrFixedString(arguments[0].type))
+            {
+                if (this->getName().find("OrZero") != std::string::npos ||
+                    this->getName().find("OrNull") != std::string::npos)
+                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument of function {}. "
+                            "Conversion functions with postfix 'OrZero' or 'OrNull' should take String argument",
+                            arguments[0].type->getName(), getName());
+                else
+                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument of function {}",
+                            arguments[0].type->getName(), getName());
+            }
+
+            if (arguments.size() == 2)
+            {
+                if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
+                {
+                    if (!isString(arguments[1].type))
+                        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of 2nd argument of function {}",
+                            arguments[1].type->getName(), getName());
+                }
+                else if constexpr (to_decimal)
+                {
+                    if (!isInteger(arguments[1].type))
+                        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of 2nd argument of function {}",
+                            arguments[1].type->getName(), getName());
+                    if (!arguments[1].column)
+                        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Second argument for function {} must be constant", getName());
+                }
+                else
+                {
+                    throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
+                        "Number of arguments for function {} doesn't match: passed {}, should be 1. "
+                        "Second argument makes sense only for DateTime and Decimal.",
+                        getName(), arguments.size());
+                }
+            }
+
+            if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
+                res = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, false));
+            else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "MaterializedMySQL is a bug.");
+            else if constexpr (to_decimal)
+            {
+                UInt64 scale = extractToDecimalScale(arguments[1]);
+                res = createDecimalMaxPrecision<typename ToDataType::FieldType>(scale);
+                if (!res)
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Something wrong with toDecimalNNOrZero() or toDecimalNNOrNull()");
+            }
+            else
+                res = std::make_shared<ToDataType>();
+        }
+
+        if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
+            res = std::make_shared<DataTypeNullable>(res);
+
+        return res;
+    }
+
+    template <typename ConvertToDataType>
+    ColumnPtr executeInternal(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count, UInt32 scale = 0) const
+    {
+        const IDataType * from_type = arguments[0].type.get();
+
+        if (checkAndGetDataType<DataTypeString>(from_type))
+        {
+            return ConvertThroughParsing<DataTypeString, ConvertToDataType, Name, exception_mode, parsing_mode>::execute(
+                arguments, result_type, input_rows_count, scale);
+        }
+        else if (checkAndGetDataType<DataTypeFixedString>(from_type))
+        {
+            return ConvertThroughParsing<DataTypeFixedString, ConvertToDataType, Name, exception_mode, parsing_mode>::execute(
+                arguments, result_type, input_rows_count, scale);
+        }
+
+        return nullptr;
+    }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
+    {
+        ColumnPtr result_column;
+
+        if constexpr (to_decimal)
+            result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count,
+                assert_cast<const ToDataType &>(*removeNullable(result_type)).getScale());
+        else
+        {
+            if (isDateTime64<Name, ToDataType>(arguments))
+            {
+                UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
+                if (arguments.size() > 1)
+                    scale = extractToDecimalScale(arguments[1]);
+
+                if (scale == 0)
+                    result_column = executeInternal<DataTypeDateTime>(arguments, result_type, input_rows_count);
+                else
+                {
+                    result_column = executeInternal<DataTypeDateTime64>(arguments, result_type, input_rows_count, static_cast<UInt32>(scale));
+                }
+            }
+            else
+            {
+                result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count);
+            }
+        }
+
+        if (!result_column)
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
+                "Only String or FixedString argument is accepted for try-conversion function. For other arguments, "
+                "use function without 'orZero' or 'orNull'.", arguments[0].type->getName(), getName());
+
+        return result_column;
+    }
+};
+
+
+/// Monotonicity.
+
+struct PositiveMonotonicity
+{
+    static bool has() { return true; }
+    static IFunction::Monotonicity get(const IDataType &, const Field &, const Field &)
+    {
+        return { .is_monotonic = true };
+    }
+};
+
+struct UnknownMonotonicity
+{
+    static bool has() { return false; }
+    static IFunction::Monotonicity get(const IDataType &, const Field &, const Field &)
+    {
+        return { };
+    }
+};
+
+template <typename T>
+struct ToNumberMonotonicity
+{
+    static bool has() { return true; }
+
+    static UInt64 divideByRangeOfType(UInt64 x)
+    {
+        if constexpr (sizeof(T) < sizeof(UInt64))
+            return x >> (sizeof(T) * 8);
+        else
+            return 0;
+    }
+
+    static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
+    {
+        if (!type.isValueRepresentedByNumber())
+            return {};
+
+        /// If type is same, the conversion is always monotonic.
+        /// (Enum has separate case, because it is different data type)
+        if (checkAndGetDataType<DataTypeNumber<T>>(&type) ||
+            checkAndGetDataType<DataTypeEnum<T>>(&type))
+            return { .is_monotonic = true, .is_always_monotonic = true };
+
+        /// Float cases.
+
+        /// When converting to Float, the conversion is always monotonic.
+        if constexpr (std::is_floating_point_v<T>)
+            return { .is_monotonic = true, .is_always_monotonic = true };
+
+        const auto * low_cardinality = typeid_cast<const DataTypeLowCardinality *>(&type);
+        const IDataType * low_cardinality_dictionary_type = nullptr;
+        if (low_cardinality)
+            low_cardinality_dictionary_type = low_cardinality->getDictionaryType().get();
+
+        WhichDataType which_type(type);
+        WhichDataType which_inner_type = low_cardinality
+            ? WhichDataType(low_cardinality_dictionary_type)
+            : WhichDataType(type);
+
+        /// If converting from Float, for monotonicity, arguments must fit in range of result type.
+        if (which_inner_type.isFloat())
+        {
+            if (left.isNull() || right.isNull())
+                return {};
+
+            Float64 left_float = left.get<Float64>();
+            Float64 right_float = right.get<Float64>();
+
+            if (left_float >= static_cast<Float64>(std::numeric_limits<T>::min())
+                && left_float <= static_cast<Float64>(std::numeric_limits<T>::max())
+                && right_float >= static_cast<Float64>(std::numeric_limits<T>::min())
+                && right_float <= static_cast<Float64>(std::numeric_limits<T>::max()))
+                return { .is_monotonic = true };
+
+            return {};
+        }
+
+        /// Integer cases.
+
+        /// Only support types represented by native integers.
+        /// It can be extended to big integers, decimals and DateTime64 later.
+        /// By the way, NULLs are representing unbounded ranges.
+        if (!((left.isNull() || left.getType() == Field::Types::UInt64 || left.getType() == Field::Types::Int64)
+            && (right.isNull() || right.getType() == Field::Types::UInt64 || right.getType() == Field::Types::Int64)))
+            return {};
+
+        const bool from_is_unsigned = type.isValueRepresentedByUnsignedInteger();
+        const bool to_is_unsigned = is_unsigned_v<T>;
+
+        const size_t size_of_from = type.getSizeOfValueInMemory();
+        const size_t size_of_to = sizeof(T);
+
+        const bool left_in_first_half = left.isNull()
+            ? from_is_unsigned
+            : (left.get<Int64>() >= 0);
+
+        const bool right_in_first_half = right.isNull()
+            ? !from_is_unsigned
+            : (right.get<Int64>() >= 0);
+
+        /// Size of type is the same.
+        if (size_of_from == size_of_to)
+        {
+            if (from_is_unsigned == to_is_unsigned)
+                return { .is_monotonic = true, .is_always_monotonic = true };
+
+            if (left_in_first_half == right_in_first_half)
+                return { .is_monotonic = true };
+
+            return {};
+        }
+
+        /// Size of type is expanded.
+        if (size_of_from < size_of_to)
+        {
+            if (from_is_unsigned == to_is_unsigned)
+                return { .is_monotonic = true, .is_always_monotonic = true };
+
+            if (!to_is_unsigned)
+                return { .is_monotonic = true, .is_always_monotonic = true };
+
+            /// signed -> unsigned. If arguments from the same half, then function is monotonic.
+            if (left_in_first_half == right_in_first_half)
+                return { .is_monotonic = true };
+
+            return {};
+        }
+
+        /// Size of type is shrunk.
+        if (size_of_from > size_of_to)
+        {
+            /// Function cannot be monotonic on unbounded ranges.
+            if (left.isNull() || right.isNull())
+                return {};
+
+            /// Function cannot be monotonic when left and right are not on the same ranges.
+            if (divideByRangeOfType(left.get<UInt64>()) != divideByRangeOfType(right.get<UInt64>()))
+                return {};
+
+            if (to_is_unsigned)
+                return { .is_monotonic = true };
+            else
+            {
+                // If To is signed, it's possible that the signedness is different after conversion. So we check it explicitly.
+                const bool is_monotonic = (T(left.get<UInt64>()) >= 0) == (T(right.get<UInt64>()) >= 0);
+
+                return { .is_monotonic = is_monotonic };
+            }
+        }
+
+        UNREACHABLE();
+    }
+};
+
+struct ToDateMonotonicity
+{
+    static bool has() { return true; }
+
+    static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
+    {
+        auto which = WhichDataType(type);
+        if (which.isDateOrDate32() || which.isDateTime() || which.isDateTime64() || which.isInt8() || which.isInt16() || which.isUInt8()
+            || which.isUInt16())
+        {
+            return {.is_monotonic = true, .is_always_monotonic = true};
+        }
+        else if (
+            ((left.getType() == Field::Types::UInt64 || left.isNull()) && (right.getType() == Field::Types::UInt64 || right.isNull())
+             && ((left.isNull() || left.get<UInt64>() < 0xFFFF) && (right.isNull() || right.get<UInt64>() >= 0xFFFF)))
+            || ((left.getType() == Field::Types::Int64 || left.isNull()) && (right.getType() == Field::Types::Int64 || right.isNull())
+                && ((left.isNull() || left.get<Int64>() < 0xFFFF) && (right.isNull() || right.get<Int64>() >= 0xFFFF)))
+            || ((
+                (left.getType() == Field::Types::Float64 || left.isNull())
+                && (right.getType() == Field::Types::Float64 || right.isNull())
+                && ((left.isNull() || left.get<Float64>() < 0xFFFF) && (right.isNull() || right.get<Float64>() >= 0xFFFF))))
+            || !isNativeNumber(type))
+        {
+            return {};
+        }
+        else
+        {
+            return {.is_monotonic = true, .is_always_monotonic = true};
+        }
+    }
+};
+
+struct ToDateTimeMonotonicity
+{
+    static bool has() { return true; }
+
+    static IFunction::Monotonicity get(const IDataType & type, const Field &, const Field &)
+    {
+        if (type.isValueRepresentedByNumber())
+            return {.is_monotonic = true, .is_always_monotonic = true};
+        else
+            return {};
+    }
+};
+
+/** The monotonicity for the `toString` function is mainly determined for test purposes.
+  * It is doubtful that anyone is looking to optimize queries with conditions `toString(CounterID) = 34`.
+  */
+struct ToStringMonotonicity
+{
+    static bool has() { return true; }
+
+    static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
+    {
+        IFunction::Monotonicity positive{ .is_monotonic = true };
+        IFunction::Monotonicity not_monotonic;
+
+        const auto * type_ptr = &type;
+        if (const auto * low_cardinality_type = checkAndGetDataType<DataTypeLowCardinality>(type_ptr))
+            type_ptr = low_cardinality_type->getDictionaryType().get();
+
+        /// Order on enum values (which is the order on integers) is completely arbitrary in respect to the order on strings.
+        if (WhichDataType(type).isEnum())
+            return not_monotonic;
+
+        /// `toString` function is monotonous if the argument is Date or Date32 or DateTime or String, or non-negative numbers with the same number of symbols.
+        if (checkDataTypes<DataTypeDate, DataTypeDate32, DataTypeDateTime, DataTypeString>(type_ptr))
+            return positive;
+
+        if (left.isNull() || right.isNull())
+            return {};
+
+        if (left.getType() == Field::Types::UInt64
+            && right.getType() == Field::Types::UInt64)
+        {
+            return (left.get<Int64>() == 0 && right.get<Int64>() == 0)
+                || (floor(log10(left.get<UInt64>())) == floor(log10(right.get<UInt64>())))
+                ? positive : not_monotonic;
+        }
+
+        if (left.getType() == Field::Types::Int64
+            && right.getType() == Field::Types::Int64)
+        {
+            return (left.get<Int64>() == 0 && right.get<Int64>() == 0)
+                || (left.get<Int64>() > 0 && right.get<Int64>() > 0 && floor(log10(left.get<Int64>())) == floor(log10(right.get<Int64>())))
+                ? positive : not_monotonic;
+        }
+
+        return not_monotonic;
+    }
+};
+
+
+struct NameToUInt8 { static constexpr auto name = "toUInt8"; };
+struct NameToUInt16 { static constexpr auto name = "toUInt16"; };
+struct NameToUInt32 { static constexpr auto name = "toUInt32"; };
+struct NameToUInt64 { static constexpr auto name = "toUInt64"; };
+struct NameToUInt128 { static constexpr auto name = "toUInt128"; };
+struct NameToUInt256 { static constexpr auto name = "toUInt256"; };
+struct NameToInt8 { static constexpr auto name = "toInt8"; };
+struct NameToInt16 { static constexpr auto name = "toInt16"; };
+struct NameToInt32 { static constexpr auto name = "toInt32"; };
+struct NameToInt64 { static constexpr auto name = "toInt64"; };
+struct NameToInt128 { static constexpr auto name = "toInt128"; };
+struct NameToInt256 { static constexpr auto name = "toInt256"; };
+struct NameToFloat32 { static constexpr auto name = "toFloat32"; };
+struct NameToFloat64 { static constexpr auto name = "toFloat64"; };
+struct NameToUUID { static constexpr auto name = "toUUID"; };
+struct NameToIPv4 { static constexpr auto name = "toIPv4"; };
+struct NameToIPv6 { static constexpr auto name = "toIPv6"; };
+
+using FunctionToUInt8 = FunctionConvert<DataTypeUInt8, NameToUInt8, ToNumberMonotonicity<UInt8>>;
+using FunctionToUInt16 = FunctionConvert<DataTypeUInt16, NameToUInt16, ToNumberMonotonicity<UInt16>>;
+using FunctionToUInt32 = FunctionConvert<DataTypeUInt32, NameToUInt32, ToNumberMonotonicity<UInt32>>;
+using FunctionToUInt64 = FunctionConvert<DataTypeUInt64, NameToUInt64, ToNumberMonotonicity<UInt64>>;
+using FunctionToUInt128 = FunctionConvert<DataTypeUInt128, NameToUInt128, ToNumberMonotonicity<UInt128>>;
+using FunctionToUInt256 = FunctionConvert<DataTypeUInt256, NameToUInt256, ToNumberMonotonicity<UInt256>>;
+using FunctionToInt8 = FunctionConvert<DataTypeInt8, NameToInt8, ToNumberMonotonicity<Int8>>;
+using FunctionToInt16 = FunctionConvert<DataTypeInt16, NameToInt16, ToNumberMonotonicity<Int16>>;
+using FunctionToInt32 = FunctionConvert<DataTypeInt32, NameToInt32, ToNumberMonotonicity<Int32>>;
+using FunctionToInt64 = FunctionConvert<DataTypeInt64, NameToInt64, ToNumberMonotonicity<Int64>>;
+using FunctionToInt128 = FunctionConvert<DataTypeInt128, NameToInt128, ToNumberMonotonicity<Int128>>;
+using FunctionToInt256 = FunctionConvert<DataTypeInt256, NameToInt256, ToNumberMonotonicity<Int256>>;
+using FunctionToFloat32 = FunctionConvert<DataTypeFloat32, NameToFloat32, ToNumberMonotonicity<Float32>>;
+using FunctionToFloat64 = FunctionConvert<DataTypeFloat64, NameToFloat64, ToNumberMonotonicity<Float64>>;
+
+using FunctionToDate = FunctionConvert<DataTypeDate, NameToDate, ToDateMonotonicity>;
+
+using FunctionToDate32 = FunctionConvert<DataTypeDate32, NameToDate32, ToDateMonotonicity>;
+
+using FunctionToDateTime = FunctionConvert<DataTypeDateTime, NameToDateTime, ToDateTimeMonotonicity>;
+
+using FunctionToDateTime32 = FunctionConvert<DataTypeDateTime, NameToDateTime32, ToDateTimeMonotonicity>;
+
+using FunctionToDateTime64 = FunctionConvert<DataTypeDateTime64, NameToDateTime64, ToDateTimeMonotonicity>;
+
+using FunctionToUUID = FunctionConvert<DataTypeUUID, NameToUUID, ToNumberMonotonicity<UInt128>>;
+using FunctionToIPv4 = FunctionConvert<DataTypeIPv4, NameToIPv4, ToNumberMonotonicity<UInt32>>;
+using FunctionToIPv6 = FunctionConvert<DataTypeIPv6, NameToIPv6, ToNumberMonotonicity<UInt128>>;
+using FunctionToString = FunctionConvert<DataTypeString, NameToString, ToStringMonotonicity>;
+using FunctionToUnixTimestamp = FunctionConvert<DataTypeUInt32, NameToUnixTimestamp, ToNumberMonotonicity<UInt32>>;
+using FunctionToDecimal32 = FunctionConvert<DataTypeDecimal<Decimal32>, NameToDecimal32, UnknownMonotonicity>;
+using FunctionToDecimal64 = FunctionConvert<DataTypeDecimal<Decimal64>, NameToDecimal64, UnknownMonotonicity>;
+using FunctionToDecimal128 = FunctionConvert<DataTypeDecimal<Decimal128>, NameToDecimal128, UnknownMonotonicity>;
+using FunctionToDecimal256 = FunctionConvert<DataTypeDecimal<Decimal256>, NameToDecimal256, UnknownMonotonicity>;
+
+template <typename DataType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior> struct FunctionTo;
+
+template <> struct FunctionTo<DataTypeUInt8> { using Type = FunctionToUInt8; };
+template <> struct FunctionTo<DataTypeUInt16> { using Type = FunctionToUInt16; };
+template <> struct FunctionTo<DataTypeUInt32> { using Type = FunctionToUInt32; };
+template <> struct FunctionTo<DataTypeUInt64> { using Type = FunctionToUInt64; };
+template <> struct FunctionTo<DataTypeUInt128> { using Type = FunctionToUInt128; };
+template <> struct FunctionTo<DataTypeUInt256> { using Type = FunctionToUInt256; };
+template <> struct FunctionTo<DataTypeInt8> { using Type = FunctionToInt8; };
+template <> struct FunctionTo<DataTypeInt16> { using Type = FunctionToInt16; };
+template <> struct FunctionTo<DataTypeInt32> { using Type = FunctionToInt32; };
+template <> struct FunctionTo<DataTypeInt64> { using Type = FunctionToInt64; };
+template <> struct FunctionTo<DataTypeInt128> { using Type = FunctionToInt128; };
+template <> struct FunctionTo<DataTypeInt256> { using Type = FunctionToInt256; };
+template <> struct FunctionTo<DataTypeFloat32> { using Type = FunctionToFloat32; };
+template <> struct FunctionTo<DataTypeFloat64> { using Type = FunctionToFloat64; };
+
+template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct FunctionTo<DataTypeDate, date_time_overflow_behavior> { using Type = FunctionToDate; };
+
+template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct FunctionTo<DataTypeDate32, date_time_overflow_behavior> { using Type = FunctionToDate32; };
+
+template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct FunctionTo<DataTypeDateTime, date_time_overflow_behavior> { using Type = FunctionToDateTime; };
+
+template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct FunctionTo<DataTypeDateTime64, date_time_overflow_behavior> { using Type = FunctionToDateTime64; };
+
+template <> struct FunctionTo<DataTypeUUID> { using Type = FunctionToUUID; };
+template <> struct FunctionTo<DataTypeIPv4> { using Type = FunctionToIPv4; };
+template <> struct FunctionTo<DataTypeIPv6> { using Type = FunctionToIPv6; };
+template <> struct FunctionTo<DataTypeString> { using Type = FunctionToString; };
+template <> struct FunctionTo<DataTypeFixedString> { using Type = FunctionToFixedString; };
+template <> struct FunctionTo<DataTypeDecimal<Decimal32>> { using Type = FunctionToDecimal32; };
+template <> struct FunctionTo<DataTypeDecimal<Decimal64>> { using Type = FunctionToDecimal64; };
+template <> struct FunctionTo<DataTypeDecimal<Decimal128>> { using Type = FunctionToDecimal128; };
+template <> struct FunctionTo<DataTypeDecimal<Decimal256>> { using Type = FunctionToDecimal256; };
+
+template <typename FieldType> struct FunctionTo<DataTypeEnum<FieldType>>
+    : FunctionTo<DataTypeNumber<FieldType>>
+{
+};
+
+struct NameToUInt8OrZero { static constexpr auto name = "toUInt8OrZero"; };
+struct NameToUInt16OrZero { static constexpr auto name = "toUInt16OrZero"; };
+struct NameToUInt32OrZero { static constexpr auto name = "toUInt32OrZero"; };
+struct NameToUInt64OrZero { static constexpr auto name = "toUInt64OrZero"; };
+struct NameToUInt128OrZero { static constexpr auto name = "toUInt128OrZero"; };
+struct NameToUInt256OrZero { static constexpr auto name = "toUInt256OrZero"; };
+struct NameToInt8OrZero { static constexpr auto name = "toInt8OrZero"; };
+struct NameToInt16OrZero { static constexpr auto name = "toInt16OrZero"; };
+struct NameToInt32OrZero { static constexpr auto name = "toInt32OrZero"; };
+struct NameToInt64OrZero { static constexpr auto name = "toInt64OrZero"; };
+struct NameToInt128OrZero { static constexpr auto name = "toInt128OrZero"; };
+struct NameToInt256OrZero { static constexpr auto name = "toInt256OrZero"; };
+struct NameToFloat32OrZero { static constexpr auto name = "toFloat32OrZero"; };
+struct NameToFloat64OrZero { static constexpr auto name = "toFloat64OrZero"; };
+struct NameToDateOrZero { static constexpr auto name = "toDateOrZero"; };
+struct NameToDate32OrZero { static constexpr auto name = "toDate32OrZero"; };
+struct NameToDateTimeOrZero { static constexpr auto name = "toDateTimeOrZero"; };
+struct NameToDateTime64OrZero { static constexpr auto name = "toDateTime64OrZero"; };
+struct NameToDecimal32OrZero { static constexpr auto name = "toDecimal32OrZero"; };
+struct NameToDecimal64OrZero { static constexpr auto name = "toDecimal64OrZero"; };
+struct NameToDecimal128OrZero { static constexpr auto name = "toDecimal128OrZero"; };
+struct NameToDecimal256OrZero { static constexpr auto name = "toDecimal256OrZero"; };
+struct NameToUUIDOrZero { static constexpr auto name = "toUUIDOrZero"; };
+struct NameToIPv4OrZero { static constexpr auto name = "toIPv4OrZero"; };
+struct NameToIPv6OrZero { static constexpr auto name = "toIPv6OrZero"; };
+
+using FunctionToUInt8OrZero = FunctionConvertFromString<DataTypeUInt8, NameToUInt8OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToUInt16OrZero = FunctionConvertFromString<DataTypeUInt16, NameToUInt16OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToUInt32OrZero = FunctionConvertFromString<DataTypeUInt32, NameToUInt32OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToUInt64OrZero = FunctionConvertFromString<DataTypeUInt64, NameToUInt64OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToUInt128OrZero = FunctionConvertFromString<DataTypeUInt128, NameToUInt128OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToUInt256OrZero = FunctionConvertFromString<DataTypeUInt256, NameToUInt256OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToInt8OrZero = FunctionConvertFromString<DataTypeInt8, NameToInt8OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToInt16OrZero = FunctionConvertFromString<DataTypeInt16, NameToInt16OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToInt32OrZero = FunctionConvertFromString<DataTypeInt32, NameToInt32OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToInt64OrZero = FunctionConvertFromString<DataTypeInt64, NameToInt64OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToInt128OrZero = FunctionConvertFromString<DataTypeInt128, NameToInt128OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToInt256OrZero = FunctionConvertFromString<DataTypeInt256, NameToInt256OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToFloat32OrZero = FunctionConvertFromString<DataTypeFloat32, NameToFloat32OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToFloat64OrZero = FunctionConvertFromString<DataTypeFloat64, NameToFloat64OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToDateOrZero = FunctionConvertFromString<DataTypeDate, NameToDateOrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToDate32OrZero = FunctionConvertFromString<DataTypeDate32, NameToDate32OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToDateTimeOrZero = FunctionConvertFromString<DataTypeDateTime, NameToDateTimeOrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToDateTime64OrZero = FunctionConvertFromString<DataTypeDateTime64, NameToDateTime64OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToDecimal32OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal32>, NameToDecimal32OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToDecimal64OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal64>, NameToDecimal64OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToDecimal128OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal128>, NameToDecimal128OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToDecimal256OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal256>, NameToDecimal256OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToUUIDOrZero = FunctionConvertFromString<DataTypeUUID, NameToUUIDOrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToIPv4OrZero = FunctionConvertFromString<DataTypeIPv4, NameToIPv4OrZero, ConvertFromStringExceptionMode::Zero>;
+using FunctionToIPv6OrZero = FunctionConvertFromString<DataTypeIPv6, NameToIPv6OrZero, ConvertFromStringExceptionMode::Zero>;
+
+struct NameToUInt8OrNull { static constexpr auto name = "toUInt8OrNull"; };
+struct NameToUInt16OrNull { static constexpr auto name = "toUInt16OrNull"; };
+struct NameToUInt32OrNull { static constexpr auto name = "toUInt32OrNull"; };
+struct NameToUInt64OrNull { static constexpr auto name = "toUInt64OrNull"; };
+struct NameToUInt128OrNull { static constexpr auto name = "toUInt128OrNull"; };
+struct NameToUInt256OrNull { static constexpr auto name = "toUInt256OrNull"; };
+struct NameToInt8OrNull { static constexpr auto name = "toInt8OrNull"; };
+struct NameToInt16OrNull { static constexpr auto name = "toInt16OrNull"; };
+struct NameToInt32OrNull { static constexpr auto name = "toInt32OrNull"; };
+struct NameToInt64OrNull { static constexpr auto name = "toInt64OrNull"; };
+struct NameToInt128OrNull { static constexpr auto name = "toInt128OrNull"; };
+struct NameToInt256OrNull { static constexpr auto name = "toInt256OrNull"; };
+struct NameToFloat32OrNull { static constexpr auto name = "toFloat32OrNull"; };
+struct NameToFloat64OrNull { static constexpr auto name = "toFloat64OrNull"; };
+struct NameToDateOrNull { static constexpr auto name = "toDateOrNull"; };
+struct NameToDate32OrNull { static constexpr auto name = "toDate32OrNull"; };
+struct NameToDateTimeOrNull { static constexpr auto name = "toDateTimeOrNull"; };
+struct NameToDateTime64OrNull { static constexpr auto name = "toDateTime64OrNull"; };
+struct NameToDecimal32OrNull { static constexpr auto name = "toDecimal32OrNull"; };
+struct NameToDecimal64OrNull { static constexpr auto name = "toDecimal64OrNull"; };
+struct NameToDecimal128OrNull { static constexpr auto name = "toDecimal128OrNull"; };
+struct NameToDecimal256OrNull { static constexpr auto name = "toDecimal256OrNull"; };
+struct NameToUUIDOrNull { static constexpr auto name = "toUUIDOrNull"; };
+struct NameToIPv4OrNull { static constexpr auto name = "toIPv4OrNull"; };
+struct NameToIPv6OrNull { static constexpr auto name = "toIPv6OrNull"; };
+
+using FunctionToUInt8OrNull = FunctionConvertFromString<DataTypeUInt8, NameToUInt8OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToUInt16OrNull = FunctionConvertFromString<DataTypeUInt16, NameToUInt16OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToUInt32OrNull = FunctionConvertFromString<DataTypeUInt32, NameToUInt32OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToUInt64OrNull = FunctionConvertFromString<DataTypeUInt64, NameToUInt64OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToUInt128OrNull = FunctionConvertFromString<DataTypeUInt128, NameToUInt128OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToUInt256OrNull = FunctionConvertFromString<DataTypeUInt256, NameToUInt256OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToInt8OrNull = FunctionConvertFromString<DataTypeInt8, NameToInt8OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToInt16OrNull = FunctionConvertFromString<DataTypeInt16, NameToInt16OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToInt32OrNull = FunctionConvertFromString<DataTypeInt32, NameToInt32OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToInt64OrNull = FunctionConvertFromString<DataTypeInt64, NameToInt64OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToInt128OrNull = FunctionConvertFromString<DataTypeInt128, NameToInt128OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToInt256OrNull = FunctionConvertFromString<DataTypeInt256, NameToInt256OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToFloat32OrNull = FunctionConvertFromString<DataTypeFloat32, NameToFloat32OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToFloat64OrNull = FunctionConvertFromString<DataTypeFloat64, NameToFloat64OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToDateOrNull = FunctionConvertFromString<DataTypeDate, NameToDateOrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToDate32OrNull = FunctionConvertFromString<DataTypeDate32, NameToDate32OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToDateTimeOrNull = FunctionConvertFromString<DataTypeDateTime, NameToDateTimeOrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToDateTime64OrNull = FunctionConvertFromString<DataTypeDateTime64, NameToDateTime64OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToDecimal32OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal32>, NameToDecimal32OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToDecimal64OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal64>, NameToDecimal64OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToDecimal128OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal128>, NameToDecimal128OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToDecimal256OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal256>, NameToDecimal256OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToUUIDOrNull = FunctionConvertFromString<DataTypeUUID, NameToUUIDOrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToIPv4OrNull = FunctionConvertFromString<DataTypeIPv4, NameToIPv4OrNull, ConvertFromStringExceptionMode::Null>;
+using FunctionToIPv6OrNull = FunctionConvertFromString<DataTypeIPv6, NameToIPv6OrNull, ConvertFromStringExceptionMode::Null>;
+
+struct NameParseDateTimeBestEffort { static constexpr auto name = "parseDateTimeBestEffort"; };
+struct NameParseDateTimeBestEffortOrZero { static constexpr auto name = "parseDateTimeBestEffortOrZero"; };
+struct NameParseDateTimeBestEffortOrNull { static constexpr auto name = "parseDateTimeBestEffortOrNull"; };
+struct NameParseDateTimeBestEffortUS { static constexpr auto name = "parseDateTimeBestEffortUS"; };
+struct NameParseDateTimeBestEffortUSOrZero { static constexpr auto name = "parseDateTimeBestEffortUSOrZero"; };
+struct NameParseDateTimeBestEffortUSOrNull { static constexpr auto name = "parseDateTimeBestEffortUSOrNull"; };
+struct NameParseDateTime32BestEffort { static constexpr auto name = "parseDateTime32BestEffort"; };
+struct NameParseDateTime32BestEffortOrZero { static constexpr auto name = "parseDateTime32BestEffortOrZero"; };
+struct NameParseDateTime32BestEffortOrNull { static constexpr auto name = "parseDateTime32BestEffortOrNull"; };
+struct NameParseDateTime64BestEffort { static constexpr auto name = "parseDateTime64BestEffort"; };
+struct NameParseDateTime64BestEffortOrZero { static constexpr auto name = "parseDateTime64BestEffortOrZero"; };
+struct NameParseDateTime64BestEffortOrNull { static constexpr auto name = "parseDateTime64BestEffortOrNull"; };
+struct NameParseDateTime64BestEffortUS { static constexpr auto name = "parseDateTime64BestEffortUS"; };
+struct NameParseDateTime64BestEffortUSOrZero { static constexpr auto name = "parseDateTime64BestEffortUSOrZero"; };
+struct NameParseDateTime64BestEffortUSOrNull { static constexpr auto name = "parseDateTime64BestEffortUSOrNull"; };
+
+
+using FunctionParseDateTimeBestEffort = FunctionConvertFromString<
+    DataTypeDateTime, NameParseDateTimeBestEffort, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffort>;
+using FunctionParseDateTimeBestEffortOrZero = FunctionConvertFromString<
+    DataTypeDateTime, NameParseDateTimeBestEffortOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffort>;
+using FunctionParseDateTimeBestEffortOrNull = FunctionConvertFromString<
+    DataTypeDateTime, NameParseDateTimeBestEffortOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffort>;
+
+using FunctionParseDateTimeBestEffortUS = FunctionConvertFromString<
+    DataTypeDateTime, NameParseDateTimeBestEffortUS, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffortUS>;
+using FunctionParseDateTimeBestEffortUSOrZero = FunctionConvertFromString<
+    DataTypeDateTime, NameParseDateTimeBestEffortUSOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffortUS>;
+using FunctionParseDateTimeBestEffortUSOrNull = FunctionConvertFromString<
+    DataTypeDateTime, NameParseDateTimeBestEffortUSOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffortUS>;
+
+using FunctionParseDateTime32BestEffort = FunctionConvertFromString<
+    DataTypeDateTime, NameParseDateTime32BestEffort, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffort>;
+using FunctionParseDateTime32BestEffortOrZero = FunctionConvertFromString<
+    DataTypeDateTime, NameParseDateTime32BestEffortOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffort>;
+using FunctionParseDateTime32BestEffortOrNull = FunctionConvertFromString<
+    DataTypeDateTime, NameParseDateTime32BestEffortOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffort>;
+
+using FunctionParseDateTime64BestEffort = FunctionConvertFromString<
+    DataTypeDateTime64, NameParseDateTime64BestEffort, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffort>;
+using FunctionParseDateTime64BestEffortOrZero = FunctionConvertFromString<
+    DataTypeDateTime64, NameParseDateTime64BestEffortOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffort>;
+using FunctionParseDateTime64BestEffortOrNull = FunctionConvertFromString<
+    DataTypeDateTime64, NameParseDateTime64BestEffortOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffort>;
+
+using FunctionParseDateTime64BestEffortUS = FunctionConvertFromString<
+    DataTypeDateTime64, NameParseDateTime64BestEffortUS, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffortUS>;
+using FunctionParseDateTime64BestEffortUSOrZero = FunctionConvertFromString<
+    DataTypeDateTime64, NameParseDateTime64BestEffortUSOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffortUS>;
+using FunctionParseDateTime64BestEffortUSOrNull = FunctionConvertFromString<
+    DataTypeDateTime64, NameParseDateTime64BestEffortUSOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffortUS>;
+
+
+class ExecutableFunctionCast : public IExecutableFunction
+{
+public:
+    using WrapperType = std::function<ColumnPtr(ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t)>;
+
+    explicit ExecutableFunctionCast(
+            WrapperType && wrapper_function_, const char * name_, std::optional<CastDiagnostic> diagnostic_)
+            : wrapper_function(std::move(wrapper_function_)), name(name_), diagnostic(std::move(diagnostic_)) {}
+
+    String getName() const override { return name; }
+
+protected:
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
+    {
+        /// drop second argument, pass others
+        ColumnsWithTypeAndName new_arguments{arguments.front()};
+        if (arguments.size() > 2)
+            new_arguments.insert(std::end(new_arguments), std::next(std::begin(arguments), 2), std::end(arguments));
+
+        try
+        {
+            return wrapper_function(new_arguments, result_type, nullptr, input_rows_count);
+        }
+        catch (Exception & e)
+        {
+            if (diagnostic)
+                e.addMessage("while converting source column " + backQuoteIfNeed(diagnostic->column_from) +
+                             " to destination column " + backQuoteIfNeed(diagnostic->column_to));
+            throw;
+        }
+    }
+
+    bool useDefaultImplementationForNulls() const override { return false; }
+    /// CAST(Nothing, T) -> T
+    bool useDefaultImplementationForNothing() const override { return false; }
+    bool useDefaultImplementationForConstants() const override { return true; }
+    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
+
+private:
+    WrapperType wrapper_function;
+    const char * name;
+    std::optional<CastDiagnostic> diagnostic;
+};
+
+
+struct FunctionCastName
+{
+    static constexpr auto name = "CAST";
+};
+
+class FunctionCastBase : public IFunctionBase
+{
+public:
+    using MonotonicityForRange = std::function<Monotonicity(const IDataType &, const Field &, const Field &)>;
+};
+
+class FunctionCast final : public FunctionCastBase
+{
+public:
+    using WrapperType = std::function<ColumnPtr(ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t)>;
+
+    FunctionCast(ContextPtr context_
+            , const char * cast_name_
+            , MonotonicityForRange && monotonicity_for_range_
+            , const DataTypes & argument_types_
+            , const DataTypePtr & return_type_
+            , std::optional<CastDiagnostic> diagnostic_
+            , CastType cast_type_)
+        : cast_name(cast_name_), monotonicity_for_range(std::move(monotonicity_for_range_))
+        , argument_types(argument_types_), return_type(return_type_), diagnostic(std::move(diagnostic_))
+        , cast_type(cast_type_)
+        , context(context_)
+    {
+    }
+
+    const DataTypes & getArgumentTypes() const override { return argument_types; }
+    const DataTypePtr & getResultType() const override { return return_type; }
+
+    ExecutableFunctionPtr prepare(const ColumnsWithTypeAndName & /*sample_columns*/) const override
+    {
+        try
+        {
+            return std::make_unique<ExecutableFunctionCast>(
+                prepareUnpackDictionaries(getArgumentTypes()[0], getResultType()), cast_name, diagnostic);
+        }
+        catch (Exception & e)
+        {
+            if (diagnostic)
+                e.addMessage("while converting source column " + backQuoteIfNeed(diagnostic->column_from) +
+                             " to destination column " + backQuoteIfNeed(diagnostic->column_to));
+            throw;
+        }
+    }
+
+    String getName() const override { return cast_name; }
+
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+
+    bool hasInformationAboutMonotonicity() const override
+    {
+        return static_cast<bool>(monotonicity_for_range);
+    }
+
+    Monotonicity getMonotonicityForRange(const IDataType & type, const Field & left, const Field & right) const override
+    {
+        return monotonicity_for_range(type, left, right);
+    }
+
+private:
+
+    const char * cast_name;
+    MonotonicityForRange monotonicity_for_range;
+
+    DataTypes argument_types;
+    DataTypePtr return_type;
+
+    std::optional<CastDiagnostic> diagnostic;
+    CastType cast_type;
+    ContextPtr context;
+
+    static WrapperType createFunctionAdaptor(FunctionPtr function, const DataTypePtr & from_type)
+    {
+        auto function_adaptor = std::make_unique<FunctionToOverloadResolverAdaptor>(function)->build({ColumnWithTypeAndName{nullptr, from_type, ""}});
+
+        return [function_adaptor]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count)
+        {
+            return function_adaptor->execute(arguments, result_type, input_rows_count);
+        };
+    }
+
+    static WrapperType createToNullableColumnWrapper()
+    {
+        return [] (ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count)
+        {
+            ColumnPtr res = result_type->createColumn();
+            ColumnUInt8::Ptr col_null_map_to = ColumnUInt8::create(input_rows_count, true);
+            return ColumnNullable::create(res->cloneResized(input_rows_count), std::move(col_null_map_to));
+        };
+    }
+
+    template <typename ToDataType>
+    WrapperType createWrapper(const DataTypePtr & from_type, const ToDataType * const to_type, bool requested_result_is_nullable) const
+    {
+        TypeIndex from_type_index = from_type->getTypeId();
+        WhichDataType which(from_type_index);
+        bool can_apply_accurate_cast = (cast_type == CastType::accurate || cast_type == CastType::accurateOrNull)
+            && (which.isInt() || which.isUInt() || which.isFloat());
+
+        FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior;
+        if (context)
+            date_time_overflow_behavior = context->getSettingsRef().date_time_overflow_behavior;
+
+        if (requested_result_is_nullable && checkAndGetDataType<DataTypeString>(from_type.get()))
+        {
+            /// In case when converting to Nullable type, we apply different parsing rule,
+            /// that will not throw an exception but return NULL in case of malformed input.
+            FunctionPtr function = FunctionConvertFromString<ToDataType, FunctionCastName, ConvertFromStringExceptionMode::Null>::create();
+            return createFunctionAdaptor(function, from_type);
+        }
+        else if (!can_apply_accurate_cast)
+        {
+            FunctionPtr function = FunctionTo<ToDataType>::Type::create(context);
+            return createFunctionAdaptor(function, from_type);
+        }
+
+        auto wrapper_cast_type = cast_type;
+
+        return [wrapper_cast_type, from_type_index, to_type, date_time_overflow_behavior]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *column_nullable, size_t input_rows_count)
+        {
+            ColumnPtr result_column;
+            auto res = callOnIndexAndDataType<ToDataType>(from_type_index, [&](const auto & types) -> bool {
+                using Types = std::decay_t<decltype(types)>;
+                using LeftDataType = typename Types::LeftType;
+                using RightDataType = typename Types::RightType;
+
+                if constexpr (IsDataTypeNumber<LeftDataType>)
+                {
+                    if constexpr (IsDataTypeNumber<RightDataType>)
+                    {
+#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
+            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
+                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
+                arguments, result_type, input_rows_count, ADDITIONS()); \
+                break;
+                        if (wrapper_cast_type == CastType::accurate)
+                        {
+                            switch (date_time_overflow_behavior)
+                            {
+                                GENERATE_OVERFLOW_MODE_CASE(Throw, AccurateConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Ignore, AccurateConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Saturate, AccurateConvertStrategyAdditions)
+                            }
+                        }
+                        else
+                        {
+                            switch (date_time_overflow_behavior)
+                            {
+                                GENERATE_OVERFLOW_MODE_CASE(Throw, AccurateOrNullConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Ignore, AccurateOrNullConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Saturate, AccurateOrNullConvertStrategyAdditions)
+                            }
+                        }
+#undef GENERATE_OVERFLOW_MODE_CASE
+
+                        return true;
+                    }
+
+                    if constexpr (std::is_same_v<RightDataType, DataTypeDate> || std::is_same_v<RightDataType, DataTypeDateTime>)
+                    {
+#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
+            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
+            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::template execute<ADDITIONS>( \
+arguments, result_type, input_rows_count); \
+                break;
+                        if (wrapper_cast_type == CastType::accurate)
+                        {
+                            switch (date_time_overflow_behavior)
+                            {
+                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateConvertStrategyAdditions)
+                            }
+                        }
+                        else
+                        {
+                            switch (date_time_overflow_behavior)
+                            {
+                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateOrNullConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateOrNullConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateOrNullConvertStrategyAdditions)
+                            }
+                        }
+#undef GENERATE_OVERFLOW_MODE_CASE
+                        return true;
+                    }
+                }
+
+                return false;
+            });
+
+            /// Additionally check if callOnIndexAndDataType wasn't called at all.
+            if (!res)
+            {
+                if (wrapper_cast_type == CastType::accurateOrNull)
+                {
+                    auto nullable_column_wrapper = FunctionCast::createToNullableColumnWrapper();
+                    return nullable_column_wrapper(arguments, result_type, column_nullable, input_rows_count);
+                }
+                else
+                {
+                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE,
+                        "Conversion from {} to {} is not supported",
+                        from_type_index, to_type->getName());
+                }
+            }
+
+            return result_column;
+        };
+    }
+
+    template <typename ToDataType>
+    WrapperType createBoolWrapper(const DataTypePtr & from_type, const ToDataType * const to_type, bool requested_result_is_nullable) const
+    {
+        if (checkAndGetDataType<DataTypeString>(from_type.get()))
+        {
+            return &ConvertImplGenericFromString::execute;
+        }
+
+        return createWrapper<ToDataType>(from_type, to_type, requested_result_is_nullable);
+    }
+
+    WrapperType createUInt8ToBoolWrapper(const DataTypePtr from_type, const DataTypePtr to_type) const
+    {
+        return [from_type, to_type] (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t /*input_rows_count*/) -> ColumnPtr
+        {
+            /// Special case when we convert UInt8 column to Bool column.
+            /// both columns have type UInt8, but we shouldn't use identity wrapper,
+            /// because Bool column can contain only 0 and 1.
+            auto res_column = to_type->createColumn();
+            const auto & data_from = checkAndGetColumn<ColumnUInt8>(arguments[0].column.get())->getData();
+            auto & data_to = assert_cast<ColumnUInt8 *>(res_column.get())->getData();
+            data_to.resize(data_from.size());
+            for (size_t i = 0; i != data_from.size(); ++i)
+                data_to[i] = static_cast<bool>(data_from[i]);
+            return res_column;
+        };
+    }
+
+    static WrapperType createStringWrapper(const DataTypePtr & from_type)
+    {
+        FunctionPtr function = FunctionToString::create();
+        return createFunctionAdaptor(function, from_type);
+    }
+
+    WrapperType createFixedStringWrapper(const DataTypePtr & from_type, const size_t N) const
+    {
+        if (!isStringOrFixedString(from_type))
+            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "CAST AS FixedString is only implemented for types String and FixedString");
+
+        bool exception_mode_null = cast_type == CastType::accurateOrNull;
+        return [exception_mode_null, N] (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t /*input_rows_count*/)
+        {
+            if (exception_mode_null)
+                return FunctionToFixedString::executeForN<ConvertToFixedStringExceptionMode::Null>(arguments, N);
+            else
+                return FunctionToFixedString::executeForN<ConvertToFixedStringExceptionMode::Throw>(arguments, N);
+        };
+    }
+
+#define GENERATE_INTERVAL_CASE(INTERVAL_KIND) \
+            case IntervalKind::Kind::INTERVAL_KIND: \
+                return createFunctionAdaptor(FunctionConvert<DataTypeInterval, NameToInterval##INTERVAL_KIND, PositiveMonotonicity>::create(), from_type);
+
+    static WrapperType createIntervalWrapper(const DataTypePtr & from_type, IntervalKind kind)
+    {
+        switch (kind)
+        {
+            GENERATE_INTERVAL_CASE(Nanosecond)
+            GENERATE_INTERVAL_CASE(Microsecond)
+            GENERATE_INTERVAL_CASE(Millisecond)
+            GENERATE_INTERVAL_CASE(Second)
+            GENERATE_INTERVAL_CASE(Minute)
+            GENERATE_INTERVAL_CASE(Hour)
+            GENERATE_INTERVAL_CASE(Day)
+            GENERATE_INTERVAL_CASE(Week)
+            GENERATE_INTERVAL_CASE(Month)
+            GENERATE_INTERVAL_CASE(Quarter)
+            GENERATE_INTERVAL_CASE(Year)
+        }
+        throw Exception{ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion to unexpected IntervalKind: {}", kind.toString()};
+    }
+
+#undef GENERATE_INTERVAL_CASE
+
+    template <typename ToDataType>
+    requires IsDataTypeDecimal<ToDataType>
+    WrapperType createDecimalWrapper(const DataTypePtr & from_type, const ToDataType * to_type, bool requested_result_is_nullable) const
+    {
+        TypeIndex type_index = from_type->getTypeId();
+        UInt32 scale = to_type->getScale();
+
+        WhichDataType which(type_index);
+        bool ok = which.isNativeInt() || which.isNativeUInt() || which.isDecimal() || which.isFloat() || which.isDateOrDate32() || which.isDateTime() || which.isDateTime64()
+            || which.isStringOrFixedString();
+        if (!ok)
+        {
+            if (cast_type == CastType::accurateOrNull)
+                return createToNullableColumnWrapper();
+            else
+                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
+                    from_type->getName(), to_type->getName());
+        }
+
+        auto wrapper_cast_type = cast_type;
+
+        return [wrapper_cast_type, type_index, scale, to_type, requested_result_is_nullable]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *column_nullable, size_t input_rows_count)
+        {
+            ColumnPtr result_column;
+            auto res = callOnIndexAndDataType<ToDataType>(type_index, [&](const auto & types) -> bool
+            {
+                using Types = std::decay_t<decltype(types)>;
+                using LeftDataType = typename Types::LeftType;
+                using RightDataType = typename Types::RightType;
+
+                if constexpr (IsDataTypeDecimalOrNumber<LeftDataType> && IsDataTypeDecimalOrNumber<RightDataType> && !std::is_same_v<DataTypeDateTime64, RightDataType>)
+                {
+                    if (wrapper_cast_type == CastType::accurate)
+                    {
+                        AccurateConvertStrategyAdditions additions;
+                        additions.scale = scale;
+                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
+                            arguments, result_type, input_rows_count, additions);
+
+                        return true;
+                    }
+                    else if (wrapper_cast_type == CastType::accurateOrNull)
+                    {
+                        AccurateOrNullConvertStrategyAdditions additions;
+                        additions.scale = scale;
+                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
+                            arguments, result_type, input_rows_count, additions);
+
+                        return true;
+                    }
+                }
+                else if constexpr (std::is_same_v<LeftDataType, DataTypeString>)
+                {
+                    if (requested_result_is_nullable)
+                    {
+                        /// Consistent with CAST(Nullable(String) AS Nullable(Numbers))
+                        /// In case when converting to Nullable type, we apply different parsing rule,
+                        /// that will not throw an exception but return NULL in case of malformed input.
+                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertReturnNullOnErrorTag>::execute(
+                            arguments, result_type, input_rows_count, scale);
+
+                        return true;
+                    }
+                }
+
+                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(arguments, result_type, input_rows_count, scale);
+
+                return true;
+            });
+
+            /// Additionally check if callOnIndexAndDataType wasn't called at all.
+            if (!res)
+            {
+                if (wrapper_cast_type == CastType::accurateOrNull)
+                {
+                    auto nullable_column_wrapper = FunctionCast::createToNullableColumnWrapper();
+                    return nullable_column_wrapper(arguments, result_type, column_nullable, input_rows_count);
+                }
+                else
+                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE,
+                        "Conversion from {} to {} is not supported",
+                        type_index, to_type->getName());
+            }
+
+            return result_column;
+        };
+    }
+
+    WrapperType createAggregateFunctionWrapper(const DataTypePtr & from_type_untyped, const DataTypeAggregateFunction * to_type) const
+    {
+        /// Conversion from String through parsing.
+        if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
+        {
+            return &ConvertImplGenericFromString::execute;
+        }
+        else if (const auto * agg_type = checkAndGetDataType<DataTypeAggregateFunction>(from_type_untyped.get()))
+        {
+            if (agg_type->getFunction()->haveSameStateRepresentation(*to_type->getFunction()))
+            {
+                return [function = to_type->getFunction()](
+                           ColumnsWithTypeAndName & arguments,
+                           const DataTypePtr & /* result_type */,
+                           const ColumnNullable * /* nullable_source */,
+                           size_t /*input_rows_count*/) -> ColumnPtr
+                {
+                    const auto & argument_column = arguments.front();
+                    const auto * col_agg = checkAndGetColumn<ColumnAggregateFunction>(argument_column.column.get());
+                    if (col_agg)
+                    {
+                        auto new_col_agg = ColumnAggregateFunction::create(*col_agg);
+                        new_col_agg->set(function);
+                        return new_col_agg;
+                    }
+                    else
+                    {
+                        throw Exception(
+                            ErrorCodes::LOGICAL_ERROR,
+                            "Illegal column {} for function CAST AS AggregateFunction",
+                            argument_column.column->getName());
+                    }
+                };
+            }
+        }
+
+        if (cast_type == CastType::accurateOrNull)
+            return createToNullableColumnWrapper();
+        else
+            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
+                from_type_untyped->getName(), to_type->getName());
+    }
+
+    WrapperType createArrayWrapper(const DataTypePtr & from_type_untyped, const DataTypeArray & to_type) const
+    {
+        /// Conversion from String through parsing.
+        if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
+        {
+            return &ConvertImplGenericFromString::execute;
+        }
+
+        DataTypePtr from_type_holder;
+        const auto * from_type = checkAndGetDataType<DataTypeArray>(from_type_untyped.get());
+        const auto * from_type_map = checkAndGetDataType<DataTypeMap>(from_type_untyped.get());
+
+        /// Convert from Map
+        if (from_type_map)
+        {
+            /// Recreate array of unnamed tuples because otherwise it may work
+            /// unexpectedly while converting to array of named tuples.
+            from_type_holder = from_type_map->getNestedTypeWithUnnamedTuple();
+            from_type = assert_cast<const DataTypeArray *>(from_type_holder.get());
+        }
+
+        if (!from_type)
+        {
+            throw Exception(ErrorCodes::TYPE_MISMATCH,
+                "CAST AS Array can only be performed between same-dimensional Array, Map or String types");
+        }
+
+        DataTypePtr from_nested_type = from_type->getNestedType();
+
+        /// In query SELECT CAST([] AS Array(Array(String))) from type is Array(Nothing)
+        bool from_empty_array = isNothing(from_nested_type);
+
+        if (from_type->getNumberOfDimensions() != to_type.getNumberOfDimensions() && !from_empty_array)
+            throw Exception(ErrorCodes::TYPE_MISMATCH,
+                "CAST AS Array can only be performed between same-dimensional array types");
+
+        const DataTypePtr & to_nested_type = to_type.getNestedType();
+
+        /// Prepare nested type conversion
+        const auto nested_function = prepareUnpackDictionaries(from_nested_type, to_nested_type);
+
+        return [nested_function, from_nested_type, to_nested_type](
+                ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
+        {
+            const auto & argument_column = arguments.front();
+
+            const ColumnArray * col_array = nullptr;
+
+            if (const ColumnMap * col_map = checkAndGetColumn<ColumnMap>(argument_column.column.get()))
+                col_array = &col_map->getNestedColumn();
+            else
+                col_array = checkAndGetColumn<ColumnArray>(argument_column.column.get());
+
+            if (col_array)
+            {
+                /// create columns for converting nested column containing original and result columns
+                ColumnsWithTypeAndName nested_columns{{ col_array->getDataPtr(), from_nested_type, "" }};
+
+                /// convert nested column
+                auto result_column = nested_function(nested_columns, to_nested_type, nullable_source, nested_columns.front().column->size());
+
+                /// set converted nested column to result
+                return ColumnArray::create(result_column, col_array->getOffsetsPtr());
+            }
+            else
+            {
+                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                    "Illegal column {} for function CAST AS Array",
+                    argument_column.column->getName());
+            }
+        };
+    }
+
+    using ElementWrappers = std::vector<WrapperType>;
+
+    ElementWrappers getElementWrappers(const DataTypes & from_element_types, const DataTypes & to_element_types) const
+    {
+        ElementWrappers element_wrappers;
+        element_wrappers.reserve(from_element_types.size());
+
+        /// Create conversion wrapper for each element in tuple
+        for (size_t i = 0; i < from_element_types.size(); ++i)
+        {
+            const DataTypePtr & from_element_type = from_element_types[i];
+            const DataTypePtr & to_element_type = to_element_types[i];
+            element_wrappers.push_back(prepareUnpackDictionaries(from_element_type, to_element_type));
+        }
+
+        return element_wrappers;
+    }
+
+    WrapperType createTupleWrapper(const DataTypePtr & from_type_untyped, const DataTypeTuple * to_type) const
+    {
+        /// Conversion from String through parsing.
+        if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
+        {
+            return &ConvertImplGenericFromString::execute;
+        }
+
+        const auto * from_type = checkAndGetDataType<DataTypeTuple>(from_type_untyped.get());
+        if (!from_type)
+            throw Exception(ErrorCodes::TYPE_MISMATCH, "CAST AS Tuple can only be performed between tuple types or from String.\n"
+                            "Left type: {}, right type: {}", from_type_untyped->getName(), to_type->getName());
+
+        const auto & from_element_types = from_type->getElements();
+        const auto & to_element_types = to_type->getElements();
+
+        std::vector<WrapperType> element_wrappers;
+        std::vector<std::optional<size_t>> to_reverse_index;
+
+        /// For named tuples allow conversions for tuples with
+        /// different sets of elements. If element exists in @to_type
+        /// and doesn't exist in @to_type it will be filled by default values.
+        if (from_type->haveExplicitNames() && to_type->haveExplicitNames())
+        {
+            const auto & from_names = from_type->getElementNames();
+            std::unordered_map<String, size_t> from_positions;
+            from_positions.reserve(from_names.size());
+            for (size_t i = 0; i < from_names.size(); ++i)
+                from_positions[from_names[i]] = i;
+
+            const auto & to_names = to_type->getElementNames();
+            element_wrappers.reserve(to_names.size());
+            to_reverse_index.reserve(from_names.size());
+
+            for (size_t i = 0; i < to_names.size(); ++i)
+            {
+                auto it = from_positions.find(to_names[i]);
+                if (it != from_positions.end())
+                {
+                    element_wrappers.emplace_back(prepareUnpackDictionaries(from_element_types[it->second], to_element_types[i]));
+                    to_reverse_index.emplace_back(it->second);
+                }
+                else
+                {
+                    element_wrappers.emplace_back();
+                    to_reverse_index.emplace_back();
+                }
+            }
+        }
+        else
+        {
+            if (from_element_types.size() != to_element_types.size())
+                throw Exception(ErrorCodes::TYPE_MISMATCH, "CAST AS Tuple can only be performed between tuple types "
+                                "with the same number of elements or from String.\nLeft type: {}, right type: {}",
+                                from_type->getName(), to_type->getName());
+
+            element_wrappers = getElementWrappers(from_element_types, to_element_types);
+            to_reverse_index.reserve(to_element_types.size());
+            for (size_t i = 0; i < to_element_types.size(); ++i)
+                to_reverse_index.emplace_back(i);
+        }
+
+        return [element_wrappers, from_element_types, to_element_types, to_reverse_index]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t input_rows_count) -> ColumnPtr
+        {
+            const auto * col = arguments.front().column.get();
+
+            size_t tuple_size = to_element_types.size();
+            const ColumnTuple & column_tuple = typeid_cast<const ColumnTuple &>(*col);
+
+            Columns converted_columns(tuple_size);
+
+            /// invoke conversion for each element
+            for (size_t i = 0; i < tuple_size; ++i)
+            {
+                if (to_reverse_index[i])
+                {
+                    size_t from_idx = *to_reverse_index[i];
+                    ColumnsWithTypeAndName element = {{column_tuple.getColumns()[from_idx], from_element_types[from_idx], "" }};
+                    converted_columns[i] = element_wrappers[i](element, to_element_types[i], nullable_source, input_rows_count);
+                }
+                else
+                {
+                    converted_columns[i] = to_element_types[i]->createColumn()->cloneResized(input_rows_count);
+                }
+            }
+
+            return ColumnTuple::create(converted_columns);
+        };
+    }
+
+    /// The case of: tuple([key1, key2, ..., key_n], [value1, value2, ..., value_n])
+    WrapperType createTupleToMapWrapper(const DataTypes & from_kv_types, const DataTypes & to_kv_types) const
+    {
+        return [element_wrappers = getElementWrappers(from_kv_types, to_kv_types), from_kv_types, to_kv_types]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
+        {
+            const auto * col = arguments.front().column.get();
+            const auto & column_tuple = assert_cast<const ColumnTuple &>(*col);
+
+            Columns offsets(2);
+            Columns converted_columns(2);
+            for (size_t i = 0; i < 2; ++i)
+            {
+                const auto & column_array = assert_cast<const ColumnArray &>(column_tuple.getColumn(i));
+                ColumnsWithTypeAndName element = {{column_array.getDataPtr(), from_kv_types[i], ""}};
+                converted_columns[i] = element_wrappers[i](element, to_kv_types[i], nullable_source, (element[0].column)->size());
+                offsets[i] = column_array.getOffsetsPtr();
+            }
+
+            const auto & keys_offsets = assert_cast<const ColumnArray::ColumnOffsets &>(*offsets[0]).getData();
+            const auto & values_offsets = assert_cast<const ColumnArray::ColumnOffsets &>(*offsets[1]).getData();
+            if (keys_offsets != values_offsets)
+                throw Exception(ErrorCodes::TYPE_MISMATCH,
+                    "CAST AS Map can only be performed from tuple of arrays with equal sizes.");
+
+            return ColumnMap::create(converted_columns[0], converted_columns[1], offsets[0]);
+        };
+    }
+
+    WrapperType createMapToMapWrapper(const DataTypes & from_kv_types, const DataTypes & to_kv_types) const
+    {
+        return [element_wrappers = getElementWrappers(from_kv_types, to_kv_types), from_kv_types, to_kv_types]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
+        {
+            const auto * col = arguments.front().column.get();
+            const auto & column_map = typeid_cast<const ColumnMap &>(*col);
+            const auto & nested_data = column_map.getNestedData();
+
+            Columns converted_columns(2);
+            for (size_t i = 0; i < 2; ++i)
+            {
+                ColumnsWithTypeAndName element = {{nested_data.getColumnPtr(i), from_kv_types[i], ""}};
+                converted_columns[i] = element_wrappers[i](element, to_kv_types[i], nullable_source, (element[0].column)->size());
+            }
+
+            return ColumnMap::create(converted_columns[0], converted_columns[1], column_map.getNestedColumn().getOffsetsPtr());
+        };
+    }
+
+    /// The case of: [(key1, value1), (key2, value2), ...]
+    WrapperType createArrayToMapWrapper(const DataTypes & from_kv_types, const DataTypes & to_kv_types) const
+    {
+        return [element_wrappers = getElementWrappers(from_kv_types, to_kv_types), from_kv_types, to_kv_types]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
+        {
+            const auto * col = arguments.front().column.get();
+            const auto & column_array = typeid_cast<const ColumnArray &>(*col);
+            const auto & nested_data = typeid_cast<const ColumnTuple &>(column_array.getData());
+
+            Columns converted_columns(2);
+            for (size_t i = 0; i < 2; ++i)
+            {
+                ColumnsWithTypeAndName element = {{nested_data.getColumnPtr(i), from_kv_types[i], ""}};
+                converted_columns[i] = element_wrappers[i](element, to_kv_types[i], nullable_source, (element[0].column)->size());
+            }
+
+            return ColumnMap::create(converted_columns[0], converted_columns[1], column_array.getOffsetsPtr());
+        };
+    }
+
+
+    WrapperType createMapWrapper(const DataTypePtr & from_type_untyped, const DataTypeMap * to_type) const
+    {
+        if (const auto * from_tuple = checkAndGetDataType<DataTypeTuple>(from_type_untyped.get()))
+        {
+            if (from_tuple->getElements().size() != 2)
+                throw Exception(
+                    ErrorCodes::TYPE_MISMATCH,
+                    "CAST AS Map from tuple requires 2 elements. "
+                    "Left type: {}, right type: {}",
+                    from_tuple->getName(),
+                    to_type->getName());
+
+            DataTypes from_kv_types;
+            const auto & to_kv_types = to_type->getKeyValueTypes();
+
+            for (const auto & elem : from_tuple->getElements())
+            {
+                const auto * type_array = checkAndGetDataType<DataTypeArray>(elem.get());
+                if (!type_array)
+                    throw Exception(ErrorCodes::TYPE_MISMATCH,
+                        "CAST AS Map can only be performed from tuples of array. Got: {}", from_tuple->getName());
+
+                from_kv_types.push_back(type_array->getNestedType());
+            }
+
+            return createTupleToMapWrapper(from_kv_types, to_kv_types);
+        }
+        else if (const auto * from_array = typeid_cast<const DataTypeArray *>(from_type_untyped.get()))
+        {
+            const auto * nested_tuple = typeid_cast<const DataTypeTuple *>(from_array->getNestedType().get());
+            if (!nested_tuple || nested_tuple->getElements().size() != 2)
+                throw Exception(
+                    ErrorCodes::TYPE_MISMATCH,
+                    "CAST AS Map from array requires nested tuple of 2 elements. "
+                    "Left type: {}, right type: {}",
+                    from_array->getName(),
+                    to_type->getName());
+
+            return createArrayToMapWrapper(nested_tuple->getElements(), to_type->getKeyValueTypes());
+        }
+        else if (const auto * from_type = checkAndGetDataType<DataTypeMap>(from_type_untyped.get()))
+        {
+            return createMapToMapWrapper(from_type->getKeyValueTypes(), to_type->getKeyValueTypes());
+        }
+        else
+        {
+            throw Exception(ErrorCodes::TYPE_MISMATCH, "Unsupported types to CAST AS Map. "
+                "Left type: {}, right type: {}", from_type_untyped->getName(), to_type->getName());
+        }
+    }
+
+    WrapperType createTupleToObjectWrapper(const DataTypeTuple & from_tuple, bool has_nullable_subcolumns) const
+    {
+        if (!from_tuple.haveExplicitNames())
+            throw Exception(ErrorCodes::TYPE_MISMATCH,
+            "Cast to Object can be performed only from flatten Named Tuple. Got: {}", from_tuple.getName());
+
+        PathsInData paths;
+        DataTypes from_types;
+
+        std::tie(paths, from_types) = flattenTuple(from_tuple.getPtr());
+        auto to_types = from_types;
+
+        for (auto & type : to_types)
+        {
+            if (isTuple(type) || isNested(type))
+                throw Exception(ErrorCodes::TYPE_MISMATCH,
+                    "Cast to Object can be performed only from flatten Named Tuple. Got: {}",
+                    from_tuple.getName());
+
+            type = recursiveRemoveLowCardinality(type);
+        }
+
+        return [element_wrappers = getElementWrappers(from_types, to_types),
+            has_nullable_subcolumns, from_types, to_types, paths]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t input_rows_count)
+        {
+            size_t tuple_size = to_types.size();
+            auto flattened_column = flattenTuple(arguments.front().column);
+            const auto & column_tuple = assert_cast<const ColumnTuple &>(*flattened_column);
+
+            if (tuple_size != column_tuple.getColumns().size())
+                throw Exception(ErrorCodes::TYPE_MISMATCH,
+                    "Expected tuple with {} subcolumn, but got {} subcolumns",
+                    tuple_size, column_tuple.getColumns().size());
+
+            auto res = ColumnObject::create(has_nullable_subcolumns);
+            for (size_t i = 0; i < tuple_size; ++i)
+            {
+                ColumnsWithTypeAndName element = {{column_tuple.getColumns()[i], from_types[i], "" }};
+                auto converted_column = element_wrappers[i](element, to_types[i], nullable_source, input_rows_count);
+                res->addSubcolumn(paths[i], converted_column->assumeMutable());
+            }
+
+            return res;
+        };
+    }
+
+    WrapperType createMapToObjectWrapper(const DataTypeMap & from_map, bool has_nullable_subcolumns) const
+    {
+        auto key_value_types = from_map.getKeyValueTypes();
+
+        if (!isStringOrFixedString(key_value_types[0]))
+            throw Exception(ErrorCodes::TYPE_MISMATCH,
+                "Cast to Object from Map can be performed only from Map "
+                "with String or FixedString key. Got: {}", from_map.getName());
+
+        const auto & value_type = key_value_types[1];
+        auto to_value_type = value_type;
+
+        if (!has_nullable_subcolumns && value_type->isNullable())
+            to_value_type = removeNullable(value_type);
+
+        if (has_nullable_subcolumns && !value_type->isNullable())
+            to_value_type = makeNullable(value_type);
+
+        DataTypes to_key_value_types{std::make_shared<DataTypeString>(), std::move(to_value_type)};
+        auto element_wrappers = getElementWrappers(key_value_types, to_key_value_types);
+
+        return [has_nullable_subcolumns, element_wrappers, key_value_types, to_key_value_types]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t) -> ColumnPtr
+        {
+            const auto & column_map = assert_cast<const ColumnMap &>(*arguments.front().column);
+            const auto & offsets = column_map.getNestedColumn().getOffsets();
+            auto key_value_columns = column_map.getNestedData().getColumnsCopy();
+
+            for (size_t i = 0; i < 2; ++i)
+            {
+                ColumnsWithTypeAndName element{{key_value_columns[i], key_value_types[i], ""}};
+                key_value_columns[i] = element_wrappers[i](element, to_key_value_types[i], nullable_source, key_value_columns[i]->size());
+            }
+
+            const auto & key_column_str = assert_cast<const ColumnString &>(*key_value_columns[0]);
+            const auto & value_column = *key_value_columns[1];
+
+            using SubcolumnsMap = HashMap<StringRef, MutableColumnPtr, StringRefHash>;
+            SubcolumnsMap subcolumns;
+
+            for (size_t row = 0; row < offsets.size(); ++row)
+            {
+                for (size_t i = offsets[static_cast<ssize_t>(row) - 1]; i < offsets[row]; ++i)
+                {
+                    auto ref = key_column_str.getDataAt(i);
+
+                    bool inserted;
+                    SubcolumnsMap::LookupResult it;
+                    subcolumns.emplace(ref, it, inserted);
+                    auto & subcolumn = it->getMapped();
+
+                    if (inserted)
+                        subcolumn = value_column.cloneEmpty()->cloneResized(row);
+
+                    /// Map can have duplicated keys. We insert only first one.
+                    if (subcolumn->size() == row)
+                        subcolumn->insertFrom(value_column, i);
+                }
+
+                /// Insert default values for keys missed in current row.
+                for (const auto & [_, subcolumn] : subcolumns)
+                    if (subcolumn->size() == row)
+                        subcolumn->insertDefault();
+            }
+
+            auto column_object = ColumnObject::create(has_nullable_subcolumns);
+            for (auto && [key, subcolumn] : subcolumns)
+            {
+                PathInData path(key.toView());
+                column_object->addSubcolumn(path, std::move(subcolumn));
+            }
+
+            return column_object;
+        };
+    }
+
+    WrapperType createObjectWrapper(const DataTypePtr & from_type, const DataTypeObject * to_type) const
+    {
+        if (const auto * from_tuple = checkAndGetDataType<DataTypeTuple>(from_type.get()))
+        {
+            return createTupleToObjectWrapper(*from_tuple, to_type->hasNullableSubcolumns());
+        }
+        else if (const auto * from_map = checkAndGetDataType<DataTypeMap>(from_type.get()))
+        {
+            return createMapToObjectWrapper(*from_map, to_type->hasNullableSubcolumns());
+        }
+        else if (checkAndGetDataType<DataTypeString>(from_type.get()))
+        {
+            return [] (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * nullable_source, size_t input_rows_count)
+            {
+                auto res = ConvertImplGenericFromString::execute(arguments, result_type, nullable_source, input_rows_count)->assumeMutable();
+                res->finalize();
+                return res;
+            };
+        }
+        else if (checkAndGetDataType<DataTypeObject>(from_type.get()))
+        {
+            return [is_nullable = to_type->hasNullableSubcolumns()] (ColumnsWithTypeAndName & arguments, const DataTypePtr & , const ColumnNullable * , size_t) -> ColumnPtr
+            {
+                auto & column_object = assert_cast<const ColumnObject &>(*arguments.front().column);
+                auto res = ColumnObject::create(is_nullable);
+                for (size_t i = 0; i < column_object.size(); i++)
+                    res->insert(column_object[i]);
+
+                res->finalize();
+                return res;
+            };
+        }
+
+        throw Exception(ErrorCodes::TYPE_MISMATCH,
+            "Cast to Object can be performed only from flatten named Tuple, Map or String. Got: {}", from_type->getName());
+    }
+
+    WrapperType createVariantToVariantWrapper(const DataTypeVariant & from_variant, const DataTypeVariant & to_variant) const
+    {
+        /// We support only extension of variant type, so, only new types can be added.
+        /// For example: Variant(T1, T2) -> Variant(T1, T2, T3) is supported, but Variant(T1, T2) -> Variant(T1, T3) is not supported.
+        /// We want to extend Variant type for free without rewriting the data, but we sort data types inside Variant during type creation
+        /// (we do it because we want Variant(T1, T2) to be the same as Variant(T2, T1)), but after extension the order of variant types
+        /// (and so their discriminators) can be different. For example: Variant(T1, T3) -> Variant(T1, T2, T3).
+        /// To avoid full rewrite of discriminators column, ColumnVariant supports it's local order of variant columns (and so local
+        /// discriminators) and stores mapping global order -> local order.
+        /// So, to extend Variant with new types for free, we should keep old local order for old variants, append new variants and change
+        /// mapping global order -> local order according to the new global order.
+
+        /// Create map (new variant type) -> (it's global discriminator in new order).
+        const auto & new_variants = to_variant.getVariants();
+        std::unordered_map<String, ColumnVariant::Discriminator> new_variant_types_to_new_global_discriminator;
+        new_variant_types_to_new_global_discriminator.reserve(new_variants.size());
+        for (size_t i = 0; i != new_variants.size(); ++i)
+            new_variant_types_to_new_global_discriminator[new_variants[i]->getName()] = i;
+
+        /// Create set of old variant types.
+        const auto & old_variants = from_variant.getVariants();
+        std::unordered_map<String, ColumnVariant::Discriminator> old_variant_types_to_old_global_discriminator;
+        old_variant_types_to_old_global_discriminator.reserve(old_variants.size());
+        for (size_t i = 0; i != old_variants.size(); ++i)
+            old_variant_types_to_old_global_discriminator[old_variants[i]->getName()] = i;
+
+        /// Check that the set of old variants types is a subset of new variant types and collect new global discriminator for each old global discriminator.
+        std::unordered_map<ColumnVariant::Discriminator, ColumnVariant::Discriminator> old_global_discriminator_to_new;
+        old_global_discriminator_to_new.reserve(old_variants.size());
+        for (const auto & [old_variant_type, old_discriminator] : old_variant_types_to_old_global_discriminator)
+        {
+            auto it = new_variant_types_to_new_global_discriminator.find(old_variant_type);
+            if (it == new_variant_types_to_new_global_discriminator.end())
+                throw Exception(
+                    ErrorCodes::CANNOT_CONVERT_TYPE,
+                    "Cannot convert type {} to {}. Conversion between Variant types is allowed only when new Variant type is an extension "
+                    "of an initial one", from_variant.getName(), to_variant.getName());
+            old_global_discriminator_to_new[old_discriminator] = it->second;
+        }
+
+        /// Collect variant types and their global discriminators that should be added to the old Variant to get the new Variant.
+        std::vector<std::pair<DataTypePtr, ColumnVariant::Discriminator>> variant_types_and_discriminators_to_add;
+        variant_types_and_discriminators_to_add.reserve(new_variants.size() - old_variants.size());
+        for (size_t i = 0; i != new_variants.size(); ++i)
+        {
+            if (!old_variant_types_to_old_global_discriminator.contains(new_variants[i]->getName()))
+                variant_types_and_discriminators_to_add.emplace_back(new_variants[i], i);
+        }
+
+        return [old_global_discriminator_to_new, variant_types_and_discriminators_to_add]
+               (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t) -> ColumnPtr
+        {
+            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
+            size_t num_old_variants = column_variant.getNumVariants();
+            Columns new_variant_columns;
+            new_variant_columns.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
+            std::vector<ColumnVariant::Discriminator> new_local_to_global_discriminators;
+            new_local_to_global_discriminators.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
+            for (size_t i = 0; i != num_old_variants; ++i)
+            {
+                new_variant_columns.push_back(column_variant.getVariantPtrByLocalDiscriminator(i));
+                new_local_to_global_discriminators.push_back(old_global_discriminator_to_new.at(column_variant.globalDiscriminatorByLocal(i)));
+            }
+
+            for (const auto & [new_variant_type, new_global_discriminator] : variant_types_and_discriminators_to_add)
+            {
+                new_variant_columns.push_back(new_variant_type->createColumn());
+                new_local_to_global_discriminators.push_back(new_global_discriminator);
+            }
+
+            return ColumnVariant::create(column_variant.getLocalDiscriminatorsPtr(), column_variant.getOffsetsPtr(), new_variant_columns, new_local_to_global_discriminators);
+        };
+    }
+
+    WrapperType createVariantToColumnWrapper(const DataTypeVariant & from_variant, const DataTypePtr & to_type) const
+    {
+        const auto & variant_types = from_variant.getVariants();
+        std::vector<WrapperType> variant_wrappers;
+        variant_wrappers.reserve(variant_types.size());
+
+        /// Create conversion wrapper for each variant.
+        for (const auto & variant_type : variant_types)
+            variant_wrappers.push_back(prepareUnpackDictionaries(variant_type, to_type));
+
+        return [variant_wrappers, variant_types, to_type]
+               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
+        {
+            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
+
+            /// First, cast each variant to the result type.
+            std::vector<ColumnPtr> casted_variant_columns;
+            casted_variant_columns.reserve(variant_types.size());
+            for (size_t i = 0; i != variant_types.size(); ++i)
+            {
+                auto variant_col = column_variant.getVariantPtrByLocalDiscriminator(i);
+                ColumnsWithTypeAndName variant = {{variant_col, variant_types[i], "" }};
+                const auto & variant_wrapper = variant_wrappers[column_variant.globalDiscriminatorByLocal(i)];
+                casted_variant_columns.push_back(variant_wrapper(variant, result_type, nullptr, variant_col->size()));
+            }
+
+            /// Second, construct resulting column from casted variant columns according to discriminators.
+            const auto & local_discriminators = column_variant.getLocalDiscriminators();
+            auto res = result_type->createColumn();
+            res->reserve(input_rows_count);
+            for (size_t i = 0; i != input_rows_count; ++i)
+            {
+                auto local_discr = local_discriminators[i];
+                if (local_discr == ColumnVariant::NULL_DISCRIMINATOR)
+                    res->insertDefault();
+                else
+                    res->insertFrom(*casted_variant_columns[local_discr], column_variant.offsetAt(i));
+            }
+
+            return res;
+        };
+    }
+
+    static ColumnPtr createVariantFromDescriptorsAndOneNonEmptyVariant(const DataTypes & variant_types, const ColumnPtr & discriminators, const ColumnPtr & variant, ColumnVariant::Discriminator variant_discr)
+    {
+        Columns variants;
+        variants.reserve(variant_types.size());
+        for (size_t i = 0; i != variant_types.size(); ++i)
+        {
+            if (i == variant_discr)
+                variants.emplace_back(variant);
+            else
+                variants.push_back(variant_types[i]->createColumn());
+        }
+
+        return ColumnVariant::create(discriminators, variants);
+    }
+
+    WrapperType createColumnToVariantWrapper(const DataTypePtr & from_type, const DataTypeVariant & to_variant) const
+    {
+        /// We allow converting NULL to Variant(...) as Variant can store NULLs.
+        if (from_type->onlyNull())
+        {
+            return [](ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
+            {
+                auto result_column = result_type->createColumn();
+                result_column->insertManyDefaults(input_rows_count);
+                return result_column;
+            };
+        }
+
+        auto variant_discr_opt = to_variant.tryGetVariantDiscriminator(*removeNullableOrLowCardinalityNullable(from_type));
+        if (!variant_discr_opt)
+            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert type {} to {}. Conversion to Variant allowed only for types from this Variant", from_type->getName(), to_variant.getName());
+
+        return [variant_discr = *variant_discr_opt]
+               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t) -> ColumnPtr
+        {
+            const auto & result_variant_type = assert_cast<const DataTypeVariant &>(*result_type);
+            const auto & variant_types = result_variant_type.getVariants();
+            if (const ColumnNullable * col_nullable = typeid_cast<const ColumnNullable *>(arguments.front().column.get()))
+            {
+                const auto & column = col_nullable->getNestedColumnPtr();
+                const auto & null_map = col_nullable->getNullMapData();
+                IColumn::Filter filter;
+                filter.reserve(column->size());
+                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
+                auto & discriminators_data = discriminators->getData();
+                discriminators_data.reserve(column->size());
+                size_t variant_size_hint = 0;
+                for (size_t i = 0; i != column->size(); ++i)
+                {
+                    if (null_map[i])
+                    {
+                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
+                        filter.push_back(0);
+                    }
+                    else
+                    {
+                        discriminators_data.push_back(variant_discr);
+                        filter.push_back(1);
+                        ++variant_size_hint;
+                    }
+                }
+
+                ColumnPtr variant_column;
+                /// If there were no NULLs, just use the column.
+                if (variant_size_hint == column->size())
+                    variant_column = column;
+                /// Otherwise we should use filtered column.
+                else
+                    variant_column = column->filter(filter, variant_size_hint);
+                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), variant_column, variant_discr);
+            }
+            else if (isColumnLowCardinalityNullable(*arguments.front().column))
+            {
+                const auto & column = arguments.front().column;
+
+                /// Variant column cannot have LowCardinality(Nullable(...)) variant, as Variant column stores NULLs itself.
+                /// We should create a null-map, insert NULL_DISCRIMINATOR on NULL values and filter initial column.
+                const auto & col_lc = assert_cast<const ColumnLowCardinality &>(*column);
+                const auto & indexes = col_lc.getIndexes();
+                auto null_index = col_lc.getDictionary().getNullValueIndex();
+                IColumn::Filter filter;
+                filter.reserve(col_lc.size());
+                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
+                auto & discriminators_data = discriminators->getData();
+                discriminators_data.reserve(col_lc.size());
+                size_t variant_size_hint = 0;
+                for (size_t i = 0; i != col_lc.size(); ++i)
+                {
+                    if (indexes.getUInt(i) == null_index)
+                    {
+                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
+                        filter.push_back(0);
+                    }
+                    else
+                    {
+                        discriminators_data.push_back(variant_discr);
+                        filter.push_back(1);
+                        ++variant_size_hint;
+                    }
+                }
+
+                MutableColumnPtr variant_column;
+                /// If there were no NULLs, we can just clone the column.
+                if (variant_size_hint == col_lc.size())
+                    variant_column = IColumn::mutate(column);
+                /// Otherwise we should filter column.
+                else
+                    variant_column = column->filter(filter, variant_size_hint)->assumeMutable();
+
+                assert_cast<ColumnLowCardinality &>(*variant_column).nestedRemoveNullable();
+                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), std::move(variant_column), variant_discr);
+            }
+            else
+            {
+                const auto & column = arguments.front().column;
+                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
+                discriminators->getData().resize_fill(column->size(), variant_discr);
+                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), column, variant_discr);
+            }
+        };
+    }
+
+    /// Wrapper for conversion to/from Variant type
+    WrapperType createVariantWrapper(const DataTypePtr & from_type, const DataTypePtr & to_type) const
+    {
+        if (const auto * from_variant = checkAndGetDataType<DataTypeVariant>(from_type.get()))
+        {
+            if (const auto * to_variant = checkAndGetDataType<DataTypeVariant>(to_type.get()))
+                return createVariantToVariantWrapper(*from_variant, *to_variant);
+
+            return createVariantToColumnWrapper(*from_variant, to_type);
+        }
+
+        return createColumnToVariantWrapper(from_type, assert_cast<const DataTypeVariant &>(*to_type));
+    }
+
+    template <typename FieldType>
+    WrapperType createEnumWrapper(const DataTypePtr & from_type, const DataTypeEnum<FieldType> * to_type) const
+    {
+        using EnumType = DataTypeEnum<FieldType>;
+        using Function = typename FunctionTo<EnumType>::Type;
+
+        if (const auto * from_enum8 = checkAndGetDataType<DataTypeEnum8>(from_type.get()))
+            checkEnumToEnumConversion(from_enum8, to_type);
+        else if (const auto * from_enum16 = checkAndGetDataType<DataTypeEnum16>(from_type.get()))
+            checkEnumToEnumConversion(from_enum16, to_type);
+
+        if (checkAndGetDataType<DataTypeString>(from_type.get()))
+            return createStringToEnumWrapper<ColumnString, EnumType>();
+        else if (checkAndGetDataType<DataTypeFixedString>(from_type.get()))
+            return createStringToEnumWrapper<ColumnFixedString, EnumType>();
+        else if (isNativeNumber(from_type) || isEnum(from_type))
+        {
+            auto function = Function::create();
+            return createFunctionAdaptor(function, from_type);
+        }
+        else
+        {
+            if (cast_type == CastType::accurateOrNull)
+                return createToNullableColumnWrapper();
+            else
+                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
+                    from_type->getName(), to_type->getName());
+        }
+    }
+
+    template <typename EnumTypeFrom, typename EnumTypeTo>
+    void checkEnumToEnumConversion(const EnumTypeFrom * from_type, const EnumTypeTo * to_type) const
+    {
+        const auto & from_values = from_type->getValues();
+        const auto & to_values = to_type->getValues();
+
+        using ValueType = std::common_type_t<typename EnumTypeFrom::FieldType, typename EnumTypeTo::FieldType>;
+        using NameValuePair = std::pair<std::string, ValueType>;
+        using EnumValues = std::vector<NameValuePair>;
+
+        EnumValues name_intersection;
+        std::set_intersection(std::begin(from_values), std::end(from_values),
+            std::begin(to_values), std::end(to_values), std::back_inserter(name_intersection),
+            [] (auto && from, auto && to) { return from.first < to.first; });
+
+        for (const auto & name_value : name_intersection)
+        {
+            const auto & old_value = name_value.second;
+            const auto & new_value = to_type->getValue(name_value.first);
+            if (old_value != new_value)
+                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Enum conversion changes value for element '{}' from {} to {}",
+                    name_value.first, toString(old_value), toString(new_value));
+        }
+    }
+
+    template <typename ColumnStringType, typename EnumType>
+    WrapperType createStringToEnumWrapper() const
+    {
+        const char * function_name = cast_name;
+        return [function_name] (
+            ColumnsWithTypeAndName & arguments, const DataTypePtr & res_type, const ColumnNullable * nullable_col, size_t /*input_rows_count*/)
+        {
+            const auto & first_col = arguments.front().column.get();
+            const auto & result_type = typeid_cast<const EnumType &>(*res_type);
+
+            const ColumnStringType * col = typeid_cast<const ColumnStringType *>(first_col);
+
+            if (col && nullable_col && nullable_col->size() != col->size())
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "ColumnNullable is not compatible with original");
+
+            if (col)
+            {
+                const auto size = col->size();
+
+                auto res = result_type.createColumn();
+                auto & out_data = static_cast<typename EnumType::ColumnType &>(*res).getData();
+                out_data.resize(size);
+
+                auto default_enum_value = result_type.getValues().front().second;
+
+                if (nullable_col)
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        if (!nullable_col->isNullAt(i))
+                            out_data[i] = result_type.getValue(col->getDataAt(i));
+                        else
+                            out_data[i] = default_enum_value;
+                    }
+                }
+                else
+                {
+                    for (size_t i = 0; i < size; ++i)
+                        out_data[i] = result_type.getValue(col->getDataAt(i));
+                }
+
+                return res;
+            }
+            else
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected column {} as first argument of function {}",
+                    first_col->getName(), function_name);
+        };
+    }
+
+    template <typename EnumType>
+    WrapperType createEnumToStringWrapper() const
+    {
+        const char * function_name = cast_name;
+        return [function_name] (
+            ColumnsWithTypeAndName & arguments, const DataTypePtr & res_type, const ColumnNullable * nullable_col, size_t /*input_rows_count*/)
+        {
+            using ColumnEnumType = EnumType::ColumnType;
+
+            const auto & first_col = arguments.front().column.get();
+            const auto & first_type = arguments.front().type.get();
+
+            const ColumnEnumType * enum_col = typeid_cast<const ColumnEnumType *>(first_col);
+            const EnumType * enum_type = typeid_cast<const EnumType *>(first_type);
+
+            if (enum_col && nullable_col && nullable_col->size() != enum_col->size())
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "ColumnNullable is not compatible with original");
+
+            if (enum_col && enum_type)
+            {
+                const auto size = enum_col->size();
+                const auto & enum_data = enum_col->getData();
+
+                auto res = res_type->createColumn();
+
+                if (nullable_col)
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        if (!nullable_col->isNullAt(i))
+                        {
+                            const auto & value = enum_type->getNameForValue(enum_data[i]);
+                            res->insertData(value.data, value.size);
+                        }
+                        else
+                            res->insertDefault();
+                    }
+                }
+                else
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        const auto & value = enum_type->getNameForValue(enum_data[i]);
+                        res->insertData(value.data, value.size);
+                    }
+                }
+
+                return res;
+            }
+            else
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected column {} as first argument of function {}",
+                    first_col->getName(), function_name);
+        };
+    }
+
+    static WrapperType createIdentityWrapper(const DataTypePtr &)
+    {
+        return [] (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t /*input_rows_count*/)
+        {
+            return arguments.front().column;
+        };
+    }
+
+    static WrapperType createNothingWrapper(const IDataType * to_type)
+    {
+        ColumnPtr res = to_type->createColumnConstWithDefaultValue(1);
+        return [res] (ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t input_rows_count)
+        {
+            /// Column of Nothing type is trivially convertible to any other column
+            return res->cloneResized(input_rows_count)->convertToFullColumnIfConst();
+        };
+    }
+
+    WrapperType prepareUnpackDictionaries(const DataTypePtr & from_type, const DataTypePtr & to_type) const
+    {
+        /// Conversion from/to Variant data type is processed in a special way.
+        /// We don't need to remove LowCardinality/Nullable.
+        if (isVariant(to_type) || isVariant(from_type))
+            return createVariantWrapper(from_type, to_type);
+
+        const auto * from_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(from_type.get());
+        const auto * to_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(to_type.get());
+        const auto & from_nested = from_low_cardinality ? from_low_cardinality->getDictionaryType() : from_type;
+        const auto & to_nested = to_low_cardinality ? to_low_cardinality->getDictionaryType() : to_type;
+
+        if (from_type->onlyNull())
+        {
+            if (!to_nested->isNullable() && !isVariant(to_type))
+            {
+                if (cast_type == CastType::accurateOrNull)
+                {
+                    return createToNullableColumnWrapper();
+                }
+                else
+                {
+                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert NULL to a non-nullable type");
+                }
+            }
+
+            return [](ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count)
+            {
+                return result_type->createColumnConstWithDefaultValue(input_rows_count)->convertToFullColumnIfConst();
+            };
+        }
+
+        bool skip_not_null_check = false;
+
+        if (from_low_cardinality && from_nested->isNullable() && !to_nested->isNullable())
+            /// Disable check for dictionary. Will check that column doesn't contain NULL in wrapper below.
+            skip_not_null_check = true;
+
+        auto wrapper = prepareRemoveNullable(from_nested, to_nested, skip_not_null_check);
+        if (!from_low_cardinality && !to_low_cardinality)
+            return wrapper;
+
+        return [wrapper, from_low_cardinality, to_low_cardinality, skip_not_null_check]
+                (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * nullable_source, size_t input_rows_count) -> ColumnPtr
+        {
+            ColumnsWithTypeAndName args = {arguments[0]};
+            auto & arg = args.front();
+            auto res_type = result_type;
+
+            ColumnPtr converted_column;
+
+            ColumnPtr res_indexes;
+            /// For some types default can't be casted (for example, String to Int). In that case convert column to full.
+            bool src_converted_to_full_column = false;
+
+            {
+                auto tmp_rows_count = input_rows_count;
+
+                if (to_low_cardinality)
+                    res_type = to_low_cardinality->getDictionaryType();
+
+                if (from_low_cardinality)
+                {
+                    const auto * col_low_cardinality = typeid_cast<const ColumnLowCardinality *>(arguments[0].column.get());
+
+                    if (skip_not_null_check && col_low_cardinality->containsNull())
+                        throw Exception(ErrorCodes::CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN, "Cannot convert NULL value to non-Nullable type");
+
+                    arg.column = col_low_cardinality->getDictionary().getNestedColumn();
+                    arg.type = from_low_cardinality->getDictionaryType();
+
+                    /// TODO: Make map with defaults conversion.
+                    src_converted_to_full_column = !removeNullable(arg.type)->equals(*removeNullable(res_type));
+                    if (src_converted_to_full_column)
+                        arg.column = arg.column->index(col_low_cardinality->getIndexes(), 0);
+                    else
+                        res_indexes = col_low_cardinality->getIndexesPtr();
+
+                    tmp_rows_count = arg.column->size();
+                }
+
+                /// Perform the requested conversion.
+                converted_column = wrapper(args, res_type, nullable_source, tmp_rows_count);
+            }
+
+            if (to_low_cardinality)
+            {
+                auto res_column = to_low_cardinality->createColumn();
+                auto * col_low_cardinality = typeid_cast<ColumnLowCardinality *>(res_column.get());
+
+                if (from_low_cardinality && !src_converted_to_full_column)
+                {
+                    col_low_cardinality->insertRangeFromDictionaryEncodedColumn(*converted_column, *res_indexes);
+                }
+                else
+                    col_low_cardinality->insertRangeFromFullColumn(*converted_column, 0, converted_column->size());
+
+                return res_column;
+            }
+            else if (!src_converted_to_full_column)
+                return converted_column->index(*res_indexes, 0);
+            else
+                return converted_column;
+        };
+    }
+
+    WrapperType prepareRemoveNullable(const DataTypePtr & from_type, const DataTypePtr & to_type, bool skip_not_null_check) const
+    {
+        /// Determine whether pre-processing and/or post-processing must take place during conversion.
+
+        bool source_is_nullable = from_type->isNullable();
+        bool result_is_nullable = to_type->isNullable();
+
+        auto wrapper = prepareImpl(removeNullable(from_type), removeNullable(to_type), result_is_nullable);
+
+        if (result_is_nullable)
+        {
+            return [wrapper, source_is_nullable]
+                (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
+            {
+                /// Create a temporary columns on which to perform the operation.
+                const auto & nullable_type = static_cast<const DataTypeNullable &>(*result_type);
+                const auto & nested_type = nullable_type.getNestedType();
+
+                ColumnsWithTypeAndName tmp_args;
+                if (source_is_nullable)
+                    tmp_args = createBlockWithNestedColumns(arguments);
+                else
+                    tmp_args = arguments;
+
+                const ColumnNullable * nullable_source = nullptr;
+
+                /// Add original ColumnNullable for createStringToEnumWrapper()
+                if (source_is_nullable)
+                {
+                    if (arguments.size() != 1)
+                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid number of arguments");
+                    nullable_source = typeid_cast<const ColumnNullable *>(arguments.front().column.get());
+                }
+
+                /// Perform the requested conversion.
+                auto tmp_res = wrapper(tmp_args, nested_type, nullable_source, input_rows_count);
+
+                /// May happen in fuzzy tests. For debug purpose.
+                if (!tmp_res)
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Couldn't convert {} to {} in prepareRemoveNullable wrapper.",
+                                    arguments[0].type->getName(), nested_type->getName());
+
+                return wrapInNullable(tmp_res, arguments, nested_type, input_rows_count);
+            };
+        }
+        else if (source_is_nullable)
+        {
+            /// Conversion from Nullable to non-Nullable.
+
+            return [wrapper, skip_not_null_check]
+                (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
+            {
+                auto tmp_args = createBlockWithNestedColumns(arguments);
+                auto nested_type = removeNullable(result_type);
+
+                /// Check that all values are not-NULL.
+                /// Check can be skipped in case if LowCardinality dictionary is transformed.
+                /// In that case, correctness will be checked beforehand.
+                if (!skip_not_null_check)
+                {
+                    const auto & col = arguments[0].column;
+                    const auto & nullable_col = assert_cast<const ColumnNullable &>(*col);
+                    const auto & null_map = nullable_col.getNullMapData();
+
+                    if (!memoryIsZero(null_map.data(), 0, null_map.size()))
+                        throw Exception(ErrorCodes::CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN, "Cannot convert NULL value to non-Nullable type");
+                }
+                const ColumnNullable * nullable_source = typeid_cast<const ColumnNullable *>(arguments.front().column.get());
+                return wrapper(tmp_args, nested_type, nullable_source, input_rows_count);
+            };
+        }
+        else
+            return wrapper;
+    }
+
+    /// 'from_type' and 'to_type' are nested types in case of Nullable.
+    /// 'requested_result_is_nullable' is true if CAST to Nullable type is requested.
+    WrapperType prepareImpl(const DataTypePtr & from_type, const DataTypePtr & to_type, bool requested_result_is_nullable) const
+    {
+        if (isUInt8(from_type) && isBool(to_type))
+            return createUInt8ToBoolWrapper(from_type, to_type);
+
+        /// We can cast IPv6 into IPv6, IPv4 into IPv4, but we should not allow to cast FixedString(16) into IPv6 as part of identity cast
+        bool safe_convert_custom_types = true;
+
+        if (const auto * to_type_custom_name = to_type->getCustomName())
+            safe_convert_custom_types = from_type->getCustomName() && from_type->getCustomName()->getName() == to_type_custom_name->getName();
+        else if (const auto * from_type_custom_name = from_type->getCustomName())
+            safe_convert_custom_types = to_type->getCustomName() && from_type_custom_name->getName() == to_type->getCustomName()->getName();
+
+        if (from_type->equals(*to_type) && safe_convert_custom_types)
+        {
+            /// We can only use identity conversion for DataTypeAggregateFunction when they are strictly equivalent.
+            if (typeid_cast<const DataTypeAggregateFunction *>(from_type.get()))
+            {
+                if (DataTypeAggregateFunction::strictEquals(from_type, to_type))
+                    return createIdentityWrapper(from_type);
+            }
+            else
+                return createIdentityWrapper(from_type);
+        }
+        else if (WhichDataType(from_type).isNothing())
+            return createNothingWrapper(to_type.get());
+
+        WrapperType ret;
+
+        auto make_default_wrapper = [&](const auto & types) -> bool
+        {
+            using Types = std::decay_t<decltype(types)>;
+            using ToDataType = typename Types::LeftType;
+
+            if constexpr (
+                std::is_same_v<ToDataType, DataTypeUInt16> ||
+                std::is_same_v<ToDataType, DataTypeUInt32> ||
+                std::is_same_v<ToDataType, DataTypeUInt64> ||
+                std::is_same_v<ToDataType, DataTypeUInt128> ||
+                std::is_same_v<ToDataType, DataTypeUInt256> ||
+                std::is_same_v<ToDataType, DataTypeInt8> ||
+                std::is_same_v<ToDataType, DataTypeInt16> ||
+                std::is_same_v<ToDataType, DataTypeInt32> ||
+                std::is_same_v<ToDataType, DataTypeInt64> ||
+                std::is_same_v<ToDataType, DataTypeInt128> ||
+                std::is_same_v<ToDataType, DataTypeInt256> ||
+                std::is_same_v<ToDataType, DataTypeFloat32> ||
+                std::is_same_v<ToDataType, DataTypeFloat64> ||
+                std::is_same_v<ToDataType, DataTypeDate> ||
+                std::is_same_v<ToDataType, DataTypeDate32> ||
+                std::is_same_v<ToDataType, DataTypeDateTime> ||
+                std::is_same_v<ToDataType, DataTypeUUID> ||
+                std::is_same_v<ToDataType, DataTypeIPv4> ||
+                std::is_same_v<ToDataType, DataTypeIPv6>)
+            {
+                ret = createWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
+                return true;
+            }
+            if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
+            {
+                if (isBool(to_type))
+                    ret = createBoolWrapper<ToDataType>(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
+                else
+                    ret = createWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
+                return true;
+            }
+            if constexpr (
+                std::is_same_v<ToDataType, DataTypeEnum8> ||
+                std::is_same_v<ToDataType, DataTypeEnum16>)
+            {
+                ret = createEnumWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()));
+                return true;
+            }
+            if constexpr (
+                std::is_same_v<ToDataType, DataTypeDecimal<Decimal32>> ||
+                std::is_same_v<ToDataType, DataTypeDecimal<Decimal64>> ||
+                std::is_same_v<ToDataType, DataTypeDecimal<Decimal128>> ||
+                std::is_same_v<ToDataType, DataTypeDecimal<Decimal256>> ||
+                std::is_same_v<ToDataType, DataTypeDateTime64>)
+            {
+                ret = createDecimalWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
+                return true;
+            }
+
+            return false;
+        };
+
+        bool cast_ipv4_ipv6_default_on_conversion_error_value = context && context->getSettingsRef().cast_ipv4_ipv6_default_on_conversion_error;
+        bool input_format_ipv4_default_on_conversion_error_value = context && context->getSettingsRef().input_format_ipv4_default_on_conversion_error;
+        bool input_format_ipv6_default_on_conversion_error_value = context && context->getSettingsRef().input_format_ipv6_default_on_conversion_error;
+
+        auto make_custom_serialization_wrapper = [&, cast_ipv4_ipv6_default_on_conversion_error_value, input_format_ipv4_default_on_conversion_error_value, input_format_ipv6_default_on_conversion_error_value](const auto & types) -> bool
+        {
+            using Types = std::decay_t<decltype(types)>;
+            using ToDataType = typename Types::RightType;
+            using FromDataType = typename Types::LeftType;
+
+            if constexpr (WhichDataType(FromDataType::type_id).isStringOrFixedString())
+            {
+                if constexpr (std::is_same_v<ToDataType, DataTypeIPv4>)
+                {
+                    ret = [cast_ipv4_ipv6_default_on_conversion_error_value,
+                           input_format_ipv4_default_on_conversion_error_value,
+                           requested_result_is_nullable](
+                              ColumnsWithTypeAndName & arguments,
+                              const DataTypePtr & result_type,
+                              const ColumnNullable * column_nullable,
+                              size_t) -> ColumnPtr
+                    {
+                        if (!WhichDataType(result_type).isIPv4())
+                            throw Exception(ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv4", result_type->getName());
+
+                        const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
+                        if (requested_result_is_nullable)
+                            return convertToIPv4<IPStringToNumExceptionMode::Null>(arguments[0].column, null_map);
+                        else if (cast_ipv4_ipv6_default_on_conversion_error_value || input_format_ipv4_default_on_conversion_error_value)
+                            return convertToIPv4<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
+                        else
+                            return convertToIPv4<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
+                    };
+
+                    return true;
+                }
+
+                if constexpr (std::is_same_v<ToDataType, DataTypeIPv6>)
+                {
+                    ret = [cast_ipv4_ipv6_default_on_conversion_error_value,
+                           input_format_ipv6_default_on_conversion_error_value,
+                           requested_result_is_nullable](
+                              ColumnsWithTypeAndName & arguments,
+                              const DataTypePtr & result_type,
+                              const ColumnNullable * column_nullable,
+                              size_t) -> ColumnPtr
+                    {
+                        if (!WhichDataType(result_type).isIPv6())
+                            throw Exception(
+                                ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv6", result_type->getName());
+
+                        const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
+                        if (requested_result_is_nullable)
+                            return convertToIPv6<IPStringToNumExceptionMode::Null>(arguments[0].column, null_map);
+                        else if (cast_ipv4_ipv6_default_on_conversion_error_value || input_format_ipv6_default_on_conversion_error_value)
+                            return convertToIPv6<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
+                        else
+                            return convertToIPv6<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
+                    };
+
+                    return true;
+                }
+
+                if (to_type->getCustomSerialization() && to_type->getCustomName())
+                {
+                    ret = [requested_result_is_nullable](
+                              ColumnsWithTypeAndName & arguments,
+                              const DataTypePtr & result_type,
+                              const ColumnNullable * column_nullable,
+                              size_t input_rows_count) -> ColumnPtr
+                    {
+                        auto wrapped_result_type = result_type;
+                        if (requested_result_is_nullable)
+                            wrapped_result_type = makeNullable(result_type);
+                        return ConvertImplGenericFromString::execute(
+                            arguments, wrapped_result_type, column_nullable, input_rows_count);
+                    };
+                    return true;
+                }
+            }
+            else if constexpr (WhichDataType(FromDataType::type_id).isIPv6() && WhichDataType(ToDataType::type_id).isIPv4())
+            {
+                ret = [cast_ipv4_ipv6_default_on_conversion_error_value, requested_result_is_nullable](
+                                ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * column_nullable, size_t)
+                        -> ColumnPtr
+                {
+                    if (!WhichDataType(result_type).isIPv4())
+                        throw Exception(
+                            ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv4", result_type->getName());
+
+                    const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
+                    if (requested_result_is_nullable)
+                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Null>(arguments[0].column, null_map);
+                    else if (cast_ipv4_ipv6_default_on_conversion_error_value)
+                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
+                    else
+                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
+                };
+
+                return true;
+            }
+
+            if constexpr (WhichDataType(ToDataType::type_id).isStringOrFixedString())
+            {
+                if constexpr (WhichDataType(FromDataType::type_id).isEnum())
+                {
+                    ret = createEnumToStringWrapper<FromDataType>();
+                    return true;
+                }
+                else if (from_type->getCustomSerialization())
+                {
+                    ret = [](ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
+                    {
+                        return ConvertImplGenericToString<typename ToDataType::ColumnType>::execute(arguments, result_type, input_rows_count);
+                    };
+                    return true;
+                }
+            }
+
+            return false;
+        };
+
+        if (callOnTwoTypeIndexes(from_type->getTypeId(), to_type->getTypeId(), make_custom_serialization_wrapper))
+            return ret;
+
+        if (callOnIndexAndDataType<void>(to_type->getTypeId(), make_default_wrapper))
+            return ret;
+
+        switch (to_type->getTypeId())
+        {
+            case TypeIndex::String:
+                return createStringWrapper(from_type);
+            case TypeIndex::FixedString:
+                return createFixedStringWrapper(from_type, checkAndGetDataType<DataTypeFixedString>(to_type.get())->getN());
+            case TypeIndex::Array:
+                return createArrayWrapper(from_type, static_cast<const DataTypeArray &>(*to_type));
+            case TypeIndex::Tuple:
+                return createTupleWrapper(from_type, checkAndGetDataType<DataTypeTuple>(to_type.get()));
+            case TypeIndex::Map:
+                return createMapWrapper(from_type, checkAndGetDataType<DataTypeMap>(to_type.get()));
+            case TypeIndex::Object:
+                return createObjectWrapper(from_type, checkAndGetDataType<DataTypeObject>(to_type.get()));
+            case TypeIndex::AggregateFunction:
+                return createAggregateFunctionWrapper(from_type, checkAndGetDataType<DataTypeAggregateFunction>(to_type.get()));
+            case TypeIndex::Interval:
+                return createIntervalWrapper(from_type, checkAndGetDataType<DataTypeInterval>(to_type.get())->getKind());
+            default:
+                break;
+        }
+
+        if (cast_type == CastType::accurateOrNull)
+            return createToNullableColumnWrapper();
+        else
+            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
+                from_type->getName(), to_type->getName());
+    }
+};
+
+class MonotonicityHelper
+{
+public:
+    using MonotonicityForRange = FunctionCastBase::MonotonicityForRange;
+
+    template <typename DataType>
+    static auto monotonicityForType(const DataType * const)
+    {
+        return FunctionTo<DataType>::Type::Monotonic::get;
+    }
+
+    static MonotonicityForRange getMonotonicityInformation(const DataTypePtr & from_type, const IDataType * to_type)
+    {
+        if (const auto * type = checkAndGetDataType<DataTypeUInt8>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeUInt16>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeUInt32>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeUInt64>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeUInt128>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeUInt256>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeInt8>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeInt16>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeInt32>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeInt64>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeInt128>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeInt256>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeFloat32>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeFloat64>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeDate>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeDate32>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeDateTime>(to_type))
+            return monotonicityForType(type);
+        if (const auto * type = checkAndGetDataType<DataTypeString>(to_type))
+            return monotonicityForType(type);
+        if (isEnum(from_type))
+        {
+            if (const auto * type = checkAndGetDataType<DataTypeEnum8>(to_type))
+                return monotonicityForType(type);
+            if (const auto * type = checkAndGetDataType<DataTypeEnum16>(to_type))
+                return monotonicityForType(type);
+        }
+        /// other types like Null, FixedString, Array and Tuple have no monotonicity defined
+        return {};
+    }
+};
+
+
 FunctionBasePtr createFunctionBaseCast(
     ContextPtr context
     , const ColumnsWithTypeAndName & arguments
@@ -146,54 +5102,4 @@ REGISTER_FUNCTION(Conversion)
     factory.registerFunction<FunctionConvert<DataTypeInterval, NameToIntervalYear, PositiveMonotonicity>>();
 }
 
-
-MonotonicityHelper::MonotonicityForRange MonotonicityHelper::getMonotonicityInformation(const DataTypePtr & from_type, const IDataType * to_type)
-{
-    if (const auto * type = checkAndGetDataType<DataTypeUInt8>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeUInt16>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeUInt32>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeUInt64>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeUInt128>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeUInt256>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeInt8>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeInt16>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeInt32>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeInt64>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeInt128>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeInt256>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeFloat32>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeFloat64>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeDate>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeDate32>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeDateTime>(to_type))
-        return monotonicityForType(type);
-    if (const auto * type = checkAndGetDataType<DataTypeString>(to_type))
-        return monotonicityForType(type);
-    if (isEnum(from_type))
-    {
-        if (const auto * type = checkAndGetDataType<DataTypeEnum8>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeEnum16>(to_type))
-            return monotonicityForType(type);
-    }
-    /// other types like Null, FixedString, Array and Tuple have no monotonicity defined
-    return {};
-}
-
 }
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
deleted file mode 100644
index c21e85fb40e..00000000000
--- a/src/Functions/FunctionsConversion.h
+++ /dev/null
@@ -1,4924 +0,0 @@
-#pragma once
-
-#include <cstddef>
-#include <type_traits>
-
-#include <IO/WriteBufferFromVector.h>
-#include <IO/ReadBufferFromMemory.h>
-#include <IO/Operators.h>
-#include <IO/parseDateTimeBestEffort.h>
-#include <DataTypes/DataTypeFactory.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypesDecimal.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypeFixedString.h>
-#include <DataTypes/DataTypeDate.h>
-#include <DataTypes/DataTypeDate32.h>
-#include <DataTypes/DataTypeDateTime.h>
-#include <DataTypes/DataTypeDateTime64.h>
-#include <DataTypes/DataTypeEnum.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeMap.h>
-#include <DataTypes/DataTypeNullable.h>
-#include <DataTypes/DataTypeNothing.h>
-#include <DataTypes/DataTypeUUID.h>
-#include <DataTypes/DataTypeInterval.h>
-#include <DataTypes/DataTypeAggregateFunction.h>
-#include <DataTypes/DataTypeObject.h>
-#include <DataTypes/ObjectUtils.h>
-#include <DataTypes/DataTypeNested.h>
-#include <DataTypes/DataTypeVariant.h>
-#include <DataTypes/Serializations/SerializationDecimal.h>
-#include <Formats/FormatSettings.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnFixedString.h>
-#include <Columns/ColumnConst.h>
-#include <Columns/ColumnAggregateFunction.h>
-#include <Columns/ColumnArray.h>
-#include <Columns/ColumnNullable.h>
-#include <Columns/ColumnTuple.h>
-#include <Columns/ColumnMap.h>
-#include <Columns/ColumnObject.h>
-#include <Columns/ColumnsCommon.h>
-#include <Columns/ColumnVariant.h>
-#include <Columns/ColumnStringHelpers.h>
-#include <Common/assert_cast.h>
-#include <Common/Concepts.h>
-#include <Common/quoteString.h>
-#include <Common/Exception.h>
-#include <Core/AccurateComparison.h>
-#include <Functions/IFunctionAdaptors.h>
-#include <Functions/FunctionHelpers.h>
-#include <Functions/DateTimeTransforms.h>
-#include <Functions/toFixedString.h>
-#include <Functions/TransformDateTime64.h>
-#include <Functions/FunctionsCodingIP.h>
-#include <Functions/CastOverloadResolver.h>
-#include <DataTypes/DataTypeLowCardinality.h>
-#include <Columns/ColumnLowCardinality.h>
-#include <Interpreters/Context.h>
-#include <Common/HashTable/HashMap.h>
-#include <DataTypes/DataTypeIPv4andIPv6.h>
-#include <Common/IPv6ToBinary.h>
-#include <Core/Types.h>
-
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int ATTEMPT_TO_READ_AFTER_EOF;
-    extern const int CANNOT_PARSE_NUMBER;
-    extern const int CANNOT_READ_ARRAY_FROM_TEXT;
-    extern const int CANNOT_PARSE_INPUT_ASSERTION_FAILED;
-    extern const int CANNOT_PARSE_QUOTED_STRING;
-    extern const int CANNOT_PARSE_ESCAPE_SEQUENCE;
-    extern const int CANNOT_PARSE_DATE;
-    extern const int CANNOT_PARSE_DATETIME;
-    extern const int CANNOT_PARSE_TEXT;
-    extern const int CANNOT_PARSE_UUID;
-    extern const int CANNOT_PARSE_IPV4;
-    extern const int CANNOT_PARSE_IPV6;
-    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
-    extern const int LOGICAL_ERROR;
-    extern const int TYPE_MISMATCH;
-    extern const int CANNOT_CONVERT_TYPE;
-    extern const int ILLEGAL_COLUMN;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int NOT_IMPLEMENTED;
-    extern const int CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN;
-    extern const int CANNOT_PARSE_BOOL;
-    extern const int VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE;
-}
-
-/** Type conversion functions.
-  * toType - conversion in "natural way";
-  */
-
-UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column);
-
-/// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
-struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
-
-struct AccurateConvertStrategyAdditions
-{
-    UInt32 scale { 0 };
-};
-
-struct AccurateOrNullConvertStrategyAdditions
-{
-    UInt32 scale { 0 };
-};
-
-
-struct ConvertDefaultBehaviorTag {};
-struct ConvertReturnNullOnErrorTag {};
-struct ConvertReturnZeroOnErrorTag {};
-
-/** Conversion of number types to each other, enums to numbers, dates and datetimes to numbers and back: done by straight assignment.
-  *  (Date is represented internally as number of days from some day; DateTime - as unix timestamp)
-  */
-template <typename FromDataType, typename ToDataType, typename Name,
-    typename SpecialTag = ConvertDefaultBehaviorTag,
-    FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
-struct ConvertImpl
-{
-    using FromFieldType = typename FromDataType::FieldType;
-    using ToFieldType = typename ToDataType::FieldType;
-
-    template <typename Additions = void *>
-    static ColumnPtr NO_SANITIZE_UNDEFINED execute(
-        const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type [[maybe_unused]], size_t input_rows_count,
-        Additions additions [[maybe_unused]] = Additions())
-    {
-        const ColumnWithTypeAndName & named_from = arguments[0];
-
-        using ColVecFrom = typename FromDataType::ColumnType;
-        using ColVecTo = typename ToDataType::ColumnType;
-
-        if constexpr ((IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
-            && !(std::is_same_v<DataTypeDateTime64, FromDataType> || std::is_same_v<DataTypeDateTime64, ToDataType>))
-        {
-            if constexpr (!IsDataTypeDecimalOrNumber<FromDataType> || !IsDataTypeDecimalOrNumber<ToDataType>)
-            {
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    named_from.column->getName(), Name::name);
-            }
-        }
-
-        if (const ColVecFrom * col_from = checkAndGetColumn<ColVecFrom>(named_from.column.get()))
-        {
-            typename ColVecTo::MutablePtr col_to = nullptr;
-
-            if constexpr (IsDataTypeDecimal<ToDataType>)
-            {
-                UInt32 scale;
-
-                if constexpr (std::is_same_v<Additions, AccurateConvertStrategyAdditions>
-                    || std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                {
-                    scale = additions.scale;
-                }
-                else
-                {
-                    scale = additions;
-                }
-
-                col_to = ColVecTo::create(0, scale);
-            }
-            else
-                col_to = ColVecTo::create();
-
-            const auto & vec_from = col_from->getData();
-            auto & vec_to = col_to->getData();
-            vec_to.resize(input_rows_count);
-
-            ColumnUInt8::MutablePtr col_null_map_to;
-            ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
-            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-            {
-                col_null_map_to = ColumnUInt8::create(input_rows_count, false);
-                vec_null_map_to = &col_null_map_to->getData();
-            }
-
-            bool result_is_bool = isBool(result_type);
-            for (size_t i = 0; i < input_rows_count; ++i)
-            {
-                if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
-                {
-                    if (result_is_bool)
-                    {
-                        vec_to[i] = vec_from[i] != FromFieldType(0);
-                        continue;
-                    }
-                }
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> && std::is_same_v<ToDataType, DataTypeUInt128>)
-                {
-                    static_assert(
-                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                        "UInt128 and UUID types must be same");
-
-                    vec_to[i].items[1] = vec_from[i].toUnderType().items[0];
-                    vec_to[i].items[0] = vec_from[i].toUnderType().items[1];
-
-                    continue;
-                }
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
-                {
-                    static_assert(
-                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                        "UInt128 and IPv6 types must be same");
-
-                    vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
-                    vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
-
-                    continue;
-                }
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                    "Conversion between numeric types and UUID is not supported. "
-                                    "Probably the passed UUID is unquoted");
-                }
-                else if constexpr (
-                    (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
-                    && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6> || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>)
-                )
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
-                                    TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
-                }
-                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6> && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                    "Conversion between numeric types and IPv6 is not supported. "
-                                    "Probably the passed IPv6 is unquoted");
-                }
-                else
-                {
-                    if constexpr (IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
-                    {
-                        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                        {
-                            ToFieldType result;
-                            bool convert_result = false;
-
-                            if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                convert_result = tryConvertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale(), result);
-                            else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
-                                convert_result = tryConvertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), result);
-                            else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                convert_result = tryConvertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale(), result);
-
-                            if (convert_result)
-                                vec_to[i] = result;
-                            else
-                            {
-                                vec_to[i] = static_cast<ToFieldType>(0);
-                                (*vec_null_map_to)[i] = true;
-                            }
-                        }
-                        else
-                        {
-                            if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                vec_to[i] = convertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale());
-                            else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
-                                vec_to[i] = convertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale());
-                            else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                vec_to[i] = convertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale());
-                            else
-                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unsupported data type in conversion function");
-                        }
-                    }
-                    else
-                    {
-                        /// If From Data is Nan or Inf and we convert to integer type, throw exception
-                        if constexpr (std::is_floating_point_v<FromFieldType> && !std::is_floating_point_v<ToFieldType>)
-                        {
-                            if (!isFinite(vec_from[i]))
-                            {
-                                if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                                {
-                                    vec_to[i] = 0;
-                                    (*vec_null_map_to)[i] = true;
-                                    continue;
-                                }
-                                else
-                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unexpected inf or nan to integer conversion");
-                            }
-                        }
-
-                        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>
-                                || std::is_same_v<Additions, AccurateConvertStrategyAdditions>)
-                        {
-                            bool convert_result = accurate::convertNumeric(vec_from[i], vec_to[i]);
-
-                            if (!convert_result)
-                            {
-                                if (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                                {
-                                    vec_to[i] = 0;
-                                    (*vec_null_map_to)[i] = true;
-                                }
-                                else
-                                {
-                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Value in column {} cannot be safely converted into type {}",
-                                        named_from.column->getName(), result_type->getName());
-                                }
-                            }
-                        }
-                        else
-                        {
-                            if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
-                            {
-                                const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
-                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                                if (!matchIPv6Subnet(src, ip4_cidr, 96))
-                                {
-                                    char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
-                                    char * paddr = addr;
-                                    formatIPv6(src, paddr);
-
-                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
-                                }
-
-                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                                if constexpr (std::endian::native == std::endian::little)
-                                {
-                                    dst[0] = src[15];
-                                    dst[1] = src[14];
-                                    dst[2] = src[13];
-                                    dst[3] = src[12];
-                                }
-                                else
-                                {
-                                    dst[0] = src[12];
-                                    dst[1] = src[13];
-                                    dst[2] = src[14];
-                                    dst[3] = src[15];
-                                }
-                            }
-                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
-                            {
-                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                                std::memset(dst, '\0', IPV6_BINARY_LENGTH);
-                                dst[10] = dst[11] = 0xff;
-
-                                if constexpr (std::endian::native == std::endian::little)
-                                {
-                                    dst[12] = src[3];
-                                    dst[13] = src[2];
-                                    dst[14] = src[1];
-                                    dst[15] = src[0];
-                                }
-                                else
-                                {
-                                    dst[12] = src[0];
-                                    dst[13] = src[1];
-                                    dst[14] = src[2];
-                                    dst[15] = src[3];
-                                }
-                            }
-                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
-                                vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
-                            else if constexpr (std::is_same_v<Name, NameToUnixTimestamp> && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
-                                vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
-                            else
-                                vec_to[i] = static_cast<ToFieldType>(vec_from[i]);
-                        }
-                    }
-                }
-            }
-
-            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
-            else
-                return col_to;
-        }
-        else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                named_from.column->getName(), Name::name);
-    }
-};
-
-/** Conversion of DateTime to Date: throw off time component.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDate, ToDateImpl<date_time_overflow_behavior>, false> {};
-
-/** Conversion of DateTime to Date32: throw off time component.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDate32, ToDate32Impl, false> {};
-
-/** Conversion of Date to DateTime: adding 00:00:00 time component.
-  */
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
-struct ToDateTimeImpl
-{
-    static constexpr auto name = "toDateTime";
-
-    static UInt32 execute(UInt16 d, const DateLUTImpl & time_zone)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (d > MAX_DATETIME_DAY_NUM) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Day number {} is out of bounds of type DateTime", d);
-        }
-        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
-        {
-            if (d > MAX_DATETIME_DAY_NUM)
-                d = MAX_DATETIME_DAY_NUM;
-        }
-        return static_cast<UInt32>(time_zone.fromDayNum(DayNum(d)));
-    }
-
-    static UInt32 execute(Int32 d, const DateLUTImpl & time_zone)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
-        {
-            if (d < 0)
-                return 0;
-            else if (d > MAX_DATETIME_DAY_NUM)
-                d = MAX_DATETIME_DAY_NUM;
-        }
-        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (d < 0 || d > MAX_DATETIME_DAY_NUM) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", d);
-        }
-        return static_cast<UInt32>(time_zone.fromDayNum(ExtendedDayNum(d)));
-    }
-
-    static UInt32 execute(UInt32 dt, const DateLUTImpl & /*time_zone*/)
-    {
-        return dt;
-    }
-
-    static UInt32 execute(Int64 dt64, const DateLUTImpl & /*time_zone*/)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Ignore)
-            return static_cast<UInt32>(dt64);
-        else
-        {
-            if (dt64 < 0 || dt64 >= MAX_DATETIME_TIMESTAMP)
-            {
-                if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
-                    return dt64 < 0 ? 0 : std::numeric_limits<UInt32>::max();
-                else
-                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", dt64);
-            }
-            else
-                return static_cast<UInt32>(dt64);
-        }
-    }
-};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate, DataTypeDateTime, ToDateTimeImpl<date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate32, DataTypeDateTime, ToDateTimeImpl<date_time_overflow_behavior>, false> {};
-
-/// Implementation of toDate function.
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTransform32Or64
-{
-    static constexpr auto name = "toDate";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
-        }
-        /// if value is smaller (or equal) than maximum day value for Date, than treat it as day num,
-        /// otherwise treat it as unix timestamp. This is a bit weird, but we leave this behavior.
-        if (from <= DATE_LUT_MAX_DAY_NUM)
-            return from;
-        else
-            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
-    }
-};
-
-/** Conversion of Date32 to Date.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate32, DataTypeDate, ToDateImpl<date_time_overflow_behavior>, false> {};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTransform32Or64Signed
-{
-    static constexpr auto name = "toDate";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        // TODO: decide narrow or extended range based on FromType
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < 0 || from > MAX_DATE_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
-        }
-        else
-        {
-            if (from < 0)
-                return 0;
-        }
-        return (from <= DATE_LUT_MAX_DAY_NUM)
-            ? static_cast<ToType>(from)
-            : time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATE_TIMESTAMP)));
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTransform8Or16Signed
-{
-    static constexpr auto name = "toDate";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if (from < 0)
-        {
-            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
-            else
-                return 0;
-        }
-        return from;
-    }
-};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-        : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false> {};
-
-/// Implementation of toDate32 function.
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDate32Transform32Or64
-{
-    static constexpr auto name = "toDate32";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        if (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
-            return static_cast<ToType>(from);
-        else
-        {
-            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-            {
-                if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
-            }
-            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME64_TIMESTAMP)));
-        }
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDate32Transform32Or64Signed
-{
-    static constexpr auto name = "toDate32";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        static const Int32 daynum_min_offset = -static_cast<Int32>(time_zone.getDayNumOffsetEpoch());
-
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < daynum_min_offset || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
-        }
-
-        if (from < daynum_min_offset)
-            return daynum_min_offset;
-
-        return (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
-            ? static_cast<ToType>(from)
-            : time_zone.toDayNum(std::min(time_t(Int64(from)), time_t(MAX_DATETIME64_TIMESTAMP)));
-    }
-};
-
-template <typename FromType, typename ToType>
-struct ToDate32Transform8Or16Signed
-{
-    static constexpr auto name = "toDate32";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        return from;
-    }
-};
-
-/** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
-  * Float32, Float64) to Date. If the
-  * number is less than 65536, then it is treated as DayNum, and if it's greater or equals to 65536,
-  * then treated as unix timestamp. If the number exceeds UInt32, saturate to MAX_UINT32 then as DayNum.
-  * It's a bit illogical, as we actually have two functions in one.
-  * But allows to support frequent case,
-  *  when user write toDate(UInt32), expecting conversion of unix timestamp to Date.
-  *  (otherwise such usage would be frequent mistake).
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt32, DataTypeDate, ToDateTransform32Or64<UInt32, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDate, ToDateTransform32Or64<UInt64, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDate, ToDateTransform8Or16Signed<Int8, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDate, ToDateTransform8Or16Signed<Int16, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDate, ToDateTransform32Or64Signed<Int32, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDate, ToDateTransform32Or64Signed<Int64, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDate, ToDateTransform32Or64Signed<Float32, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDate, ToDateTransform32Or64Signed<Float64, UInt16, default_date_time_overflow_behavior>, false> {};
-
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt32, DataTypeDate32, ToDate32Transform32Or64<UInt32, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDate32, ToDate32Transform32Or64<UInt64, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDate32, ToDate32Transform8Or16Signed<Int8, Int32>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDate32, ToDate32Transform8Or16Signed<Int16, Int32>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDate32, ToDate32Transform32Or64Signed<Int32, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDate32, ToDate32Transform32Or64Signed<Int64, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDate32, ToDate32Transform32Or64Signed<Float32, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDate32, ToDate32Transform32Or64Signed<Float64, Int32, default_date_time_overflow_behavior>, false> {};
-
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTimeTransform64
-{
-    static constexpr auto name = "toDateTime";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
-        }
-        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTimeTransformSigned
-{
-    static constexpr auto name = "toDateTime";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if (from < 0)
-        {
-            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
-            else
-                return 0;
-        }
-        return from;
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTimeTransform64Signed
-{
-    static constexpr auto name = "toDateTime";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < 0 || from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
-        }
-
-        if (from < 0)
-            return 0;
-        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
-    }
-};
-
-/// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDateTime, ToDateTimeTransformSigned<Int8, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDateTime, ToDateTimeTransformSigned<Int16, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDateTime, ToDateTimeTransformSigned<Int32, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDateTime, ToDateTimeTransform64Signed<Int64, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDateTime, ToDateTimeTransform64<UInt64, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDateTime, ToDateTimeTransform64Signed<Float32, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDateTime, ToDateTimeTransform64Signed<Float64, UInt32, default_date_time_overflow_behavior>, false> {};
-
-/** Conversion of numeric to DateTime64
-  */
-
-template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTime64TransformUnsigned
-{
-    static constexpr auto name = "toDateTime64";
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    ToDateTime64TransformUnsigned(UInt32 scale = 0) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
-            else
-                return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
-        }
-        else
-            return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP), 0, scale_multiplier);
-    }
-};
-template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTime64TransformSigned
-{
-    static constexpr auto name = "toDateTime64";
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    ToDateTime64TransformSigned(UInt32 scale = 0) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
-        }
-        from = static_cast<FromType>(std::max<time_t>(from, MIN_DATETIME64_TIMESTAMP));
-        from = static_cast<FromType>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP));
-
-        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
-    }
-};
-template <typename FromDataType, typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTime64TransformFloat
-{
-    static constexpr auto name = "toDateTime64";
-
-    const UInt32 scale = 1;
-
-    ToDateTime64TransformFloat(UInt32 scale_ = 0) /// NOLINT
-        : scale(scale_)
-    {}
-
-    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
-        }
-
-        from = std::max(from, static_cast<FromType>(MIN_DATETIME64_TIMESTAMP));
-        from = std::min(from, static_cast<FromType>(MAX_DATETIME64_TIMESTAMP));
-        return convertToDecimal<FromDataType, DataTypeDateTime64>(from, scale);
-    }
-};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDateTime64, ToDateTime64TransformSigned<Int8, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDateTime64, ToDateTime64TransformSigned<Int16, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDateTime64, ToDateTime64TransformSigned<Int32, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDateTime64, ToDateTime64TransformSigned<Int64, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDateTime64, ToDateTime64TransformUnsigned<UInt64, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDateTime64, ToDateTime64TransformFloat<DataTypeFloat32, Float32, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDateTime64, ToDateTime64TransformFloat<DataTypeFloat64, Float64, date_time_overflow_behavior>, false> {};
-
-
-/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
- */
-template <typename Transform>
-struct FromDateTime64Transform
-{
-    static constexpr auto name = Transform::name;
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    FromDateTime64Transform(UInt32 scale) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    auto execute(DateTime64::NativeType dt, const DateLUTImpl & time_zone) const
-    {
-        const auto c = DecimalUtils::splitWithScaleMultiplier(DateTime64(dt), scale_multiplier);
-        return Transform::execute(static_cast<UInt32>(c.whole), time_zone);
-    }
-};
-
-/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
- */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDateTime, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false> {};
-
-struct ToDateTime64Transform
-{
-    static constexpr auto name = "toDateTime64";
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    ToDateTime64Transform(UInt32 scale = 0) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    DateTime64::NativeType execute(UInt16 d, const DateLUTImpl & time_zone) const
-    {
-        const auto dt = ToDateTimeImpl<>::execute(d, time_zone);
-        return execute(dt, time_zone);
-    }
-
-    DateTime64::NativeType execute(Int32 d, const DateLUTImpl & time_zone) const
-    {
-        Int64 dt = static_cast<Int64>(time_zone.fromDayNum(ExtendedDayNum(d)));
-        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
-    }
-
-    DateTime64::NativeType execute(UInt32 dt, const DateLUTImpl & /*time_zone*/) const
-    {
-        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
-    }
-};
-
-/** Conversion of Date or DateTime to DateTime64: add zero sub-second part.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate, DataTypeDateTime64, ToDateTime64Transform> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate32, DataTypeDateTime64, ToDateTime64Transform> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDateTime64, ToDateTime64Transform> {};
-
-
-/** Transformation of numbers, dates, datetimes to strings: through formatting.
-  */
-template <typename DataType>
-struct FormatImpl
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const typename DataType::FieldType x, WriteBuffer & wb, const DataType *, const DateLUTImpl *)
-    {
-        writeText(x, wb);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDate>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDate::FieldType x, WriteBuffer & wb, const DataTypeDate *, const DateLUTImpl * time_zone)
-    {
-        writeDateText(DayNum(x), wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDate32>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDate32::FieldType x, WriteBuffer & wb, const DataTypeDate32 *, const DateLUTImpl * time_zone)
-    {
-        writeDateText(ExtendedDayNum(x), wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDateTime>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDateTime::FieldType x, WriteBuffer & wb, const DataTypeDateTime *, const DateLUTImpl * time_zone)
-    {
-        writeDateTimeText(x, wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDateTime64>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDateTime64::FieldType x, WriteBuffer & wb, const DataTypeDateTime64 * type, const DateLUTImpl * time_zone)
-    {
-        writeDateTimeText(DateTime64(x), type->getScale(), wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-
-template <typename FieldType>
-struct FormatImpl<DataTypeEnum<FieldType>>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeEnum<FieldType> * type, const DateLUTImpl *)
-    {
-        static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
-
-        if constexpr (throw_exception)
-        {
-            writeString(type->getNameForValue(x), wb);
-        }
-        else
-        {
-            StringRef res;
-            bool is_ok = type->getNameForValue(x, res);
-            if (is_ok)
-                writeString(res, wb);
-            return ReturnType(is_ok);
-        }
-    }
-};
-
-template <typename FieldType>
-struct FormatImpl<DataTypeDecimal<FieldType>>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeDecimal<FieldType> * type, const DateLUTImpl *)
-    {
-        writeText(x, type->getScale(), wb, false);
-        return ReturnType(true);
-    }
-};
-
-
-/// DataTypeEnum<T> to DataType<T> free conversion
-template <typename FieldType, typename Name>
-struct ConvertImpl<DataTypeEnum<FieldType>, DataTypeNumber<FieldType>, Name, ConvertDefaultBehaviorTag>
-{
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/)
-    {
-        return arguments[0].column;
-    }
-};
-
-static inline ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
-{
-    ColumnUInt8::MutablePtr null_map = nullptr;
-    if (const auto * col_null = checkAndGetColumn<ColumnNullable>(col.get()))
-    {
-        null_map = ColumnUInt8::create();
-        null_map->insertRangeFrom(col_null->getNullMapColumn(), 0, col_null->size());
-    }
-    return null_map;
-}
-
-template <typename FromDataType, typename Name>
-requires (!std::is_same_v<FromDataType, DataTypeString>)
-struct ConvertImpl<FromDataType, DataTypeString, Name, ConvertDefaultBehaviorTag>
-{
-    using FromFieldType = typename FromDataType::FieldType;
-    using ColVecType = ColumnVectorOrDecimal<FromFieldType>;
-
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/)
-    {
-        if constexpr (IsDataTypeDateOrDateTime<FromDataType>)
-        {
-            auto datetime_arg = arguments[0];
-
-            const DateLUTImpl * time_zone = nullptr;
-            const ColumnConst * time_zone_column = nullptr;
-
-            if (arguments.size() == 1)
-            {
-                auto non_null_args = createBlockWithNestedColumns(arguments);
-                time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
-            }
-            else /// When we have a column for timezone
-            {
-                datetime_arg.column = datetime_arg.column->convertToFullColumnIfConst();
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
-                    time_zone = &DateLUT::instance();
-                /// For argument of Date or DateTime type, second argument with time zone could be specified.
-                if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDateTime64>)
-                {
-                    if ((time_zone_column = checkAndGetColumnConst<ColumnString>(arguments[1].column.get())))
-                    {
-                        auto non_null_args = createBlockWithNestedColumns(arguments);
-                        time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
-                    }
-                }
-            }
-            const auto & col_with_type_and_name = columnGetNested(datetime_arg);
-
-            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
-            {
-                auto col_to = ColumnString::create();
-
-                const typename ColVecType::Container & vec_from = col_from->getData();
-                ColumnString::Chars & data_to = col_to->getChars();
-                ColumnString::Offsets & offsets_to = col_to->getOffsets();
-                size_t size = vec_from.size();
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeDate>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
-                else if constexpr (std::is_same_v<FromDataType, DataTypeDate32>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
-                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss") + 1));
-                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss.") + col_from->getScale() + 1));
-                else
-                    data_to.resize(size * 3);   /// Arbitrary
-
-                offsets_to.resize(size);
-
-                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
-                const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
-
-                ColumnUInt8::MutablePtr null_map = copyNullMap(datetime_arg.column);
-
-                if (!null_map && arguments.size() > 1)
-                    null_map = copyNullMap(arguments[1].column->convertToFullColumnIfConst());
-
-                if (null_map)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!time_zone_column && arguments.size() > 1)
-                        {
-                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
-                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
-                            else
-                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
-                        }
-                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, time_zone);
-                        null_map->getData()[i] |= !is_ok;
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!time_zone_column && arguments.size() > 1)
-                        {
-                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
-                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
-                            else
-                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
-                        }
-                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, time_zone);
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-
-                write_buffer.finalize();
-
-                if (null_map)
-                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
-                return col_to;
-            }
-            else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                        arguments[0].column->getName(), Name::name);
-        }
-        else
-        {
-            ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
-
-            const auto & col_with_type_and_name = columnGetNested(arguments[0]);
-            const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
-
-            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
-            {
-                auto col_to = ColumnString::create();
-
-                const typename ColVecType::Container & vec_from = col_from->getData();
-                ColumnString::Chars & data_to = col_to->getChars();
-                ColumnString::Offsets & offsets_to = col_to->getOffsets();
-                size_t size = vec_from.size();
-
-                data_to.resize(size * 3);
-                offsets_to.resize(size);
-
-                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
-
-                if (null_map)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, nullptr);
-                        /// We don't use timezones in this branch
-                        null_map->getData()[i] |= !is_ok;
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, nullptr);
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-
-                write_buffer.finalize();
-
-                if (null_map)
-                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
-                return col_to;
-            }
-            else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                        arguments[0].column->getName(), Name::name);
-        }
-    }
-};
-
-
-/// Generic conversion of any type to String or FixedString via serialization to text.
-template <typename StringColumnType>
-struct ConvertImplGenericToString
-{
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t /*input_rows_count*/)
-    {
-        static_assert(std::is_same_v<StringColumnType, ColumnString> || std::is_same_v<StringColumnType, ColumnFixedString>,
-                "Can be used only to serialize to ColumnString or ColumnFixedString");
-
-        ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
-
-        const auto & col_with_type_and_name = columnGetNested(arguments[0]);
-        const IDataType & type = *col_with_type_and_name.type;
-        const IColumn & col_from = *col_with_type_and_name.column;
-
-        size_t size = col_from.size();
-        auto col_to = removeNullable(result_type)->createColumn();
-
-        {
-            ColumnStringHelpers::WriteHelper write_helper(
-                    assert_cast<StringColumnType &>(*col_to),
-                    size);
-
-            auto & write_buffer = write_helper.getWriteBuffer();
-
-            FormatSettings format_settings;
-            auto serialization = type.getDefaultSerialization();
-            for (size_t row = 0; row < size; ++row)
-            {
-                serialization->serializeText(col_from, row, write_buffer, format_settings);
-                write_helper.rowWritten();
-            }
-
-            write_helper.finalize();
-        }
-
-        if (result_type->isNullable() && null_map)
-            return ColumnNullable::create(std::move(col_to), std::move(null_map));
-        return col_to;
-    }
-};
-
-/** Conversion of time_t to UInt16, Int32, UInt32
-  */
-template <typename DataType>
-void convertFromTime(typename DataType::FieldType & x, time_t & time)
-{
-    x = time;
-}
-
-template <>
-inline void convertFromTime<DataTypeDate>(DataTypeDate::FieldType & x, time_t & time)
-{
-    if (unlikely(time < 0))
-        x = 0;
-    else if (unlikely(time > 0xFFFF))
-        x = 0xFFFF;
-    else
-        x = time;
-}
-
-template <>
-inline void convertFromTime<DataTypeDate32>(DataTypeDate32::FieldType & x, time_t & time)
-{
-    x = static_cast<UInt32>(time);
-}
-
-template <>
-inline void convertFromTime<DataTypeDateTime>(DataTypeDateTime::FieldType & x, time_t & time)
-{
-    if (unlikely(time < 0))
-        x = 0;
-    else if (unlikely(time > MAX_DATETIME_TIMESTAMP))
-        x = MAX_DATETIME_TIMESTAMP;
-    else
-        x = static_cast<UInt32>(time);
-}
-
-/** Conversion of strings to numbers, dates, datetimes: through parsing.
-  */
-template <typename DataType>
-void parseImpl(typename DataType::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool precise_float_parsing)
-{
-    if constexpr (std::is_floating_point_v<typename DataType::FieldType>)
-    {
-        if (precise_float_parsing)
-            readFloatTextPrecise(x, rb);
-        else
-            readFloatTextFast(x, rb);
-    }
-    else
-        readText(x, rb);
-}
-
-template <>
-inline void parseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    DayNum tmp(0);
-    readDateText(tmp, rb, *time_zone);
-    x = tmp;
-}
-
-template <>
-inline void parseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    ExtendedDayNum tmp(0);
-    readDateText(tmp, rb, *time_zone);
-    x = tmp;
-}
-
-
-// NOTE: no need of extra overload of DateTime64, since readDateTimeText64 has different signature and that case is explicitly handled in the calling code.
-template <>
-inline void parseImpl<DataTypeDateTime>(DataTypeDateTime::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    time_t time = 0;
-    readDateTimeText(time, rb, *time_zone);
-    convertFromTime<DataTypeDateTime>(x, time);
-}
-
-template <>
-inline void parseImpl<DataTypeUUID>(DataTypeUUID::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    UUID tmp;
-    readUUIDText(tmp, rb);
-    x = tmp.toUnderType();
-}
-
-template <>
-inline void parseImpl<DataTypeIPv4>(DataTypeIPv4::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    IPv4 tmp;
-    readIPv4Text(tmp, rb);
-    x = tmp.toUnderType();
-}
-
-template <>
-inline void parseImpl<DataTypeIPv6>(DataTypeIPv6::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    IPv6 tmp;
-    readIPv6Text(tmp, rb);
-    x = tmp;
-}
-
-template <typename DataType>
-bool tryParseImpl(typename DataType::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool precise_float_parsing)
-{
-    if constexpr (std::is_floating_point_v<typename DataType::FieldType>)
-    {
-        if (precise_float_parsing)
-            return tryReadFloatTextPrecise(x, rb);
-        else
-            return tryReadFloatTextFast(x, rb);
-    }
-    else /*if constexpr (is_integer_v<typename DataType::FieldType>)*/
-        return tryReadIntText(x, rb);
-}
-
-template <>
-inline bool tryParseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    DayNum tmp(0);
-    if (!tryReadDateText(tmp, rb, *time_zone))
-        return false;
-    x = tmp;
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    ExtendedDayNum tmp(0);
-    if (!tryReadDateText(tmp, rb, *time_zone))
-        return false;
-    x = tmp;
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeDateTime>(DataTypeDateTime::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    time_t time = 0;
-    if (!tryReadDateTimeText(time, rb, *time_zone))
-        return false;
-    convertFromTime<DataTypeDateTime>(x, time);
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeUUID>(DataTypeUUID::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    UUID tmp;
-    if (!tryReadUUIDText(tmp, rb))
-        return false;
-
-    x = tmp.toUnderType();
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeIPv4>(DataTypeIPv4::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    IPv4 tmp;
-    if (!tryReadIPv4Text(tmp, rb))
-        return false;
-
-    x = tmp.toUnderType();
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeIPv6>(DataTypeIPv6::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    IPv6 tmp;
-    if (!tryReadIPv6Text(tmp, rb))
-        return false;
-
-    x = tmp;
-    return true;
-}
-
-
-/** Throw exception with verbose message when string value is not parsed completely.
-  */
-[[noreturn]] inline void throwExceptionForIncompletelyParsedValue(ReadBuffer & read_buffer, const IDataType & result_type)
-{
-    WriteBufferFromOwnString message_buf;
-    message_buf << "Cannot parse string " << quote << String(read_buffer.buffer().begin(), read_buffer.buffer().size())
-                << " as " << result_type.getName()
-                << ": syntax error";
-
-    if (read_buffer.offset())
-        message_buf << " at position " << read_buffer.offset()
-                    << " (parsed just " << quote << String(read_buffer.buffer().begin(), read_buffer.offset()) << ")";
-    else
-        message_buf << " at begin of string";
-
-    // Currently there are no functions toIPv{4,6}Or{Null,Zero}
-    if (isNativeNumber(result_type) && !(result_type.getName() == "IPv4" || result_type.getName() == "IPv6"))
-        message_buf << ". Note: there are to" << result_type.getName() << "OrZero and to" << result_type.getName() << "OrNull functions, which returns zero/NULL instead of throwing exception.";
-
-    throw Exception(PreformattedMessage{message_buf.str(), "Cannot parse string {} as {}: syntax error {}"}, ErrorCodes::CANNOT_PARSE_TEXT);
-}
-
-
-enum class ConvertFromStringExceptionMode
-{
-    Throw,  /// Throw exception if value cannot be parsed.
-    Zero,   /// Fill with zero or default if value cannot be parsed.
-    Null    /// Return ColumnNullable with NULLs when value cannot be parsed.
-};
-
-enum class ConvertFromStringParsingMode
-{
-    Normal,
-    BestEffort,  /// Only applicable for DateTime. Will use sophisticated method, that is slower.
-    BestEffortUS
-};
-
-template <typename FromDataType, typename ToDataType, typename Name,
-    ConvertFromStringExceptionMode exception_mode, ConvertFromStringParsingMode parsing_mode>
-struct ConvertThroughParsing
-{
-    static_assert(std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>,
-        "ConvertThroughParsing is only applicable for String or FixedString data types");
-
-    static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
-
-    static bool isAllRead(ReadBuffer & in)
-    {
-        /// In case of FixedString, skip zero bytes at end.
-        if constexpr (std::is_same_v<FromDataType, DataTypeFixedString>)
-            while (!in.eof() && *in.position() == 0)
-                ++in.position();
-
-        if (in.eof())
-            return true;
-
-        /// Special case, that allows to parse string with DateTime or DateTime64 as Date or Date32.
-        if constexpr (std::is_same_v<ToDataType, DataTypeDate> || std::is_same_v<ToDataType, DataTypeDate32>)
-        {
-            if (!in.eof() && (*in.position() == ' ' || *in.position() == 'T'))
-            {
-                if (in.buffer().size() == strlen("YYYY-MM-DD hh:mm:ss"))
-                    return true;
-
-                if (in.buffer().size() >= strlen("YYYY-MM-DD hh:mm:ss.x")
-                    && in.buffer().begin()[19] == '.')
-                {
-                    in.position() = in.buffer().begin() + 20;
-
-                    while (!in.eof() && isNumericASCII(*in.position()))
-                        ++in.position();
-
-                    if (in.eof())
-                        return true;
-                }
-            }
-        }
-
-        return false;
-    }
-
-    template <typename Additions = void *>
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & res_type, size_t input_rows_count,
-                        Additions additions [[maybe_unused]] = Additions())
-    {
-        using ColVecTo = typename ToDataType::ColumnType;
-
-        const DateLUTImpl * local_time_zone [[maybe_unused]] = nullptr;
-        const DateLUTImpl * utc_time_zone [[maybe_unused]] = nullptr;
-
-        /// For conversion to Date or DateTime type, second argument with time zone could be specified.
-        if constexpr (std::is_same_v<ToDataType, DataTypeDateTime> || to_datetime64)
-        {
-            const auto result_type = removeNullable(res_type);
-            // Time zone is already figured out during result type resolution, no need to do it here.
-            if (const auto dt_col = checkAndGetDataType<ToDataType>(result_type.get()))
-                local_time_zone = &dt_col->getTimeZone();
-            else
-                local_time_zone = &extractTimeZoneFromFunctionArguments(arguments, 1, 0);
-
-            if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort || parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
-                utc_time_zone = &DateLUT::instance("UTC");
-        }
-        else if constexpr (std::is_same_v<ToDataType, DataTypeDate> || std::is_same_v<ToDataType, DataTypeDate32>)
-        {
-            // Timezone is more or less dummy when parsing Date/Date32 from string.
-            local_time_zone = &DateLUT::instance();
-            utc_time_zone = &DateLUT::instance("UTC");
-        }
-
-        const IColumn * col_from = arguments[0].column.get();
-        const ColumnString * col_from_string = checkAndGetColumn<ColumnString>(col_from);
-        const ColumnFixedString * col_from_fixed_string = checkAndGetColumn<ColumnFixedString>(col_from);
-
-        if (std::is_same_v<FromDataType, DataTypeString> && !col_from_string)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                col_from->getName(), Name::name);
-
-        if (std::is_same_v<FromDataType, DataTypeFixedString> && !col_from_fixed_string)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                col_from->getName(), Name::name);
-
-        size_t size = input_rows_count;
-        typename ColVecTo::MutablePtr col_to = nullptr;
-
-        if constexpr (IsDataTypeDecimal<ToDataType>)
-        {
-            UInt32 scale = additions;
-            if constexpr (to_datetime64)
-            {
-                ToDataType check_bounds_in_ctor(scale, local_time_zone ? local_time_zone->getTimeZone() : String{});
-            }
-            else
-            {
-                ToDataType check_bounds_in_ctor(ToDataType::maxPrecision(), scale);
-            }
-            col_to = ColVecTo::create(size, scale);
-        }
-        else
-            col_to = ColVecTo::create(size);
-
-        typename ColVecTo::Container & vec_to = col_to->getData();
-
-        ColumnUInt8::MutablePtr col_null_map_to;
-        ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
-        if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
-        {
-            col_null_map_to = ColumnUInt8::create(size);
-            vec_null_map_to = &col_null_map_to->getData();
-        }
-
-        const ColumnString::Chars * chars = nullptr;
-        const IColumn::Offsets * offsets = nullptr;
-        size_t fixed_string_size = 0;
-
-        if constexpr (std::is_same_v<FromDataType, DataTypeString>)
-        {
-            chars = &col_from_string->getChars();
-            offsets = &col_from_string->getOffsets();
-        }
-        else
-        {
-            chars = &col_from_fixed_string->getChars();
-            fixed_string_size = col_from_fixed_string->getN();
-        }
-
-        size_t current_offset = 0;
-
-        bool precise_float_parsing = false;
-
-        if (DB::CurrentThread::isInitialized())
-        {
-            const DB::ContextPtr query_context = DB::CurrentThread::get().getQueryContext();
-
-            if (query_context)
-                precise_float_parsing = query_context->getSettingsRef().precise_float_parsing;
-        }
-
-        for (size_t i = 0; i < size; ++i)
-        {
-            size_t next_offset = std::is_same_v<FromDataType, DataTypeString> ? (*offsets)[i] : (current_offset + fixed_string_size);
-            size_t string_size = std::is_same_v<FromDataType, DataTypeString> ? next_offset - current_offset - 1 : fixed_string_size;
-
-            ReadBufferFromMemory read_buffer(&(*chars)[current_offset], string_size);
-
-            if constexpr (exception_mode == ConvertFromStringExceptionMode::Throw)
-            {
-                if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort)
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 res = 0;
-                        parseDateTime64BestEffort(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
-                        vec_to[i] = res;
-                    }
-                    else
-                    {
-                        time_t res;
-                        parseDateTimeBestEffort(res, read_buffer, *local_time_zone, *utc_time_zone);
-                        convertFromTime<ToDataType>(vec_to[i], res);
-                    }
-                }
-                else if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 res = 0;
-                        parseDateTime64BestEffortUS(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
-                        vec_to[i] = res;
-                    }
-                    else
-                    {
-                        time_t res;
-                        parseDateTimeBestEffortUS(res, read_buffer, *local_time_zone, *utc_time_zone);
-                        convertFromTime<ToDataType>(vec_to[i], res);
-                    }
-                }
-                else
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 value = 0;
-                        readDateTime64Text(value, col_to->getScale(), read_buffer, *local_time_zone);
-                        vec_to[i] = value;
-                    }
-                    else if constexpr (IsDataTypeDecimal<ToDataType>)
-                    {
-                        SerializationDecimal<typename ToDataType::FieldType>::readText(
-                            vec_to[i], read_buffer, ToDataType::maxPrecision(), col_to->getScale());
-                    }
-                    else
-                    {
-                        /// we want to utilize constexpr condition here, which is not mixable with value comparison
-                        do
-                        {
-                            if constexpr (std::is_same_v<FromDataType, DataTypeFixedString> && std::is_same_v<ToDataType, DataTypeIPv6>)
-                            {
-                                if (fixed_string_size == IPV6_BINARY_LENGTH)
-                                {
-                                    readBinary(vec_to[i], read_buffer);
-                                    break;
-                                }
-                            }
-                            parseImpl<ToDataType>(vec_to[i], read_buffer, local_time_zone, precise_float_parsing);
-                        } while (false);
-                    }
-                }
-
-                if (!isAllRead(read_buffer))
-                    throwExceptionForIncompletelyParsedValue(read_buffer, *res_type);
-            }
-            else
-            {
-                bool parsed;
-
-                if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort)
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 res = 0;
-                        parsed = tryParseDateTime64BestEffort(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
-                        vec_to[i] = res;
-                    }
-                    else
-                    {
-                        time_t res;
-                        parsed = tryParseDateTimeBestEffort(res, read_buffer, *local_time_zone, *utc_time_zone);
-                        convertFromTime<ToDataType>(vec_to[i],res);
-                    }
-                }
-                else if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 res = 0;
-                        parsed = tryParseDateTime64BestEffortUS(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
-                        vec_to[i] = res;
-                    }
-                    else
-                    {
-                        time_t res;
-                        parsed = tryParseDateTimeBestEffortUS(res, read_buffer, *local_time_zone, *utc_time_zone);
-                        convertFromTime<ToDataType>(vec_to[i],res);
-                    }
-                }
-                else
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 value = 0;
-                        parsed = tryReadDateTime64Text(value, col_to->getScale(), read_buffer, *local_time_zone);
-                        vec_to[i] = value;
-                    }
-                    else if constexpr (IsDataTypeDecimal<ToDataType>)
-                    {
-                        parsed = SerializationDecimal<typename ToDataType::FieldType>::tryReadText(
-                            vec_to[i], read_buffer, ToDataType::maxPrecision(), col_to->getScale());
-                    }
-                    else
-                    {
-                        /// we want to utilize constexpr condition here, which is not mixable with value comparison
-                        do
-                        {
-                            if constexpr (std::is_same_v<FromDataType, DataTypeFixedString> && std::is_same_v<ToDataType, DataTypeIPv6>)
-                            {
-                                if (fixed_string_size == IPV6_BINARY_LENGTH)
-                                {
-                                    readBinary(vec_to[i], read_buffer);
-                                    parsed = true;
-                                    break;
-                                }
-                            }
-
-                            parsed = tryParseImpl<ToDataType>(vec_to[i], read_buffer, local_time_zone, precise_float_parsing);
-                        } while (false);
-                    }
-                }
-
-                if (!isAllRead(read_buffer))
-                    parsed = false;
-
-                if (!parsed)
-                {
-                    if constexpr (std::is_same_v<ToDataType, DataTypeDate32>)
-                    {
-                        vec_to[i] = -static_cast<Int32>(DateLUT::instance().getDayNumOffsetEpoch());
-                    }
-                    else
-                    {
-                        vec_to[i] = static_cast<typename ToDataType::FieldType>(0);
-                    }
-                }
-
-                if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
-                    (*vec_null_map_to)[i] = !parsed;
-            }
-
-            current_offset = next_offset;
-        }
-
-        if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
-            return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
-        else
-            return col_to;
-    }
-};
-
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeString>)
-struct ConvertImpl<DataTypeString, ToDataType, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeString, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal> {};
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeFixedString>)
-struct ConvertImpl<DataTypeFixedString, ToDataType, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeFixedString, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal> {};
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeString>)
-struct ConvertImpl<DataTypeString, ToDataType, Name, ConvertReturnNullOnErrorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeString, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal> {};
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeFixedString>)
-struct ConvertImpl<DataTypeFixedString, ToDataType, Name, ConvertReturnNullOnErrorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeFixedString, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal> {};
-
-template <typename FromDataType, typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (is_any_of<FromDataType, DataTypeString, DataTypeFixedString> && is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>)
-struct ConvertImpl<FromDataType, ToDataType, Name, ConvertReturnZeroOnErrorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::Normal> {};
-
-/// Generic conversion of any type from String. Used for complex types: Array and Tuple or types with custom serialization.
-struct ConvertImplGenericFromString
-{
-    static ColumnPtr execute(ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * column_nullable, size_t input_rows_count)
-    {
-        const IColumn & column_from = *arguments[0].column;
-        const IDataType & data_type_to = *result_type;
-        auto res = data_type_to.createColumn();
-        auto serialization = data_type_to.getDefaultSerialization();
-        const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
-
-        executeImpl(column_from, *res, *serialization, input_rows_count, null_map, result_type.get());
-        return res;
-    }
-
-    static void executeImpl(
-        const IColumn & column_from,
-        IColumn & column_to,
-        const ISerialization & serialization_from,
-        size_t input_rows_count,
-        const PaddedPODArray<UInt8> * null_map,
-        const IDataType * result_type)
-    {
-        column_to.reserve(input_rows_count);
-
-        FormatSettings format_settings;
-        for (size_t i = 0; i < input_rows_count; ++i)
-        {
-            if (null_map && (*null_map)[i])
-            {
-                column_to.insertDefault();
-                continue;
-            }
-
-            const auto & val = column_from.getDataAt(i);
-            ReadBufferFromMemory read_buffer(val.data, val.size);
-            try
-            {
-                serialization_from.deserializeWholeText(column_to, read_buffer, format_settings);
-            }
-            catch (const Exception & e)
-            {
-                auto * nullable_column = typeid_cast<ColumnNullable *>(&column_to);
-                if (e.code() == ErrorCodes::CANNOT_PARSE_BOOL && nullable_column)
-                {
-                    auto & col_nullmap = nullable_column->getNullMapData();
-                    if (col_nullmap.size() != nullable_column->size())
-                        col_nullmap.resize_fill(nullable_column->size());
-                    if (nullable_column->size() == (i + 1))
-                        nullable_column->popBack(1);
-                    nullable_column->insertDefault();
-                    continue;
-                }
-                throw;
-            }
-
-            if (!read_buffer.eof())
-            {
-                if (result_type)
-                    throwExceptionForIncompletelyParsedValue(read_buffer, *result_type);
-                else
-                    throw Exception(ErrorCodes::CANNOT_PARSE_TEXT,
-                        "Cannot parse string to column {}. Expected eof", column_to.getName());
-            }
-        }
-    }
-};
-
-
-template <>
-struct ConvertImpl<DataTypeString, DataTypeUInt32, NameToUnixTimestamp, ConvertDefaultBehaviorTag>
-    : ConvertImpl<DataTypeString, DataTypeDateTime, NameToUnixTimestamp, ConvertDefaultBehaviorTag> {};
-
-template <>
-struct ConvertImpl<DataTypeString, DataTypeUInt32, NameToUnixTimestamp, ConvertReturnNullOnErrorTag>
-    : ConvertImpl<DataTypeString, DataTypeDateTime, NameToUnixTimestamp, ConvertReturnNullOnErrorTag> {};
-
-/** If types are identical, just take reference to column.
-  */
-template <typename T, typename Name>
-requires (!T::is_parametric)
-struct ConvertImpl<T, T, Name, ConvertDefaultBehaviorTag>
-{
-    template <typename Additions = void *>
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/,
-        Additions additions [[maybe_unused]] = Additions())
-    {
-        return arguments[0].column;
-    }
-};
-
-template <typename Name>
-struct ConvertImpl<DataTypeUInt8, DataTypeUInt8, Name, ConvertDefaultBehaviorTag>
-{
-    template <typename Additions = void *>
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/,
-                             Additions additions [[maybe_unused]] = Additions())
-    {
-
-        return arguments[0].column;
-    }
-};
-
-
-/** Conversion from FixedString to String.
-  * Cutting sequences of zero bytes from end of strings.
-  */
-template <typename Name>
-struct ConvertImpl<DataTypeFixedString, DataTypeString, Name, ConvertDefaultBehaviorTag>
-{
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type, size_t /*input_rows_count*/)
-    {
-        ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
-        const auto & nested =  columnGetNested(arguments[0]);
-        if (const ColumnFixedString * col_from = checkAndGetColumn<ColumnFixedString>(nested.column.get()))
-        {
-            auto col_to = ColumnString::create();
-
-            const ColumnFixedString::Chars & data_from = col_from->getChars();
-            ColumnString::Chars & data_to = col_to->getChars();
-            ColumnString::Offsets & offsets_to = col_to->getOffsets();
-            size_t size = col_from->size();
-            size_t n = col_from->getN();
-            data_to.resize(size * (n + 1)); /// + 1 - zero terminator
-            offsets_to.resize(size);
-
-            size_t offset_from = 0;
-            size_t offset_to = 0;
-            for (size_t i = 0; i < size; ++i)
-            {
-                if (!null_map || !null_map->getData()[i])
-                {
-                    size_t bytes_to_copy = n;
-                    while (bytes_to_copy > 0 && data_from[offset_from + bytes_to_copy - 1] == 0)
-                        --bytes_to_copy;
-
-                    memcpy(&data_to[offset_to], &data_from[offset_from], bytes_to_copy);
-                    offset_to += bytes_to_copy;
-                }
-                data_to[offset_to] = 0;
-                ++offset_to;
-                offsets_to[i] = offset_to;
-                offset_from += n;
-            }
-
-            data_to.resize(offset_to);
-            if (return_type->isNullable() && null_map)
-                return ColumnNullable::create(std::move(col_to), std::move(null_map));
-            return col_to;
-        }
-        else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    arguments[0].column->getName(), Name::name);
-    }
-};
-
-
-/// Declared early because used below.
-struct NameToDate { static constexpr auto name = "toDate"; };
-struct NameToDate32 { static constexpr auto name = "toDate32"; };
-struct NameToDateTime { static constexpr auto name = "toDateTime"; };
-struct NameToDateTime32 { static constexpr auto name = "toDateTime32"; };
-struct NameToDateTime64 { static constexpr auto name = "toDateTime64"; };
-struct NameToString { static constexpr auto name = "toString"; };
-struct NameToDecimal32 { static constexpr auto name = "toDecimal32"; };
-struct NameToDecimal64 { static constexpr auto name = "toDecimal64"; };
-struct NameToDecimal128 { static constexpr auto name = "toDecimal128"; };
-struct NameToDecimal256 { static constexpr auto name = "toDecimal256"; };
-
-
-#define DEFINE_NAME_TO_INTERVAL(INTERVAL_KIND) \
-    struct NameToInterval ## INTERVAL_KIND \
-    { \
-        static constexpr auto name = "toInterval" #INTERVAL_KIND; \
-        static constexpr auto kind = IntervalKind::Kind::INTERVAL_KIND; \
-    };
-
-DEFINE_NAME_TO_INTERVAL(Nanosecond)
-DEFINE_NAME_TO_INTERVAL(Microsecond)
-DEFINE_NAME_TO_INTERVAL(Millisecond)
-DEFINE_NAME_TO_INTERVAL(Second)
-DEFINE_NAME_TO_INTERVAL(Minute)
-DEFINE_NAME_TO_INTERVAL(Hour)
-DEFINE_NAME_TO_INTERVAL(Day)
-DEFINE_NAME_TO_INTERVAL(Week)
-DEFINE_NAME_TO_INTERVAL(Month)
-DEFINE_NAME_TO_INTERVAL(Quarter)
-DEFINE_NAME_TO_INTERVAL(Year)
-
-#undef DEFINE_NAME_TO_INTERVAL
-
-struct NameParseDateTimeBestEffort;
-struct NameParseDateTimeBestEffortOrZero;
-struct NameParseDateTimeBestEffortOrNull;
-
-template<typename Name, typename ToDataType>
-static inline bool isDateTime64(const ColumnsWithTypeAndName & arguments)
-{
-    if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
-        return true;
-    else if constexpr (std::is_same_v<Name, NameToDateTime> || std::is_same_v<Name, NameParseDateTimeBestEffort>
-        || std::is_same_v<Name, NameParseDateTimeBestEffortOrZero> || std::is_same_v<Name, NameParseDateTimeBestEffortOrNull>)
-    {
-        return (arguments.size() == 2 && isUInt(arguments[1].type)) || arguments.size() == 3;
-    }
-
-    return false;
-}
-
-template <typename ToDataType, typename Name, typename MonotonicityImpl>
-class FunctionConvert : public IFunction
-{
-public:
-    using Monotonic = MonotonicityImpl;
-
-    static constexpr auto name = Name::name;
-    static constexpr bool to_decimal =
-        std::is_same_v<Name, NameToDecimal32> || std::is_same_v<Name, NameToDecimal64>
-         || std::is_same_v<Name, NameToDecimal128> || std::is_same_v<Name, NameToDecimal256>;
-
-    static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
-
-    static constexpr bool to_string_or_fixed_string = std::is_same_v<ToDataType, DataTypeFixedString> ||
-                                                      std::is_same_v<ToDataType, DataTypeString>;
-
-    static constexpr bool to_date_or_datetime = std::is_same_v<ToDataType, DataTypeDate> ||
-                                                std::is_same_v<ToDataType, DataTypeDate32> ||
-                                                std::is_same_v<ToDataType, DataTypeDateTime>;
-
-    static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionConvert>(context); }
-    static FunctionPtr create() { return std::make_shared<FunctionConvert>(); }
-
-    FunctionConvert() = default;
-    explicit FunctionConvert(ContextPtr context_) : context(context_) {}
-
-    String getName() const override
-    {
-        return name;
-    }
-
-    bool isVariadic() const override { return true; }
-    size_t getNumberOfArguments() const override { return 0; }
-    bool isInjective(const ColumnsWithTypeAndName &) const override { return std::is_same_v<Name, NameToString>; }
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & arguments) const override
-    {
-        /// TODO: We can make more optimizations here.
-        return !(to_date_or_datetime && isNumber(*arguments[0].type));
-    }
-
-    using DefaultReturnTypeGetter = std::function<DataTypePtr(const ColumnsWithTypeAndName &)>;
-    static DataTypePtr getReturnTypeDefaultImplementationForNulls(const ColumnsWithTypeAndName & arguments, const DefaultReturnTypeGetter & getter)
-    {
-        NullPresence null_presence = getNullPresense(arguments);
-
-        if (null_presence.has_null_constant)
-        {
-            return makeNullable(std::make_shared<DataTypeNothing>());
-        }
-        if (null_presence.has_nullable)
-        {
-            auto nested_columns = Block(createBlockWithNestedColumns(arguments));
-            auto return_type = getter(ColumnsWithTypeAndName(nested_columns.begin(), nested_columns.end()));
-            return makeNullable(return_type);
-        }
-
-        return getter(arguments);
-    }
-
-    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
-    {
-        auto getter = [&] (const auto & args) { return getReturnTypeImplRemovedNullable(args); };
-        auto res = getReturnTypeDefaultImplementationForNulls(arguments, getter);
-        to_nullable = res->isNullable();
-        checked_return_type = true;
-        return res;
-    }
-
-    DataTypePtr getReturnTypeImplRemovedNullable(const ColumnsWithTypeAndName & arguments) const
-    {
-        FunctionArgumentDescriptors mandatory_args = {{"Value", nullptr, nullptr, nullptr}};
-        FunctionArgumentDescriptors optional_args;
-
-        if constexpr (to_decimal)
-        {
-            mandatory_args.push_back({"scale", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isNativeInteger), &isColumnConst, "const Integer"});
-        }
-
-        if (!to_decimal && isDateTime64<Name, ToDataType>(arguments))
-        {
-            mandatory_args.push_back({"scale", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isNativeInteger), &isColumnConst, "const Integer"});
-        }
-
-        // toString(DateTime or DateTime64, [timezone: String])
-        if ((std::is_same_v<Name, NameToString> && !arguments.empty() && (isDateTime64(arguments[0].type) || isDateTime(arguments[0].type)))
-            // toUnixTimestamp(value[, timezone : String])
-            || std::is_same_v<Name, NameToUnixTimestamp>
-            // toDate(value[, timezone : String])
-            || std::is_same_v<ToDataType, DataTypeDate> // TODO: shall we allow timestamp argument for toDate? DateTime knows nothing about timezones and this argument is ignored below.
-            // toDate32(value[, timezone : String])
-            || std::is_same_v<ToDataType, DataTypeDate32>
-            // toDateTime(value[, timezone: String])
-            || std::is_same_v<ToDataType, DataTypeDateTime>
-            // toDateTime64(value, scale : Integer[, timezone: String])
-            || std::is_same_v<ToDataType, DataTypeDateTime64>)
-        {
-            optional_args.push_back({"timezone", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isString), nullptr, "String"});
-        }
-
-        validateFunctionArgumentTypes(*this, arguments, mandatory_args, optional_args);
-
-        if constexpr (std::is_same_v<ToDataType, DataTypeInterval>)
-        {
-            return std::make_shared<DataTypeInterval>(Name::kind);
-        }
-        else if constexpr (to_decimal)
-        {
-            UInt64 scale = extractToDecimalScale(arguments[1]);
-
-            if constexpr (std::is_same_v<Name, NameToDecimal32>)
-                return createDecimalMaxPrecision<Decimal32>(scale);
-            else if constexpr (std::is_same_v<Name, NameToDecimal64>)
-                return createDecimalMaxPrecision<Decimal64>(scale);
-            else if constexpr (std::is_same_v<Name, NameToDecimal128>)
-                return createDecimalMaxPrecision<Decimal128>(scale);
-            else if constexpr (std::is_same_v<Name, NameToDecimal256>)
-                return createDecimalMaxPrecision<Decimal256>(scale);
-
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected branch in code of conversion function: it is a bug.");
-        }
-        else
-        {
-            // Optional second argument with time zone for DateTime.
-            UInt8 timezone_arg_position = 1;
-            UInt32 scale [[maybe_unused]] = DataTypeDateTime64::default_scale;
-
-            // DateTime64 requires more arguments: scale and timezone. Since timezone is optional, scale should be first.
-            if (isDateTime64<Name, ToDataType>(arguments))
-            {
-                timezone_arg_position += 1;
-                scale = static_cast<UInt32>(arguments[1].column->get64(0));
-
-                if (to_datetime64 || scale != 0) /// toDateTime('xxxx-xx-xx xx:xx:xx', 0) return DateTime
-                    return std::make_shared<DataTypeDateTime64>(scale,
-                        extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
-
-                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
-            }
-
-            if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
-                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
-            else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected branch in code of conversion function: it is a bug.");
-            else
-                return std::make_shared<ToDataType>();
-        }
-    }
-
-    /// Function actually uses default implementation for nulls,
-    /// but we need to know if return type is Nullable or not,
-    /// so we use checked_return_type only to intercept the first call to getReturnTypeImpl(...).
-    bool useDefaultImplementationForNulls() const override
-    {
-        bool to_nullable_string = to_nullable && std::is_same_v<ToDataType, DataTypeString>;
-        return checked_return_type && !to_nullable_string;
-    }
-
-    bool useDefaultImplementationForConstants() const override { return true; }
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override
-    {
-        if constexpr (std::is_same_v<ToDataType, DataTypeString>)
-            return {};
-        else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
-            return {2};
-        return {1};
-    }
-    bool canBeExecutedOnDefaultArguments() const override { return false; }
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
-    {
-        try
-        {
-            return executeInternal(arguments, result_type, input_rows_count);
-        }
-        catch (Exception & e)
-        {
-            /// More convenient error message.
-            if (e.code() == ErrorCodes::ATTEMPT_TO_READ_AFTER_EOF)
-            {
-                e.addMessage("Cannot parse "
-                    + result_type->getName() + " from "
-                    + arguments[0].type->getName()
-                    + ", because value is too short");
-            }
-            else if (e.code() == ErrorCodes::CANNOT_PARSE_NUMBER
-                || e.code() == ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT
-                || e.code() == ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED
-                || e.code() == ErrorCodes::CANNOT_PARSE_QUOTED_STRING
-                || e.code() == ErrorCodes::CANNOT_PARSE_ESCAPE_SEQUENCE
-                || e.code() == ErrorCodes::CANNOT_PARSE_DATE
-                || e.code() == ErrorCodes::CANNOT_PARSE_DATETIME
-                || e.code() == ErrorCodes::CANNOT_PARSE_UUID
-                || e.code() == ErrorCodes::CANNOT_PARSE_IPV4
-                || e.code() == ErrorCodes::CANNOT_PARSE_IPV6)
-            {
-                e.addMessage("Cannot parse "
-                    + result_type->getName() + " from "
-                    + arguments[0].type->getName());
-            }
-
-            throw;
-        }
-    }
-
-    bool hasInformationAboutMonotonicity() const override
-    {
-        return Monotonic::has();
-    }
-
-    Monotonicity getMonotonicityForRange(const IDataType & type, const Field & left, const Field & right) const override
-    {
-        return Monotonic::get(type, left, right);
-    }
-
-private:
-    ContextPtr context;
-    mutable bool checked_return_type = false;
-    mutable bool to_nullable = false;
-
-    ColumnPtr executeInternal(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const
-    {
-        if (arguments.empty())
-            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} expects at least 1 argument", getName());
-
-        if (result_type->onlyNull())
-            return result_type->createColumnConstWithDefaultValue(input_rows_count);
-
-        const DataTypePtr from_type = removeNullable(arguments[0].type);
-        ColumnPtr result_column;
-
-        [[maybe_unused]] FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior;
-
-        if (context)
-            date_time_overflow_behavior = context->getSettingsRef().date_time_overflow_behavior.value;
-
-        auto call = [&](const auto & types, const auto & tag) -> bool
-        {
-            using Types = std::decay_t<decltype(types)>;
-            using LeftDataType = typename Types::LeftType;
-            using RightDataType = typename Types::RightType;
-            using SpecialTag = std::decay_t<decltype(tag)>;
-
-            if constexpr (IsDataTypeDecimal<RightDataType>)
-            {
-                if constexpr (std::is_same_v<RightDataType, DataTypeDateTime64>)
-                {
-                    /// Account for optional timezone argument.
-                    if (arguments.size() != 2 && arguments.size() != 3)
-                        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} expects 2 or 3 arguments for DataTypeDateTime64.", getName());
-                }
-                else if (arguments.size() != 2)
-                {
-                    throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} expects 2 arguments for Decimal.", getName());
-                }
-
-                const ColumnWithTypeAndName & scale_column = arguments[1];
-                UInt32 scale = extractToDecimalScale(scale_column);
-
-                switch (date_time_overflow_behavior)
-                {
-                    case FormatSettings::DateTimeOverflowBehavior::Throw:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, scale);
-                        break;
-                    case FormatSettings::DateTimeOverflowBehavior::Ignore:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, scale);
-                        break;
-                    case FormatSettings::DateTimeOverflowBehavior::Saturate:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, scale);
-                        break;
-                }
-
-            }
-            else if constexpr (IsDataTypeDateOrDateTime<RightDataType> && std::is_same_v<LeftDataType, DataTypeDateTime64>)
-            {
-                const auto * dt64 = assert_cast<const DataTypeDateTime64 *>(arguments[0].type.get());
-                switch (date_time_overflow_behavior)
-                {
-                    case FormatSettings::DateTimeOverflowBehavior::Throw:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, dt64->getScale());
-                        break;
-                    case FormatSettings::DateTimeOverflowBehavior::Ignore:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, dt64->getScale());
-                        break;
-                    case FormatSettings::DateTimeOverflowBehavior::Saturate:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, dt64->getScale());
-                        break;
-                }
-            }
-#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE) \
-            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-                result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
-                arguments, result_type, input_rows_count); \
-                break;
-
-            else if constexpr (IsDataTypeDecimalOrNumber<LeftDataType> && IsDataTypeDecimalOrNumber<RightDataType>)
-            {
-                using LeftT = typename LeftDataType::FieldType;
-                using RightT = typename RightDataType::FieldType;
-
-                static constexpr bool bad_left =
-                    is_decimal<LeftT> || std::is_floating_point_v<LeftT> || is_big_int_v<LeftT> || is_signed_v<LeftT>;
-                static constexpr bool bad_right =
-                    is_decimal<RightT> || std::is_floating_point_v<RightT> || is_big_int_v<RightT> || is_signed_v<RightT>;
-
-                /// Disallow int vs UUID conversion (but support int vs UInt128 conversion)
-                if constexpr ((bad_left && std::is_same_v<RightDataType, DataTypeUUID>) ||
-                              (bad_right && std::is_same_v<LeftDataType, DataTypeUUID>))
-                {
-                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Wrong UUID conversion");
-                }
-                else
-                {
-                    switch (date_time_overflow_behavior)
-                    {
-                        GENERATE_OVERFLOW_MODE_CASE(Throw)
-                        GENERATE_OVERFLOW_MODE_CASE(Ignore)
-                        GENERATE_OVERFLOW_MODE_CASE(Saturate)
-                    }
-                }
-            }
-            else if constexpr ((IsDataTypeNumber<LeftDataType> || IsDataTypeDateOrDateTime<LeftDataType>)
-                               && IsDataTypeDateOrDateTime<RightDataType>)
-            {
-                switch (date_time_overflow_behavior)
-                {
-                    GENERATE_OVERFLOW_MODE_CASE(Throw)
-                    GENERATE_OVERFLOW_MODE_CASE(Ignore)
-                    GENERATE_OVERFLOW_MODE_CASE(Saturate)
-                }
-            }
-#undef GENERATE_OVERFLOW_MODE_CASE
-            else
-                  result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag>::execute(arguments, result_type, input_rows_count);
-
-            return true;
-        };
-
-        if (isDateTime64<Name, ToDataType>(arguments))
-        {
-            /// For toDateTime('xxxx-xx-xx xx:xx:xx.00', 2[, 'timezone']) we need to it convert to DateTime64
-            const ColumnWithTypeAndName & scale_column = arguments[1];
-            UInt32 scale = extractToDecimalScale(scale_column);
-
-            if (to_datetime64 || scale != 0) /// When scale = 0, the data type is DateTime otherwise the data type is DateTime64
-            {
-                if (!callOnIndexAndDataType<DataTypeDateTime64>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{}))
-                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
-                                    arguments[0].type->getName(), getName());
-
-                return result_column;
-            }
-        }
-
-        if constexpr (std::is_same_v<ToDataType, DataTypeString>)
-        {
-            if (from_type->getCustomSerialization())
-                return ConvertImplGenericToString<ColumnString>::execute(arguments, result_type, input_rows_count);
-        }
-
-        bool done = false;
-        if constexpr (to_string_or_fixed_string)
-        {
-            done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
-        }
-        else
-        {
-            bool cast_ipv4_ipv6_default_on_conversion_error = false;
-            if constexpr (is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>)
-                if (context && (cast_ipv4_ipv6_default_on_conversion_error = context->getSettingsRef().cast_ipv4_ipv6_default_on_conversion_error))
-                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertReturnZeroOnErrorTag{});
-
-            if (!cast_ipv4_ipv6_default_on_conversion_error)
-            {
-                /// We should use ConvertFromStringExceptionMode::Null mode when converting from String (or FixedString)
-                /// to Nullable type, to avoid 'value is too short' error on attempt to parse empty string from NULL values.
-                if (to_nullable && WhichDataType(from_type).isStringOrFixedString())
-                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertReturnNullOnErrorTag{});
-                else
-                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
-            }
-        }
-
-        if (!done)
-        {
-            /// Generic conversion of any type to String.
-            if (std::is_same_v<ToDataType, DataTypeString>)
-            {
-                return ConvertImplGenericToString<ColumnString>::execute(arguments, result_type, input_rows_count);
-            }
-            else
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
-                    arguments[0].type->getName(), getName());
-        }
-
-        return result_column;
-    }
-};
-
-
-/** Function toTOrZero (where T is number of date or datetime type):
-  *  try to convert from String to type T through parsing,
-  *  if cannot parse, return default value instead of throwing exception.
-  * Function toTOrNull will return Nullable type with NULL when cannot parse.
-  * NOTE Also need to implement tryToUnixTimestamp with timezone.
-  */
-template <typename ToDataType, typename Name,
-    ConvertFromStringExceptionMode exception_mode,
-    ConvertFromStringParsingMode parsing_mode = ConvertFromStringParsingMode::Normal>
-class FunctionConvertFromString : public IFunction
-{
-public:
-    static constexpr auto name = Name::name;
-    static constexpr bool to_decimal =
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal32>> ||
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal64>> ||
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal128>> ||
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal256>>;
-
-    static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
-
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionConvertFromString>(); }
-    static FunctionPtr create() { return std::make_shared<FunctionConvertFromString>(); }
-
-    String getName() const override
-    {
-        return name;
-    }
-
-    bool isVariadic() const override { return true; }
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
-    size_t getNumberOfArguments() const override { return 0; }
-
-    bool useDefaultImplementationForConstants() const override { return true; }
-    bool canBeExecutedOnDefaultArguments() const override { return false; }
-
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
-
-    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
-    {
-        DataTypePtr res;
-
-        if (isDateTime64<Name, ToDataType>(arguments))
-        {
-            validateFunctionArgumentTypes(*this, arguments,
-                FunctionArgumentDescriptors{{"string", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isStringOrFixedString), nullptr, "String or FixedString"}},
-                // optional
-                FunctionArgumentDescriptors{
-                    {"precision", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isUInt8), isColumnConst, "const UInt8"},
-                    {"timezone", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isStringOrFixedString), isColumnConst, "const String or FixedString"},
-                });
-
-            UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
-            if (arguments.size() > 1)
-                scale = extractToDecimalScale(arguments[1]);
-            const auto timezone = extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false);
-
-            res = scale == 0 ? res = std::make_shared<DataTypeDateTime>(timezone) : std::make_shared<DataTypeDateTime64>(scale, timezone);
-        }
-        else
-        {
-            if ((arguments.size() != 1 && arguments.size() != 2) || (to_decimal && arguments.size() != 2))
-                throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
-                    "Number of arguments for function {} doesn't match: passed {}, should be 1 or 2. "
-                    "Second argument only make sense for DateTime (time zone, optional) and Decimal (scale).",
-                    getName(), arguments.size());
-
-            if (!isStringOrFixedString(arguments[0].type))
-            {
-                if (this->getName().find("OrZero") != std::string::npos ||
-                    this->getName().find("OrNull") != std::string::npos)
-                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument of function {}. "
-                            "Conversion functions with postfix 'OrZero' or 'OrNull' should take String argument",
-                            arguments[0].type->getName(), getName());
-                else
-                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument of function {}",
-                            arguments[0].type->getName(), getName());
-            }
-
-            if (arguments.size() == 2)
-            {
-                if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
-                {
-                    if (!isString(arguments[1].type))
-                        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of 2nd argument of function {}",
-                            arguments[1].type->getName(), getName());
-                }
-                else if constexpr (to_decimal)
-                {
-                    if (!isInteger(arguments[1].type))
-                        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of 2nd argument of function {}",
-                            arguments[1].type->getName(), getName());
-                    if (!arguments[1].column)
-                        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Second argument for function {} must be constant", getName());
-                }
-                else
-                {
-                    throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
-                        "Number of arguments for function {} doesn't match: passed {}, should be 1. "
-                        "Second argument makes sense only for DateTime and Decimal.",
-                        getName(), arguments.size());
-                }
-            }
-
-            if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
-                res = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, false));
-            else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "MaterializedMySQL is a bug.");
-            else if constexpr (to_decimal)
-            {
-                UInt64 scale = extractToDecimalScale(arguments[1]);
-                res = createDecimalMaxPrecision<typename ToDataType::FieldType>(scale);
-                if (!res)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Something wrong with toDecimalNNOrZero() or toDecimalNNOrNull()");
-            }
-            else
-                res = std::make_shared<ToDataType>();
-        }
-
-        if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
-            res = std::make_shared<DataTypeNullable>(res);
-
-        return res;
-    }
-
-    template <typename ConvertToDataType>
-    ColumnPtr executeInternal(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count, UInt32 scale = 0) const
-    {
-        const IDataType * from_type = arguments[0].type.get();
-
-        if (checkAndGetDataType<DataTypeString>(from_type))
-        {
-            return ConvertThroughParsing<DataTypeString, ConvertToDataType, Name, exception_mode, parsing_mode>::execute(
-                arguments, result_type, input_rows_count, scale);
-        }
-        else if (checkAndGetDataType<DataTypeFixedString>(from_type))
-        {
-            return ConvertThroughParsing<DataTypeFixedString, ConvertToDataType, Name, exception_mode, parsing_mode>::execute(
-                arguments, result_type, input_rows_count, scale);
-        }
-
-        return nullptr;
-    }
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
-    {
-        ColumnPtr result_column;
-
-        if constexpr (to_decimal)
-            result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count,
-                assert_cast<const ToDataType &>(*removeNullable(result_type)).getScale());
-        else
-        {
-            if (isDateTime64<Name, ToDataType>(arguments))
-            {
-                UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
-                if (arguments.size() > 1)
-                    scale = extractToDecimalScale(arguments[1]);
-
-                if (scale == 0)
-                    result_column = executeInternal<DataTypeDateTime>(arguments, result_type, input_rows_count);
-                else
-                {
-                    result_column = executeInternal<DataTypeDateTime64>(arguments, result_type, input_rows_count, static_cast<UInt32>(scale));
-                }
-            }
-            else
-            {
-                result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count);
-            }
-        }
-
-        if (!result_column)
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
-                "Only String or FixedString argument is accepted for try-conversion function. For other arguments, "
-                "use function without 'orZero' or 'orNull'.", arguments[0].type->getName(), getName());
-
-        return result_column;
-    }
-};
-
-
-/// Monotonicity.
-
-struct PositiveMonotonicity
-{
-    static bool has() { return true; }
-    static IFunction::Monotonicity get(const IDataType &, const Field &, const Field &)
-    {
-        return { .is_monotonic = true };
-    }
-};
-
-struct UnknownMonotonicity
-{
-    static bool has() { return false; }
-    static IFunction::Monotonicity get(const IDataType &, const Field &, const Field &)
-    {
-        return { };
-    }
-};
-
-template <typename T>
-struct ToNumberMonotonicity
-{
-    static bool has() { return true; }
-
-    static UInt64 divideByRangeOfType(UInt64 x)
-    {
-        if constexpr (sizeof(T) < sizeof(UInt64))
-            return x >> (sizeof(T) * 8);
-        else
-            return 0;
-    }
-
-    static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
-    {
-        if (!type.isValueRepresentedByNumber())
-            return {};
-
-        /// If type is same, the conversion is always monotonic.
-        /// (Enum has separate case, because it is different data type)
-        if (checkAndGetDataType<DataTypeNumber<T>>(&type) ||
-            checkAndGetDataType<DataTypeEnum<T>>(&type))
-            return { .is_monotonic = true, .is_always_monotonic = true };
-
-        /// Float cases.
-
-        /// When converting to Float, the conversion is always monotonic.
-        if constexpr (std::is_floating_point_v<T>)
-            return { .is_monotonic = true, .is_always_monotonic = true };
-
-        const auto * low_cardinality = typeid_cast<const DataTypeLowCardinality *>(&type);
-        const IDataType * low_cardinality_dictionary_type = nullptr;
-        if (low_cardinality)
-            low_cardinality_dictionary_type = low_cardinality->getDictionaryType().get();
-
-        WhichDataType which_type(type);
-        WhichDataType which_inner_type = low_cardinality
-            ? WhichDataType(low_cardinality_dictionary_type)
-            : WhichDataType(type);
-
-        /// If converting from Float, for monotonicity, arguments must fit in range of result type.
-        if (which_inner_type.isFloat())
-        {
-            if (left.isNull() || right.isNull())
-                return {};
-
-            Float64 left_float = left.get<Float64>();
-            Float64 right_float = right.get<Float64>();
-
-            if (left_float >= static_cast<Float64>(std::numeric_limits<T>::min())
-                && left_float <= static_cast<Float64>(std::numeric_limits<T>::max())
-                && right_float >= static_cast<Float64>(std::numeric_limits<T>::min())
-                && right_float <= static_cast<Float64>(std::numeric_limits<T>::max()))
-                return { .is_monotonic = true };
-
-            return {};
-        }
-
-        /// Integer cases.
-
-        /// Only support types represented by native integers.
-        /// It can be extended to big integers, decimals and DateTime64 later.
-        /// By the way, NULLs are representing unbounded ranges.
-        if (!((left.isNull() || left.getType() == Field::Types::UInt64 || left.getType() == Field::Types::Int64)
-            && (right.isNull() || right.getType() == Field::Types::UInt64 || right.getType() == Field::Types::Int64)))
-            return {};
-
-        const bool from_is_unsigned = type.isValueRepresentedByUnsignedInteger();
-        const bool to_is_unsigned = is_unsigned_v<T>;
-
-        const size_t size_of_from = type.getSizeOfValueInMemory();
-        const size_t size_of_to = sizeof(T);
-
-        const bool left_in_first_half = left.isNull()
-            ? from_is_unsigned
-            : (left.get<Int64>() >= 0);
-
-        const bool right_in_first_half = right.isNull()
-            ? !from_is_unsigned
-            : (right.get<Int64>() >= 0);
-
-        /// Size of type is the same.
-        if (size_of_from == size_of_to)
-        {
-            if (from_is_unsigned == to_is_unsigned)
-                return { .is_monotonic = true, .is_always_monotonic = true };
-
-            if (left_in_first_half == right_in_first_half)
-                return { .is_monotonic = true };
-
-            return {};
-        }
-
-        /// Size of type is expanded.
-        if (size_of_from < size_of_to)
-        {
-            if (from_is_unsigned == to_is_unsigned)
-                return { .is_monotonic = true, .is_always_monotonic = true };
-
-            if (!to_is_unsigned)
-                return { .is_monotonic = true, .is_always_monotonic = true };
-
-            /// signed -> unsigned. If arguments from the same half, then function is monotonic.
-            if (left_in_first_half == right_in_first_half)
-                return { .is_monotonic = true };
-
-            return {};
-        }
-
-        /// Size of type is shrunk.
-        if (size_of_from > size_of_to)
-        {
-            /// Function cannot be monotonic on unbounded ranges.
-            if (left.isNull() || right.isNull())
-                return {};
-
-            /// Function cannot be monotonic when left and right are not on the same ranges.
-            if (divideByRangeOfType(left.get<UInt64>()) != divideByRangeOfType(right.get<UInt64>()))
-                return {};
-
-            if (to_is_unsigned)
-                return { .is_monotonic = true };
-            else
-            {
-                // If To is signed, it's possible that the signedness is different after conversion. So we check it explicitly.
-                const bool is_monotonic = (T(left.get<UInt64>()) >= 0) == (T(right.get<UInt64>()) >= 0);
-
-                return { .is_monotonic = is_monotonic };
-            }
-        }
-
-        UNREACHABLE();
-    }
-};
-
-struct ToDateMonotonicity
-{
-    static bool has() { return true; }
-
-    static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
-    {
-        auto which = WhichDataType(type);
-        if (which.isDateOrDate32() || which.isDateTime() || which.isDateTime64() || which.isInt8() || which.isInt16() || which.isUInt8()
-            || which.isUInt16())
-        {
-            return {.is_monotonic = true, .is_always_monotonic = true};
-        }
-        else if (
-            ((left.getType() == Field::Types::UInt64 || left.isNull()) && (right.getType() == Field::Types::UInt64 || right.isNull())
-             && ((left.isNull() || left.get<UInt64>() < 0xFFFF) && (right.isNull() || right.get<UInt64>() >= 0xFFFF)))
-            || ((left.getType() == Field::Types::Int64 || left.isNull()) && (right.getType() == Field::Types::Int64 || right.isNull())
-                && ((left.isNull() || left.get<Int64>() < 0xFFFF) && (right.isNull() || right.get<Int64>() >= 0xFFFF)))
-            || ((
-                (left.getType() == Field::Types::Float64 || left.isNull())
-                && (right.getType() == Field::Types::Float64 || right.isNull())
-                && ((left.isNull() || left.get<Float64>() < 0xFFFF) && (right.isNull() || right.get<Float64>() >= 0xFFFF))))
-            || !isNativeNumber(type))
-        {
-            return {};
-        }
-        else
-        {
-            return {.is_monotonic = true, .is_always_monotonic = true};
-        }
-    }
-};
-
-struct ToDateTimeMonotonicity
-{
-    static bool has() { return true; }
-
-    static IFunction::Monotonicity get(const IDataType & type, const Field &, const Field &)
-    {
-        if (type.isValueRepresentedByNumber())
-            return {.is_monotonic = true, .is_always_monotonic = true};
-        else
-            return {};
-    }
-};
-
-/** The monotonicity for the `toString` function is mainly determined for test purposes.
-  * It is doubtful that anyone is looking to optimize queries with conditions `toString(CounterID) = 34`.
-  */
-struct ToStringMonotonicity
-{
-    static bool has() { return true; }
-
-    static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
-    {
-        IFunction::Monotonicity positive{ .is_monotonic = true };
-        IFunction::Monotonicity not_monotonic;
-
-        const auto * type_ptr = &type;
-        if (const auto * low_cardinality_type = checkAndGetDataType<DataTypeLowCardinality>(type_ptr))
-            type_ptr = low_cardinality_type->getDictionaryType().get();
-
-        /// Order on enum values (which is the order on integers) is completely arbitrary in respect to the order on strings.
-        if (WhichDataType(type).isEnum())
-            return not_monotonic;
-
-        /// `toString` function is monotonous if the argument is Date or Date32 or DateTime or String, or non-negative numbers with the same number of symbols.
-        if (checkDataTypes<DataTypeDate, DataTypeDate32, DataTypeDateTime, DataTypeString>(type_ptr))
-            return positive;
-
-        if (left.isNull() || right.isNull())
-            return {};
-
-        if (left.getType() == Field::Types::UInt64
-            && right.getType() == Field::Types::UInt64)
-        {
-            return (left.get<Int64>() == 0 && right.get<Int64>() == 0)
-                || (floor(log10(left.get<UInt64>())) == floor(log10(right.get<UInt64>())))
-                ? positive : not_monotonic;
-        }
-
-        if (left.getType() == Field::Types::Int64
-            && right.getType() == Field::Types::Int64)
-        {
-            return (left.get<Int64>() == 0 && right.get<Int64>() == 0)
-                || (left.get<Int64>() > 0 && right.get<Int64>() > 0 && floor(log10(left.get<Int64>())) == floor(log10(right.get<Int64>())))
-                ? positive : not_monotonic;
-        }
-
-        return not_monotonic;
-    }
-};
-
-
-struct NameToUInt8 { static constexpr auto name = "toUInt8"; };
-struct NameToUInt16 { static constexpr auto name = "toUInt16"; };
-struct NameToUInt32 { static constexpr auto name = "toUInt32"; };
-struct NameToUInt64 { static constexpr auto name = "toUInt64"; };
-struct NameToUInt128 { static constexpr auto name = "toUInt128"; };
-struct NameToUInt256 { static constexpr auto name = "toUInt256"; };
-struct NameToInt8 { static constexpr auto name = "toInt8"; };
-struct NameToInt16 { static constexpr auto name = "toInt16"; };
-struct NameToInt32 { static constexpr auto name = "toInt32"; };
-struct NameToInt64 { static constexpr auto name = "toInt64"; };
-struct NameToInt128 { static constexpr auto name = "toInt128"; };
-struct NameToInt256 { static constexpr auto name = "toInt256"; };
-struct NameToFloat32 { static constexpr auto name = "toFloat32"; };
-struct NameToFloat64 { static constexpr auto name = "toFloat64"; };
-struct NameToUUID { static constexpr auto name = "toUUID"; };
-struct NameToIPv4 { static constexpr auto name = "toIPv4"; };
-struct NameToIPv6 { static constexpr auto name = "toIPv6"; };
-
-using FunctionToUInt8 = FunctionConvert<DataTypeUInt8, NameToUInt8, ToNumberMonotonicity<UInt8>>;
-using FunctionToUInt16 = FunctionConvert<DataTypeUInt16, NameToUInt16, ToNumberMonotonicity<UInt16>>;
-using FunctionToUInt32 = FunctionConvert<DataTypeUInt32, NameToUInt32, ToNumberMonotonicity<UInt32>>;
-using FunctionToUInt64 = FunctionConvert<DataTypeUInt64, NameToUInt64, ToNumberMonotonicity<UInt64>>;
-using FunctionToUInt128 = FunctionConvert<DataTypeUInt128, NameToUInt128, ToNumberMonotonicity<UInt128>>;
-using FunctionToUInt256 = FunctionConvert<DataTypeUInt256, NameToUInt256, ToNumberMonotonicity<UInt256>>;
-using FunctionToInt8 = FunctionConvert<DataTypeInt8, NameToInt8, ToNumberMonotonicity<Int8>>;
-using FunctionToInt16 = FunctionConvert<DataTypeInt16, NameToInt16, ToNumberMonotonicity<Int16>>;
-using FunctionToInt32 = FunctionConvert<DataTypeInt32, NameToInt32, ToNumberMonotonicity<Int32>>;
-using FunctionToInt64 = FunctionConvert<DataTypeInt64, NameToInt64, ToNumberMonotonicity<Int64>>;
-using FunctionToInt128 = FunctionConvert<DataTypeInt128, NameToInt128, ToNumberMonotonicity<Int128>>;
-using FunctionToInt256 = FunctionConvert<DataTypeInt256, NameToInt256, ToNumberMonotonicity<Int256>>;
-using FunctionToFloat32 = FunctionConvert<DataTypeFloat32, NameToFloat32, ToNumberMonotonicity<Float32>>;
-using FunctionToFloat64 = FunctionConvert<DataTypeFloat64, NameToFloat64, ToNumberMonotonicity<Float64>>;
-
-using FunctionToDate = FunctionConvert<DataTypeDate, NameToDate, ToDateMonotonicity>;
-
-using FunctionToDate32 = FunctionConvert<DataTypeDate32, NameToDate32, ToDateMonotonicity>;
-
-using FunctionToDateTime = FunctionConvert<DataTypeDateTime, NameToDateTime, ToDateTimeMonotonicity>;
-
-using FunctionToDateTime32 = FunctionConvert<DataTypeDateTime, NameToDateTime32, ToDateTimeMonotonicity>;
-
-using FunctionToDateTime64 = FunctionConvert<DataTypeDateTime64, NameToDateTime64, ToDateTimeMonotonicity>;
-
-using FunctionToUUID = FunctionConvert<DataTypeUUID, NameToUUID, ToNumberMonotonicity<UInt128>>;
-using FunctionToIPv4 = FunctionConvert<DataTypeIPv4, NameToIPv4, ToNumberMonotonicity<UInt32>>;
-using FunctionToIPv6 = FunctionConvert<DataTypeIPv6, NameToIPv6, ToNumberMonotonicity<UInt128>>;
-using FunctionToString = FunctionConvert<DataTypeString, NameToString, ToStringMonotonicity>;
-using FunctionToUnixTimestamp = FunctionConvert<DataTypeUInt32, NameToUnixTimestamp, ToNumberMonotonicity<UInt32>>;
-using FunctionToDecimal32 = FunctionConvert<DataTypeDecimal<Decimal32>, NameToDecimal32, UnknownMonotonicity>;
-using FunctionToDecimal64 = FunctionConvert<DataTypeDecimal<Decimal64>, NameToDecimal64, UnknownMonotonicity>;
-using FunctionToDecimal128 = FunctionConvert<DataTypeDecimal<Decimal128>, NameToDecimal128, UnknownMonotonicity>;
-using FunctionToDecimal256 = FunctionConvert<DataTypeDecimal<Decimal256>, NameToDecimal256, UnknownMonotonicity>;
-
-template <typename DataType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior> struct FunctionTo;
-
-template <> struct FunctionTo<DataTypeUInt8> { using Type = FunctionToUInt8; };
-template <> struct FunctionTo<DataTypeUInt16> { using Type = FunctionToUInt16; };
-template <> struct FunctionTo<DataTypeUInt32> { using Type = FunctionToUInt32; };
-template <> struct FunctionTo<DataTypeUInt64> { using Type = FunctionToUInt64; };
-template <> struct FunctionTo<DataTypeUInt128> { using Type = FunctionToUInt128; };
-template <> struct FunctionTo<DataTypeUInt256> { using Type = FunctionToUInt256; };
-template <> struct FunctionTo<DataTypeInt8> { using Type = FunctionToInt8; };
-template <> struct FunctionTo<DataTypeInt16> { using Type = FunctionToInt16; };
-template <> struct FunctionTo<DataTypeInt32> { using Type = FunctionToInt32; };
-template <> struct FunctionTo<DataTypeInt64> { using Type = FunctionToInt64; };
-template <> struct FunctionTo<DataTypeInt128> { using Type = FunctionToInt128; };
-template <> struct FunctionTo<DataTypeInt256> { using Type = FunctionToInt256; };
-template <> struct FunctionTo<DataTypeFloat32> { using Type = FunctionToFloat32; };
-template <> struct FunctionTo<DataTypeFloat64> { using Type = FunctionToFloat64; };
-
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct FunctionTo<DataTypeDate, date_time_overflow_behavior> { using Type = FunctionToDate; };
-
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct FunctionTo<DataTypeDate32, date_time_overflow_behavior> { using Type = FunctionToDate32; };
-
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct FunctionTo<DataTypeDateTime, date_time_overflow_behavior> { using Type = FunctionToDateTime; };
-
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct FunctionTo<DataTypeDateTime64, date_time_overflow_behavior> { using Type = FunctionToDateTime64; };
-
-template <> struct FunctionTo<DataTypeUUID> { using Type = FunctionToUUID; };
-template <> struct FunctionTo<DataTypeIPv4> { using Type = FunctionToIPv4; };
-template <> struct FunctionTo<DataTypeIPv6> { using Type = FunctionToIPv6; };
-template <> struct FunctionTo<DataTypeString> { using Type = FunctionToString; };
-template <> struct FunctionTo<DataTypeFixedString> { using Type = FunctionToFixedString; };
-template <> struct FunctionTo<DataTypeDecimal<Decimal32>> { using Type = FunctionToDecimal32; };
-template <> struct FunctionTo<DataTypeDecimal<Decimal64>> { using Type = FunctionToDecimal64; };
-template <> struct FunctionTo<DataTypeDecimal<Decimal128>> { using Type = FunctionToDecimal128; };
-template <> struct FunctionTo<DataTypeDecimal<Decimal256>> { using Type = FunctionToDecimal256; };
-
-template <typename FieldType> struct FunctionTo<DataTypeEnum<FieldType>>
-    : FunctionTo<DataTypeNumber<FieldType>>
-{
-};
-
-struct NameToUInt8OrZero { static constexpr auto name = "toUInt8OrZero"; };
-struct NameToUInt16OrZero { static constexpr auto name = "toUInt16OrZero"; };
-struct NameToUInt32OrZero { static constexpr auto name = "toUInt32OrZero"; };
-struct NameToUInt64OrZero { static constexpr auto name = "toUInt64OrZero"; };
-struct NameToUInt128OrZero { static constexpr auto name = "toUInt128OrZero"; };
-struct NameToUInt256OrZero { static constexpr auto name = "toUInt256OrZero"; };
-struct NameToInt8OrZero { static constexpr auto name = "toInt8OrZero"; };
-struct NameToInt16OrZero { static constexpr auto name = "toInt16OrZero"; };
-struct NameToInt32OrZero { static constexpr auto name = "toInt32OrZero"; };
-struct NameToInt64OrZero { static constexpr auto name = "toInt64OrZero"; };
-struct NameToInt128OrZero { static constexpr auto name = "toInt128OrZero"; };
-struct NameToInt256OrZero { static constexpr auto name = "toInt256OrZero"; };
-struct NameToFloat32OrZero { static constexpr auto name = "toFloat32OrZero"; };
-struct NameToFloat64OrZero { static constexpr auto name = "toFloat64OrZero"; };
-struct NameToDateOrZero { static constexpr auto name = "toDateOrZero"; };
-struct NameToDate32OrZero { static constexpr auto name = "toDate32OrZero"; };
-struct NameToDateTimeOrZero { static constexpr auto name = "toDateTimeOrZero"; };
-struct NameToDateTime64OrZero { static constexpr auto name = "toDateTime64OrZero"; };
-struct NameToDecimal32OrZero { static constexpr auto name = "toDecimal32OrZero"; };
-struct NameToDecimal64OrZero { static constexpr auto name = "toDecimal64OrZero"; };
-struct NameToDecimal128OrZero { static constexpr auto name = "toDecimal128OrZero"; };
-struct NameToDecimal256OrZero { static constexpr auto name = "toDecimal256OrZero"; };
-struct NameToUUIDOrZero { static constexpr auto name = "toUUIDOrZero"; };
-struct NameToIPv4OrZero { static constexpr auto name = "toIPv4OrZero"; };
-struct NameToIPv6OrZero { static constexpr auto name = "toIPv6OrZero"; };
-
-using FunctionToUInt8OrZero = FunctionConvertFromString<DataTypeUInt8, NameToUInt8OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt16OrZero = FunctionConvertFromString<DataTypeUInt16, NameToUInt16OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt32OrZero = FunctionConvertFromString<DataTypeUInt32, NameToUInt32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt64OrZero = FunctionConvertFromString<DataTypeUInt64, NameToUInt64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt128OrZero = FunctionConvertFromString<DataTypeUInt128, NameToUInt128OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt256OrZero = FunctionConvertFromString<DataTypeUInt256, NameToUInt256OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt8OrZero = FunctionConvertFromString<DataTypeInt8, NameToInt8OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt16OrZero = FunctionConvertFromString<DataTypeInt16, NameToInt16OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt32OrZero = FunctionConvertFromString<DataTypeInt32, NameToInt32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt64OrZero = FunctionConvertFromString<DataTypeInt64, NameToInt64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt128OrZero = FunctionConvertFromString<DataTypeInt128, NameToInt128OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt256OrZero = FunctionConvertFromString<DataTypeInt256, NameToInt256OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToFloat32OrZero = FunctionConvertFromString<DataTypeFloat32, NameToFloat32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToFloat64OrZero = FunctionConvertFromString<DataTypeFloat64, NameToFloat64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDateOrZero = FunctionConvertFromString<DataTypeDate, NameToDateOrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDate32OrZero = FunctionConvertFromString<DataTypeDate32, NameToDate32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDateTimeOrZero = FunctionConvertFromString<DataTypeDateTime, NameToDateTimeOrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDateTime64OrZero = FunctionConvertFromString<DataTypeDateTime64, NameToDateTime64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDecimal32OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal32>, NameToDecimal32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDecimal64OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal64>, NameToDecimal64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDecimal128OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal128>, NameToDecimal128OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDecimal256OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal256>, NameToDecimal256OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUUIDOrZero = FunctionConvertFromString<DataTypeUUID, NameToUUIDOrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToIPv4OrZero = FunctionConvertFromString<DataTypeIPv4, NameToIPv4OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToIPv6OrZero = FunctionConvertFromString<DataTypeIPv6, NameToIPv6OrZero, ConvertFromStringExceptionMode::Zero>;
-
-struct NameToUInt8OrNull { static constexpr auto name = "toUInt8OrNull"; };
-struct NameToUInt16OrNull { static constexpr auto name = "toUInt16OrNull"; };
-struct NameToUInt32OrNull { static constexpr auto name = "toUInt32OrNull"; };
-struct NameToUInt64OrNull { static constexpr auto name = "toUInt64OrNull"; };
-struct NameToUInt128OrNull { static constexpr auto name = "toUInt128OrNull"; };
-struct NameToUInt256OrNull { static constexpr auto name = "toUInt256OrNull"; };
-struct NameToInt8OrNull { static constexpr auto name = "toInt8OrNull"; };
-struct NameToInt16OrNull { static constexpr auto name = "toInt16OrNull"; };
-struct NameToInt32OrNull { static constexpr auto name = "toInt32OrNull"; };
-struct NameToInt64OrNull { static constexpr auto name = "toInt64OrNull"; };
-struct NameToInt128OrNull { static constexpr auto name = "toInt128OrNull"; };
-struct NameToInt256OrNull { static constexpr auto name = "toInt256OrNull"; };
-struct NameToFloat32OrNull { static constexpr auto name = "toFloat32OrNull"; };
-struct NameToFloat64OrNull { static constexpr auto name = "toFloat64OrNull"; };
-struct NameToDateOrNull { static constexpr auto name = "toDateOrNull"; };
-struct NameToDate32OrNull { static constexpr auto name = "toDate32OrNull"; };
-struct NameToDateTimeOrNull { static constexpr auto name = "toDateTimeOrNull"; };
-struct NameToDateTime64OrNull { static constexpr auto name = "toDateTime64OrNull"; };
-struct NameToDecimal32OrNull { static constexpr auto name = "toDecimal32OrNull"; };
-struct NameToDecimal64OrNull { static constexpr auto name = "toDecimal64OrNull"; };
-struct NameToDecimal128OrNull { static constexpr auto name = "toDecimal128OrNull"; };
-struct NameToDecimal256OrNull { static constexpr auto name = "toDecimal256OrNull"; };
-struct NameToUUIDOrNull { static constexpr auto name = "toUUIDOrNull"; };
-struct NameToIPv4OrNull { static constexpr auto name = "toIPv4OrNull"; };
-struct NameToIPv6OrNull { static constexpr auto name = "toIPv6OrNull"; };
-
-using FunctionToUInt8OrNull = FunctionConvertFromString<DataTypeUInt8, NameToUInt8OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt16OrNull = FunctionConvertFromString<DataTypeUInt16, NameToUInt16OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt32OrNull = FunctionConvertFromString<DataTypeUInt32, NameToUInt32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt64OrNull = FunctionConvertFromString<DataTypeUInt64, NameToUInt64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt128OrNull = FunctionConvertFromString<DataTypeUInt128, NameToUInt128OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt256OrNull = FunctionConvertFromString<DataTypeUInt256, NameToUInt256OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt8OrNull = FunctionConvertFromString<DataTypeInt8, NameToInt8OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt16OrNull = FunctionConvertFromString<DataTypeInt16, NameToInt16OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt32OrNull = FunctionConvertFromString<DataTypeInt32, NameToInt32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt64OrNull = FunctionConvertFromString<DataTypeInt64, NameToInt64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt128OrNull = FunctionConvertFromString<DataTypeInt128, NameToInt128OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt256OrNull = FunctionConvertFromString<DataTypeInt256, NameToInt256OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToFloat32OrNull = FunctionConvertFromString<DataTypeFloat32, NameToFloat32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToFloat64OrNull = FunctionConvertFromString<DataTypeFloat64, NameToFloat64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDateOrNull = FunctionConvertFromString<DataTypeDate, NameToDateOrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDate32OrNull = FunctionConvertFromString<DataTypeDate32, NameToDate32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDateTimeOrNull = FunctionConvertFromString<DataTypeDateTime, NameToDateTimeOrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDateTime64OrNull = FunctionConvertFromString<DataTypeDateTime64, NameToDateTime64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDecimal32OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal32>, NameToDecimal32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDecimal64OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal64>, NameToDecimal64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDecimal128OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal128>, NameToDecimal128OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDecimal256OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal256>, NameToDecimal256OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUUIDOrNull = FunctionConvertFromString<DataTypeUUID, NameToUUIDOrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToIPv4OrNull = FunctionConvertFromString<DataTypeIPv4, NameToIPv4OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToIPv6OrNull = FunctionConvertFromString<DataTypeIPv6, NameToIPv6OrNull, ConvertFromStringExceptionMode::Null>;
-
-struct NameParseDateTimeBestEffort { static constexpr auto name = "parseDateTimeBestEffort"; };
-struct NameParseDateTimeBestEffortOrZero { static constexpr auto name = "parseDateTimeBestEffortOrZero"; };
-struct NameParseDateTimeBestEffortOrNull { static constexpr auto name = "parseDateTimeBestEffortOrNull"; };
-struct NameParseDateTimeBestEffortUS { static constexpr auto name = "parseDateTimeBestEffortUS"; };
-struct NameParseDateTimeBestEffortUSOrZero { static constexpr auto name = "parseDateTimeBestEffortUSOrZero"; };
-struct NameParseDateTimeBestEffortUSOrNull { static constexpr auto name = "parseDateTimeBestEffortUSOrNull"; };
-struct NameParseDateTime32BestEffort { static constexpr auto name = "parseDateTime32BestEffort"; };
-struct NameParseDateTime32BestEffortOrZero { static constexpr auto name = "parseDateTime32BestEffortOrZero"; };
-struct NameParseDateTime32BestEffortOrNull { static constexpr auto name = "parseDateTime32BestEffortOrNull"; };
-struct NameParseDateTime64BestEffort { static constexpr auto name = "parseDateTime64BestEffort"; };
-struct NameParseDateTime64BestEffortOrZero { static constexpr auto name = "parseDateTime64BestEffortOrZero"; };
-struct NameParseDateTime64BestEffortOrNull { static constexpr auto name = "parseDateTime64BestEffortOrNull"; };
-struct NameParseDateTime64BestEffortUS { static constexpr auto name = "parseDateTime64BestEffortUS"; };
-struct NameParseDateTime64BestEffortUSOrZero { static constexpr auto name = "parseDateTime64BestEffortUSOrZero"; };
-struct NameParseDateTime64BestEffortUSOrNull { static constexpr auto name = "parseDateTime64BestEffortUSOrNull"; };
-
-
-using FunctionParseDateTimeBestEffort = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffort, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTimeBestEffortOrZero = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTimeBestEffortOrNull = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffort>;
-
-using FunctionParseDateTimeBestEffortUS = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortUS, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffortUS>;
-using FunctionParseDateTimeBestEffortUSOrZero = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortUSOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffortUS>;
-using FunctionParseDateTimeBestEffortUSOrNull = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortUSOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffortUS>;
-
-using FunctionParseDateTime32BestEffort = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTime32BestEffort, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTime32BestEffortOrZero = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTime32BestEffortOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTime32BestEffortOrNull = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTime32BestEffortOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffort>;
-
-using FunctionParseDateTime64BestEffort = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffort, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTime64BestEffortOrZero = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTime64BestEffortOrNull = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffort>;
-
-using FunctionParseDateTime64BestEffortUS = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortUS, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffortUS>;
-using FunctionParseDateTime64BestEffortUSOrZero = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortUSOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffortUS>;
-using FunctionParseDateTime64BestEffortUSOrNull = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortUSOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffortUS>;
-
-
-class ExecutableFunctionCast : public IExecutableFunction
-{
-public:
-    using WrapperType = std::function<ColumnPtr(ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t)>;
-
-    explicit ExecutableFunctionCast(
-            WrapperType && wrapper_function_, const char * name_, std::optional<CastDiagnostic> diagnostic_)
-            : wrapper_function(std::move(wrapper_function_)), name(name_), diagnostic(std::move(diagnostic_)) {}
-
-    String getName() const override { return name; }
-
-protected:
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
-    {
-        /// drop second argument, pass others
-        ColumnsWithTypeAndName new_arguments{arguments.front()};
-        if (arguments.size() > 2)
-            new_arguments.insert(std::end(new_arguments), std::next(std::begin(arguments), 2), std::end(arguments));
-
-        try
-        {
-            return wrapper_function(new_arguments, result_type, nullptr, input_rows_count);
-        }
-        catch (Exception & e)
-        {
-            if (diagnostic)
-                e.addMessage("while converting source column " + backQuoteIfNeed(diagnostic->column_from) +
-                             " to destination column " + backQuoteIfNeed(diagnostic->column_to));
-            throw;
-        }
-    }
-
-    bool useDefaultImplementationForNulls() const override { return false; }
-    /// CAST(Nothing, T) -> T
-    bool useDefaultImplementationForNothing() const override { return false; }
-    bool useDefaultImplementationForConstants() const override { return true; }
-    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
-
-private:
-    WrapperType wrapper_function;
-    const char * name;
-    std::optional<CastDiagnostic> diagnostic;
-};
-
-
-struct FunctionCastName
-{
-    static constexpr auto name = "CAST";
-};
-
-class FunctionCastBase : public IFunctionBase
-{
-public:
-    using MonotonicityForRange = std::function<Monotonicity(const IDataType &, const Field &, const Field &)>;
-};
-
-class FunctionCast final : public FunctionCastBase
-{
-public:
-    using WrapperType = std::function<ColumnPtr(ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t)>;
-
-    FunctionCast(ContextPtr context_
-            , const char * cast_name_
-            , MonotonicityForRange && monotonicity_for_range_
-            , const DataTypes & argument_types_
-            , const DataTypePtr & return_type_
-            , std::optional<CastDiagnostic> diagnostic_
-            , CastType cast_type_)
-        : cast_name(cast_name_), monotonicity_for_range(std::move(monotonicity_for_range_))
-        , argument_types(argument_types_), return_type(return_type_), diagnostic(std::move(diagnostic_))
-        , cast_type(cast_type_)
-        , context(context_)
-    {
-    }
-
-    const DataTypes & getArgumentTypes() const override { return argument_types; }
-    const DataTypePtr & getResultType() const override { return return_type; }
-
-    ExecutableFunctionPtr prepare(const ColumnsWithTypeAndName & /*sample_columns*/) const override
-    {
-        try
-        {
-            return std::make_unique<ExecutableFunctionCast>(
-                prepareUnpackDictionaries(getArgumentTypes()[0], getResultType()), cast_name, diagnostic);
-        }
-        catch (Exception & e)
-        {
-            if (diagnostic)
-                e.addMessage("while converting source column " + backQuoteIfNeed(diagnostic->column_from) +
-                             " to destination column " + backQuoteIfNeed(diagnostic->column_to));
-            throw;
-        }
-    }
-
-    String getName() const override { return cast_name; }
-
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
-
-    bool hasInformationAboutMonotonicity() const override
-    {
-        return static_cast<bool>(monotonicity_for_range);
-    }
-
-    Monotonicity getMonotonicityForRange(const IDataType & type, const Field & left, const Field & right) const override
-    {
-        return monotonicity_for_range(type, left, right);
-    }
-
-private:
-
-    const char * cast_name;
-    MonotonicityForRange monotonicity_for_range;
-
-    DataTypes argument_types;
-    DataTypePtr return_type;
-
-    std::optional<CastDiagnostic> diagnostic;
-    CastType cast_type;
-    ContextPtr context;
-
-    static WrapperType createFunctionAdaptor(FunctionPtr function, const DataTypePtr & from_type)
-    {
-        auto function_adaptor = std::make_unique<FunctionToOverloadResolverAdaptor>(function)->build({ColumnWithTypeAndName{nullptr, from_type, ""}});
-
-        return [function_adaptor]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count)
-        {
-            return function_adaptor->execute(arguments, result_type, input_rows_count);
-        };
-    }
-
-    static WrapperType createToNullableColumnWrapper()
-    {
-        return [] (ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count)
-        {
-            ColumnPtr res = result_type->createColumn();
-            ColumnUInt8::Ptr col_null_map_to = ColumnUInt8::create(input_rows_count, true);
-            return ColumnNullable::create(res->cloneResized(input_rows_count), std::move(col_null_map_to));
-        };
-    }
-
-    template <typename ToDataType>
-    WrapperType createWrapper(const DataTypePtr & from_type, const ToDataType * const to_type, bool requested_result_is_nullable) const
-    {
-        TypeIndex from_type_index = from_type->getTypeId();
-        WhichDataType which(from_type_index);
-        bool can_apply_accurate_cast = (cast_type == CastType::accurate || cast_type == CastType::accurateOrNull)
-            && (which.isInt() || which.isUInt() || which.isFloat());
-
-        FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior;
-        if (context)
-            date_time_overflow_behavior = context->getSettingsRef().date_time_overflow_behavior;
-
-        if (requested_result_is_nullable && checkAndGetDataType<DataTypeString>(from_type.get()))
-        {
-            /// In case when converting to Nullable type, we apply different parsing rule,
-            /// that will not throw an exception but return NULL in case of malformed input.
-            FunctionPtr function = FunctionConvertFromString<ToDataType, FunctionCastName, ConvertFromStringExceptionMode::Null>::create();
-            return createFunctionAdaptor(function, from_type);
-        }
-        else if (!can_apply_accurate_cast)
-        {
-            FunctionPtr function = FunctionTo<ToDataType>::Type::create(context);
-            return createFunctionAdaptor(function, from_type);
-        }
-
-        auto wrapper_cast_type = cast_type;
-
-        return [wrapper_cast_type, from_type_index, to_type, date_time_overflow_behavior]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *column_nullable, size_t input_rows_count)
-        {
-            ColumnPtr result_column;
-            auto res = callOnIndexAndDataType<ToDataType>(from_type_index, [&](const auto & types) -> bool {
-                using Types = std::decay_t<decltype(types)>;
-                using LeftDataType = typename Types::LeftType;
-                using RightDataType = typename Types::RightType;
-
-                if constexpr (IsDataTypeNumber<LeftDataType>)
-                {
-                    if constexpr (IsDataTypeNumber<RightDataType>)
-                    {
-#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
-            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
-                arguments, result_type, input_rows_count, ADDITIONS()); \
-                break;
-                        if (wrapper_cast_type == CastType::accurate)
-                        {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, AccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, AccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, AccurateConvertStrategyAdditions)
-                            }
-                        }
-                        else
-                        {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, AccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, AccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, AccurateOrNullConvertStrategyAdditions)
-                            }
-                        }
-#undef GENERATE_OVERFLOW_MODE_CASE
-
-                        return true;
-                    }
-
-                    if constexpr (std::is_same_v<RightDataType, DataTypeDate> || std::is_same_v<RightDataType, DataTypeDateTime>)
-                    {
-#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
-            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::template execute<ADDITIONS>( \
-arguments, result_type, input_rows_count); \
-                break;
-                        if (wrapper_cast_type == CastType::accurate)
-                        {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateConvertStrategyAdditions)
-                            }
-                        }
-                        else
-                        {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateOrNullConvertStrategyAdditions)
-                            }
-                        }
-#undef GENERATE_OVERFLOW_MODE_CASE
-                        return true;
-                    }
-                }
-
-                return false;
-            });
-
-            /// Additionally check if callOnIndexAndDataType wasn't called at all.
-            if (!res)
-            {
-                if (wrapper_cast_type == CastType::accurateOrNull)
-                {
-                    auto nullable_column_wrapper = FunctionCast::createToNullableColumnWrapper();
-                    return nullable_column_wrapper(arguments, result_type, column_nullable, input_rows_count);
-                }
-                else
-                {
-                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE,
-                        "Conversion from {} to {} is not supported",
-                        from_type_index, to_type->getName());
-                }
-            }
-
-            return result_column;
-        };
-    }
-
-    template <typename ToDataType>
-    WrapperType createBoolWrapper(const DataTypePtr & from_type, const ToDataType * const to_type, bool requested_result_is_nullable) const
-    {
-        if (checkAndGetDataType<DataTypeString>(from_type.get()))
-        {
-            return &ConvertImplGenericFromString::execute;
-        }
-
-        return createWrapper<ToDataType>(from_type, to_type, requested_result_is_nullable);
-    }
-
-    WrapperType createUInt8ToBoolWrapper(const DataTypePtr from_type, const DataTypePtr to_type) const
-    {
-        return [from_type, to_type] (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            /// Special case when we convert UInt8 column to Bool column.
-            /// both columns have type UInt8, but we shouldn't use identity wrapper,
-            /// because Bool column can contain only 0 and 1.
-            auto res_column = to_type->createColumn();
-            const auto & data_from = checkAndGetColumn<ColumnUInt8>(arguments[0].column.get())->getData();
-            auto & data_to = assert_cast<ColumnUInt8 *>(res_column.get())->getData();
-            data_to.resize(data_from.size());
-            for (size_t i = 0; i != data_from.size(); ++i)
-                data_to[i] = static_cast<bool>(data_from[i]);
-            return res_column;
-        };
-    }
-
-    static WrapperType createStringWrapper(const DataTypePtr & from_type)
-    {
-        FunctionPtr function = FunctionToString::create();
-        return createFunctionAdaptor(function, from_type);
-    }
-
-    WrapperType createFixedStringWrapper(const DataTypePtr & from_type, const size_t N) const
-    {
-        if (!isStringOrFixedString(from_type))
-            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "CAST AS FixedString is only implemented for types String and FixedString");
-
-        bool exception_mode_null = cast_type == CastType::accurateOrNull;
-        return [exception_mode_null, N] (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t /*input_rows_count*/)
-        {
-            if (exception_mode_null)
-                return FunctionToFixedString::executeForN<ConvertToFixedStringExceptionMode::Null>(arguments, N);
-            else
-                return FunctionToFixedString::executeForN<ConvertToFixedStringExceptionMode::Throw>(arguments, N);
-        };
-    }
-
-#define GENERATE_INTERVAL_CASE(INTERVAL_KIND) \
-            case IntervalKind::Kind::INTERVAL_KIND: \
-                return createFunctionAdaptor(FunctionConvert<DataTypeInterval, NameToInterval##INTERVAL_KIND, PositiveMonotonicity>::create(), from_type);
-
-    static WrapperType createIntervalWrapper(const DataTypePtr & from_type, IntervalKind kind)
-    {
-        switch (kind)
-        {
-            GENERATE_INTERVAL_CASE(Nanosecond)
-            GENERATE_INTERVAL_CASE(Microsecond)
-            GENERATE_INTERVAL_CASE(Millisecond)
-            GENERATE_INTERVAL_CASE(Second)
-            GENERATE_INTERVAL_CASE(Minute)
-            GENERATE_INTERVAL_CASE(Hour)
-            GENERATE_INTERVAL_CASE(Day)
-            GENERATE_INTERVAL_CASE(Week)
-            GENERATE_INTERVAL_CASE(Month)
-            GENERATE_INTERVAL_CASE(Quarter)
-            GENERATE_INTERVAL_CASE(Year)
-        }
-        throw Exception{ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion to unexpected IntervalKind: {}", kind.toString()};
-    }
-
-#undef GENERATE_INTERVAL_CASE
-
-    template <typename ToDataType>
-    requires IsDataTypeDecimal<ToDataType>
-    WrapperType createDecimalWrapper(const DataTypePtr & from_type, const ToDataType * to_type, bool requested_result_is_nullable) const
-    {
-        TypeIndex type_index = from_type->getTypeId();
-        UInt32 scale = to_type->getScale();
-
-        WhichDataType which(type_index);
-        bool ok = which.isNativeInt() || which.isNativeUInt() || which.isDecimal() || which.isFloat() || which.isDateOrDate32() || which.isDateTime() || which.isDateTime64()
-            || which.isStringOrFixedString();
-        if (!ok)
-        {
-            if (cast_type == CastType::accurateOrNull)
-                return createToNullableColumnWrapper();
-            else
-                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
-                    from_type->getName(), to_type->getName());
-        }
-
-        auto wrapper_cast_type = cast_type;
-
-        return [wrapper_cast_type, type_index, scale, to_type, requested_result_is_nullable]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *column_nullable, size_t input_rows_count)
-        {
-            ColumnPtr result_column;
-            auto res = callOnIndexAndDataType<ToDataType>(type_index, [&](const auto & types) -> bool
-            {
-                using Types = std::decay_t<decltype(types)>;
-                using LeftDataType = typename Types::LeftType;
-                using RightDataType = typename Types::RightType;
-
-                if constexpr (IsDataTypeDecimalOrNumber<LeftDataType> && IsDataTypeDecimalOrNumber<RightDataType> && !std::is_same_v<DataTypeDateTime64, RightDataType>)
-                {
-                    if (wrapper_cast_type == CastType::accurate)
-                    {
-                        AccurateConvertStrategyAdditions additions;
-                        additions.scale = scale;
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
-                            arguments, result_type, input_rows_count, additions);
-
-                        return true;
-                    }
-                    else if (wrapper_cast_type == CastType::accurateOrNull)
-                    {
-                        AccurateOrNullConvertStrategyAdditions additions;
-                        additions.scale = scale;
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
-                            arguments, result_type, input_rows_count, additions);
-
-                        return true;
-                    }
-                }
-                else if constexpr (std::is_same_v<LeftDataType, DataTypeString>)
-                {
-                    if (requested_result_is_nullable)
-                    {
-                        /// Consistent with CAST(Nullable(String) AS Nullable(Numbers))
-                        /// In case when converting to Nullable type, we apply different parsing rule,
-                        /// that will not throw an exception but return NULL in case of malformed input.
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertReturnNullOnErrorTag>::execute(
-                            arguments, result_type, input_rows_count, scale);
-
-                        return true;
-                    }
-                }
-
-                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(arguments, result_type, input_rows_count, scale);
-
-                return true;
-            });
-
-            /// Additionally check if callOnIndexAndDataType wasn't called at all.
-            if (!res)
-            {
-                if (wrapper_cast_type == CastType::accurateOrNull)
-                {
-                    auto nullable_column_wrapper = FunctionCast::createToNullableColumnWrapper();
-                    return nullable_column_wrapper(arguments, result_type, column_nullable, input_rows_count);
-                }
-                else
-                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE,
-                        "Conversion from {} to {} is not supported",
-                        type_index, to_type->getName());
-            }
-
-            return result_column;
-        };
-    }
-
-    WrapperType createAggregateFunctionWrapper(const DataTypePtr & from_type_untyped, const DataTypeAggregateFunction * to_type) const
-    {
-        /// Conversion from String through parsing.
-        if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
-        {
-            return &ConvertImplGenericFromString::execute;
-        }
-        else if (const auto * agg_type = checkAndGetDataType<DataTypeAggregateFunction>(from_type_untyped.get()))
-        {
-            if (agg_type->getFunction()->haveSameStateRepresentation(*to_type->getFunction()))
-            {
-                return [function = to_type->getFunction()](
-                           ColumnsWithTypeAndName & arguments,
-                           const DataTypePtr & /* result_type */,
-                           const ColumnNullable * /* nullable_source */,
-                           size_t /*input_rows_count*/) -> ColumnPtr
-                {
-                    const auto & argument_column = arguments.front();
-                    const auto * col_agg = checkAndGetColumn<ColumnAggregateFunction>(argument_column.column.get());
-                    if (col_agg)
-                    {
-                        auto new_col_agg = ColumnAggregateFunction::create(*col_agg);
-                        new_col_agg->set(function);
-                        return new_col_agg;
-                    }
-                    else
-                    {
-                        throw Exception(
-                            ErrorCodes::LOGICAL_ERROR,
-                            "Illegal column {} for function CAST AS AggregateFunction",
-                            argument_column.column->getName());
-                    }
-                };
-            }
-        }
-
-        if (cast_type == CastType::accurateOrNull)
-            return createToNullableColumnWrapper();
-        else
-            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
-                from_type_untyped->getName(), to_type->getName());
-    }
-
-    WrapperType createArrayWrapper(const DataTypePtr & from_type_untyped, const DataTypeArray & to_type) const
-    {
-        /// Conversion from String through parsing.
-        if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
-        {
-            return &ConvertImplGenericFromString::execute;
-        }
-
-        DataTypePtr from_type_holder;
-        const auto * from_type = checkAndGetDataType<DataTypeArray>(from_type_untyped.get());
-        const auto * from_type_map = checkAndGetDataType<DataTypeMap>(from_type_untyped.get());
-
-        /// Convert from Map
-        if (from_type_map)
-        {
-            /// Recreate array of unnamed tuples because otherwise it may work
-            /// unexpectedly while converting to array of named tuples.
-            from_type_holder = from_type_map->getNestedTypeWithUnnamedTuple();
-            from_type = assert_cast<const DataTypeArray *>(from_type_holder.get());
-        }
-
-        if (!from_type)
-        {
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "CAST AS Array can only be performed between same-dimensional Array, Map or String types");
-        }
-
-        DataTypePtr from_nested_type = from_type->getNestedType();
-
-        /// In query SELECT CAST([] AS Array(Array(String))) from type is Array(Nothing)
-        bool from_empty_array = isNothing(from_nested_type);
-
-        if (from_type->getNumberOfDimensions() != to_type.getNumberOfDimensions() && !from_empty_array)
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "CAST AS Array can only be performed between same-dimensional array types");
-
-        const DataTypePtr & to_nested_type = to_type.getNestedType();
-
-        /// Prepare nested type conversion
-        const auto nested_function = prepareUnpackDictionaries(from_nested_type, to_nested_type);
-
-        return [nested_function, from_nested_type, to_nested_type](
-                ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            const auto & argument_column = arguments.front();
-
-            const ColumnArray * col_array = nullptr;
-
-            if (const ColumnMap * col_map = checkAndGetColumn<ColumnMap>(argument_column.column.get()))
-                col_array = &col_map->getNestedColumn();
-            else
-                col_array = checkAndGetColumn<ColumnArray>(argument_column.column.get());
-
-            if (col_array)
-            {
-                /// create columns for converting nested column containing original and result columns
-                ColumnsWithTypeAndName nested_columns{{ col_array->getDataPtr(), from_nested_type, "" }};
-
-                /// convert nested column
-                auto result_column = nested_function(nested_columns, to_nested_type, nullable_source, nested_columns.front().column->size());
-
-                /// set converted nested column to result
-                return ColumnArray::create(result_column, col_array->getOffsetsPtr());
-            }
-            else
-            {
-                throw Exception(ErrorCodes::LOGICAL_ERROR,
-                    "Illegal column {} for function CAST AS Array",
-                    argument_column.column->getName());
-            }
-        };
-    }
-
-    using ElementWrappers = std::vector<WrapperType>;
-
-    ElementWrappers getElementWrappers(const DataTypes & from_element_types, const DataTypes & to_element_types) const
-    {
-        ElementWrappers element_wrappers;
-        element_wrappers.reserve(from_element_types.size());
-
-        /// Create conversion wrapper for each element in tuple
-        for (size_t i = 0; i < from_element_types.size(); ++i)
-        {
-            const DataTypePtr & from_element_type = from_element_types[i];
-            const DataTypePtr & to_element_type = to_element_types[i];
-            element_wrappers.push_back(prepareUnpackDictionaries(from_element_type, to_element_type));
-        }
-
-        return element_wrappers;
-    }
-
-    WrapperType createTupleWrapper(const DataTypePtr & from_type_untyped, const DataTypeTuple * to_type) const
-    {
-        /// Conversion from String through parsing.
-        if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
-        {
-            return &ConvertImplGenericFromString::execute;
-        }
-
-        const auto * from_type = checkAndGetDataType<DataTypeTuple>(from_type_untyped.get());
-        if (!from_type)
-            throw Exception(ErrorCodes::TYPE_MISMATCH, "CAST AS Tuple can only be performed between tuple types or from String.\n"
-                            "Left type: {}, right type: {}", from_type_untyped->getName(), to_type->getName());
-
-        const auto & from_element_types = from_type->getElements();
-        const auto & to_element_types = to_type->getElements();
-
-        std::vector<WrapperType> element_wrappers;
-        std::vector<std::optional<size_t>> to_reverse_index;
-
-        /// For named tuples allow conversions for tuples with
-        /// different sets of elements. If element exists in @to_type
-        /// and doesn't exist in @to_type it will be filled by default values.
-        if (from_type->haveExplicitNames() && to_type->haveExplicitNames())
-        {
-            const auto & from_names = from_type->getElementNames();
-            std::unordered_map<String, size_t> from_positions;
-            from_positions.reserve(from_names.size());
-            for (size_t i = 0; i < from_names.size(); ++i)
-                from_positions[from_names[i]] = i;
-
-            const auto & to_names = to_type->getElementNames();
-            element_wrappers.reserve(to_names.size());
-            to_reverse_index.reserve(from_names.size());
-
-            for (size_t i = 0; i < to_names.size(); ++i)
-            {
-                auto it = from_positions.find(to_names[i]);
-                if (it != from_positions.end())
-                {
-                    element_wrappers.emplace_back(prepareUnpackDictionaries(from_element_types[it->second], to_element_types[i]));
-                    to_reverse_index.emplace_back(it->second);
-                }
-                else
-                {
-                    element_wrappers.emplace_back();
-                    to_reverse_index.emplace_back();
-                }
-            }
-        }
-        else
-        {
-            if (from_element_types.size() != to_element_types.size())
-                throw Exception(ErrorCodes::TYPE_MISMATCH, "CAST AS Tuple can only be performed between tuple types "
-                                "with the same number of elements or from String.\nLeft type: {}, right type: {}",
-                                from_type->getName(), to_type->getName());
-
-            element_wrappers = getElementWrappers(from_element_types, to_element_types);
-            to_reverse_index.reserve(to_element_types.size());
-            for (size_t i = 0; i < to_element_types.size(); ++i)
-                to_reverse_index.emplace_back(i);
-        }
-
-        return [element_wrappers, from_element_types, to_element_types, to_reverse_index]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t input_rows_count) -> ColumnPtr
-        {
-            const auto * col = arguments.front().column.get();
-
-            size_t tuple_size = to_element_types.size();
-            const ColumnTuple & column_tuple = typeid_cast<const ColumnTuple &>(*col);
-
-            Columns converted_columns(tuple_size);
-
-            /// invoke conversion for each element
-            for (size_t i = 0; i < tuple_size; ++i)
-            {
-                if (to_reverse_index[i])
-                {
-                    size_t from_idx = *to_reverse_index[i];
-                    ColumnsWithTypeAndName element = {{column_tuple.getColumns()[from_idx], from_element_types[from_idx], "" }};
-                    converted_columns[i] = element_wrappers[i](element, to_element_types[i], nullable_source, input_rows_count);
-                }
-                else
-                {
-                    converted_columns[i] = to_element_types[i]->createColumn()->cloneResized(input_rows_count);
-                }
-            }
-
-            return ColumnTuple::create(converted_columns);
-        };
-    }
-
-    /// The case of: tuple([key1, key2, ..., key_n], [value1, value2, ..., value_n])
-    WrapperType createTupleToMapWrapper(const DataTypes & from_kv_types, const DataTypes & to_kv_types) const
-    {
-        return [element_wrappers = getElementWrappers(from_kv_types, to_kv_types), from_kv_types, to_kv_types]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            const auto * col = arguments.front().column.get();
-            const auto & column_tuple = assert_cast<const ColumnTuple &>(*col);
-
-            Columns offsets(2);
-            Columns converted_columns(2);
-            for (size_t i = 0; i < 2; ++i)
-            {
-                const auto & column_array = assert_cast<const ColumnArray &>(column_tuple.getColumn(i));
-                ColumnsWithTypeAndName element = {{column_array.getDataPtr(), from_kv_types[i], ""}};
-                converted_columns[i] = element_wrappers[i](element, to_kv_types[i], nullable_source, (element[0].column)->size());
-                offsets[i] = column_array.getOffsetsPtr();
-            }
-
-            const auto & keys_offsets = assert_cast<const ColumnArray::ColumnOffsets &>(*offsets[0]).getData();
-            const auto & values_offsets = assert_cast<const ColumnArray::ColumnOffsets &>(*offsets[1]).getData();
-            if (keys_offsets != values_offsets)
-                throw Exception(ErrorCodes::TYPE_MISMATCH,
-                    "CAST AS Map can only be performed from tuple of arrays with equal sizes.");
-
-            return ColumnMap::create(converted_columns[0], converted_columns[1], offsets[0]);
-        };
-    }
-
-    WrapperType createMapToMapWrapper(const DataTypes & from_kv_types, const DataTypes & to_kv_types) const
-    {
-        return [element_wrappers = getElementWrappers(from_kv_types, to_kv_types), from_kv_types, to_kv_types]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            const auto * col = arguments.front().column.get();
-            const auto & column_map = typeid_cast<const ColumnMap &>(*col);
-            const auto & nested_data = column_map.getNestedData();
-
-            Columns converted_columns(2);
-            for (size_t i = 0; i < 2; ++i)
-            {
-                ColumnsWithTypeAndName element = {{nested_data.getColumnPtr(i), from_kv_types[i], ""}};
-                converted_columns[i] = element_wrappers[i](element, to_kv_types[i], nullable_source, (element[0].column)->size());
-            }
-
-            return ColumnMap::create(converted_columns[0], converted_columns[1], column_map.getNestedColumn().getOffsetsPtr());
-        };
-    }
-
-    /// The case of: [(key1, value1), (key2, value2), ...]
-    WrapperType createArrayToMapWrapper(const DataTypes & from_kv_types, const DataTypes & to_kv_types) const
-    {
-        return [element_wrappers = getElementWrappers(from_kv_types, to_kv_types), from_kv_types, to_kv_types]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            const auto * col = arguments.front().column.get();
-            const auto & column_array = typeid_cast<const ColumnArray &>(*col);
-            const auto & nested_data = typeid_cast<const ColumnTuple &>(column_array.getData());
-
-            Columns converted_columns(2);
-            for (size_t i = 0; i < 2; ++i)
-            {
-                ColumnsWithTypeAndName element = {{nested_data.getColumnPtr(i), from_kv_types[i], ""}};
-                converted_columns[i] = element_wrappers[i](element, to_kv_types[i], nullable_source, (element[0].column)->size());
-            }
-
-            return ColumnMap::create(converted_columns[0], converted_columns[1], column_array.getOffsetsPtr());
-        };
-    }
-
-
-    WrapperType createMapWrapper(const DataTypePtr & from_type_untyped, const DataTypeMap * to_type) const
-    {
-        if (const auto * from_tuple = checkAndGetDataType<DataTypeTuple>(from_type_untyped.get()))
-        {
-            if (from_tuple->getElements().size() != 2)
-                throw Exception(
-                    ErrorCodes::TYPE_MISMATCH,
-                    "CAST AS Map from tuple requires 2 elements. "
-                    "Left type: {}, right type: {}",
-                    from_tuple->getName(),
-                    to_type->getName());
-
-            DataTypes from_kv_types;
-            const auto & to_kv_types = to_type->getKeyValueTypes();
-
-            for (const auto & elem : from_tuple->getElements())
-            {
-                const auto * type_array = checkAndGetDataType<DataTypeArray>(elem.get());
-                if (!type_array)
-                    throw Exception(ErrorCodes::TYPE_MISMATCH,
-                        "CAST AS Map can only be performed from tuples of array. Got: {}", from_tuple->getName());
-
-                from_kv_types.push_back(type_array->getNestedType());
-            }
-
-            return createTupleToMapWrapper(from_kv_types, to_kv_types);
-        }
-        else if (const auto * from_array = typeid_cast<const DataTypeArray *>(from_type_untyped.get()))
-        {
-            const auto * nested_tuple = typeid_cast<const DataTypeTuple *>(from_array->getNestedType().get());
-            if (!nested_tuple || nested_tuple->getElements().size() != 2)
-                throw Exception(
-                    ErrorCodes::TYPE_MISMATCH,
-                    "CAST AS Map from array requires nested tuple of 2 elements. "
-                    "Left type: {}, right type: {}",
-                    from_array->getName(),
-                    to_type->getName());
-
-            return createArrayToMapWrapper(nested_tuple->getElements(), to_type->getKeyValueTypes());
-        }
-        else if (const auto * from_type = checkAndGetDataType<DataTypeMap>(from_type_untyped.get()))
-        {
-            return createMapToMapWrapper(from_type->getKeyValueTypes(), to_type->getKeyValueTypes());
-        }
-        else
-        {
-            throw Exception(ErrorCodes::TYPE_MISMATCH, "Unsupported types to CAST AS Map. "
-                "Left type: {}, right type: {}", from_type_untyped->getName(), to_type->getName());
-        }
-    }
-
-    WrapperType createTupleToObjectWrapper(const DataTypeTuple & from_tuple, bool has_nullable_subcolumns) const
-    {
-        if (!from_tuple.haveExplicitNames())
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-            "Cast to Object can be performed only from flatten Named Tuple. Got: {}", from_tuple.getName());
-
-        PathsInData paths;
-        DataTypes from_types;
-
-        std::tie(paths, from_types) = flattenTuple(from_tuple.getPtr());
-        auto to_types = from_types;
-
-        for (auto & type : to_types)
-        {
-            if (isTuple(type) || isNested(type))
-                throw Exception(ErrorCodes::TYPE_MISMATCH,
-                    "Cast to Object can be performed only from flatten Named Tuple. Got: {}",
-                    from_tuple.getName());
-
-            type = recursiveRemoveLowCardinality(type);
-        }
-
-        return [element_wrappers = getElementWrappers(from_types, to_types),
-            has_nullable_subcolumns, from_types, to_types, paths]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t input_rows_count)
-        {
-            size_t tuple_size = to_types.size();
-            auto flattened_column = flattenTuple(arguments.front().column);
-            const auto & column_tuple = assert_cast<const ColumnTuple &>(*flattened_column);
-
-            if (tuple_size != column_tuple.getColumns().size())
-                throw Exception(ErrorCodes::TYPE_MISMATCH,
-                    "Expected tuple with {} subcolumn, but got {} subcolumns",
-                    tuple_size, column_tuple.getColumns().size());
-
-            auto res = ColumnObject::create(has_nullable_subcolumns);
-            for (size_t i = 0; i < tuple_size; ++i)
-            {
-                ColumnsWithTypeAndName element = {{column_tuple.getColumns()[i], from_types[i], "" }};
-                auto converted_column = element_wrappers[i](element, to_types[i], nullable_source, input_rows_count);
-                res->addSubcolumn(paths[i], converted_column->assumeMutable());
-            }
-
-            return res;
-        };
-    }
-
-    WrapperType createMapToObjectWrapper(const DataTypeMap & from_map, bool has_nullable_subcolumns) const
-    {
-        auto key_value_types = from_map.getKeyValueTypes();
-
-        if (!isStringOrFixedString(key_value_types[0]))
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "Cast to Object from Map can be performed only from Map "
-                "with String or FixedString key. Got: {}", from_map.getName());
-
-        const auto & value_type = key_value_types[1];
-        auto to_value_type = value_type;
-
-        if (!has_nullable_subcolumns && value_type->isNullable())
-            to_value_type = removeNullable(value_type);
-
-        if (has_nullable_subcolumns && !value_type->isNullable())
-            to_value_type = makeNullable(value_type);
-
-        DataTypes to_key_value_types{std::make_shared<DataTypeString>(), std::move(to_value_type)};
-        auto element_wrappers = getElementWrappers(key_value_types, to_key_value_types);
-
-        return [has_nullable_subcolumns, element_wrappers, key_value_types, to_key_value_types]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t) -> ColumnPtr
-        {
-            const auto & column_map = assert_cast<const ColumnMap &>(*arguments.front().column);
-            const auto & offsets = column_map.getNestedColumn().getOffsets();
-            auto key_value_columns = column_map.getNestedData().getColumnsCopy();
-
-            for (size_t i = 0; i < 2; ++i)
-            {
-                ColumnsWithTypeAndName element{{key_value_columns[i], key_value_types[i], ""}};
-                key_value_columns[i] = element_wrappers[i](element, to_key_value_types[i], nullable_source, key_value_columns[i]->size());
-            }
-
-            const auto & key_column_str = assert_cast<const ColumnString &>(*key_value_columns[0]);
-            const auto & value_column = *key_value_columns[1];
-
-            using SubcolumnsMap = HashMap<StringRef, MutableColumnPtr, StringRefHash>;
-            SubcolumnsMap subcolumns;
-
-            for (size_t row = 0; row < offsets.size(); ++row)
-            {
-                for (size_t i = offsets[static_cast<ssize_t>(row) - 1]; i < offsets[row]; ++i)
-                {
-                    auto ref = key_column_str.getDataAt(i);
-
-                    bool inserted;
-                    SubcolumnsMap::LookupResult it;
-                    subcolumns.emplace(ref, it, inserted);
-                    auto & subcolumn = it->getMapped();
-
-                    if (inserted)
-                        subcolumn = value_column.cloneEmpty()->cloneResized(row);
-
-                    /// Map can have duplicated keys. We insert only first one.
-                    if (subcolumn->size() == row)
-                        subcolumn->insertFrom(value_column, i);
-                }
-
-                /// Insert default values for keys missed in current row.
-                for (const auto & [_, subcolumn] : subcolumns)
-                    if (subcolumn->size() == row)
-                        subcolumn->insertDefault();
-            }
-
-            auto column_object = ColumnObject::create(has_nullable_subcolumns);
-            for (auto && [key, subcolumn] : subcolumns)
-            {
-                PathInData path(key.toView());
-                column_object->addSubcolumn(path, std::move(subcolumn));
-            }
-
-            return column_object;
-        };
-    }
-
-    WrapperType createObjectWrapper(const DataTypePtr & from_type, const DataTypeObject * to_type) const
-    {
-        if (const auto * from_tuple = checkAndGetDataType<DataTypeTuple>(from_type.get()))
-        {
-            return createTupleToObjectWrapper(*from_tuple, to_type->hasNullableSubcolumns());
-        }
-        else if (const auto * from_map = checkAndGetDataType<DataTypeMap>(from_type.get()))
-        {
-            return createMapToObjectWrapper(*from_map, to_type->hasNullableSubcolumns());
-        }
-        else if (checkAndGetDataType<DataTypeString>(from_type.get()))
-        {
-            return [] (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * nullable_source, size_t input_rows_count)
-            {
-                auto res = ConvertImplGenericFromString::execute(arguments, result_type, nullable_source, input_rows_count)->assumeMutable();
-                res->finalize();
-                return res;
-            };
-        }
-        else if (checkAndGetDataType<DataTypeObject>(from_type.get()))
-        {
-            return [is_nullable = to_type->hasNullableSubcolumns()] (ColumnsWithTypeAndName & arguments, const DataTypePtr & , const ColumnNullable * , size_t) -> ColumnPtr
-            {
-                auto & column_object = assert_cast<const ColumnObject &>(*arguments.front().column);
-                auto res = ColumnObject::create(is_nullable);
-                for (size_t i = 0; i < column_object.size(); i++)
-                    res->insert(column_object[i]);
-
-                res->finalize();
-                return res;
-            };
-        }
-
-        throw Exception(ErrorCodes::TYPE_MISMATCH,
-            "Cast to Object can be performed only from flatten named Tuple, Map or String. Got: {}", from_type->getName());
-    }
-
-    WrapperType createVariantToVariantWrapper(const DataTypeVariant & from_variant, const DataTypeVariant & to_variant) const
-    {
-        /// We support only extension of variant type, so, only new types can be added.
-        /// For example: Variant(T1, T2) -> Variant(T1, T2, T3) is supported, but Variant(T1, T2) -> Variant(T1, T3) is not supported.
-        /// We want to extend Variant type for free without rewriting the data, but we sort data types inside Variant during type creation
-        /// (we do it because we want Variant(T1, T2) to be the same as Variant(T2, T1)), but after extension the order of variant types
-        /// (and so their discriminators) can be different. For example: Variant(T1, T3) -> Variant(T1, T2, T3).
-        /// To avoid full rewrite of discriminators column, ColumnVariant supports it's local order of variant columns (and so local
-        /// discriminators) and stores mapping global order -> local order.
-        /// So, to extend Variant with new types for free, we should keep old local order for old variants, append new variants and change
-        /// mapping global order -> local order according to the new global order.
-
-        /// Create map (new variant type) -> (it's global discriminator in new order).
-        const auto & new_variants = to_variant.getVariants();
-        std::unordered_map<String, ColumnVariant::Discriminator> new_variant_types_to_new_global_discriminator;
-        new_variant_types_to_new_global_discriminator.reserve(new_variants.size());
-        for (size_t i = 0; i != new_variants.size(); ++i)
-            new_variant_types_to_new_global_discriminator[new_variants[i]->getName()] = i;
-
-        /// Create set of old variant types.
-        const auto & old_variants = from_variant.getVariants();
-        std::unordered_map<String, ColumnVariant::Discriminator> old_variant_types_to_old_global_discriminator;
-        old_variant_types_to_old_global_discriminator.reserve(old_variants.size());
-        for (size_t i = 0; i != old_variants.size(); ++i)
-            old_variant_types_to_old_global_discriminator[old_variants[i]->getName()] = i;
-
-        /// Check that the set of old variants types is a subset of new variant types and collect new global discriminator for each old global discriminator.
-        std::unordered_map<ColumnVariant::Discriminator, ColumnVariant::Discriminator> old_global_discriminator_to_new;
-        old_global_discriminator_to_new.reserve(old_variants.size());
-        for (const auto & [old_variant_type, old_discriminator] : old_variant_types_to_old_global_discriminator)
-        {
-            auto it = new_variant_types_to_new_global_discriminator.find(old_variant_type);
-            if (it == new_variant_types_to_new_global_discriminator.end())
-                throw Exception(
-                    ErrorCodes::CANNOT_CONVERT_TYPE,
-                    "Cannot convert type {} to {}. Conversion between Variant types is allowed only when new Variant type is an extension "
-                    "of an initial one", from_variant.getName(), to_variant.getName());
-            old_global_discriminator_to_new[old_discriminator] = it->second;
-        }
-
-        /// Collect variant types and their global discriminators that should be added to the old Variant to get the new Variant.
-        std::vector<std::pair<DataTypePtr, ColumnVariant::Discriminator>> variant_types_and_discriminators_to_add;
-        variant_types_and_discriminators_to_add.reserve(new_variants.size() - old_variants.size());
-        for (size_t i = 0; i != new_variants.size(); ++i)
-        {
-            if (!old_variant_types_to_old_global_discriminator.contains(new_variants[i]->getName()))
-                variant_types_and_discriminators_to_add.emplace_back(new_variants[i], i);
-        }
-
-        return [old_global_discriminator_to_new, variant_types_and_discriminators_to_add]
-               (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t) -> ColumnPtr
-        {
-            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
-            size_t num_old_variants = column_variant.getNumVariants();
-            Columns new_variant_columns;
-            new_variant_columns.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
-            std::vector<ColumnVariant::Discriminator> new_local_to_global_discriminators;
-            new_local_to_global_discriminators.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
-            for (size_t i = 0; i != num_old_variants; ++i)
-            {
-                new_variant_columns.push_back(column_variant.getVariantPtrByLocalDiscriminator(i));
-                new_local_to_global_discriminators.push_back(old_global_discriminator_to_new.at(column_variant.globalDiscriminatorByLocal(i)));
-            }
-
-            for (const auto & [new_variant_type, new_global_discriminator] : variant_types_and_discriminators_to_add)
-            {
-                new_variant_columns.push_back(new_variant_type->createColumn());
-                new_local_to_global_discriminators.push_back(new_global_discriminator);
-            }
-
-            return ColumnVariant::create(column_variant.getLocalDiscriminatorsPtr(), column_variant.getOffsetsPtr(), new_variant_columns, new_local_to_global_discriminators);
-        };
-    }
-
-    WrapperType createVariantToColumnWrapper(const DataTypeVariant & from_variant, const DataTypePtr & to_type) const
-    {
-        const auto & variant_types = from_variant.getVariants();
-        std::vector<WrapperType> variant_wrappers;
-        variant_wrappers.reserve(variant_types.size());
-
-        /// Create conversion wrapper for each variant.
-        for (const auto & variant_type : variant_types)
-            variant_wrappers.push_back(prepareUnpackDictionaries(variant_type, to_type));
-
-        return [variant_wrappers, variant_types, to_type]
-               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-        {
-            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
-
-            /// First, cast each variant to the result type.
-            std::vector<ColumnPtr> casted_variant_columns;
-            casted_variant_columns.reserve(variant_types.size());
-            for (size_t i = 0; i != variant_types.size(); ++i)
-            {
-                auto variant_col = column_variant.getVariantPtrByLocalDiscriminator(i);
-                ColumnsWithTypeAndName variant = {{variant_col, variant_types[i], "" }};
-                const auto & variant_wrapper = variant_wrappers[column_variant.globalDiscriminatorByLocal(i)];
-                casted_variant_columns.push_back(variant_wrapper(variant, result_type, nullptr, variant_col->size()));
-            }
-
-            /// Second, construct resulting column from casted variant columns according to discriminators.
-            const auto & local_discriminators = column_variant.getLocalDiscriminators();
-            auto res = result_type->createColumn();
-            res->reserve(input_rows_count);
-            for (size_t i = 0; i != input_rows_count; ++i)
-            {
-                auto local_discr = local_discriminators[i];
-                if (local_discr == ColumnVariant::NULL_DISCRIMINATOR)
-                    res->insertDefault();
-                else
-                    res->insertFrom(*casted_variant_columns[local_discr], column_variant.offsetAt(i));
-            }
-
-            return res;
-        };
-    }
-
-    static ColumnPtr createVariantFromDescriptorsAndOneNonEmptyVariant(const DataTypes & variant_types, const ColumnPtr & discriminators, const ColumnPtr & variant, ColumnVariant::Discriminator variant_discr)
-    {
-        Columns variants;
-        variants.reserve(variant_types.size());
-        for (size_t i = 0; i != variant_types.size(); ++i)
-        {
-            if (i == variant_discr)
-                variants.emplace_back(variant);
-            else
-                variants.push_back(variant_types[i]->createColumn());
-        }
-
-        return ColumnVariant::create(discriminators, variants);
-    }
-
-    WrapperType createColumnToVariantWrapper(const DataTypePtr & from_type, const DataTypeVariant & to_variant) const
-    {
-        /// We allow converting NULL to Variant(...) as Variant can store NULLs.
-        if (from_type->onlyNull())
-        {
-            return [](ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-            {
-                auto result_column = result_type->createColumn();
-                result_column->insertManyDefaults(input_rows_count);
-                return result_column;
-            };
-        }
-
-        auto variant_discr_opt = to_variant.tryGetVariantDiscriminator(*removeNullableOrLowCardinalityNullable(from_type));
-        if (!variant_discr_opt)
-            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert type {} to {}. Conversion to Variant allowed only for types from this Variant", from_type->getName(), to_variant.getName());
-
-        return [variant_discr = *variant_discr_opt]
-               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t) -> ColumnPtr
-        {
-            const auto & result_variant_type = assert_cast<const DataTypeVariant &>(*result_type);
-            const auto & variant_types = result_variant_type.getVariants();
-            if (const ColumnNullable * col_nullable = typeid_cast<const ColumnNullable *>(arguments.front().column.get()))
-            {
-                const auto & column = col_nullable->getNestedColumnPtr();
-                const auto & null_map = col_nullable->getNullMapData();
-                IColumn::Filter filter;
-                filter.reserve(column->size());
-                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
-                auto & discriminators_data = discriminators->getData();
-                discriminators_data.reserve(column->size());
-                size_t variant_size_hint = 0;
-                for (size_t i = 0; i != column->size(); ++i)
-                {
-                    if (null_map[i])
-                    {
-                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
-                        filter.push_back(0);
-                    }
-                    else
-                    {
-                        discriminators_data.push_back(variant_discr);
-                        filter.push_back(1);
-                        ++variant_size_hint;
-                    }
-                }
-
-                ColumnPtr variant_column;
-                /// If there were no NULLs, just use the column.
-                if (variant_size_hint == column->size())
-                    variant_column = column;
-                /// Otherwise we should use filtered column.
-                else
-                    variant_column = column->filter(filter, variant_size_hint);
-                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), variant_column, variant_discr);
-            }
-            else if (isColumnLowCardinalityNullable(*arguments.front().column))
-            {
-                const auto & column = arguments.front().column;
-
-                /// Variant column cannot have LowCardinality(Nullable(...)) variant, as Variant column stores NULLs itself.
-                /// We should create a null-map, insert NULL_DISCRIMINATOR on NULL values and filter initial column.
-                const auto & col_lc = assert_cast<const ColumnLowCardinality &>(*column);
-                const auto & indexes = col_lc.getIndexes();
-                auto null_index = col_lc.getDictionary().getNullValueIndex();
-                IColumn::Filter filter;
-                filter.reserve(col_lc.size());
-                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
-                auto & discriminators_data = discriminators->getData();
-                discriminators_data.reserve(col_lc.size());
-                size_t variant_size_hint = 0;
-                for (size_t i = 0; i != col_lc.size(); ++i)
-                {
-                    if (indexes.getUInt(i) == null_index)
-                    {
-                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
-                        filter.push_back(0);
-                    }
-                    else
-                    {
-                        discriminators_data.push_back(variant_discr);
-                        filter.push_back(1);
-                        ++variant_size_hint;
-                    }
-                }
-
-                MutableColumnPtr variant_column;
-                /// If there were no NULLs, we can just clone the column.
-                if (variant_size_hint == col_lc.size())
-                    variant_column = IColumn::mutate(column);
-                /// Otherwise we should filter column.
-                else
-                    variant_column = column->filter(filter, variant_size_hint)->assumeMutable();
-
-                assert_cast<ColumnLowCardinality &>(*variant_column).nestedRemoveNullable();
-                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), std::move(variant_column), variant_discr);
-            }
-            else
-            {
-                const auto & column = arguments.front().column;
-                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
-                discriminators->getData().resize_fill(column->size(), variant_discr);
-                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), column, variant_discr);
-            }
-        };
-    }
-
-    /// Wrapper for conversion to/from Variant type
-    WrapperType createVariantWrapper(const DataTypePtr & from_type, const DataTypePtr & to_type) const
-    {
-        if (const auto * from_variant = checkAndGetDataType<DataTypeVariant>(from_type.get()))
-        {
-            if (const auto * to_variant = checkAndGetDataType<DataTypeVariant>(to_type.get()))
-                return createVariantToVariantWrapper(*from_variant, *to_variant);
-
-            return createVariantToColumnWrapper(*from_variant, to_type);
-        }
-
-        return createColumnToVariantWrapper(from_type, assert_cast<const DataTypeVariant &>(*to_type));
-    }
-
-    template <typename FieldType>
-    WrapperType createEnumWrapper(const DataTypePtr & from_type, const DataTypeEnum<FieldType> * to_type) const
-    {
-        using EnumType = DataTypeEnum<FieldType>;
-        using Function = typename FunctionTo<EnumType>::Type;
-
-        if (const auto * from_enum8 = checkAndGetDataType<DataTypeEnum8>(from_type.get()))
-            checkEnumToEnumConversion(from_enum8, to_type);
-        else if (const auto * from_enum16 = checkAndGetDataType<DataTypeEnum16>(from_type.get()))
-            checkEnumToEnumConversion(from_enum16, to_type);
-
-        if (checkAndGetDataType<DataTypeString>(from_type.get()))
-            return createStringToEnumWrapper<ColumnString, EnumType>();
-        else if (checkAndGetDataType<DataTypeFixedString>(from_type.get()))
-            return createStringToEnumWrapper<ColumnFixedString, EnumType>();
-        else if (isNativeNumber(from_type) || isEnum(from_type))
-        {
-            auto function = Function::create();
-            return createFunctionAdaptor(function, from_type);
-        }
-        else
-        {
-            if (cast_type == CastType::accurateOrNull)
-                return createToNullableColumnWrapper();
-            else
-                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
-                    from_type->getName(), to_type->getName());
-        }
-    }
-
-    template <typename EnumTypeFrom, typename EnumTypeTo>
-    void checkEnumToEnumConversion(const EnumTypeFrom * from_type, const EnumTypeTo * to_type) const
-    {
-        const auto & from_values = from_type->getValues();
-        const auto & to_values = to_type->getValues();
-
-        using ValueType = std::common_type_t<typename EnumTypeFrom::FieldType, typename EnumTypeTo::FieldType>;
-        using NameValuePair = std::pair<std::string, ValueType>;
-        using EnumValues = std::vector<NameValuePair>;
-
-        EnumValues name_intersection;
-        std::set_intersection(std::begin(from_values), std::end(from_values),
-            std::begin(to_values), std::end(to_values), std::back_inserter(name_intersection),
-            [] (auto && from, auto && to) { return from.first < to.first; });
-
-        for (const auto & name_value : name_intersection)
-        {
-            const auto & old_value = name_value.second;
-            const auto & new_value = to_type->getValue(name_value.first);
-            if (old_value != new_value)
-                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Enum conversion changes value for element '{}' from {} to {}",
-                    name_value.first, toString(old_value), toString(new_value));
-        }
-    }
-
-    template <typename ColumnStringType, typename EnumType>
-    WrapperType createStringToEnumWrapper() const
-    {
-        const char * function_name = cast_name;
-        return [function_name] (
-            ColumnsWithTypeAndName & arguments, const DataTypePtr & res_type, const ColumnNullable * nullable_col, size_t /*input_rows_count*/)
-        {
-            const auto & first_col = arguments.front().column.get();
-            const auto & result_type = typeid_cast<const EnumType &>(*res_type);
-
-            const ColumnStringType * col = typeid_cast<const ColumnStringType *>(first_col);
-
-            if (col && nullable_col && nullable_col->size() != col->size())
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "ColumnNullable is not compatible with original");
-
-            if (col)
-            {
-                const auto size = col->size();
-
-                auto res = result_type.createColumn();
-                auto & out_data = static_cast<typename EnumType::ColumnType &>(*res).getData();
-                out_data.resize(size);
-
-                auto default_enum_value = result_type.getValues().front().second;
-
-                if (nullable_col)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!nullable_col->isNullAt(i))
-                            out_data[i] = result_type.getValue(col->getDataAt(i));
-                        else
-                            out_data[i] = default_enum_value;
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                        out_data[i] = result_type.getValue(col->getDataAt(i));
-                }
-
-                return res;
-            }
-            else
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected column {} as first argument of function {}",
-                    first_col->getName(), function_name);
-        };
-    }
-
-    template <typename EnumType>
-    WrapperType createEnumToStringWrapper() const
-    {
-        const char * function_name = cast_name;
-        return [function_name] (
-            ColumnsWithTypeAndName & arguments, const DataTypePtr & res_type, const ColumnNullable * nullable_col, size_t /*input_rows_count*/)
-        {
-            using ColumnEnumType = EnumType::ColumnType;
-
-            const auto & first_col = arguments.front().column.get();
-            const auto & first_type = arguments.front().type.get();
-
-            const ColumnEnumType * enum_col = typeid_cast<const ColumnEnumType *>(first_col);
-            const EnumType * enum_type = typeid_cast<const EnumType *>(first_type);
-
-            if (enum_col && nullable_col && nullable_col->size() != enum_col->size())
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "ColumnNullable is not compatible with original");
-
-            if (enum_col && enum_type)
-            {
-                const auto size = enum_col->size();
-                const auto & enum_data = enum_col->getData();
-
-                auto res = res_type->createColumn();
-
-                if (nullable_col)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!nullable_col->isNullAt(i))
-                        {
-                            const auto & value = enum_type->getNameForValue(enum_data[i]);
-                            res->insertData(value.data, value.size);
-                        }
-                        else
-                            res->insertDefault();
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        const auto & value = enum_type->getNameForValue(enum_data[i]);
-                        res->insertData(value.data, value.size);
-                    }
-                }
-
-                return res;
-            }
-            else
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected column {} as first argument of function {}",
-                    first_col->getName(), function_name);
-        };
-    }
-
-    static WrapperType createIdentityWrapper(const DataTypePtr &)
-    {
-        return [] (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t /*input_rows_count*/)
-        {
-            return arguments.front().column;
-        };
-    }
-
-    static WrapperType createNothingWrapper(const IDataType * to_type)
-    {
-        ColumnPtr res = to_type->createColumnConstWithDefaultValue(1);
-        return [res] (ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t input_rows_count)
-        {
-            /// Column of Nothing type is trivially convertible to any other column
-            return res->cloneResized(input_rows_count)->convertToFullColumnIfConst();
-        };
-    }
-
-    WrapperType prepareUnpackDictionaries(const DataTypePtr & from_type, const DataTypePtr & to_type) const
-    {
-        /// Conversion from/to Variant data type is processed in a special way.
-        /// We don't need to remove LowCardinality/Nullable.
-        if (isVariant(to_type) || isVariant(from_type))
-            return createVariantWrapper(from_type, to_type);
-
-        const auto * from_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(from_type.get());
-        const auto * to_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(to_type.get());
-        const auto & from_nested = from_low_cardinality ? from_low_cardinality->getDictionaryType() : from_type;
-        const auto & to_nested = to_low_cardinality ? to_low_cardinality->getDictionaryType() : to_type;
-
-        if (from_type->onlyNull())
-        {
-            if (!to_nested->isNullable() && !isVariant(to_type))
-            {
-                if (cast_type == CastType::accurateOrNull)
-                {
-                    return createToNullableColumnWrapper();
-                }
-                else
-                {
-                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert NULL to a non-nullable type");
-                }
-            }
-
-            return [](ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count)
-            {
-                return result_type->createColumnConstWithDefaultValue(input_rows_count)->convertToFullColumnIfConst();
-            };
-        }
-
-        bool skip_not_null_check = false;
-
-        if (from_low_cardinality && from_nested->isNullable() && !to_nested->isNullable())
-            /// Disable check for dictionary. Will check that column doesn't contain NULL in wrapper below.
-            skip_not_null_check = true;
-
-        auto wrapper = prepareRemoveNullable(from_nested, to_nested, skip_not_null_check);
-        if (!from_low_cardinality && !to_low_cardinality)
-            return wrapper;
-
-        return [wrapper, from_low_cardinality, to_low_cardinality, skip_not_null_check]
-                (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * nullable_source, size_t input_rows_count) -> ColumnPtr
-        {
-            ColumnsWithTypeAndName args = {arguments[0]};
-            auto & arg = args.front();
-            auto res_type = result_type;
-
-            ColumnPtr converted_column;
-
-            ColumnPtr res_indexes;
-            /// For some types default can't be casted (for example, String to Int). In that case convert column to full.
-            bool src_converted_to_full_column = false;
-
-            {
-                auto tmp_rows_count = input_rows_count;
-
-                if (to_low_cardinality)
-                    res_type = to_low_cardinality->getDictionaryType();
-
-                if (from_low_cardinality)
-                {
-                    const auto * col_low_cardinality = typeid_cast<const ColumnLowCardinality *>(arguments[0].column.get());
-
-                    if (skip_not_null_check && col_low_cardinality->containsNull())
-                        throw Exception(ErrorCodes::CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN, "Cannot convert NULL value to non-Nullable type");
-
-                    arg.column = col_low_cardinality->getDictionary().getNestedColumn();
-                    arg.type = from_low_cardinality->getDictionaryType();
-
-                    /// TODO: Make map with defaults conversion.
-                    src_converted_to_full_column = !removeNullable(arg.type)->equals(*removeNullable(res_type));
-                    if (src_converted_to_full_column)
-                        arg.column = arg.column->index(col_low_cardinality->getIndexes(), 0);
-                    else
-                        res_indexes = col_low_cardinality->getIndexesPtr();
-
-                    tmp_rows_count = arg.column->size();
-                }
-
-                /// Perform the requested conversion.
-                converted_column = wrapper(args, res_type, nullable_source, tmp_rows_count);
-            }
-
-            if (to_low_cardinality)
-            {
-                auto res_column = to_low_cardinality->createColumn();
-                auto * col_low_cardinality = typeid_cast<ColumnLowCardinality *>(res_column.get());
-
-                if (from_low_cardinality && !src_converted_to_full_column)
-                {
-                    col_low_cardinality->insertRangeFromDictionaryEncodedColumn(*converted_column, *res_indexes);
-                }
-                else
-                    col_low_cardinality->insertRangeFromFullColumn(*converted_column, 0, converted_column->size());
-
-                return res_column;
-            }
-            else if (!src_converted_to_full_column)
-                return converted_column->index(*res_indexes, 0);
-            else
-                return converted_column;
-        };
-    }
-
-    WrapperType prepareRemoveNullable(const DataTypePtr & from_type, const DataTypePtr & to_type, bool skip_not_null_check) const
-    {
-        /// Determine whether pre-processing and/or post-processing must take place during conversion.
-
-        bool source_is_nullable = from_type->isNullable();
-        bool result_is_nullable = to_type->isNullable();
-
-        auto wrapper = prepareImpl(removeNullable(from_type), removeNullable(to_type), result_is_nullable);
-
-        if (result_is_nullable)
-        {
-            return [wrapper, source_is_nullable]
-                (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-            {
-                /// Create a temporary columns on which to perform the operation.
-                const auto & nullable_type = static_cast<const DataTypeNullable &>(*result_type);
-                const auto & nested_type = nullable_type.getNestedType();
-
-                ColumnsWithTypeAndName tmp_args;
-                if (source_is_nullable)
-                    tmp_args = createBlockWithNestedColumns(arguments);
-                else
-                    tmp_args = arguments;
-
-                const ColumnNullable * nullable_source = nullptr;
-
-                /// Add original ColumnNullable for createStringToEnumWrapper()
-                if (source_is_nullable)
-                {
-                    if (arguments.size() != 1)
-                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid number of arguments");
-                    nullable_source = typeid_cast<const ColumnNullable *>(arguments.front().column.get());
-                }
-
-                /// Perform the requested conversion.
-                auto tmp_res = wrapper(tmp_args, nested_type, nullable_source, input_rows_count);
-
-                /// May happen in fuzzy tests. For debug purpose.
-                if (!tmp_res)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Couldn't convert {} to {} in prepareRemoveNullable wrapper.",
-                                    arguments[0].type->getName(), nested_type->getName());
-
-                return wrapInNullable(tmp_res, arguments, nested_type, input_rows_count);
-            };
-        }
-        else if (source_is_nullable)
-        {
-            /// Conversion from Nullable to non-Nullable.
-
-            return [wrapper, skip_not_null_check]
-                (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-            {
-                auto tmp_args = createBlockWithNestedColumns(arguments);
-                auto nested_type = removeNullable(result_type);
-
-                /// Check that all values are not-NULL.
-                /// Check can be skipped in case if LowCardinality dictionary is transformed.
-                /// In that case, correctness will be checked beforehand.
-                if (!skip_not_null_check)
-                {
-                    const auto & col = arguments[0].column;
-                    const auto & nullable_col = assert_cast<const ColumnNullable &>(*col);
-                    const auto & null_map = nullable_col.getNullMapData();
-
-                    if (!memoryIsZero(null_map.data(), 0, null_map.size()))
-                        throw Exception(ErrorCodes::CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN, "Cannot convert NULL value to non-Nullable type");
-                }
-                const ColumnNullable * nullable_source = typeid_cast<const ColumnNullable *>(arguments.front().column.get());
-                return wrapper(tmp_args, nested_type, nullable_source, input_rows_count);
-            };
-        }
-        else
-            return wrapper;
-    }
-
-    /// 'from_type' and 'to_type' are nested types in case of Nullable.
-    /// 'requested_result_is_nullable' is true if CAST to Nullable type is requested.
-    WrapperType prepareImpl(const DataTypePtr & from_type, const DataTypePtr & to_type, bool requested_result_is_nullable) const
-    {
-        if (isUInt8(from_type) && isBool(to_type))
-            return createUInt8ToBoolWrapper(from_type, to_type);
-
-        /// We can cast IPv6 into IPv6, IPv4 into IPv4, but we should not allow to cast FixedString(16) into IPv6 as part of identity cast
-        bool safe_convert_custom_types = true;
-
-        if (const auto * to_type_custom_name = to_type->getCustomName())
-            safe_convert_custom_types = from_type->getCustomName() && from_type->getCustomName()->getName() == to_type_custom_name->getName();
-        else if (const auto * from_type_custom_name = from_type->getCustomName())
-            safe_convert_custom_types = to_type->getCustomName() && from_type_custom_name->getName() == to_type->getCustomName()->getName();
-
-        if (from_type->equals(*to_type) && safe_convert_custom_types)
-        {
-            /// We can only use identity conversion for DataTypeAggregateFunction when they are strictly equivalent.
-            if (typeid_cast<const DataTypeAggregateFunction *>(from_type.get()))
-            {
-                if (DataTypeAggregateFunction::strictEquals(from_type, to_type))
-                    return createIdentityWrapper(from_type);
-            }
-            else
-                return createIdentityWrapper(from_type);
-        }
-        else if (WhichDataType(from_type).isNothing())
-            return createNothingWrapper(to_type.get());
-
-        WrapperType ret;
-
-        auto make_default_wrapper = [&](const auto & types) -> bool
-        {
-            using Types = std::decay_t<decltype(types)>;
-            using ToDataType = typename Types::LeftType;
-
-            if constexpr (
-                std::is_same_v<ToDataType, DataTypeUInt16> ||
-                std::is_same_v<ToDataType, DataTypeUInt32> ||
-                std::is_same_v<ToDataType, DataTypeUInt64> ||
-                std::is_same_v<ToDataType, DataTypeUInt128> ||
-                std::is_same_v<ToDataType, DataTypeUInt256> ||
-                std::is_same_v<ToDataType, DataTypeInt8> ||
-                std::is_same_v<ToDataType, DataTypeInt16> ||
-                std::is_same_v<ToDataType, DataTypeInt32> ||
-                std::is_same_v<ToDataType, DataTypeInt64> ||
-                std::is_same_v<ToDataType, DataTypeInt128> ||
-                std::is_same_v<ToDataType, DataTypeInt256> ||
-                std::is_same_v<ToDataType, DataTypeFloat32> ||
-                std::is_same_v<ToDataType, DataTypeFloat64> ||
-                std::is_same_v<ToDataType, DataTypeDate> ||
-                std::is_same_v<ToDataType, DataTypeDate32> ||
-                std::is_same_v<ToDataType, DataTypeDateTime> ||
-                std::is_same_v<ToDataType, DataTypeUUID> ||
-                std::is_same_v<ToDataType, DataTypeIPv4> ||
-                std::is_same_v<ToDataType, DataTypeIPv6>)
-            {
-                ret = createWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
-                return true;
-            }
-            if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
-            {
-                if (isBool(to_type))
-                    ret = createBoolWrapper<ToDataType>(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
-                else
-                    ret = createWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
-                return true;
-            }
-            if constexpr (
-                std::is_same_v<ToDataType, DataTypeEnum8> ||
-                std::is_same_v<ToDataType, DataTypeEnum16>)
-            {
-                ret = createEnumWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()));
-                return true;
-            }
-            if constexpr (
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal32>> ||
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal64>> ||
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal128>> ||
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal256>> ||
-                std::is_same_v<ToDataType, DataTypeDateTime64>)
-            {
-                ret = createDecimalWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
-                return true;
-            }
-
-            return false;
-        };
-
-        bool cast_ipv4_ipv6_default_on_conversion_error_value = context && context->getSettingsRef().cast_ipv4_ipv6_default_on_conversion_error;
-        bool input_format_ipv4_default_on_conversion_error_value = context && context->getSettingsRef().input_format_ipv4_default_on_conversion_error;
-        bool input_format_ipv6_default_on_conversion_error_value = context && context->getSettingsRef().input_format_ipv6_default_on_conversion_error;
-
-        auto make_custom_serialization_wrapper = [&, cast_ipv4_ipv6_default_on_conversion_error_value, input_format_ipv4_default_on_conversion_error_value, input_format_ipv6_default_on_conversion_error_value](const auto & types) -> bool
-        {
-            using Types = std::decay_t<decltype(types)>;
-            using ToDataType = typename Types::RightType;
-            using FromDataType = typename Types::LeftType;
-
-            if constexpr (WhichDataType(FromDataType::type_id).isStringOrFixedString())
-            {
-                if constexpr (std::is_same_v<ToDataType, DataTypeIPv4>)
-                {
-                    ret = [cast_ipv4_ipv6_default_on_conversion_error_value,
-                           input_format_ipv4_default_on_conversion_error_value,
-                           requested_result_is_nullable](
-                              ColumnsWithTypeAndName & arguments,
-                              const DataTypePtr & result_type,
-                              const ColumnNullable * column_nullable,
-                              size_t) -> ColumnPtr
-                    {
-                        if (!WhichDataType(result_type).isIPv4())
-                            throw Exception(ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv4", result_type->getName());
-
-                        const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
-                        if (requested_result_is_nullable)
-                            return convertToIPv4<IPStringToNumExceptionMode::Null>(arguments[0].column, null_map);
-                        else if (cast_ipv4_ipv6_default_on_conversion_error_value || input_format_ipv4_default_on_conversion_error_value)
-                            return convertToIPv4<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
-                        else
-                            return convertToIPv4<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
-                    };
-
-                    return true;
-                }
-
-                if constexpr (std::is_same_v<ToDataType, DataTypeIPv6>)
-                {
-                    ret = [cast_ipv4_ipv6_default_on_conversion_error_value,
-                           input_format_ipv6_default_on_conversion_error_value,
-                           requested_result_is_nullable](
-                              ColumnsWithTypeAndName & arguments,
-                              const DataTypePtr & result_type,
-                              const ColumnNullable * column_nullable,
-                              size_t) -> ColumnPtr
-                    {
-                        if (!WhichDataType(result_type).isIPv6())
-                            throw Exception(
-                                ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv6", result_type->getName());
-
-                        const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
-                        if (requested_result_is_nullable)
-                            return convertToIPv6<IPStringToNumExceptionMode::Null>(arguments[0].column, null_map);
-                        else if (cast_ipv4_ipv6_default_on_conversion_error_value || input_format_ipv6_default_on_conversion_error_value)
-                            return convertToIPv6<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
-                        else
-                            return convertToIPv6<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
-                    };
-
-                    return true;
-                }
-
-                if (to_type->getCustomSerialization() && to_type->getCustomName())
-                {
-                    ret = [requested_result_is_nullable](
-                              ColumnsWithTypeAndName & arguments,
-                              const DataTypePtr & result_type,
-                              const ColumnNullable * column_nullable,
-                              size_t input_rows_count) -> ColumnPtr
-                    {
-                        auto wrapped_result_type = result_type;
-                        if (requested_result_is_nullable)
-                            wrapped_result_type = makeNullable(result_type);
-                        return ConvertImplGenericFromString::execute(
-                            arguments, wrapped_result_type, column_nullable, input_rows_count);
-                    };
-                    return true;
-                }
-            }
-            else if constexpr (WhichDataType(FromDataType::type_id).isIPv6() && WhichDataType(ToDataType::type_id).isIPv4())
-            {
-                ret = [cast_ipv4_ipv6_default_on_conversion_error_value, requested_result_is_nullable](
-                                ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * column_nullable, size_t)
-                        -> ColumnPtr
-                {
-                    if (!WhichDataType(result_type).isIPv4())
-                        throw Exception(
-                            ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv4", result_type->getName());
-
-                    const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
-                    if (requested_result_is_nullable)
-                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Null>(arguments[0].column, null_map);
-                    else if (cast_ipv4_ipv6_default_on_conversion_error_value)
-                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
-                    else
-                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
-                };
-
-                return true;
-            }
-
-            if constexpr (WhichDataType(ToDataType::type_id).isStringOrFixedString())
-            {
-                if constexpr (WhichDataType(FromDataType::type_id).isEnum())
-                {
-                    ret = createEnumToStringWrapper<FromDataType>();
-                    return true;
-                }
-                else if (from_type->getCustomSerialization())
-                {
-                    ret = [](ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-                    {
-                        return ConvertImplGenericToString<typename ToDataType::ColumnType>::execute(arguments, result_type, input_rows_count);
-                    };
-                    return true;
-                }
-            }
-
-            return false;
-        };
-
-        if (callOnTwoTypeIndexes(from_type->getTypeId(), to_type->getTypeId(), make_custom_serialization_wrapper))
-            return ret;
-
-        if (callOnIndexAndDataType<void>(to_type->getTypeId(), make_default_wrapper))
-            return ret;
-
-        switch (to_type->getTypeId())
-        {
-            case TypeIndex::String:
-                return createStringWrapper(from_type);
-            case TypeIndex::FixedString:
-                return createFixedStringWrapper(from_type, checkAndGetDataType<DataTypeFixedString>(to_type.get())->getN());
-            case TypeIndex::Array:
-                return createArrayWrapper(from_type, static_cast<const DataTypeArray &>(*to_type));
-            case TypeIndex::Tuple:
-                return createTupleWrapper(from_type, checkAndGetDataType<DataTypeTuple>(to_type.get()));
-            case TypeIndex::Map:
-                return createMapWrapper(from_type, checkAndGetDataType<DataTypeMap>(to_type.get()));
-            case TypeIndex::Object:
-                return createObjectWrapper(from_type, checkAndGetDataType<DataTypeObject>(to_type.get()));
-            case TypeIndex::AggregateFunction:
-                return createAggregateFunctionWrapper(from_type, checkAndGetDataType<DataTypeAggregateFunction>(to_type.get()));
-            case TypeIndex::Interval:
-                return createIntervalWrapper(from_type, checkAndGetDataType<DataTypeInterval>(to_type.get())->getKind());
-            default:
-                break;
-        }
-
-        if (cast_type == CastType::accurateOrNull)
-            return createToNullableColumnWrapper();
-        else
-            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
-                from_type->getName(), to_type->getName());
-    }
-};
-
-class MonotonicityHelper
-{
-public:
-    using MonotonicityForRange = FunctionCastBase::MonotonicityForRange;
-
-    template <typename DataType>
-    static auto monotonicityForType(const DataType * const)
-    {
-        return FunctionTo<DataType>::Type::Monotonic::get;
-    }
-
-    static MonotonicityForRange getMonotonicityInformation(const DataTypePtr & from_type, const IDataType * to_type);
-};
-
-FunctionBasePtr createFunctionBaseCast(
-    ContextPtr context
-    , const ColumnsWithTypeAndName & arguments
-    , const DataTypePtr & return_type
-    , std::optional<CastDiagnostic> diagnostic
-    , CastType cast_type);
-
-}

From 70796e497f1970d186d017226e93a67f1c6d170f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 08:32:13 +0100
Subject: [PATCH 216/985] Miscellaneous

---
 programs/library-bridge/createFunctionBaseCast.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/library-bridge/createFunctionBaseCast.cpp b/programs/library-bridge/createFunctionBaseCast.cpp
index 473aa1ca81d..194fc4bfcf7 100644
--- a/programs/library-bridge/createFunctionBaseCast.cpp
+++ b/programs/library-bridge/createFunctionBaseCast.cpp
@@ -13,7 +13,7 @@ namespace ErrorCodes
 FunctionBasePtr createFunctionBaseCast(
     ContextPtr, const ColumnsWithTypeAndName &, const DataTypePtr &, std::optional<CastDiagnostic>, CastType)
 {
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Type conversions are not implemented for ODBC Bridge");
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Type conversions are not implemented for Library Bridge");
 }
 
 }

From 47b308d2346ef2b87d478d8ee29ee439097df000 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 08:42:33 +0100
Subject: [PATCH 217/985] Simplify bridges

---
 .../library-bridge/LibraryBridgeHandlers.cpp  |  3 --
 programs/odbc-bridge/ColumnInfoHandler.cpp    |  2 -
 .../odbc-bridge/IdentifierQuoteHandler.cpp    |  3 --
 programs/odbc-bridge/ODBCBlockInputStream.cpp | 50 ++++++-------------
 .../odbc-bridge/ODBCBlockOutputStream.cpp     |  1 -
 5 files changed, 16 insertions(+), 43 deletions(-)

diff --git a/programs/library-bridge/LibraryBridgeHandlers.cpp b/programs/library-bridge/LibraryBridgeHandlers.cpp
index ab146f458df..26d887cfc98 100644
--- a/programs/library-bridge/LibraryBridgeHandlers.cpp
+++ b/programs/library-bridge/LibraryBridgeHandlers.cpp
@@ -1,6 +1,5 @@
 #include "LibraryBridgeHandlers.h"
 
-#include "CatBoostLibraryHandler.h"
 #include "CatBoostLibraryHandlerFactory.h"
 #include "Common/ProfileEvents.h"
 #include "ExternalDictionaryLibraryHandler.h"
@@ -11,10 +10,8 @@
 #include <IO/ReadHelpers.h>
 #include <Common/BridgeProtocolVersion.h>
 #include <IO/WriteHelpers.h>
-#include <Poco/Net/HTMLForm.h>
 #include <Poco/Net/HTTPServerRequest.h>
 #include <Poco/Net/HTTPServerResponse.h>
-#include <Poco/ThreadPool.h>
 #include <Processors/Executors/CompletedPipelineExecutor.h>
 #include <Processors/Executors/PullingPipelineExecutor.h>
 #include <Processors/Formats/IInputFormat.h>
diff --git a/programs/odbc-bridge/ColumnInfoHandler.cpp b/programs/odbc-bridge/ColumnInfoHandler.cpp
index 774883657b7..4cb15de3b2c 100644
--- a/programs/odbc-bridge/ColumnInfoHandler.cpp
+++ b/programs/odbc-bridge/ColumnInfoHandler.cpp
@@ -8,13 +8,11 @@
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
 #include <Parsers/ParserQueryWithOutput.h>
-#include <Parsers/parseQuery.h>
 #include <Server/HTTP/HTMLForm.h>
 #include <Poco/Net/HTTPServerRequest.h>
 #include <Poco/Net/HTTPServerResponse.h>
 #include <Poco/NumberParser.h>
 #include <Common/logger_useful.h>
-#include <base/scope_guard.h>
 #include <Common/BridgeProtocolVersion.h>
 #include <Common/quoteString.h>
 #include "getIdentifierQuote.h"
diff --git a/programs/odbc-bridge/IdentifierQuoteHandler.cpp b/programs/odbc-bridge/IdentifierQuoteHandler.cpp
index a23efb112de..cf5acdc4534 100644
--- a/programs/odbc-bridge/IdentifierQuoteHandler.cpp
+++ b/programs/odbc-bridge/IdentifierQuoteHandler.cpp
@@ -7,13 +7,10 @@
 #include <Server/HTTP/WriteBufferFromHTTPServerResponse.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
-#include <Parsers/ParserQueryWithOutput.h>
-#include <Parsers/parseQuery.h>
 #include <Poco/Net/HTTPServerRequest.h>
 #include <Poco/Net/HTTPServerResponse.h>
 #include <Common/BridgeProtocolVersion.h>
 #include <Common/logger_useful.h>
-#include <base/scope_guard.h>
 #include "getIdentifierQuote.h"
 #include "validateODBCConnectionString.h"
 #include "ODBCPooledConnectionFactory.h"
diff --git a/programs/odbc-bridge/ODBCBlockInputStream.cpp b/programs/odbc-bridge/ODBCBlockInputStream.cpp
index c46144c3dc8..2cccc66a033 100644
--- a/programs/odbc-bridge/ODBCBlockInputStream.cpp
+++ b/programs/odbc-bridge/ODBCBlockInputStream.cpp
@@ -3,12 +3,8 @@
 #include <IO/ReadBufferFromString.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeDateTime64.h>
-#include <Columns/ColumnNullable.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnsNumber.h>
 #include <Common/assert_cast.h>
 #include <IO/ReadHelpers.h>
-#include <IO/WriteHelpers.h>
 #include <Common/logger_useful.h>
 
 
@@ -54,21 +50,7 @@ Chunk ODBCSource::generate()
             const auto & sample = description.sample_block.getByPosition(idx);
 
             if (!result.is_null(idx))
-            {
-                bool is_nullable = description.types[idx].second;
-
-                if (is_nullable)
-                {
-                    ColumnNullable & column_nullable = assert_cast<ColumnNullable &>(*columns[idx]);
-                    const auto & data_type = assert_cast<const DataTypeNullable &>(*sample.type);
-                    insertValue(column_nullable.getNestedColumn(), data_type.getNestedType(), description.types[idx].first, result, idx);
-                    column_nullable.getNullMapData().emplace_back(0);
-                }
-                else
-                {
-                    insertValue(*columns[idx], sample.type, description.types[idx].first, result, idx);
-                }
-            }
+                insertValue(*columns[idx], sample.type, description.types[idx].first, result, idx);
             else
                 insertDefaultValue(*columns[idx], *sample.column);
         }
@@ -87,49 +69,49 @@ void ODBCSource::insertValue(
     switch (type)
     {
         case ValueType::vtUInt8:
-            assert_cast<ColumnUInt8 &>(column).insertValue(row.get<uint16_t>(idx));
+            column.insert(row.get<uint16_t>(idx));
             break;
         case ValueType::vtUInt16:
-            assert_cast<ColumnUInt16 &>(column).insertValue(row.get<uint16_t>(idx));
+            column.insert(row.get<uint16_t>(idx));
             break;
         case ValueType::vtUInt32:
-            assert_cast<ColumnUInt32 &>(column).insertValue(row.get<uint32_t>(idx));
+            column.insert(row.get<uint32_t>(idx));
             break;
         case ValueType::vtUInt64:
-            assert_cast<ColumnUInt64 &>(column).insertValue(row.get<uint64_t>(idx));
+            column.insert(row.get<uint64_t>(idx));
             break;
         case ValueType::vtInt8:
-            assert_cast<ColumnInt8 &>(column).insertValue(row.get<int16_t>(idx));
+            column.insert(row.get<int16_t>(idx));
             break;
         case ValueType::vtInt16:
-            assert_cast<ColumnInt16 &>(column).insertValue(row.get<int16_t>(idx));
+            column.insert(row.get<int16_t>(idx));
             break;
         case ValueType::vtInt32:
-            assert_cast<ColumnInt32 &>(column).insertValue(row.get<int32_t>(idx));
+            column.insert(row.get<int32_t>(idx));
             break;
         case ValueType::vtInt64:
-            assert_cast<ColumnInt64 &>(column).insertValue(row.get<int64_t>(idx));
+            column.insert(row.get<int64_t>(idx));
             break;
         case ValueType::vtFloat32:
-            assert_cast<ColumnFloat32 &>(column).insertValue(row.get<float>(idx));
+            column.insert(row.get<float>(idx));
             break;
         case ValueType::vtFloat64:
-            assert_cast<ColumnFloat64 &>(column).insertValue(row.get<double>(idx));
+            column.insert(row.get<double>(idx));
             break;
         case ValueType::vtFixedString:[[fallthrough]];
         case ValueType::vtEnum8:
         case ValueType::vtEnum16:
         case ValueType::vtString:
-            assert_cast<ColumnString &>(column).insert(row.get<std::string>(idx));
+            column.insert(row.get<std::string>(idx));
             break;
         case ValueType::vtUUID:
         {
             auto value = row.get<std::string>(idx);
-            assert_cast<ColumnUInt128 &>(column).insert(parse<UUID>(value.data(), value.size()));
+            column.insert(parse<UUID>(value.data(), value.size()));
             break;
         }
         case ValueType::vtDate:
-            assert_cast<ColumnUInt16 &>(column).insertValue(UInt16{LocalDate{row.get<std::string>(idx)}.getDayNum()});
+            column.insert(UInt16{LocalDate{row.get<std::string>(idx)}.getDayNum()});
             break;
         case ValueType::vtDateTime:
         {
@@ -139,7 +121,7 @@ void ODBCSource::insertValue(
             readDateTimeText(time, in, assert_cast<const DataTypeDateTime *>(data_type.get())->getTimeZone());
             if (time < 0)
                 time = 0;
-            assert_cast<ColumnUInt32 &>(column).insertValue(static_cast<UInt32>(time));
+            column.insert(static_cast<UInt32>(time));
             break;
         }
         case ValueType::vtDateTime64:
@@ -149,7 +131,7 @@ void ODBCSource::insertValue(
             DateTime64 time = 0;
             const auto * datetime_type = assert_cast<const DataTypeDateTime64 *>(data_type.get());
             readDateTime64Text(time, datetime_type->getScale(), in, datetime_type->getTimeZone());
-            assert_cast<DataTypeDateTime64::ColumnType &>(column).insertValue(time);
+            column.insert(time);
             break;
         }
         case ValueType::vtDecimal32: [[fallthrough]];
diff --git a/programs/odbc-bridge/ODBCBlockOutputStream.cpp b/programs/odbc-bridge/ODBCBlockOutputStream.cpp
index 87c09d1e757..37b70023169 100644
--- a/programs/odbc-bridge/ODBCBlockOutputStream.cpp
+++ b/programs/odbc-bridge/ODBCBlockOutputStream.cpp
@@ -1,6 +1,5 @@
 #include "ODBCBlockOutputStream.h"
 
-#include <Common/logger_useful.h>
 #include <IO/WriteBufferFromString.h>
 #include <Interpreters/Context.h>
 #include <Processors/Formats/IOutputFormat.h>

From 3cd70f48b0d2ef1584a9351291de4d230e71c021 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 08:49:55 +0100
Subject: [PATCH 218/985] Anonymous

---
 src/Functions/CastOverloadResolver.cpp | 15 -----------
 src/Functions/FunctionsConversion.cpp  | 37 +++++++++++++-------------
 2 files changed, 19 insertions(+), 33 deletions(-)

diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 4a081d684f6..ad4b28d11c1 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -117,21 +117,6 @@ private:
 };
 
 
-UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
-{
-    const auto * arg_type = named_column.type.get();
-    bool ok = checkAndGetDataType<DataTypeUInt64>(arg_type)
-        || checkAndGetDataType<DataTypeUInt32>(arg_type)
-        || checkAndGetDataType<DataTypeUInt16>(arg_type)
-        || checkAndGetDataType<DataTypeUInt8>(arg_type);
-    if (!ok)
-        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type of toDecimal() scale {}", named_column.type->getName());
-
-    Field field;
-    named_column.column->get(0, field);
-    return static_cast<UInt32>(field.get<UInt32>());
-}
-
 FunctionOverloadResolverPtr createInternalCastOverloadResolver(CastType type, std::optional<CastDiagnostic> diagnostic)
 {
     return CastOverloadResolverImpl::create(ContextPtr{}, type, true, diagnostic);
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 865f7db8e12..3da6b9abe2d 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -93,11 +93,27 @@ namespace ErrorCodes
     extern const int VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE;
 }
 
+namespace
+{
+
 /** Type conversion functions.
   * toType - conversion in "natural way";
   */
 
-UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column);
+UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
+{
+    const auto * arg_type = named_column.type.get();
+    bool ok = checkAndGetDataType<DataTypeUInt64>(arg_type)
+        || checkAndGetDataType<DataTypeUInt32>(arg_type)
+        || checkAndGetDataType<DataTypeUInt16>(arg_type)
+        || checkAndGetDataType<DataTypeUInt8>(arg_type);
+    if (!ok)
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type of toDecimal() scale {}", named_column.type->getName());
+
+    Field field;
+    named_column.column->get(0, field);
+    return static_cast<UInt32>(field.get<UInt32>());
+}
 
 /// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
 struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
@@ -1271,23 +1287,6 @@ void convertFromTime(typename DataType::FieldType & x, time_t & time)
     x = time;
 }
 
-template <>
-inline void convertFromTime<DataTypeDate>(DataTypeDate::FieldType & x, time_t & time)
-{
-    if (unlikely(time < 0))
-        x = 0;
-    else if (unlikely(time > 0xFFFF))
-        x = 0xFFFF;
-    else
-        x = time;
-}
-
-template <>
-inline void convertFromTime<DataTypeDate32>(DataTypeDate32::FieldType & x, time_t & time)
-{
-    x = static_cast<UInt32>(time);
-}
-
 template <>
 inline void convertFromTime<DataTypeDateTime>(DataTypeDateTime::FieldType & x, time_t & time)
 {
@@ -4960,6 +4959,8 @@ public:
     }
 };
 
+}
+
 
 FunctionBasePtr createFunctionBaseCast(
     ContextPtr context

From d2e19a5da342236eb377e40a79a1fcd467b13b7a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 08:55:53 +0100
Subject: [PATCH 219/985] Remove unused header

---
 src/Functions/CastOverloadResolver.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index ad4b28d11c1..1e1fbd06d93 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -2,7 +2,6 @@
 #include <Functions/CastOverloadResolver.h>
 #include <Functions/FunctionHelpers.h>
 #include <DataTypes/DataTypeFactory.h>
-#include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <Columns/ColumnString.h>
 #include <Interpreters/parseColumnsListForTableFunction.h>

From 8a46eace13458a735ccce5f423f6b750b0db869a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 09:15:56 +0100
Subject: [PATCH 220/985] Less exceptions

---
 utils/check-style/check-large-objects.sh | 1 -
 1 file changed, 1 deletion(-)

diff --git a/utils/check-style/check-large-objects.sh b/utils/check-style/check-large-objects.sh
index 5c1276e5732..4eb9190512f 100755
--- a/utils/check-style/check-large-objects.sh
+++ b/utils/check-style/check-large-objects.sh
@@ -3,7 +3,6 @@
 # Check that there are no new translation units compiled to an object file larger than a certain size.
 
 TU_EXCLUDES=(
-    CastOverloadResolver
     AggregateFunctionUniq
     FunctionsConversion
 

From 194de2066c1e60a15d48f21333e97e5ec2d2f82b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 09:22:14 +0100
Subject: [PATCH 221/985] Loosen

---
 CMakeLists.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index b55e9810361..9ffb4789dc9 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -61,8 +61,8 @@ if (ENABLE_CHECK_HEAVY_BUILDS)
     # set CPU time limit to 1000 seconds
     set (RLIMIT_CPU 1000)
 
-    # -fsanitize=memory is too heavy
-    if (SANITIZE STREQUAL "memory")
+    # -fsanitize=memory and address are too heavy
+    if (SANITIZE)
        set (RLIMIT_DATA 10000000000) # 10G
     endif()
 

From e9ab3ed2dd8ec6e81a5125c27ae4ad30882ecddf Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 09:27:11 +0100
Subject: [PATCH 222/985] Even better

---
 programs/library-bridge/LibraryBridge.h            | 2 +-
 programs/library-bridge/createFunctionBaseCast.cpp | 6 +++++-
 programs/odbc-bridge/createFunctionBaseCast.cpp    | 8 ++++++--
 3 files changed, 12 insertions(+), 4 deletions(-)

diff --git a/programs/library-bridge/LibraryBridge.h b/programs/library-bridge/LibraryBridge.h
index 04860a042a3..a8d15a87e07 100644
--- a/programs/library-bridge/LibraryBridge.h
+++ b/programs/library-bridge/LibraryBridge.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Interpreters/Context.h>
+#include <Interpreters/Context_fwd.h>
 #include <Bridge/IBridge.h>
 #include "LibraryBridgeHandlerFactory.h"
 
diff --git a/programs/library-bridge/createFunctionBaseCast.cpp b/programs/library-bridge/createFunctionBaseCast.cpp
index 194fc4bfcf7..54319ca707a 100644
--- a/programs/library-bridge/createFunctionBaseCast.cpp
+++ b/programs/library-bridge/createFunctionBaseCast.cpp
@@ -1,5 +1,6 @@
-#include <Functions/IFunction.h>
+#include <memory>
 #include <Functions/CastOverloadResolver.h>
+#include <Core/ColumnsWithTypeAndName.h>
 
 
 namespace DB
@@ -10,6 +11,9 @@ namespace ErrorCodes
     extern const int NOT_IMPLEMENTED;
 }
 
+class IFunctionBase;
+using FunctionBasePtr = std::shared_ptr<const IFunctionBase>;
+
 FunctionBasePtr createFunctionBaseCast(
     ContextPtr, const ColumnsWithTypeAndName &, const DataTypePtr &, std::optional<CastDiagnostic>, CastType)
 {
diff --git a/programs/odbc-bridge/createFunctionBaseCast.cpp b/programs/odbc-bridge/createFunctionBaseCast.cpp
index 473aa1ca81d..54319ca707a 100644
--- a/programs/odbc-bridge/createFunctionBaseCast.cpp
+++ b/programs/odbc-bridge/createFunctionBaseCast.cpp
@@ -1,5 +1,6 @@
-#include <Functions/IFunction.h>
+#include <memory>
 #include <Functions/CastOverloadResolver.h>
+#include <Core/ColumnsWithTypeAndName.h>
 
 
 namespace DB
@@ -10,10 +11,13 @@ namespace ErrorCodes
     extern const int NOT_IMPLEMENTED;
 }
 
+class IFunctionBase;
+using FunctionBasePtr = std::shared_ptr<const IFunctionBase>;
+
 FunctionBasePtr createFunctionBaseCast(
     ContextPtr, const ColumnsWithTypeAndName &, const DataTypePtr &, std::optional<CastDiagnostic>, CastType)
 {
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Type conversions are not implemented for ODBC Bridge");
+    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Type conversions are not implemented for Library Bridge");
 }
 
 }

From 3ac4f56cfa65443119bd0fa9d23d528adf73d7bb Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 18:53:31 +0100
Subject: [PATCH 223/985] Fix tests

---
 .../library-bridge/createFunctionBaseCast.cpp |  2 +-
 .../odbc-bridge/createFunctionBaseCast.cpp    |  2 +-
 src/Functions/CastOverloadResolver.cpp        | 20 ++++++++++++-------
 src/Functions/FunctionsConversion.cpp         | 13 ++++++------
 4 files changed, 22 insertions(+), 15 deletions(-)

diff --git a/programs/library-bridge/createFunctionBaseCast.cpp b/programs/library-bridge/createFunctionBaseCast.cpp
index 54319ca707a..dcdd47d79ce 100644
--- a/programs/library-bridge/createFunctionBaseCast.cpp
+++ b/programs/library-bridge/createFunctionBaseCast.cpp
@@ -15,7 +15,7 @@ class IFunctionBase;
 using FunctionBasePtr = std::shared_ptr<const IFunctionBase>;
 
 FunctionBasePtr createFunctionBaseCast(
-    ContextPtr, const ColumnsWithTypeAndName &, const DataTypePtr &, std::optional<CastDiagnostic>, CastType)
+    ContextPtr, const char *, const ColumnsWithTypeAndName &, const DataTypePtr &, std::optional<CastDiagnostic>, CastType)
 {
     throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Type conversions are not implemented for Library Bridge");
 }
diff --git a/programs/odbc-bridge/createFunctionBaseCast.cpp b/programs/odbc-bridge/createFunctionBaseCast.cpp
index 54319ca707a..dcdd47d79ce 100644
--- a/programs/odbc-bridge/createFunctionBaseCast.cpp
+++ b/programs/odbc-bridge/createFunctionBaseCast.cpp
@@ -15,7 +15,7 @@ class IFunctionBase;
 using FunctionBasePtr = std::shared_ptr<const IFunctionBase>;
 
 FunctionBasePtr createFunctionBaseCast(
-    ContextPtr, const ColumnsWithTypeAndName &, const DataTypePtr &, std::optional<CastDiagnostic>, CastType)
+    ContextPtr, const char *, const ColumnsWithTypeAndName &, const DataTypePtr &, std::optional<CastDiagnostic>, CastType)
 {
     throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Type conversions are not implemented for Library Bridge");
 }
diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 1e1fbd06d93..4e8e99b4d95 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -17,11 +17,12 @@ namespace ErrorCodes
 }
 
 FunctionBasePtr createFunctionBaseCast(
-    ContextPtr context
-    , const ColumnsWithTypeAndName & arguments
-    , const DataTypePtr & return_type
-    , std::optional<CastDiagnostic> diagnostic
-    , CastType cast_type);
+    ContextPtr context,
+    const char * name,
+    const ColumnsWithTypeAndName & arguments,
+    const DataTypePtr & return_type,
+    std::optional<CastDiagnostic> diagnostic,
+    CastType cast_type);
 
 
 /** CastInternal does not preserve nullability of the data type,
@@ -33,7 +34,7 @@ FunctionBasePtr createFunctionBaseCast(
 class CastOverloadResolverImpl : public IFunctionOverloadResolver
 {
 public:
-    String getName() const override
+    const char * getNameImpl() const
     {
         if (cast_type == CastType::accurate)
             return "accurateCast";
@@ -45,6 +46,11 @@ public:
             return "CAST";
     }
 
+    String getName() const override
+    {
+        return getNameImpl();
+    }
+
     size_t getNumberOfArguments() const override { return 2; }
 
     ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
@@ -72,7 +78,7 @@ public:
 protected:
     FunctionBasePtr buildImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type) const override
     {
-        return createFunctionBaseCast(context, arguments, return_type, diagnostic, cast_type);
+        return createFunctionBaseCast(context, getNameImpl(), arguments, return_type, diagnostic, cast_type);
     }
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 3da6b9abe2d..d1d00780205 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -4963,11 +4963,12 @@ public:
 
 
 FunctionBasePtr createFunctionBaseCast(
-    ContextPtr context
-    , const ColumnsWithTypeAndName & arguments
-    , const DataTypePtr & return_type
-    , std::optional<CastDiagnostic> diagnostic
-    , CastType cast_type)
+    ContextPtr context,
+    const char * name,
+    const ColumnsWithTypeAndName & arguments,
+    const DataTypePtr & return_type,
+    std::optional<CastDiagnostic> diagnostic,
+    CastType cast_type)
 {
     DataTypes data_types(arguments.size());
 
@@ -4975,7 +4976,7 @@ FunctionBasePtr createFunctionBaseCast(
         data_types[i] = arguments[i].type;
 
     auto monotonicity = MonotonicityHelper::getMonotonicityInformation(arguments.front().type, return_type.get());
-    return std::make_unique<FunctionCast>(context, "CAST", std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
+    return std::make_unique<FunctionCast>(context, name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
 }
 
 REGISTER_FUNCTION(Conversion)

From 4af16043b86a6e72b3f13579a938d271fd0b77dd Mon Sep 17 00:00:00 2001
From: tomershafir <tomer.shafir8@gmail.com>
Date: Sat, 9 Mar 2024 21:27:28 +0200
Subject: [PATCH 224/985] improve randomness by erase buf elem when full

---
 src/Client/QueryFuzzer.cpp | 49 +++++++++++++++++++-------------------
 src/Client/QueryFuzzer.h   |  6 ++---
 2 files changed, 27 insertions(+), 28 deletions(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index ea2e5e17afd..d23b5159854 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -232,7 +232,7 @@ ASTPtr QueryFuzzer::getRandomColumnLike()
         return nullptr;
     }
 
-    ASTPtr new_ast = column_like[fuzz_rand() % column_like.size()]->clone();
+    ASTPtr new_ast = column_like[fuzz_rand() % column_like.size()].second->clone();
     new_ast->setAlias("");
 
     return new_ast;
@@ -272,7 +272,7 @@ void QueryFuzzer::replaceWithTableLike(ASTPtr & ast)
         return;
     }
 
-    ASTPtr new_ast = table_like[fuzz_rand() % table_like.size()]->clone();
+    ASTPtr new_ast = table_like[fuzz_rand() % table_like.size()].second->clone();
 
     std::string old_alias = ast->tryGetAlias();
     new_ast->setAlias(old_alias);
@@ -1214,51 +1214,46 @@ void QueryFuzzer::fuzz(ASTPtr & ast)
     }
 }
 
+#define AST_FUZZER_PART_TYPE_CAP 1000
+
 /*
  * This functions collects various parts of query that we can then substitute
  * to a query being fuzzed.
- *
- * TODO: we just stop remembering new parts after our corpus reaches certain size.
- * This is boring, should implement a random replacement of existing parst with
- * small probability. Do this after we add this fuzzer to CI and fix all the
- * problems it can routinely find even in this boring version.
  */
 void QueryFuzzer::collectFuzzInfoMain(ASTPtr ast)
 {
     collectFuzzInfoRecurse(ast);
-
-    column_like.clear();
-    for (const auto & [name, value] : column_like_map)
-    {
-        column_like.push_back(value);
-    }
-
-    table_like.clear();
-    for (const auto & [name, value] : table_like_map)
-    {
-        table_like.push_back(value);
-    }
 }
 
 void QueryFuzzer::addTableLike(ASTPtr ast)
 {
-    if (table_like_map.size() > 1000)
+    if (table_like_map.size() > AST_FUZZER_PART_TYPE_CAP)
     {
-        table_like_map.clear();
+        const auto iter = std::next(table_like.begin(), fuzz_rand() % table_like.size());
+        const auto ast_del = *iter;
+        table_like.erase(iter);
+        table_like_map.erase(ast_del.first);    
     }
 
     const auto name = ast->formatForErrorMessage();
     if (name.size() < 200)
     {
-        table_like_map.insert({name, ast});
+        const auto res = table_like_map.insert({name, ast});
+        if (res.second)
+        {
+            table_like.push_back({name, ast});
+        }
     }
 }
 
 void QueryFuzzer::addColumnLike(ASTPtr ast)
 {
-    if (column_like_map.size() > 1000)
+    if (column_like_map.size() > AST_FUZZER_PART_TYPE_CAP)
     {
-        column_like_map.clear();
+        const auto iter = std::next(column_like.begin(), fuzz_rand() % column_like.size());
+        const auto ast_del = *iter;
+        column_like.erase(iter);
+        column_like_map.erase(ast_del.first);
     }
 
     const auto name = ast->formatForErrorMessage();
@@ -1273,7 +1268,11 @@ void QueryFuzzer::addColumnLike(ASTPtr ast)
     }
     if (name.size() < 200)
     {
-        column_like_map.insert({name, ast});
+        const auto res = column_like_map.insert({name, ast});
+        if (res.second)
+        {
+            column_like.push_back({name, ast});
+        }
     }
 }
 
diff --git a/src/Client/QueryFuzzer.h b/src/Client/QueryFuzzer.h
index 3bc7b0842d3..6165e589cae 100644
--- a/src/Client/QueryFuzzer.h
+++ b/src/Client/QueryFuzzer.h
@@ -50,12 +50,12 @@ struct QueryFuzzer
     // we are currently fuzzing. We add some part from each new query we are asked
     // to fuzz, and keep this state between queries, so the fuzzing output becomes
     // more interesting over time, as the queries mix.
-    // The maps are used for collection, and the vectors are used for random access.
+    // The hash tables are used for collection, and the vectors are used for random access.
     std::unordered_map<std::string, ASTPtr> column_like_map;
-    std::vector<ASTPtr> column_like;
+    std::vector<std::pair<std::string, ASTPtr>> column_like;
 
     std::unordered_map<std::string, ASTPtr> table_like_map;
-    std::vector<ASTPtr> table_like;
+    std::vector<std::pair<std::string, ASTPtr>> table_like;
 
     // Some debug fields for detecting problematic ASTs with loops.
     // These are reset for each fuzzMain call.

From e30a1c9cbcc465370aa3be5c96437598c1a3ac80 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 02:26:18 +0100
Subject: [PATCH 225/985] Remove garbage

---
 src/Functions/FunctionsConversion.cpp | 9 ++-------
 1 file changed, 2 insertions(+), 7 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index d1d00780205..5347e1f739d 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -3158,15 +3158,10 @@ struct FunctionCastName
     static constexpr auto name = "CAST";
 };
 
-class FunctionCastBase : public IFunctionBase
+class FunctionCast final : public IFunctionBase
 {
 public:
     using MonotonicityForRange = std::function<Monotonicity(const IDataType &, const Field &, const Field &)>;
-};
-
-class FunctionCast final : public FunctionCastBase
-{
-public:
     using WrapperType = std::function<ColumnPtr(ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t)>;
 
     FunctionCast(ContextPtr context_
@@ -4901,7 +4896,7 @@ arguments, result_type, input_rows_count); \
 class MonotonicityHelper
 {
 public:
-    using MonotonicityForRange = FunctionCastBase::MonotonicityForRange;
+    using MonotonicityForRange = FunctionCast::MonotonicityForRange;
 
     template <typename DataType>
     static auto monotonicityForType(const DataType * const)

From bbeecf4ed5361154c2eed61f476ed9ca2c50b773 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 02:51:32 +0100
Subject: [PATCH 226/985] Fix error

---
 src/Functions/CastOverloadResolver.cpp | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/Functions/CastOverloadResolver.cpp b/src/Functions/CastOverloadResolver.cpp
index 4e8e99b4d95..5ca4b0bc579 100644
--- a/src/Functions/CastOverloadResolver.cpp
+++ b/src/Functions/CastOverloadResolver.cpp
@@ -67,12 +67,15 @@ public:
 
     static FunctionOverloadResolverPtr create(ContextPtr context, CastType cast_type, bool internal, std::optional<CastDiagnostic> diagnostic)
     {
-        const auto & settings_ref = context->getSettingsRef();
-
         if (internal)
+        {
             return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, diagnostic, false /*keep_nullable*/, DataTypeValidationSettings{});
+        }
         else
+        {
+            const auto & settings_ref = context->getSettingsRef();
             return std::make_unique<CastOverloadResolverImpl>(context, cast_type, internal, diagnostic, settings_ref.cast_keep_nullable, DataTypeValidationSettings(settings_ref));
+        }
     }
 
 protected:

From 6c0f8773426021d93229b2c713641e189c4ffe3e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 03:02:38 +0100
Subject: [PATCH 227/985] I did not understand this code and removed it

---
 src/Functions/FunctionsConversion.cpp | 12 ------------
 1 file changed, 12 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 5347e1f739d..38c18ddf850 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1906,18 +1906,6 @@ struct ConvertImpl<T, T, Name, ConvertDefaultBehaviorTag>
     }
 };
 
-template <typename Name>
-struct ConvertImpl<DataTypeUInt8, DataTypeUInt8, Name, ConvertDefaultBehaviorTag>
-{
-    template <typename Additions = void *>
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/,
-                             Additions additions [[maybe_unused]] = Additions())
-    {
-
-        return arguments[0].column;
-    }
-};
-
 
 /** Conversion from FixedString to String.
   * Cutting sequences of zero bytes from end of strings.

From 7c8a97a91a0842556e1ed67234c85c7aead67700 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 03:13:15 +0100
Subject: [PATCH 228/985] Maybe better

---
 src/Functions/FunctionsConversion.cpp | 425 +++++++++++++-------------
 1 file changed, 206 insertions(+), 219 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 38c18ddf850..1d849446254 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -151,255 +151,256 @@ struct ConvertImpl
     {
         const ColumnWithTypeAndName & named_from = arguments[0];
 
+        /// If types are the same, reuse the columns.
+        if (result_type->equals(*named_from.type))
+            return named_from.column;
+
         using ColVecFrom = typename FromDataType::ColumnType;
         using ColVecTo = typename ToDataType::ColumnType;
 
         if constexpr ((IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
-            && !(std::is_same_v<DataTypeDateTime64, FromDataType> || std::is_same_v<DataTypeDateTime64, ToDataType>))
+            && !(std::is_same_v<DataTypeDateTime64, FromDataType> || std::is_same_v<DataTypeDateTime64, ToDataType>)
+            && (!IsDataTypeDecimalOrNumber<FromDataType> || !IsDataTypeDecimalOrNumber<ToDataType>))
         {
-            if constexpr (!IsDataTypeDecimalOrNumber<FromDataType> || !IsDataTypeDecimalOrNumber<ToDataType>)
-            {
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    named_from.column->getName(), Name::name);
-            }
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                named_from.column->getName(), Name::name);
         }
 
-        if (const ColVecFrom * col_from = checkAndGetColumn<ColVecFrom>(named_from.column.get()))
+        const ColVecFrom * col_from = checkAndGetColumn<ColVecFrom>(named_from.column.get());
+        if (!col_from)
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                named_from.column->getName(), Name::name);
+
+        typename ColVecTo::MutablePtr col_to = nullptr;
+
+        if constexpr (IsDataTypeDecimal<ToDataType>)
         {
-            typename ColVecTo::MutablePtr col_to = nullptr;
+            UInt32 scale;
 
-            if constexpr (IsDataTypeDecimal<ToDataType>)
+            if constexpr (std::is_same_v<Additions, AccurateConvertStrategyAdditions>
+                || std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
             {
-                UInt32 scale;
-
-                if constexpr (std::is_same_v<Additions, AccurateConvertStrategyAdditions>
-                    || std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                {
-                    scale = additions.scale;
-                }
-                else
-                {
-                    scale = additions;
-                }
-
-                col_to = ColVecTo::create(0, scale);
+                scale = additions.scale;
             }
             else
-                col_to = ColVecTo::create();
-
-            const auto & vec_from = col_from->getData();
-            auto & vec_to = col_to->getData();
-            vec_to.resize(input_rows_count);
-
-            ColumnUInt8::MutablePtr col_null_map_to;
-            ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
-            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
             {
-                col_null_map_to = ColumnUInt8::create(input_rows_count, false);
-                vec_null_map_to = &col_null_map_to->getData();
+                scale = additions;
             }
 
-            bool result_is_bool = isBool(result_type);
-            for (size_t i = 0; i < input_rows_count; ++i)
+            col_to = ColVecTo::create(0, scale);
+        }
+        else
+            col_to = ColVecTo::create();
+
+        const auto & vec_from = col_from->getData();
+        auto & vec_to = col_to->getData();
+        vec_to.resize(input_rows_count);
+
+        ColumnUInt8::MutablePtr col_null_map_to;
+        ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
+        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+        {
+            col_null_map_to = ColumnUInt8::create(input_rows_count, false);
+            vec_null_map_to = &col_null_map_to->getData();
+        }
+
+        bool result_is_bool = isBool(result_type);
+        for (size_t i = 0; i < input_rows_count; ++i)
+        {
+            if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
             {
-                if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
+                if (result_is_bool)
                 {
-                    if (result_is_bool)
-                    {
-                        vec_to[i] = vec_from[i] != FromFieldType(0);
-                        continue;
-                    }
-                }
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> && std::is_same_v<ToDataType, DataTypeUInt128>)
-                {
-                    static_assert(
-                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                        "UInt128 and UUID types must be same");
-
-                    vec_to[i].items[1] = vec_from[i].toUnderType().items[0];
-                    vec_to[i].items[0] = vec_from[i].toUnderType().items[1];
-
+                    vec_to[i] = vec_from[i] != FromFieldType(0);
                     continue;
                 }
+            }
 
-                if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
-                {
-                    static_assert(
-                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                        "UInt128 and IPv6 types must be same");
+            if constexpr (std::is_same_v<FromDataType, DataTypeUUID> && std::is_same_v<ToDataType, DataTypeUInt128>)
+            {
+                static_assert(
+                    std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
+                    "UInt128 and UUID types must be same");
 
-                    vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
-                    vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
+                vec_to[i].items[1] = vec_from[i].toUnderType().items[0];
+                vec_to[i].items[0] = vec_from[i].toUnderType().items[1];
 
-                    continue;
-                }
+                continue;
+            }
 
-                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
+            if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
+            {
+                static_assert(
+                    std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
+                    "UInt128 and IPv6 types must be same");
+
+                vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
+                vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
+
+                continue;
+            }
+
+            if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
+            {
+                throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                                "Conversion between numeric types and UUID is not supported. "
+                                "Probably the passed UUID is unquoted");
+            }
+            else if constexpr (
+                (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
+                && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6> || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>)
+            )
+            {
+                throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
+                                TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
+            }
+            else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6> && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
+            {
+                throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                                "Conversion between numeric types and IPv6 is not supported. "
+                                "Probably the passed IPv6 is unquoted");
+            }
+            else
+            {
+                if constexpr (IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
                 {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                    "Conversion between numeric types and UUID is not supported. "
-                                    "Probably the passed UUID is unquoted");
-                }
-                else if constexpr (
-                    (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
-                    && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6> || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>)
-                )
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
-                                    TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
-                }
-                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6> && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                    "Conversion between numeric types and IPv6 is not supported. "
-                                    "Probably the passed IPv6 is unquoted");
-                }
-                else
-                {
-                    if constexpr (IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
+                    if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
                     {
-                        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                        {
-                            ToFieldType result;
-                            bool convert_result = false;
+                        ToFieldType result;
+                        bool convert_result = false;
 
-                            if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                convert_result = tryConvertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale(), result);
-                            else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
-                                convert_result = tryConvertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), result);
-                            else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                convert_result = tryConvertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale(), result);
+                        if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                            convert_result = tryConvertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale(), result);
+                        else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
+                            convert_result = tryConvertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), result);
+                        else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                            convert_result = tryConvertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale(), result);
 
-                            if (convert_result)
-                                vec_to[i] = result;
-                            else
-                            {
-                                vec_to[i] = static_cast<ToFieldType>(0);
-                                (*vec_null_map_to)[i] = true;
-                            }
-                        }
+                        if (convert_result)
+                            vec_to[i] = result;
                         else
                         {
-                            if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                vec_to[i] = convertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale());
-                            else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
-                                vec_to[i] = convertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale());
-                            else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                vec_to[i] = convertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale());
-                            else
-                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unsupported data type in conversion function");
+                            vec_to[i] = static_cast<ToFieldType>(0);
+                            (*vec_null_map_to)[i] = true;
                         }
                     }
                     else
                     {
-                        /// If From Data is Nan or Inf and we convert to integer type, throw exception
-                        if constexpr (std::is_floating_point_v<FromFieldType> && !std::is_floating_point_v<ToFieldType>)
-                        {
-                            if (!isFinite(vec_from[i]))
-                            {
-                                if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                                {
-                                    vec_to[i] = 0;
-                                    (*vec_null_map_to)[i] = true;
-                                    continue;
-                                }
-                                else
-                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unexpected inf or nan to integer conversion");
-                            }
-                        }
-
-                        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>
-                                || std::is_same_v<Additions, AccurateConvertStrategyAdditions>)
-                        {
-                            bool convert_result = accurate::convertNumeric(vec_from[i], vec_to[i]);
-
-                            if (!convert_result)
-                            {
-                                if (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                                {
-                                    vec_to[i] = 0;
-                                    (*vec_null_map_to)[i] = true;
-                                }
-                                else
-                                {
-                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Value in column {} cannot be safely converted into type {}",
-                                        named_from.column->getName(), result_type->getName());
-                                }
-                            }
-                        }
+                        if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                            vec_to[i] = convertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale());
+                        else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
+                            vec_to[i] = convertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale());
+                        else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                            vec_to[i] = convertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale());
                         else
+                            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unsupported data type in conversion function");
+                    }
+                }
+                else
+                {
+                    /// If From Data is Nan or Inf and we convert to integer type, throw exception
+                    if constexpr (std::is_floating_point_v<FromFieldType> && !std::is_floating_point_v<ToFieldType>)
+                    {
+                        if (!isFinite(vec_from[i]))
                         {
-                            if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
+                            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
                             {
-                                const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
-                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                                if (!matchIPv6Subnet(src, ip4_cidr, 96))
-                                {
-                                    char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
-                                    char * paddr = addr;
-                                    formatIPv6(src, paddr);
-
-                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
-                                }
-
-                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                                if constexpr (std::endian::native == std::endian::little)
-                                {
-                                    dst[0] = src[15];
-                                    dst[1] = src[14];
-                                    dst[2] = src[13];
-                                    dst[3] = src[12];
-                                }
-                                else
-                                {
-                                    dst[0] = src[12];
-                                    dst[1] = src[13];
-                                    dst[2] = src[14];
-                                    dst[3] = src[15];
-                                }
+                                vec_to[i] = 0;
+                                (*vec_null_map_to)[i] = true;
+                                continue;
                             }
-                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
-                            {
-                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                                std::memset(dst, '\0', IPV6_BINARY_LENGTH);
-                                dst[10] = dst[11] = 0xff;
-
-                                if constexpr (std::endian::native == std::endian::little)
-                                {
-                                    dst[12] = src[3];
-                                    dst[13] = src[2];
-                                    dst[14] = src[1];
-                                    dst[15] = src[0];
-                                }
-                                else
-                                {
-                                    dst[12] = src[0];
-                                    dst[13] = src[1];
-                                    dst[14] = src[2];
-                                    dst[15] = src[3];
-                                }
-                            }
-                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
-                                vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
-                            else if constexpr (std::is_same_v<Name, NameToUnixTimestamp> && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
-                                vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
                             else
-                                vec_to[i] = static_cast<ToFieldType>(vec_from[i]);
+                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unexpected inf or nan to integer conversion");
                         }
                     }
+
+                    if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>
+                            || std::is_same_v<Additions, AccurateConvertStrategyAdditions>)
+                    {
+                        bool convert_result = accurate::convertNumeric(vec_from[i], vec_to[i]);
+
+                        if (!convert_result)
+                        {
+                            if (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                            {
+                                vec_to[i] = 0;
+                                (*vec_null_map_to)[i] = true;
+                            }
+                            else
+                            {
+                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Value in column {} cannot be safely converted into type {}",
+                                    named_from.column->getName(), result_type->getName());
+                            }
+                        }
+                    }
+                    else
+                    {
+                        if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
+                        {
+                            const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
+                            const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                            if (!matchIPv6Subnet(src, ip4_cidr, 96))
+                            {
+                                char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
+                                char * paddr = addr;
+                                formatIPv6(src, paddr);
+
+                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
+                            }
+
+                            uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                            if constexpr (std::endian::native == std::endian::little)
+                            {
+                                dst[0] = src[15];
+                                dst[1] = src[14];
+                                dst[2] = src[13];
+                                dst[3] = src[12];
+                            }
+                            else
+                            {
+                                dst[0] = src[12];
+                                dst[1] = src[13];
+                                dst[2] = src[14];
+                                dst[3] = src[15];
+                            }
+                        }
+                        else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
+                        {
+                            const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                            uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                            std::memset(dst, '\0', IPV6_BINARY_LENGTH);
+                            dst[10] = dst[11] = 0xff;
+
+                            if constexpr (std::endian::native == std::endian::little)
+                            {
+                                dst[12] = src[3];
+                                dst[13] = src[2];
+                                dst[14] = src[1];
+                                dst[15] = src[0];
+                            }
+                            else
+                            {
+                                dst[12] = src[0];
+                                dst[13] = src[1];
+                                dst[14] = src[2];
+                                dst[15] = src[3];
+                            }
+                        }
+                        else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
+                            vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
+                        else if constexpr (std::is_same_v<Name, NameToUnixTimestamp> && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
+                            vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
+                        else
+                            vec_to[i] = static_cast<ToFieldType>(vec_from[i]);
+                    }
                 }
             }
-
-            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
-            else
-                return col_to;
         }
+
+        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+            return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
         else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                named_from.column->getName(), Name::name);
+            return col_to;
     }
 };
 
@@ -1892,20 +1893,6 @@ template <>
 struct ConvertImpl<DataTypeString, DataTypeUInt32, NameToUnixTimestamp, ConvertReturnNullOnErrorTag>
     : ConvertImpl<DataTypeString, DataTypeDateTime, NameToUnixTimestamp, ConvertReturnNullOnErrorTag> {};
 
-/** If types are identical, just take reference to column.
-  */
-template <typename T, typename Name>
-requires (!T::is_parametric)
-struct ConvertImpl<T, T, Name, ConvertDefaultBehaviorTag>
-{
-    template <typename Additions = void *>
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/,
-        Additions additions [[maybe_unused]] = Additions())
-    {
-        return arguments[0].column;
-    }
-};
-
 
 /** Conversion from FixedString to String.
   * Cutting sequences of zero bytes from end of strings.

From 3c9e6cfc96c8ba7cbc805260bfdec9ca18776ad0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 03:52:14 +0100
Subject: [PATCH 229/985] Maybe better

---
 src/Functions/FunctionsConversion.cpp | 322 +++++++++++++-------------
 1 file changed, 161 insertions(+), 161 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 1d849446254..66ba2d18f08 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -152,117 +152,113 @@ struct ConvertImpl
         const ColumnWithTypeAndName & named_from = arguments[0];
 
         /// If types are the same, reuse the columns.
-        if (result_type->equals(*named_from.type))
+        if constexpr (std::is_same_v<FromDataType, ToDataType> && !FromDataType::is_parametric)
+        {
             return named_from.column;
-
-        using ColVecFrom = typename FromDataType::ColumnType;
-        using ColVecTo = typename ToDataType::ColumnType;
-
-        if constexpr ((IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
-            && !(std::is_same_v<DataTypeDateTime64, FromDataType> || std::is_same_v<DataTypeDateTime64, ToDataType>)
-            && (!IsDataTypeDecimalOrNumber<FromDataType> || !IsDataTypeDecimalOrNumber<ToDataType>))
-        {
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                named_from.column->getName(), Name::name);
-        }
-
-        const ColVecFrom * col_from = checkAndGetColumn<ColVecFrom>(named_from.column.get());
-        if (!col_from)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                named_from.column->getName(), Name::name);
-
-        typename ColVecTo::MutablePtr col_to = nullptr;
-
-        if constexpr (IsDataTypeDecimal<ToDataType>)
-        {
-            UInt32 scale;
-
-            if constexpr (std::is_same_v<Additions, AccurateConvertStrategyAdditions>
-                || std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-            {
-                scale = additions.scale;
-            }
-            else
-            {
-                scale = additions;
-            }
-
-            col_to = ColVecTo::create(0, scale);
         }
         else
-            col_to = ColVecTo::create();
-
-        const auto & vec_from = col_from->getData();
-        auto & vec_to = col_to->getData();
-        vec_to.resize(input_rows_count);
-
-        ColumnUInt8::MutablePtr col_null_map_to;
-        ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
-        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
         {
-            col_null_map_to = ColumnUInt8::create(input_rows_count, false);
-            vec_null_map_to = &col_null_map_to->getData();
-        }
+            using ColVecFrom = typename FromDataType::ColumnType;
+            using ColVecTo = typename ToDataType::ColumnType;
 
-        bool result_is_bool = isBool(result_type);
-        for (size_t i = 0; i < input_rows_count; ++i)
-        {
-            if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
+            if constexpr ((IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
+                && !(std::is_same_v<DataTypeDateTime64, FromDataType> || std::is_same_v<DataTypeDateTime64, ToDataType>)
+                && (!IsDataTypeDecimalOrNumber<FromDataType> || !IsDataTypeDecimalOrNumber<ToDataType>))
             {
-                if (result_is_bool)
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                    named_from.column->getName(), Name::name);
+            }
+
+            const ColVecFrom * col_from = checkAndGetColumn<ColVecFrom>(named_from.column.get());
+            if (!col_from)
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                    named_from.column->getName(), Name::name);
+
+            typename ColVecTo::MutablePtr col_to = nullptr;
+
+            if constexpr (IsDataTypeDecimal<ToDataType>)
+            {
+                UInt32 scale;
+
+                if constexpr (std::is_same_v<Additions, AccurateConvertStrategyAdditions>
+                    || std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
                 {
-                    vec_to[i] = vec_from[i] != FromFieldType(0);
-                    continue;
+                    scale = additions.scale;
+                }
+                else
+                {
+                    scale = additions;
                 }
-            }
 
-            if constexpr (std::is_same_v<FromDataType, DataTypeUUID> && std::is_same_v<ToDataType, DataTypeUInt128>)
-            {
-                static_assert(
-                    std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                    "UInt128 and UUID types must be same");
-
-                vec_to[i].items[1] = vec_from[i].toUnderType().items[0];
-                vec_to[i].items[0] = vec_from[i].toUnderType().items[1];
-
-                continue;
-            }
-
-            if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
-            {
-                static_assert(
-                    std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                    "UInt128 and IPv6 types must be same");
-
-                vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
-                vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
-
-                continue;
-            }
-
-            if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
-            {
-                throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                "Conversion between numeric types and UUID is not supported. "
-                                "Probably the passed UUID is unquoted");
-            }
-            else if constexpr (
-                (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
-                && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6> || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>)
-            )
-            {
-                throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
-                                TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
-            }
-            else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6> && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
-            {
-                throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                "Conversion between numeric types and IPv6 is not supported. "
-                                "Probably the passed IPv6 is unquoted");
+                col_to = ColVecTo::create(0, scale);
             }
             else
+                col_to = ColVecTo::create();
+
+            const auto & vec_from = col_from->getData();
+            auto & vec_to = col_to->getData();
+            vec_to.resize(input_rows_count);
+
+            ColumnUInt8::MutablePtr col_null_map_to;
+            ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
+            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
             {
-                if constexpr (IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
+                col_null_map_to = ColumnUInt8::create(input_rows_count, false);
+                vec_null_map_to = &col_null_map_to->getData();
+            }
+
+            bool result_is_bool = isBool(result_type);
+            for (size_t i = 0; i < input_rows_count; ++i)
+            {
+                if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
+                {
+                    if (result_is_bool)
+                    {
+                        vec_to[i] = vec_from[i] != FromFieldType(0);
+                        continue;
+                    }
+                }
+
+                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> && std::is_same_v<ToDataType, DataTypeUInt128>)
+                {
+                    static_assert(
+                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
+                        "UInt128 and UUID types must be same");
+
+                    vec_to[i].items[1] = vec_from[i].toUnderType().items[0];
+                    vec_to[i].items[0] = vec_from[i].toUnderType().items[1];
+                }
+                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
+                {
+                    static_assert(
+                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
+                        "UInt128 and IPv6 types must be same");
+
+                    vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
+                    vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
+                }
+                else if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
+                {
+                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                                    "Conversion between numeric types and UUID is not supported. "
+                                    "Probably the passed UUID is unquoted");
+                }
+                else if constexpr (
+                    (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
+                    && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6>
+                        || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>))
+                {
+                    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
+                                    TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
+                }
+                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6>
+                    && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
+                {
+                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                                    "Conversion between numeric types and IPv6 is not supported. "
+                                    "Probably the passed IPv6 is unquoted");
+                }
+                else if constexpr (IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
                 {
                     if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
                     {
@@ -296,6 +292,66 @@ struct ConvertImpl
                             throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unsupported data type in conversion function");
                     }
                 }
+                else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
+                {
+                    const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
+                    const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                    if (!matchIPv6Subnet(src, ip4_cidr, 96))
+                    {
+                        char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
+                        char * paddr = addr;
+                        formatIPv6(src, paddr);
+
+                        throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
+                    }
+
+                    uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                    if constexpr (std::endian::native == std::endian::little)
+                    {
+                        dst[0] = src[15];
+                        dst[1] = src[14];
+                        dst[2] = src[13];
+                        dst[3] = src[12];
+                    }
+                    else
+                    {
+                        dst[0] = src[12];
+                        dst[1] = src[13];
+                        dst[2] = src[14];
+                        dst[3] = src[15];
+                    }
+                }
+                else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
+                {
+                    const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                    uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                    std::memset(dst, '\0', IPV6_BINARY_LENGTH);
+                    dst[10] = dst[11] = 0xff;
+
+                    if constexpr (std::endian::native == std::endian::little)
+                    {
+                        dst[12] = src[3];
+                        dst[13] = src[2];
+                        dst[14] = src[1];
+                        dst[15] = src[0];
+                    }
+                    else
+                    {
+                        dst[12] = src[0];
+                        dst[13] = src[1];
+                        dst[14] = src[2];
+                        dst[15] = src[3];
+                    }
+                }
+                else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
+                {
+                    vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
+                }
+                else if constexpr (std::is_same_v<Name, NameToUnixTimestamp>
+                    && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
+                {
+                    vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
+                }
                 else
                 {
                     /// If From Data is Nan or Inf and we convert to integer type, throw exception
@@ -335,72 +391,16 @@ struct ConvertImpl
                     }
                     else
                     {
-                        if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
-                        {
-                            const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
-                            const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                            if (!matchIPv6Subnet(src, ip4_cidr, 96))
-                            {
-                                char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
-                                char * paddr = addr;
-                                formatIPv6(src, paddr);
-
-                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
-                            }
-
-                            uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                            if constexpr (std::endian::native == std::endian::little)
-                            {
-                                dst[0] = src[15];
-                                dst[1] = src[14];
-                                dst[2] = src[13];
-                                dst[3] = src[12];
-                            }
-                            else
-                            {
-                                dst[0] = src[12];
-                                dst[1] = src[13];
-                                dst[2] = src[14];
-                                dst[3] = src[15];
-                            }
-                        }
-                        else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
-                        {
-                            const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                            uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                            std::memset(dst, '\0', IPV6_BINARY_LENGTH);
-                            dst[10] = dst[11] = 0xff;
-
-                            if constexpr (std::endian::native == std::endian::little)
-                            {
-                                dst[12] = src[3];
-                                dst[13] = src[2];
-                                dst[14] = src[1];
-                                dst[15] = src[0];
-                            }
-                            else
-                            {
-                                dst[12] = src[0];
-                                dst[13] = src[1];
-                                dst[14] = src[2];
-                                dst[15] = src[3];
-                            }
-                        }
-                        else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
-                            vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
-                        else if constexpr (std::is_same_v<Name, NameToUnixTimestamp> && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
-                            vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
-                        else
-                            vec_to[i] = static_cast<ToFieldType>(vec_from[i]);
+                        vec_to[i] = static_cast<ToFieldType>(vec_from[i]);
                     }
                 }
             }
-        }
 
-        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-            return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
-        else
-            return col_to;
+            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
+            else
+                return col_to;
+        }
     }
 };
 

From d2e29525c85458c07f385208582e820de10297e4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 04:08:34 +0100
Subject: [PATCH 230/985] Maybe better

---
 src/Functions/FunctionsConversion.cpp | 176 +++++++++++++-------------
 1 file changed, 87 insertions(+), 89 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 66ba2d18f08..d2d72558500 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1,4 +1,3 @@
-#include <cstddef>
 #include <type_traits>
 
 #include <IO/WriteBufferFromVector.h>
@@ -115,6 +114,71 @@ UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
     return static_cast<UInt32>(field.get<UInt32>());
 }
 
+
+/** Conversion of Date to DateTime: adding 00:00:00 time component.
+  */
+template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
+struct ToDateTimeImpl
+{
+    static constexpr auto name = "toDateTime";
+
+    static UInt32 execute(UInt16 d, const DateLUTImpl & time_zone)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (d > MAX_DATETIME_DAY_NUM) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Day number {} is out of bounds of type DateTime", d);
+        }
+        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
+        {
+            if (d > MAX_DATETIME_DAY_NUM)
+                d = MAX_DATETIME_DAY_NUM;
+        }
+        return static_cast<UInt32>(time_zone.fromDayNum(DayNum(d)));
+    }
+
+    static UInt32 execute(Int32 d, const DateLUTImpl & time_zone)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
+        {
+            if (d < 0)
+                return 0;
+            else if (d > MAX_DATETIME_DAY_NUM)
+                d = MAX_DATETIME_DAY_NUM;
+        }
+        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (d < 0 || d > MAX_DATETIME_DAY_NUM) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", d);
+        }
+        return static_cast<UInt32>(time_zone.fromDayNum(ExtendedDayNum(d)));
+    }
+
+    static UInt32 execute(UInt32 dt, const DateLUTImpl & /*time_zone*/)
+    {
+        return dt;
+    }
+
+    static UInt32 execute(Int64 dt64, const DateLUTImpl & /*time_zone*/)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Ignore)
+            return static_cast<UInt32>(dt64);
+        else
+        {
+            if (dt64 < 0 || dt64 >= MAX_DATETIME_TIMESTAMP)
+            {
+                if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
+                    return dt64 < 0 ? 0 : std::numeric_limits<UInt32>::max();
+                else
+                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", dt64);
+            }
+            else
+                return static_cast<UInt32>(dt64);
+        }
+    }
+};
+
+
 /// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
 struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
 
@@ -151,11 +215,32 @@ struct ConvertImpl
     {
         const ColumnWithTypeAndName & named_from = arguments[0];
 
-        /// If types are the same, reuse the columns.
         if constexpr (std::is_same_v<FromDataType, ToDataType> && !FromDataType::is_parametric)
         {
+            /// If types are the same, reuse the columns.
             return named_from.column;
         }
+        else if constexpr ((std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDate32>)
+            && std::is_same_v<ToDataType, DataTypeDate>)
+        {
+            /// Conversion of DateTime to Date: throw off time component.
+            /// Conversion of Date32 to Date.
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateImpl<date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> && std::is_same_v<ToDataType, DataTypeDate32>)
+        {
+            /// Conversion of DateTime to Date: throw off time component.
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Impl, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>)
+        {
+            /// Conversion from Date/Date32 to DateTime.
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeImpl<date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
         else
         {
             using ColVecFrom = typename FromDataType::ColumnType;
@@ -404,88 +489,6 @@ struct ConvertImpl
     }
 };
 
-/** Conversion of DateTime to Date: throw off time component.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDate, ToDateImpl<date_time_overflow_behavior>, false> {};
-
-/** Conversion of DateTime to Date32: throw off time component.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDate32, ToDate32Impl, false> {};
-
-/** Conversion of Date to DateTime: adding 00:00:00 time component.
-  */
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
-struct ToDateTimeImpl
-{
-    static constexpr auto name = "toDateTime";
-
-    static UInt32 execute(UInt16 d, const DateLUTImpl & time_zone)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (d > MAX_DATETIME_DAY_NUM) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Day number {} is out of bounds of type DateTime", d);
-        }
-        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
-        {
-            if (d > MAX_DATETIME_DAY_NUM)
-                d = MAX_DATETIME_DAY_NUM;
-        }
-        return static_cast<UInt32>(time_zone.fromDayNum(DayNum(d)));
-    }
-
-    static UInt32 execute(Int32 d, const DateLUTImpl & time_zone)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
-        {
-            if (d < 0)
-                return 0;
-            else if (d > MAX_DATETIME_DAY_NUM)
-                d = MAX_DATETIME_DAY_NUM;
-        }
-        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (d < 0 || d > MAX_DATETIME_DAY_NUM) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", d);
-        }
-        return static_cast<UInt32>(time_zone.fromDayNum(ExtendedDayNum(d)));
-    }
-
-    static UInt32 execute(UInt32 dt, const DateLUTImpl & /*time_zone*/)
-    {
-        return dt;
-    }
-
-    static UInt32 execute(Int64 dt64, const DateLUTImpl & /*time_zone*/)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Ignore)
-            return static_cast<UInt32>(dt64);
-        else
-        {
-            if (dt64 < 0 || dt64 >= MAX_DATETIME_TIMESTAMP)
-            {
-                if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
-                    return dt64 < 0 ? 0 : std::numeric_limits<UInt32>::max();
-                else
-                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", dt64);
-            }
-            else
-                return static_cast<UInt32>(dt64);
-        }
-    }
-};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate, DataTypeDateTime, ToDateTimeImpl<date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate32, DataTypeDateTime, ToDateTimeImpl<date_time_overflow_behavior>, false> {};
 
 /// Implementation of toDate function.
 
@@ -510,11 +513,6 @@ struct ToDateTransform32Or64
     }
 };
 
-/** Conversion of Date32 to Date.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate32, DataTypeDate, ToDateImpl<date_time_overflow_behavior>, false> {};
 
 template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDateTransform32Or64Signed

From b07e5d9f5a6420a9ba3d19d63070831a9db121ea Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 08:11:59 +0300
Subject: [PATCH 231/985] Update StorageMergeTree.cpp

---
 src/Storages/StorageMergeTree.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 0748ac2dbdf..055a48ad998 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2083,7 +2083,7 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
         MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
 
         IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
-        LOG_TRACE(log, "Partition exps are the same:part id: {}; number of disks:{}",dst_part_info.partition_id, this->getStoragePolicy()->getDisks().size());
+
         bool on_same_disk = false;
         for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
             if (disk->getName() == src_part->getDataPartStorage().getDiskName())

From d337379385de7270a894687481e7c0251a326349 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 06:44:26 +0100
Subject: [PATCH 232/985] Remove in-memory data parts, step 2

---
 docs/en/operations/system-tables/metrics.md   |   4 -
 src/Common/CurrentMetrics.cpp                 |   1 -
 src/Storages/MergeTree/ColumnSizeEstimator.h  |   3 +-
 src/Storages/MergeTree/DataPartsExchange.cpp  | 119 +------
 src/Storages/MergeTree/DataPartsExchange.h    |  16 -
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |  12 -
 src/Storages/MergeTree/IMergeTreeDataPart.h   |   1 -
 .../IMergeTreeDataPartInfoForReader.h         |   2 -
 .../LoadedMergeTreeDataPartInfoForReader.h    |   2 -
 src/Storages/MergeTree/MergeTask.cpp          |   2 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |  53 +--
 src/Storages/MergeTree/MergeTreeData.h        |   6 +-
 .../MergeTree/MergeTreeDataPartBuilder.cpp    |   3 -
 .../MergeTree/MergeTreeDataPartInMemory.cpp   | 115 ------
 .../MergeTree/MergeTreeDataPartInMemory.h     |  70 ----
 .../MergeTree/MergeTreeDataPartType.h         |   3 -
 .../MergeTree/MergeTreeDataPartWriterWide.h   |   3 +
 .../MergeTree/MergeTreeDataWriter.cpp         |  17 +-
 .../MergeTreeIndexGranularityInfo.cpp         |   4 -
 .../MergeTree/MergeTreeReaderInMemory.cpp     | 119 -------
 .../MergeTree/MergeTreeReaderInMemory.h       |  40 ---
 src/Storages/MergeTree/MergeTreeSink.cpp      |   1 -
 .../MergeTree/MergeTreeWriteAheadLog.cpp      | 336 ------------------
 .../MergeTree/MergeTreeWriteAheadLog.h        | 105 ------
 src/Storages/MergeTree/MutateTask.cpp         |  10 +-
 .../MergeTree/ReplicatedMergeTreeQueue.cpp    |   5 +-
 src/Storages/MergeTree/checkDataPart.cpp      |  12 -
 .../MergeTree/examples/CMakeLists.txt         |   2 -
 .../examples/wal_action_metadata.cpp          |  61 ----
 src/Storages/StorageJoin.cpp                  |   2 +
 src/Storages/StorageMemory.cpp                |   2 +
 src/Storages/StorageMergeTree.cpp             |   1 -
 .../aspell-ignore/en/aspell-dict.txt          |   1 -
 33 files changed, 25 insertions(+), 1108 deletions(-)
 delete mode 100644 src/Storages/MergeTree/MergeTreeDataPartInMemory.cpp
 delete mode 100644 src/Storages/MergeTree/MergeTreeDataPartInMemory.h
 delete mode 100644 src/Storages/MergeTree/MergeTreeReaderInMemory.cpp
 delete mode 100644 src/Storages/MergeTree/MergeTreeReaderInMemory.h
 delete mode 100644 src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
 delete mode 100644 src/Storages/MergeTree/MergeTreeWriteAheadLog.h
 delete mode 100644 src/Storages/MergeTree/examples/CMakeLists.txt
 delete mode 100644 src/Storages/MergeTree/examples/wal_action_metadata.cpp

diff --git a/docs/en/operations/system-tables/metrics.md b/docs/en/operations/system-tables/metrics.md
index 898e6ae2e2c..83ce817b7db 100644
--- a/docs/en/operations/system-tables/metrics.md
+++ b/docs/en/operations/system-tables/metrics.md
@@ -513,10 +513,6 @@ Part was moved to another disk and should be deleted in own destructor.
 
 Not active data part with identity refcounter, it is deleting right now by a cleaner.
 
-### PartsInMemory
-
-In-memory parts.
-
 ### PartsOutdated
 
 Not active data part, but could be used by only current SELECTs, could be deleted after SELECTs finishes.
diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index 82da4c4bbad..b58cea306c6 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -226,7 +226,6 @@
     M(PartsDeleteOnDestroy, "Part was moved to another disk and should be deleted in own destructor.") \
     M(PartsWide, "Wide parts.") \
     M(PartsCompact, "Compact parts.") \
-    M(PartsInMemory, "In-memory parts.") \
     M(MMappedFiles, "Total number of mmapped files.") \
     M(MMappedFileBytes, "Sum size of mmapped file regions.") \
     M(AsynchronousReadWait, "Number of threads waiting for asynchronous read.") \
diff --git a/src/Storages/MergeTree/ColumnSizeEstimator.h b/src/Storages/MergeTree/ColumnSizeEstimator.h
index 597dc80e525..a9c4f75ed6b 100644
--- a/src/Storages/MergeTree/ColumnSizeEstimator.h
+++ b/src/Storages/MergeTree/ColumnSizeEstimator.h
@@ -1,7 +1,6 @@
 #pragma once
 
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 
 
 namespace DB
@@ -10,7 +9,7 @@ namespace DB
 /* Allow to compute more accurate progress statistics */
 class ColumnSizeEstimator
 {
-    using ColumnToSize = MergeTreeDataPartInMemory::ColumnToSize;
+    using ColumnToSize = std::map<String, size_t>;
     ColumnToSize map;
 public:
 
diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index 168c5f729ce..cc2967003a4 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -10,7 +10,6 @@
 #include <IO/S3Common.h>
 #include <Server/HTTP/HTMLForm.h>
 #include <Server/HTTP/HTTPServerResponse.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/MergeTree/MergedBlockOutputStream.h>
 #include <Storages/MergeTree/ReplicatedFetchList.h>
 #include <Storages/StorageReplicatedMergeTree.h>
@@ -191,8 +190,6 @@ void Service::processQuery(const HTMLForm & params, ReadBuffer & /*body*/, Write
         }
 
         if (data_settings->allow_remote_fs_zero_copy_replication &&
-            /// In memory data part does not have metadata yet.
-            !isInMemoryPart(part) &&
             client_protocol_version >= REPLICATION_PROTOCOL_VERSION_WITH_PARTS_ZERO_COPY)
         {
             auto disk_type = part->getDataPartStorage().getDiskType();
@@ -205,11 +202,7 @@ void Service::processQuery(const HTMLForm & params, ReadBuffer & /*body*/, Write
             }
         }
 
-        if (isInMemoryPart(part))
-            sendPartFromMemory(part, out, send_projections);
-        else
-            sendPartFromDisk(part, out, client_protocol_version, false, send_projections);
-
+        sendPartFromDisk(part, out, client_protocol_version, false, send_projections);
         data.addLastSentPart(part->info);
     }
     catch (const NetException &)
@@ -231,36 +224,6 @@ void Service::processQuery(const HTMLForm & params, ReadBuffer & /*body*/, Write
     }
 }
 
-void Service::sendPartFromMemory(
-    const MergeTreeData::DataPartPtr & part, WriteBuffer & out, bool send_projections)
-{
-    auto metadata_snapshot = data.getInMemoryMetadataPtr();
-    if (send_projections)
-    {
-        for (const auto & [name, projection] : part->getProjectionParts())
-        {
-            auto projection_sample_block = metadata_snapshot->projections.get(name).sample_block;
-            auto part_in_memory = asInMemoryPart(projection);
-            if (!part_in_memory)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Projection {} of part {} is not stored in memory", name, part->name);
-
-            writeStringBinary(name, out);
-            projection->checksums.write(out);
-            NativeWriter block_out(out, 0, projection_sample_block);
-            block_out.write(part_in_memory->block);
-        }
-    }
-
-    auto part_in_memory = asInMemoryPart(part);
-    if (!part_in_memory)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Part {} is not stored in memory", part->name);
-
-    NativeWriter block_out(out, 0, metadata_snapshot->getSampleBlock());
-    part->checksums.write(out);
-    block_out.write(part_in_memory->block);
-
-    data.getSendsThrottler()->add(part_in_memory->block.bytes());
-}
 
 MergeTreeData::DataPart::Checksums Service::sendPartFromDisk(
     const MergeTreeData::DataPartPtr & part,
@@ -641,8 +604,6 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> Fetcher::fetchSelected
                             remote_fs_metadata, fmt::join(capability, ", "));
         if (server_protocol_version < REPLICATION_PROTOCOL_VERSION_WITH_PARTS_ZERO_COPY)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Got 'remote_fs_metadata' cookie with old protocol version {}", server_protocol_version);
-        if (part_type == PartType::InMemory)
-            throw Exception(ErrorCodes::INCORRECT_PART_TYPE, "Got 'remote_fs_metadata' cookie for in-memory part");
 
         try
         {
@@ -701,7 +662,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> Fetcher::fetchSelected
     }
 
     auto storage_id = data.getStorageID();
-    String new_part_path = part_type == PartType::InMemory ? "memory" : fs::path(data.getFullPathOnDisk(disk)) / part_name / "";
+    String new_part_path = fs::path(data.getFullPathOnDisk(disk)) / part_name / "";
     auto entry = data.getContext()->getReplicatedFetchList().insert(
         storage_id.getDatabaseName(), storage_id.getTableName(),
         part_info.partition_id, part_name, new_part_path,
@@ -709,22 +670,6 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> Fetcher::fetchSelected
 
     in->setNextCallback(ReplicatedFetchReadCallback(*entry));
 
-    if (part_type == PartType::InMemory)
-    {
-        auto volume = std::make_shared<SingleDiskVolume>("volume_" + part_name, disk, 0);
-
-        auto data_part_storage = std::make_shared<DataPartStorageOnDiskFull>(
-            volume,
-            data.getRelativeDataPath(),
-            part_name);
-
-        return std::make_pair(downloadPartToMemory(
-            data_part_storage, part_name,
-            MergeTreePartInfo::fromPartName(part_name, data.format_version),
-            part_uuid, metadata_snapshot, context, *in,
-            projections, false, throttler), std::move(temporary_directory_lock));
-    }
-
     auto output_buffer_getter = [](IDataPartStorage & part_storage, const String & file_name, size_t file_size)
     {
         return part_storage.writeFile(file_name, std::min<UInt64>(file_size, DBMS_DEFAULT_BUFFER_SIZE), {});
@@ -736,66 +681,6 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> Fetcher::fetchSelected
         projections, throttler, sync),std::move(temporary_directory_lock));
 }
 
-MergeTreeData::MutableDataPartPtr Fetcher::downloadPartToMemory(
-    MutableDataPartStoragePtr data_part_storage,
-    const String & part_name,
-    const MergeTreePartInfo & part_info,
-    const UUID & part_uuid,
-    const StorageMetadataPtr & metadata_snapshot,
-    ContextPtr context,
-    PooledReadWriteBufferFromHTTP & in,
-    size_t projections,
-    bool is_projection,
-    ThrottlerPtr throttler)
-{
-    auto new_data_part = std::make_shared<MergeTreeDataPartInMemory>(data, part_name, part_info, data_part_storage);
-
-    for (size_t i = 0; i < projections; ++i)
-    {
-        String projection_name;
-        readStringBinary(projection_name, in);
-
-        MergeTreePartInfo new_part_info("all", 0, 0, 0);
-        auto projection_part_storage = data_part_storage->getProjection(projection_name + ".proj");
-
-        auto new_projection_part = downloadPartToMemory(
-            projection_part_storage, projection_name,
-            new_part_info, part_uuid, metadata_snapshot,
-            context, in, 0, true, throttler);
-
-        new_data_part->addProjectionPart(projection_name, std::move(new_projection_part));
-    }
-
-    MergeTreeData::DataPart::Checksums checksums;
-    if (!checksums.read(in))
-        throw Exception(ErrorCodes::CORRUPTED_DATA, "Cannot deserialize checksums");
-
-    NativeReader block_in(in, 0);
-    auto block = block_in.read();
-    throttler->add(block.bytes());
-
-    new_data_part->setColumns(block.getNamesAndTypesList(), {}, metadata_snapshot->getMetadataVersion());
-
-    if (!is_projection)
-    {
-        new_data_part->version.setCreationTID(Tx::PrehistoricTID, nullptr);
-        new_data_part->uuid = part_uuid;
-        new_data_part->is_temp = true;
-        new_data_part->minmax_idx->update(block, data.getMinMaxColumnsNames(metadata_snapshot->getPartitionKey()));
-        new_data_part->partition.create(metadata_snapshot, block, 0, context);
-    }
-
-    MergedBlockOutputStream part_out(
-        new_data_part, metadata_snapshot, block.getNamesAndTypesList(), {}, {},
-        CompressionCodecFactory::instance().get("NONE", {}), NO_TRANSACTION_PTR);
-
-    part_out.write(block);
-    part_out.finalizePart(new_data_part, false);
-    new_data_part->checksums.checkEqual(checksums, /* have_uncompressed = */ true);
-
-    return new_data_part;
-}
-
 void Fetcher::downloadBaseOrProjectionPartToDisk(
     const String & replica_path,
     const MutableDataPartStoragePtr & data_part_storage,
diff --git a/src/Storages/MergeTree/DataPartsExchange.h b/src/Storages/MergeTree/DataPartsExchange.h
index 8c15dc3cfdb..21f47826344 100644
--- a/src/Storages/MergeTree/DataPartsExchange.h
+++ b/src/Storages/MergeTree/DataPartsExchange.h
@@ -40,10 +40,6 @@ public:
 
 private:
     MergeTreeData::DataPartPtr findPart(const String & name);
-    void sendPartFromMemory(
-        const MergeTreeData::DataPartPtr & part,
-        WriteBuffer & out,
-        bool send_projections);
 
     MergeTreeData::DataPart::Checksums sendPartFromDisk(
         const MergeTreeData::DataPartPtr & part,
@@ -113,18 +109,6 @@ private:
         ThrottlerPtr throttler,
         bool sync);
 
-    MergeTreeData::MutableDataPartPtr downloadPartToMemory(
-       MutableDataPartStoragePtr data_part_storage,
-       const String & part_name,
-       const MergeTreePartInfo & part_info,
-       const UUID & part_uuid,
-       const StorageMetadataPtr & metadata_snapshot,
-       ContextPtr context,
-       PooledReadWriteBufferFromHTTP & in,
-       size_t projections,
-       bool is_projection,
-       ThrottlerPtr throttler);
-
     MergeTreeData::MutableDataPartPtr downloadPartToDiskRemoteMeta(
        const String & part_name,
        const String & replica_path,
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 526ea542b0e..3fea6d04944 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -51,7 +51,6 @@ namespace CurrentMetrics
 
     extern const Metric PartsWide;
     extern const Metric PartsCompact;
-    extern const Metric PartsInMemory;
 }
 
 namespace DB
@@ -278,9 +277,6 @@ static void incrementTypeMetric(MergeTreeDataPartType type)
         case MergeTreeDataPartType::Compact:
             CurrentMetrics::add(CurrentMetrics::PartsCompact);
             return;
-        case MergeTreeDataPartType::InMemory:
-            CurrentMetrics::add(CurrentMetrics::PartsInMemory);
-            return;
         case MergeTreeDataPartType::Unknown:
             return;
     }
@@ -296,9 +292,6 @@ static void decrementTypeMetric(MergeTreeDataPartType type)
         case MergeTreeDataPartType::Compact:
             CurrentMetrics::sub(CurrentMetrics::PartsCompact);
             return;
-        case MergeTreeDataPartType::InMemory:
-            CurrentMetrics::sub(CurrentMetrics::PartsInMemory);
-            return;
         case MergeTreeDataPartType::Unknown:
             return;
     }
@@ -2207,11 +2200,6 @@ bool isWidePart(const MergeTreeDataPartPtr & data_part)
     return (data_part && data_part->getType() == MergeTreeDataPartType::Wide);
 }
 
-bool isInMemoryPart(const MergeTreeDataPartPtr & data_part)
-{
-    return (data_part && data_part->getType() == MergeTreeDataPartType::InMemory);
-}
-
 std::optional<std::string> getIndexExtensionFromFilesystem(const IDataPartStorage & data_part_storage)
 {
     if (data_part_storage.exists())
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index fba1e6ddbb1..aaae64a5970 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -710,7 +710,6 @@ using MergeTreeMutableDataPartPtr = std::shared_ptr<IMergeTreeDataPart>;
 
 bool isCompactPart(const MergeTreeDataPartPtr & data_part);
 bool isWidePart(const MergeTreeDataPartPtr & data_part);
-bool isInMemoryPart(const MergeTreeDataPartPtr & data_part);
 
 inline String getIndexExtension(bool is_compressed_primary_key) { return is_compressed_primary_key ? ".cidx" : ".idx"; }
 std::optional<String> getIndexExtensionFromFilesystem(const IDataPartStorage & data_part_storage);
diff --git a/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h b/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h
index 2cc73556f04..7807f3d8c25 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h
@@ -34,8 +34,6 @@ public:
 
     virtual bool isWidePart() const = 0;
 
-    virtual bool isInMemoryPart() const = 0;
-
     virtual bool isProjectionPart() const = 0;
 
     virtual DataPartStoragePtr getDataPartStorage() const = 0;
diff --git a/src/Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h b/src/Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h
index f1cb8b34ecf..f5111ccaacc 100644
--- a/src/Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h
+++ b/src/Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h
@@ -22,8 +22,6 @@ public:
 
     bool isWidePart() const override { return DB::isWidePart(data_part); }
 
-    bool isInMemoryPart() const override { return DB::isInMemoryPart(data_part); }
-
     bool isProjectionPart() const override { return data_part->isProjectionPart(); }
 
     DataPartStoragePtr getDataPartStorage() const override { return data_part->getDataPartStoragePtr(); }
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index aa38198334e..77bc680eae2 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -309,7 +309,7 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::prepare()
             ctx->rows_sources_uncompressed_write_buf = ctx->tmp_disk->createRawStream();
             ctx->rows_sources_write_buf = std::make_unique<CompressedWriteBuffer>(*ctx->rows_sources_uncompressed_write_buf);
 
-            MergeTreeDataPartInMemory::ColumnToSize local_merged_column_to_size;
+            std::map<String, size_t> local_merged_column_to_size;
             for (const MergeTreeData::DataPartPtr & part : global_ctx->future_part->parts)
                 part->accumulateColumnSizes(local_merged_column_to_size);
 
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 9bc360cbcac..d56cf761cf4 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -72,7 +72,6 @@
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
 #include <Storages/MergeTree/MergeTreeDataPartBuilder.h>
 #include <Storages/MergeTree/MergeTreeDataPartCompact.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/Statistics/Estimator.h>
 #include <Storages/MergeTree/MergeTreeSelectProcessor.h>
 #include <Storages/MergeTree/checkDataPart.h>
@@ -1707,8 +1706,7 @@ void MergeTreeData::loadDataParts(bool skip_sanity_checks, std::optional<std::un
             {
                 /// Skip temporary directories, file 'format_version.txt' and directory 'detached'.
                 if (startsWith(it->name(), "tmp") || it->name() == MergeTreeData::FORMAT_VERSION_FILE_NAME
-                    || it->name() == MergeTreeData::DETACHED_DIR_NAME
-                    || startsWith(it->name(), MergeTreeWriteAheadLog::WAL_FILE_NAME))
+                    || it->name() == MergeTreeData::DETACHED_DIR_NAME)
                     continue;
 
                 if (auto part_info = MergeTreePartInfo::tryParsePartName(it->name(), format_version))
@@ -2261,7 +2259,6 @@ MergeTreeData::DataPartsVector MergeTreeData::grabOldParts(bool force)
             bool reached_removal_time = part_remove_time <= time_now && time_now - part_remove_time >= getSettings()->old_parts_lifetime.totalSeconds();
             if ((reached_removal_time && !has_skipped_mutation_parent(part))
                 || force
-                || isInMemoryPart(part)     /// Remove in-memory parts immediately to not store excessive data in RAM
                 || (part->version.creation_csn == Tx::RolledBackCSN && getSettings()->remove_rolled_back_parts_immediately))
             {
                 part->removal_state.store(DataPartRemovalState::REMOVED, std::memory_order_relaxed);
@@ -5225,14 +5222,14 @@ Pipe MergeTreeData::alterPartition(
             case PartitionCommand::FREEZE_PARTITION:
             {
                 auto lock = lockForShare(query_context->getCurrentQueryId(), query_context->getSettingsRef().lock_acquire_timeout);
-                current_command_results = freezePartition(command.partition, metadata_snapshot, command.with_name, query_context, lock);
+                current_command_results = freezePartition(command.partition, command.with_name, query_context, lock);
             }
             break;
 
             case PartitionCommand::FREEZE_ALL_PARTITIONS:
             {
                 auto lock = lockForShare(query_context->getCurrentQueryId(), query_context->getSettingsRef().lock_acquire_timeout);
-                current_command_results = freezeAll(command.with_name, metadata_snapshot, query_context, lock);
+                current_command_results = freezeAll(command.with_name, query_context, lock);
             }
             break;
 
@@ -7103,27 +7100,6 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     scope_guard src_flushed_tmp_dir_lock;
     MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
 
-    /// If source part is in memory, flush it to disk and clone it already in on-disk format
-    /// Protect tmp dir from removing by cleanup thread with src_flushed_tmp_dir_lock
-    /// Construct src_flushed_tmp_part in order to delete part with its directory at destructor
-    if (auto src_part_in_memory = asInMemoryPart(src_part))
-    {
-        auto flushed_part_path = *src_part_in_memory->getRelativePathForPrefix(tmp_part_prefix);
-
-        auto tmp_src_part_file_name = fs::path(tmp_dst_part_name).filename();
-        src_flushed_tmp_dir_lock = src_part->storage.getTemporaryPartDirectoryHolder(tmp_src_part_file_name);
-
-        auto flushed_part_storage = src_part_in_memory->flushToDisk(flushed_part_path, metadata_snapshot);
-
-        src_flushed_tmp_part = MergeTreeDataPartBuilder(*this, src_part->name, flushed_part_storage)
-            .withPartInfo(src_part->info)
-            .withPartFormatFromDisk()
-            .build();
-
-        src_flushed_tmp_part->is_temp = true;
-        src_part_storage = flushed_part_storage;
-    }
-
     String with_copy;
     if (params.copy_instead_of_hardlink)
         with_copy = " (copying data)";
@@ -7305,26 +7281,23 @@ MergeTreeData::MatcherFn MergeTreeData::getPartitionMatcher(const ASTPtr & parti
 
 PartitionCommandsResultInfo MergeTreeData::freezePartition(
     const ASTPtr & partition_ast,
-    const StorageMetadataPtr & metadata_snapshot,
     const String & with_name,
     ContextPtr local_context,
     TableLockHolder &)
 {
-    return freezePartitionsByMatcher(getPartitionMatcher(partition_ast, local_context), metadata_snapshot, with_name, local_context);
+    return freezePartitionsByMatcher(getPartitionMatcher(partition_ast, local_context), with_name, local_context);
 }
 
 PartitionCommandsResultInfo MergeTreeData::freezeAll(
     const String & with_name,
-    const StorageMetadataPtr & metadata_snapshot,
     ContextPtr local_context,
     TableLockHolder &)
 {
-    return freezePartitionsByMatcher([] (const String &) { return true; }, metadata_snapshot, with_name, local_context);
+    return freezePartitionsByMatcher([] (const String &) { return true; }, with_name, local_context);
 }
 
 PartitionCommandsResultInfo MergeTreeData::freezePartitionsByMatcher(
     MatcherFn matcher,
-    const StorageMetadataPtr & metadata_snapshot,
     const String & with_name,
     ContextPtr local_context)
 {
@@ -7376,22 +7349,6 @@ PartitionCommandsResultInfo MergeTreeData::freezePartitionsByMatcher(
         scope_guard src_flushed_tmp_dir_lock;
         MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
 
-        if (auto part_in_memory = asInMemoryPart(part))
-        {
-            auto flushed_part_path = *part_in_memory->getRelativePathForPrefix("tmp_freeze");
-            src_flushed_tmp_dir_lock = part->storage.getTemporaryPartDirectoryHolder("tmp_freeze" + part->name);
-
-            auto flushed_part_storage = part_in_memory->flushToDisk(flushed_part_path, metadata_snapshot);
-
-            src_flushed_tmp_part = MergeTreeDataPartBuilder(*this, part->name, flushed_part_storage)
-                .withPartInfo(part->info)
-                .withPartFormatFromDisk()
-                .build();
-
-            src_flushed_tmp_part->is_temp = true;
-            data_part_storage = flushed_part_storage;
-        }
-
         auto callback = [this, &part, &backup_part_path](const DiskPtr & disk)
         {
             // Store metadata for replicated table.
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index dc84505f38f..c864fce4659 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -23,9 +23,7 @@
 #include <Storages/MergeTree/MergeList.h>
 #include <Storages/MergeTree/IMergeTreeDataPart.h>
 #include <Storages/MergeTree/MergeTreeDataPartBuilder.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/MergeTree/MergeTreePartsMover.h>
-#include <Storages/MergeTree/MergeTreeWriteAheadLog.h>
 #include <Storages/MergeTree/PinnedPartUUIDs.h>
 #include <Storages/MergeTree/ZeroCopyLock.h>
 #include <Storages/MergeTree/TemporaryParts.h>
@@ -752,7 +750,6 @@ public:
       */
     PartitionCommandsResultInfo freezePartition(
         const ASTPtr & partition,
-        const StorageMetadataPtr & metadata_snapshot,
         const String & with_name,
         ContextPtr context,
         TableLockHolder & table_lock_holder);
@@ -760,7 +757,6 @@ public:
     /// Freezes all parts.
     PartitionCommandsResultInfo freezeAll(
         const String & with_name,
-        const StorageMetadataPtr & metadata_snapshot,
         ContextPtr context,
         TableLockHolder & table_lock_holder);
 
@@ -1307,7 +1303,7 @@ protected:
     bool isPrimaryOrMinMaxKeyColumnPossiblyWrappedInFunctions(const ASTPtr & node, const StorageMetadataPtr & metadata_snapshot) const;
 
     /// Common part for |freezePartition()| and |freezeAll()|.
-    PartitionCommandsResultInfo freezePartitionsByMatcher(MatcherFn matcher, const StorageMetadataPtr & metadata_snapshot, const String & with_name, ContextPtr context);
+    PartitionCommandsResultInfo freezePartitionsByMatcher(MatcherFn matcher, const String & with_name, ContextPtr context);
     PartitionCommandsResultInfo unfreezePartitionsByMatcher(MatcherFn matcher, const String & backup_name, ContextPtr context);
 
     // Partition helpers
diff --git a/src/Storages/MergeTree/MergeTreeDataPartBuilder.cpp b/src/Storages/MergeTree/MergeTreeDataPartBuilder.cpp
index d55248df0af..146c15bbb69 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartBuilder.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartBuilder.cpp
@@ -1,5 +1,4 @@
 #include <Storages/MergeTree/MergeTreeDataPartBuilder.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/MergeTree/MergeTreeDataPartCompact.h>
 #include <Storages/MergeTree/MergeTreeDataPartWide.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
@@ -64,8 +63,6 @@ std::shared_ptr<IMergeTreeDataPart> MergeTreeDataPartBuilder::build()
             return std::make_shared<MergeTreeDataPartWide>(data, name, *part_info, part_storage, parent_part);
         case PartType::Compact:
             return std::make_shared<MergeTreeDataPartCompact>(data, name, *part_info, part_storage, parent_part);
-        case PartType::InMemory:
-            return std::make_shared<MergeTreeDataPartInMemory>(data, name, *part_info, part_storage, parent_part);
         default:
             throw Exception(ErrorCodes::UNKNOWN_PART_TYPE,
                 "Unknown type of part {}", part_storage->getRelativePath());
diff --git a/src/Storages/MergeTree/MergeTreeDataPartInMemory.cpp b/src/Storages/MergeTree/MergeTreeDataPartInMemory.cpp
deleted file mode 100644
index e023ae9be0e..00000000000
--- a/src/Storages/MergeTree/MergeTreeDataPartInMemory.cpp
+++ /dev/null
@@ -1,115 +0,0 @@
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
-#include <Storages/MergeTree/MergeTreeReaderInMemory.h>
-#include <Storages/MergeTree/MergedBlockOutputStream.h>
-#include <Storages/MergeTree/IMergeTreeReader.h>
-#include <Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h>
-#include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
-#include <DataTypes/NestedUtils.h>
-#include <Disks/createVolume.h>
-#include <Interpreters/Context.h>
-#include <Poco/Logger.h>
-
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int NOT_IMPLEMENTED;
-}
-
-MergeTreeDataPartInMemory::MergeTreeDataPartInMemory(
-        const MergeTreeData & storage_,
-        const String & name_,
-        const MergeTreePartInfo & info_,
-        const MutableDataPartStoragePtr & data_part_storage_,
-        const IMergeTreeDataPart * parent_part_)
-    : IMergeTreeDataPart(storage_, name_, info_, data_part_storage_, Type::InMemory, parent_part_)
-{
-    default_codec = CompressionCodecFactory::instance().get("NONE", {});
-}
-
-IMergeTreeDataPart::MergeTreeReaderPtr MergeTreeDataPartInMemory::getReader(
-    const NamesAndTypesList & columns_to_read,
-    const StorageSnapshotPtr & storage_snapshot,
-    const MarkRanges & mark_ranges,
-    const VirtualFields & virtual_fields,
-    UncompressedCache * /* uncompressed_cache */,
-    MarkCache * /* mark_cache */,
-    const AlterConversionsPtr & alter_conversions,
-    const MergeTreeReaderSettings & reader_settings,
-    const ValueSizeMap & /* avg_value_size_hints */,
-    const ReadBufferFromFileBase::ProfileCallback & /* profile_callback */) const
-{
-    auto read_info = std::make_shared<LoadedMergeTreeDataPartInfoForReader>(shared_from_this(), alter_conversions);
-    auto ptr = std::static_pointer_cast<const MergeTreeDataPartInMemory>(shared_from_this());
-
-    return std::make_unique<MergeTreeReaderInMemory>(
-        read_info,
-        ptr,
-        columns_to_read,
-        virtual_fields,
-        storage_snapshot,
-        mark_ranges,
-        reader_settings);
-}
-
-IMergeTreeDataPart::MergeTreeWriterPtr MergeTreeDataPartInMemory::getWriter(
-    const NamesAndTypesList &,
-    const StorageMetadataPtr &,
-    const std::vector<MergeTreeIndexPtr> &,
-    const Statistics &,
-    const CompressionCodecPtr &,
-    const MergeTreeWriterSettings &,
-    const MergeTreeIndexGranularity &)
-{
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "In-memory data parts are obsolete and no longer supported for writing");
-}
-
-MutableDataPartStoragePtr MergeTreeDataPartInMemory::flushToDisk(const String &, const StorageMetadataPtr &) const
-{
-    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "In-memory data parts are obsolete and no longer supported for writing");
-}
-
-DataPartStoragePtr MergeTreeDataPartInMemory::makeCloneInDetached(const String & prefix,
-                                                                  const StorageMetadataPtr & metadata_snapshot,
-                                                                  const DiskTransactionPtr & disk_transaction) const
-{
-    if (disk_transaction)
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "InMemory parts are not compatible with disk transactions");
-    String detached_path = *getRelativePathForDetachedPart(prefix, /* broken */ false);
-    return flushToDisk(detached_path, metadata_snapshot);
-}
-
-void MergeTreeDataPartInMemory::renameTo(const String & new_relative_path, bool /* remove_new_dir_if_exists */)
-{
-    getDataPartStorage().setRelativePath(new_relative_path);
-}
-
-void MergeTreeDataPartInMemory::calculateEachColumnSizes(ColumnSizeByName & each_columns_size, ColumnSize & total_size) const
-{
-    auto it = checksums.files.find("data.bin");
-    if (it != checksums.files.end())
-        total_size.data_uncompressed += it->second.uncompressed_size;
-
-    for (const auto & column : columns)
-        each_columns_size[column.name].data_uncompressed += block.getByName(column.name).column->byteSize();
-}
-
-IMergeTreeDataPart::Checksum MergeTreeDataPartInMemory::calculateBlockChecksum() const
-{
-    SipHash hash;
-    IMergeTreeDataPart::Checksum checksum;
-    for (const auto & column : block)
-        column.column->updateHashFast(hash);
-
-    checksum.uncompressed_size = block.bytes();
-    checksum.uncompressed_hash = getSipHash128AsPair(hash);
-    return checksum;
-}
-
-DataPartInMemoryPtr asInMemoryPart(const MergeTreeDataPartPtr & part)
-{
-    return std::dynamic_pointer_cast<const MergeTreeDataPartInMemory>(part);
-}
-}
diff --git a/src/Storages/MergeTree/MergeTreeDataPartInMemory.h b/src/Storages/MergeTree/MergeTreeDataPartInMemory.h
deleted file mode 100644
index 90b4b0e3471..00000000000
--- a/src/Storages/MergeTree/MergeTreeDataPartInMemory.h
+++ /dev/null
@@ -1,70 +0,0 @@
-#pragma once
-
-#include <Storages/MergeTree/IMergeTreeDataPart.h>
-
-namespace DB
-{
-
-class UncompressedCache;
-
-class MergeTreeDataPartInMemory : public IMergeTreeDataPart
-{
-public:
-    MergeTreeDataPartInMemory(
-        const MergeTreeData & storage_,
-        const String & name_,
-        const MergeTreePartInfo & info_,
-        const MutableDataPartStoragePtr & data_part_storage_,
-        const IMergeTreeDataPart * parent_part_ = nullptr);
-
-    MergeTreeReaderPtr getReader(
-        const NamesAndTypesList & columns,
-        const StorageSnapshotPtr & storage_snapshot,
-        const MarkRanges & mark_ranges,
-        const VirtualFields & virtual_fields,
-        UncompressedCache * uncompressed_cache,
-        MarkCache * mark_cache,
-        const AlterConversionsPtr & alter_conversions,
-        const MergeTreeReaderSettings & reader_settings_,
-        const ValueSizeMap & avg_value_size_hints,
-        const ReadBufferFromFileBase::ProfileCallback & profile_callback) const override;
-
-    MergeTreeWriterPtr getWriter(
-        const NamesAndTypesList & columns_list,
-        const StorageMetadataPtr & metadata_snapshot,
-        const std::vector<MergeTreeIndexPtr> & indices_to_recalc,
-        const Statistics & stats_to_recalc_,
-        const CompressionCodecPtr & default_codec_,
-        const MergeTreeWriterSettings & writer_settings,
-        const MergeTreeIndexGranularity & computed_index_granularity) override;
-
-    bool isStoredOnDisk() const override { return false; }
-    bool isStoredOnRemoteDisk() const override { return false; }
-    bool isStoredOnRemoteDiskWithZeroCopySupport() const override { return false; }
-    bool hasColumnFiles(const NameAndTypePair & column) const override { return !!getColumnPosition(column.getNameInStorage()); }
-    std::optional<String> getFileNameForColumn(const NameAndTypePair & /* column */) const override { return ""; }
-    void renameTo(const String & new_relative_path, bool remove_new_dir_if_exists) override;
-    DataPartStoragePtr makeCloneInDetached(const String & prefix, const StorageMetadataPtr & metadata_snapshot,
-                                           const DiskTransactionPtr & disk_transaction) const override;
-    std::optional<time_t> getColumnModificationTime(const String & /* column_name */) const override { return {}; }
-
-    MutableDataPartStoragePtr flushToDisk(const String & new_relative_path, const StorageMetadataPtr & metadata_snapshot) const;
-
-    /// Returns hash of parts's block
-    Checksum calculateBlockChecksum() const;
-
-    mutable Block block;
-
-private:
-    mutable std::condition_variable is_merged;
-
-    /// Calculates uncompressed sizes in memory.
-    void calculateEachColumnSizes(ColumnSizeByName & each_columns_size, ColumnSize & total_size) const override;
-};
-
-using DataPartInMemoryPtr = std::shared_ptr<const MergeTreeDataPartInMemory>;
-using MutableDataPartInMemoryPtr = std::shared_ptr<MergeTreeDataPartInMemory>;
-
-DataPartInMemoryPtr asInMemoryPart(const MergeTreeDataPartPtr & part);
-
-}
diff --git a/src/Storages/MergeTree/MergeTreeDataPartType.h b/src/Storages/MergeTree/MergeTreeDataPartType.h
index 5096ee86db1..64f3abee391 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartType.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartType.h
@@ -42,9 +42,6 @@ public:
         /// Data of all columns is stored in one file. Marks are also stored in single file.
         Compact,
 
-        /// Format with buffering data in RAM. Obsolete - new parts cannot be created in this format.
-        InMemory,
-
         Unknown,
     };
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
index ae40eb03649..f5ff323563d 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.h
@@ -1,5 +1,8 @@
 #pragma once
+
 #include <Storages/MergeTree/MergeTreeDataPartWriterOnDisk.h>
+#include <Formats/MarkInCompressedFile.h>
+
 
 namespace DB
 {
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index ebf887f5e9e..fdac16ae19a 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -648,18 +648,11 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeProjectionPartImpl(
     const auto & metadata_snapshot = projection.metadata;
 
     MergeTreeDataPartType part_type;
-    if (parent_part->getType() == MergeTreeDataPartType::InMemory)
-    {
-        part_type = MergeTreeDataPartType::InMemory;
-    }
-    else
-    {
-        /// Size of part would not be greater than block.bytes() + epsilon
-        size_t expected_size = block.bytes();
-        // just check if there is enough space on parent volume
-        data.reserveSpace(expected_size, parent_part->getDataPartStorage());
-        part_type = data.choosePartFormatOnDisk(expected_size, block.rows()).part_type;
-    }
+    /// Size of part would not be greater than block.bytes() + epsilon
+    size_t expected_size = block.bytes();
+    // just check if there is enough space on parent volume
+    data.reserveSpace(expected_size, parent_part->getDataPartStorage());
+    part_type = data.choosePartFormatOnDisk(expected_size, block.rows()).part_type;
 
     auto new_data_part = parent_part->getProjectionPartBuilder(part_name, is_temp).withPartType(part_type).build();
     auto projection_part_storage = new_data_part->getDataPartStoragePtr();
diff --git a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp
index da89d52a9ff..031a0c08c26 100644
--- a/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexGranularityInfo.cpp
@@ -81,8 +81,6 @@ std::string MarkType::getFileExtension() const
             return res + "2";
         case MergeTreeDataPartType::Compact:
             return res + "3";
-        case MergeTreeDataPartType::InMemory:
-            return "";
         case MergeTreeDataPartType::Unknown:
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown data part type");
     }
@@ -126,8 +124,6 @@ size_t MergeTreeIndexGranularityInfo::getMarkSizeInBytes(size_t columns_num) con
         return mark_type.adaptive ? getAdaptiveMrkSizeWide() : getNonAdaptiveMrkSizeWide();
     else if (mark_type.part_type == MergeTreeDataPartType::Compact)
         return getAdaptiveMrkSizeCompact(columns_num);
-    else if (mark_type.part_type == MergeTreeDataPartType::InMemory)
-        return 0;
     else
         throw Exception(ErrorCodes::UNKNOWN_PART_TYPE, "Unknown part type");
 }
diff --git a/src/Storages/MergeTree/MergeTreeReaderInMemory.cpp b/src/Storages/MergeTree/MergeTreeReaderInMemory.cpp
deleted file mode 100644
index 91fc8966a7a..00000000000
--- a/src/Storages/MergeTree/MergeTreeReaderInMemory.cpp
+++ /dev/null
@@ -1,119 +0,0 @@
-#include <Storages/MergeTree/MergeTreeReaderInMemory.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
-#include <Interpreters/getColumnFromBlock.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/NestedUtils.h>
-#include <Columns/ColumnArray.h>
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int CANNOT_READ_ALL_DATA;
-    extern const int ARGUMENT_OUT_OF_BOUND;
-}
-
-
-MergeTreeReaderInMemory::MergeTreeReaderInMemory(
-    MergeTreeDataPartInfoForReaderPtr data_part_info_for_read_,
-    DataPartInMemoryPtr data_part_,
-    NamesAndTypesList columns_,
-    const VirtualFields & virtual_fields_,
-    const StorageSnapshotPtr & storage_snapshot_,
-    MarkRanges mark_ranges_,
-    MergeTreeReaderSettings settings_)
-    : IMergeTreeReader(
-        data_part_info_for_read_,
-        columns_,
-        virtual_fields_,
-        storage_snapshot_,
-        nullptr,
-        nullptr,
-        mark_ranges_,
-        settings_,
-        {})
-    , part_in_memory(std::move(data_part_))
-{
-    for (const auto & column_to_read : columns_to_read)
-    {
-        /// If array of Nested column is missing in part,
-        /// we have to read its offsets if they exist.
-        if (typeid_cast<const DataTypeArray *>(column_to_read.type.get())
-            && !tryGetColumnFromBlock(part_in_memory->block, column_to_read))
-        {
-            if (auto offsets_position = findColumnForOffsets(column_to_read))
-            {
-                positions_for_offsets[column_to_read.name] = *data_part_info_for_read->getColumnPosition(offsets_position->first);
-                partially_read_columns.insert(column_to_read.name);
-            }
-        }
-    }
-}
-
-size_t MergeTreeReaderInMemory::readRows(
-    size_t from_mark, size_t /* current_task_last_mark */, bool continue_reading, size_t max_rows_to_read, Columns & res_columns)
-{
-    if (!continue_reading)
-        total_rows_read = 0;
-
-    size_t total_marks = data_part_info_for_read->getIndexGranularity().getMarksCount();
-    if (from_mark >= total_marks)
-        throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND, "Mark {} is out of bound. Max mark: {}",
-            toString(from_mark), toString(total_marks));
-
-    size_t num_columns = res_columns.size();
-    checkNumberOfColumns(num_columns);
-
-    size_t part_rows = part_in_memory->block.rows();
-    if (total_rows_read >= part_rows)
-        throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Cannot read data in MergeTreeReaderInMemory. "
-            "Rows already read: {}. Rows in part: {}", total_rows_read, part_rows);
-
-    size_t rows_to_read = std::min(max_rows_to_read, part_rows - total_rows_read);
-    for (size_t i = 0; i < num_columns; ++i)
-    {
-        const auto & column_to_read = columns_to_read[i];
-
-        /// Copy offsets, if array of Nested column is missing in part.
-        auto offsets_it = positions_for_offsets.find(column_to_read.name);
-        if (offsets_it != positions_for_offsets.end() && !column_to_read.isSubcolumn())
-        {
-            const auto & source_offsets = assert_cast<const ColumnArray &>(
-                *part_in_memory->block.getByPosition(offsets_it->second).column).getOffsets();
-
-            if (res_columns[i] == nullptr)
-                res_columns[i] = column_to_read.type->createColumn();
-
-            auto mutable_column = res_columns[i]->assumeMutable();
-            auto & res_offstes = assert_cast<ColumnArray &>(*mutable_column).getOffsets();
-            size_t start_offset = total_rows_read ? source_offsets[total_rows_read - 1] : 0;
-            for (size_t row = 0; row < rows_to_read; ++row)
-                res_offstes.push_back(source_offsets[total_rows_read + row] - start_offset);
-
-            res_columns[i] = std::move(mutable_column);
-        }
-        else if (part_in_memory->hasColumnFiles(column_to_read))
-        {
-            auto block_column = getColumnFromBlock(part_in_memory->block, column_to_read);
-            if (rows_to_read == part_rows)
-            {
-                res_columns[i] = block_column;
-            }
-            else
-            {
-                if (res_columns[i] == nullptr)
-                    res_columns[i] = column_to_read.type->createColumn();
-
-                auto mutable_column = res_columns[i]->assumeMutable();
-                mutable_column->insertRangeFrom(*block_column, total_rows_read, rows_to_read);
-                res_columns[i] = std::move(mutable_column);
-            }
-        }
-    }
-
-    total_rows_read += rows_to_read;
-    return rows_to_read;
-}
-
-}
diff --git a/src/Storages/MergeTree/MergeTreeReaderInMemory.h b/src/Storages/MergeTree/MergeTreeReaderInMemory.h
deleted file mode 100644
index cc1e2e9e4e2..00000000000
--- a/src/Storages/MergeTree/MergeTreeReaderInMemory.h
+++ /dev/null
@@ -1,40 +0,0 @@
-#pragma once
-
-#include <Core/NamesAndTypes.h>
-#include <Storages/MergeTree/IMergeTreeReader.h>
-
-
-namespace DB
-{
-
-class MergeTreeDataPartInMemory;
-using DataPartInMemoryPtr = std::shared_ptr<const MergeTreeDataPartInMemory>;
-
-/// Reader for InMemory parts
-class MergeTreeReaderInMemory : public IMergeTreeReader
-{
-public:
-    MergeTreeReaderInMemory(
-        MergeTreeDataPartInfoForReaderPtr data_part_info_for_read_,
-        DataPartInMemoryPtr data_part_,
-        NamesAndTypesList columns_,
-        const VirtualFields & virtual_fields_,
-        const StorageSnapshotPtr & storage_snapshot_,
-        MarkRanges mark_ranges_,
-        MergeTreeReaderSettings settings_);
-
-    /// Return the number of rows has been read or zero if there is no columns to read.
-    /// If continue_reading is true, continue reading from last state, otherwise seek to from_mark
-    size_t readRows(size_t from_mark, size_t current_tasl_last_mark,
-                    bool continue_reading, size_t max_rows_to_read, Columns & res_columns) override;
-
-    bool canReadIncompleteGranules() const override { return true; }
-
-private:
-    size_t total_rows_read = 0;
-    DataPartInMemoryPtr part_in_memory;
-
-    std::unordered_map<String, size_t> positions_for_offsets;
-};
-
-}
diff --git a/src/Storages/MergeTree/MergeTreeSink.cpp b/src/Storages/MergeTree/MergeTreeSink.cpp
index 36816904a81..87b0a04d244 100644
--- a/src/Storages/MergeTree/MergeTreeSink.cpp
+++ b/src/Storages/MergeTree/MergeTreeSink.cpp
@@ -1,5 +1,4 @@
 #include <Storages/MergeTree/MergeTreeSink.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/StorageMergeTree.h>
 #include <Interpreters/PartLog.h>
 #include <DataTypes/ObjectUtils.h>
diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp b/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
deleted file mode 100644
index 2236c1a9380..00000000000
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.cpp
+++ /dev/null
@@ -1,336 +0,0 @@
-#include <Storages/MergeTree/MergeTreeWriteAheadLog.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
-#include <Storages/MergeTree/MergeTreeData.h>
-#include <Storages/MergeTree/MergeTreeDataWriter.h>
-#include <Storages/MergeTree/MergedBlockOutputStream.h>
-#include <Storages/MergeTree/MergeTreeDataPartState.h>
-#include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
-#include <IO/MemoryReadWriteBuffer.h>
-#include <IO/ReadHelpers.h>
-#include <IO/copyData.h>
-#include <Interpreters/Context.h>
-#include <Common/logger_useful.h>
-#include <Poco/JSON/JSON.h>
-#include <Poco/JSON/Object.h>
-#include <Poco/JSON/Stringifier.h>
-#include <Poco/JSON/Parser.h>
-#include <sys/time.h>
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int UNKNOWN_FORMAT_VERSION;
-    extern const int CANNOT_READ_ALL_DATA;
-    extern const int BAD_DATA_PART_NAME;
-    extern const int CORRUPTED_DATA;
-}
-
-MergeTreeWriteAheadLog::MergeTreeWriteAheadLog(
-    MergeTreeData & storage_,
-    const DiskPtr & disk_,
-    const String & name_)
-    : storage(storage_)
-    , disk(disk_)
-    , name(name_)
-    , path(storage.getRelativeDataPath() + name_)
-    , pool(storage.getContext()->getSchedulePool())
-    , log(getLogger(storage.getLogName() + " (WriteAheadLog)"))
-{
-    init();
-    sync_task = pool.createTask("MergeTreeWriteAheadLog::sync", [this]
-    {
-        std::lock_guard lock(write_mutex);
-        out->sync();
-        sync_scheduled = false;
-        sync_cv.notify_all();
-    });
-}
-
-MergeTreeWriteAheadLog::~MergeTreeWriteAheadLog()
-{
-    try
-    {
-        shutdown();
-    }
-    catch (...)
-    {
-        tryLogCurrentException(__PRETTY_FUNCTION__);
-    }
-}
-
-
-void MergeTreeWriteAheadLog::dropAllWriteAheadLogs(DiskPtr disk_to_drop, std::string relative_data_path)
-{
-    std::vector<std::string> files;
-    disk_to_drop->listFiles(relative_data_path, files);
-    for (const auto & file : files)
-    {
-        if (file.starts_with(WAL_FILE_NAME))
-            disk_to_drop->removeFile(fs::path(relative_data_path) / file);
-    }
-}
-
-void MergeTreeWriteAheadLog::init()
-{
-    out = disk->writeFile(path, DBMS_DEFAULT_BUFFER_SIZE, WriteMode::Append);
-
-    /// Small hack: in NativeWriter header is used only in `getHeader` method.
-    /// To avoid complex logic of changing it during ALTERs we leave it empty.
-    block_out = std::make_unique<NativeWriter>(*out, 0, Block{});
-    min_block_number = std::numeric_limits<Int64>::max();
-    max_block_number = -1;
-    bytes_at_last_sync = 0;
-}
-
-void MergeTreeWriteAheadLog::dropPart(const String & part_name)
-{
-    std::unique_lock lock(write_mutex);
-
-    writeIntBinary(WAL_VERSION, *out);
-
-    ActionMetadata metadata{};
-    metadata.write(*out);
-
-    writeIntBinary(static_cast<UInt8>(ActionType::DROP_PART), *out);
-    writeStringBinary(part_name, *out);
-    out->next();
-}
-
-void MergeTreeWriteAheadLog::rotate(const std::unique_lock<std::mutex> &)
-{
-    String new_name = String(WAL_FILE_NAME) + "_"
-        + toString(min_block_number) + "_"
-        + toString(max_block_number) + WAL_FILE_EXTENSION;
-
-    /// Finalize stream before file rename
-    out->finalize();
-    disk->replaceFile(path, storage.getRelativeDataPath() + new_name);
-    init();
-}
-
-MergeTreeData::MutableDataPartsVector MergeTreeWriteAheadLog::restore(
-    const StorageMetadataPtr & metadata_snapshot,
-    ContextPtr context,
-    DataPartsLock & parts_lock,
-    bool readonly)
-{
-    std::unique_lock lock(write_mutex);
-
-    MergeTreeData::MutableDataPartsVector parts;
-    auto in = disk->readFile(path);
-    NativeReader block_in(*in, 0);
-    NameSet dropped_parts;
-
-    while (!in->eof())
-    {
-        MergeTreeData::MutableDataPartPtr part;
-        UInt8 version;
-        String part_name;
-        Block block;
-        ActionType action_type;
-
-        try
-        {
-            ActionMetadata metadata;
-
-            readIntBinary(version, *in);
-            if (version > 0)
-            {
-                metadata.read(*in);
-            }
-
-            readIntBinary(action_type, *in);
-            readStringBinary(part_name, *in);
-
-            if (action_type == ActionType::DROP_PART)
-            {
-                dropped_parts.insert(part_name);
-            }
-            else if (action_type == ActionType::ADD_PART)
-            {
-                auto single_disk_volume = std::make_shared<SingleDiskVolume>("volume_" + part_name, disk, 0);
-
-                part = storage.getDataPartBuilder(part_name, single_disk_volume, part_name)
-                    .withPartType(MergeTreeDataPartType::InMemory)
-                    .withPartStorageType(MergeTreeDataPartStorageType::Full)
-                    .build();
-
-                part->uuid = metadata.part_uuid;
-                block = block_in.read();
-
-                if (storage.getActiveContainingPart(part->info, MergeTreeDataPartState::Active, parts_lock))
-                    continue;
-            }
-            else
-            {
-                throw Exception(ErrorCodes::CORRUPTED_DATA, "Unknown action type: {}", toString(static_cast<UInt8>(action_type)));
-            }
-        }
-        catch (const Exception & e)
-        {
-            if (e.code() == ErrorCodes::CANNOT_READ_ALL_DATA
-                || e.code() == ErrorCodes::UNKNOWN_FORMAT_VERSION
-                || e.code() == ErrorCodes::BAD_DATA_PART_NAME
-                || e.code() == ErrorCodes::CORRUPTED_DATA)
-            {
-                LOG_WARNING(log, "WAL file '{}' is broken. {}", path, e.displayText());
-
-                /// If file is broken, do not write new parts to it.
-                /// But if it contains any part rotate and save them.
-                if (max_block_number == -1)
-                {
-                    if (!readonly)
-                        disk->removeFile(path);
-                }
-                else if (name == DEFAULT_WAL_FILE_NAME)
-                    rotate(lock);
-
-                break;
-            }
-            throw;
-        }
-
-        if (action_type == ActionType::ADD_PART)
-        {
-            MergedBlockOutputStream part_out(
-                part,
-                metadata_snapshot,
-                block.getNamesAndTypesList(),
-                {}, {},
-                CompressionCodecFactory::instance().get("NONE", {}),
-                NO_TRANSACTION_PTR);
-
-            part->minmax_idx->update(block, storage.getMinMaxColumnsNames(metadata_snapshot->getPartitionKey()));
-            part->partition.create(metadata_snapshot, block, 0, context);
-            part->setColumns(block.getNamesAndTypesList(), {}, metadata_snapshot->getMetadataVersion());
-            if (metadata_snapshot->hasSortingKey())
-                metadata_snapshot->getSortingKey().expression->execute(block);
-
-            part_out.write(block);
-
-            for (const auto & projection : metadata_snapshot->getProjections())
-            {
-                auto projection_block = projection.calculate(block, context);
-                auto temp_part = MergeTreeDataWriter::writeProjectionPart(storage, log, projection_block, projection, part.get());
-                temp_part.finalize();
-                if (projection_block.rows())
-                    part->addProjectionPart(projection.name, std::move(temp_part.part));
-            }
-
-            part_out.finalizePart(part, false);
-
-            min_block_number = std::min(min_block_number, part->info.min_block);
-            max_block_number = std::max(max_block_number, part->info.max_block);
-            parts.push_back(std::move(part));
-        }
-    }
-
-    MergeTreeData::MutableDataPartsVector result;
-    std::copy_if(parts.begin(), parts.end(), std::back_inserter(result),
-        [&dropped_parts](const auto & part) { return dropped_parts.count(part->name) == 0; });
-
-    /// All parts in WAL had been already committed into the disk -> clear the WAL
-    if (!readonly && result.empty())
-    {
-        LOG_DEBUG(log, "WAL file '{}' had been completely processed. Removing.", path);
-        disk->removeFile(path);
-        init();
-        return {};
-    }
-
-    return result;
-}
-
-void MergeTreeWriteAheadLog::shutdown()
-{
-    {
-        std::unique_lock lock(write_mutex);
-        if (shutdown_called)
-             return;
-
-        if (sync_scheduled)
-            sync_cv.wait(lock, [this] { return !sync_scheduled; });
-
-        shutdown_called = true;
-        out->finalize();
-        out.reset();
-    }
-
-    /// Do it without lock, otherwise inversion between pool lock and write_mutex is possible
-    sync_task->deactivate();
-}
-
-std::optional<MergeTreeWriteAheadLog::MinMaxBlockNumber>
-MergeTreeWriteAheadLog::tryParseMinMaxBlockNumber(const String & filename)
-{
-    Int64 min_block;
-    Int64 max_block;
-    ReadBufferFromString in(filename);
-    if (!checkString(WAL_FILE_NAME, in)
-        || !checkChar('_', in)
-        || !tryReadIntText(min_block, in)
-        || !checkChar('_', in)
-        || !tryReadIntText(max_block, in))
-    {
-        return {};
-    }
-
-    return std::make_pair(min_block, max_block);
-}
-
-String MergeTreeWriteAheadLog::ActionMetadata::toJSON() const
-{
-    Poco::JSON::Object json;
-
-    if (part_uuid != UUIDHelpers::Nil)
-        json.set(JSON_KEY_PART_UUID, toString(part_uuid));
-
-    std::ostringstream oss; // STYLE_CHECK_ALLOW_STD_STRING_STREAM
-    oss.exceptions(std::ios::failbit);
-    json.stringify(oss);
-
-    return oss.str();
-}
-
-void MergeTreeWriteAheadLog::ActionMetadata::fromJSON(const String & buf)
-{
-    Poco::JSON::Parser parser;
-    auto json = parser.parse(buf).extract<Poco::JSON::Object::Ptr>();
-
-    if (json->has(JSON_KEY_PART_UUID))
-        part_uuid = parseFromString<UUID>(json->getValue<std::string>(JSON_KEY_PART_UUID));
-}
-
-void MergeTreeWriteAheadLog::ActionMetadata::read(ReadBuffer & meta_in)
-{
-    readIntBinary(min_compatible_version, meta_in);
-    if (min_compatible_version > WAL_VERSION)
-        throw Exception(ErrorCodes::UNKNOWN_FORMAT_VERSION,
-                        "WAL metadata version {} is not compatible with this ClickHouse version",
-                        toString(min_compatible_version));
-
-    size_t metadata_size;
-    readVarUInt(metadata_size, meta_in);
-
-    if (metadata_size == 0)
-        return;
-
-    String buf(metadata_size, ' ');
-    meta_in.readStrict(buf.data(), metadata_size);
-
-    fromJSON(buf);
-}
-
-void MergeTreeWriteAheadLog::ActionMetadata::write(WriteBuffer & meta_out) const
-{
-    writeIntBinary(min_compatible_version, meta_out);
-
-    String ser_meta = toJSON();
-
-    writeVarUInt(static_cast<UInt32>(ser_meta.length()), meta_out);
-    writeString(ser_meta, meta_out);
-}
-
-}
diff --git a/src/Storages/MergeTree/MergeTreeWriteAheadLog.h b/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
deleted file mode 100644
index 9550fa6ecee..00000000000
--- a/src/Storages/MergeTree/MergeTreeWriteAheadLog.h
+++ /dev/null
@@ -1,105 +0,0 @@
-#pragma once
-
-#include <Formats/NativeReader.h>
-#include <Formats/NativeWriter.h>
-#include <Core/BackgroundSchedulePool.h>
-#include <Disks/IDisk.h>
-#include <Storages/MergeTree/IMergeTreeDataPart.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
-
-namespace DB
-{
-
-class MergeTreeData;
-struct DataPartsLock;
-
-/** WAL stores addditions and removals of data parts in in-memory format.
-  * Format of data in WAL:
-  * - version
-  * - type of action (ADD or DROP)
-  * - part name
-  * - part's block in Native format. (for ADD action)
-  */
-class MergeTreeWriteAheadLog
-{
-public:
-    /// Append-only enum. It is serialized to WAL
-    enum class ActionType : UInt8
-    {
-        ADD_PART = 0,
-        DROP_PART = 1,
-    };
-
-    struct ActionMetadata
-    {
-        /// The minimum version of WAL reader that can understand metadata written by current ClickHouse version.
-        /// This field must be increased when making backwards incompatible changes.
-        ///
-        /// The same approach can be used recursively inside metadata.
-        UInt8 min_compatible_version = 0;
-
-        /// Actual metadata.
-        UUID part_uuid = UUIDHelpers::Nil;
-
-        void write(WriteBuffer & meta_out) const;
-        void read(ReadBuffer & meta_in);
-
-    private:
-        static constexpr auto JSON_KEY_PART_UUID = "part_uuid";
-
-        String toJSON() const;
-        void fromJSON(const String & buf);
-    };
-
-    constexpr static UInt8 WAL_VERSION = 1;
-    constexpr static auto WAL_FILE_NAME = "wal";
-    constexpr static auto WAL_FILE_EXTENSION = ".bin";
-    constexpr static auto DEFAULT_WAL_FILE_NAME = "wal.bin";
-
-    MergeTreeWriteAheadLog(MergeTreeData & storage_, const DiskPtr & disk_,
-        const String & name = DEFAULT_WAL_FILE_NAME);
-
-    ~MergeTreeWriteAheadLog();
-
-    void dropPart(const String & part_name);
-    std::vector<MergeTreeMutableDataPartPtr> restore(
-        const StorageMetadataPtr & metadata_snapshot,
-        ContextPtr context,
-        DataPartsLock & parts_lock,
-        bool readonly);
-
-    using MinMaxBlockNumber = std::pair<Int64, Int64>;
-    static std::optional<MinMaxBlockNumber> tryParseMinMaxBlockNumber(const String & filename);
-    void shutdown();
-
-    /// Drop all write ahead logs from disk. Useful during table drop.
-    static void dropAllWriteAheadLogs(DiskPtr disk_to_drop, std::string relative_data_path);
-private:
-    void init();
-    void rotate(const std::unique_lock<std::mutex> & lock);
-
-    const MergeTreeData & storage;
-    DiskPtr disk;
-    String name;
-    String path;
-
-    std::unique_ptr<WriteBuffer> out;
-    std::unique_ptr<NativeWriter> block_out;
-
-    Int64 min_block_number = std::numeric_limits<Int64>::max();
-    Int64 max_block_number = -1;
-
-    BackgroundSchedulePool & pool;
-    BackgroundSchedulePoolTaskHolder sync_task;
-    std::condition_variable sync_cv;
-
-    size_t bytes_at_last_sync = 0;
-    bool sync_scheduled = false;
-    bool shutdown_called = false;
-
-    mutable std::mutex write_mutex;
-
-    LoggerPtr log;
-};
-
-}
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index a5b8a2a2a6d..150cc27c369 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -1235,14 +1235,8 @@ void PartMergerWriter::prepare()
 
     for (size_t i = 0, size = ctx->projections_to_build.size(); i < size; ++i)
     {
-        // If the parent part is an in-memory part, squash projection output into one block and
-        // build in-memory projection because we don't support merging into a new in-memory part.
-        // Otherwise we split the materialization into multiple stages similar to the process of
-        // INSERT SELECT query.
-        if (ctx->new_data_part->getType() == MergeTreeDataPartType::InMemory)
-            projection_squashes.emplace_back(0, 0);
-        else
-            projection_squashes.emplace_back(settings.min_insert_block_size_rows, settings.min_insert_block_size_bytes);
+        // We split the materialization into multiple stages similar to the process of INSERT SELECT query.
+        projection_squashes.emplace_back(settings.min_insert_block_size_rows, settings.min_insert_block_size_bytes);
     }
 }
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
index 775b9afaee2..858eae4afd9 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
@@ -1350,10 +1350,7 @@ bool ReplicatedMergeTreeQueue::shouldExecuteLogEntry(
             auto part = data.getPartIfExists(name, {MergeTreeDataPartState::PreActive, MergeTreeDataPartState::Active, MergeTreeDataPartState::Outdated});
             if (part)
             {
-                if (auto part_in_memory = asInMemoryPart(part))
-                    sum_parts_size_in_bytes += part_in_memory->block.bytes();
-                else
-                    sum_parts_size_in_bytes += part->getBytesOnDisk();
+                sum_parts_size_in_bytes += part->getBytesOnDisk();
 
                 if (entry.type == LogEntry::MUTATE_PART && !storage.mutation_backoff_policy.partCanBeMutated(part->name))
                 {
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index c74063cfd4b..aea0020f89d 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -7,7 +7,6 @@
 #include <Storages/MergeTree/MergeTreeIndexGranularity.h>
 #include <Storages/MergeTree/checkDataPart.h>
 #include <Storages/MergeTree/MergeTreeDataPartCompact.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/MergeTree/IDataPartStorage.h>
 #include <Interpreters/Cache/FileCache.h>
 #include <Interpreters/Cache/FileCacheFactory.h>
@@ -310,22 +309,11 @@ static IMergeTreeDataPart::Checksums checkDataPart(
     return checksums_data;
 }
 
-IMergeTreeDataPart::Checksums checkDataPartInMemory(const DataPartInMemoryPtr & data_part)
-{
-    IMergeTreeDataPart::Checksums data_checksums;
-    data_checksums.files["data.bin"] = data_part->calculateBlockChecksum();
-    data_part->checksums.checkEqual(data_checksums, true);
-    return data_checksums;
-}
-
 IMergeTreeDataPart::Checksums checkDataPart(
     MergeTreeData::DataPartPtr data_part,
     bool require_checksums,
     std::function<bool()> is_cancelled)
 {
-    if (auto part_in_memory = asInMemoryPart(data_part))
-        return checkDataPartInMemory(part_in_memory);
-
     /// If check of part has failed and it is stored on disk with cache
     /// try to drop cache and check it once again because maybe the cache
     /// is broken not the part itself.
diff --git a/src/Storages/MergeTree/examples/CMakeLists.txt b/src/Storages/MergeTree/examples/CMakeLists.txt
deleted file mode 100644
index 25bba7ae0b4..00000000000
--- a/src/Storages/MergeTree/examples/CMakeLists.txt
+++ /dev/null
@@ -1,2 +0,0 @@
-clickhouse_add_executable (wal_action_metadata wal_action_metadata.cpp)
-target_link_libraries (wal_action_metadata PRIVATE dbms)
diff --git a/src/Storages/MergeTree/examples/wal_action_metadata.cpp b/src/Storages/MergeTree/examples/wal_action_metadata.cpp
deleted file mode 100644
index 03c38c7a186..00000000000
--- a/src/Storages/MergeTree/examples/wal_action_metadata.cpp
+++ /dev/null
@@ -1,61 +0,0 @@
-#include <iostream>
-
-#include <IO/MemoryReadWriteBuffer.h>
-#include <Storages/MergeTree/MergeTreeWriteAheadLog.h>
-
-namespace DB
-{
-namespace ErrorCodes
-{
-    extern const int UNKNOWN_FORMAT_VERSION;
-}
-}
-
-int main(int, char **)
-{
-    try
-    {
-        {
-            std::cout << "test: dummy test" << std::endl;
-
-            DB::MergeTreeWriteAheadLog::ActionMetadata metadata_out;
-            DB::MemoryWriteBuffer buf{};
-
-            metadata_out.write(buf);
-            buf.finalize();
-
-            metadata_out.read(*buf.tryGetReadBuffer());
-        }
-
-        {
-            std::cout << "test: min compatibility" << std::endl;
-
-            DB::MergeTreeWriteAheadLog::ActionMetadata metadata_out;
-            metadata_out.min_compatible_version = DB::MergeTreeWriteAheadLog::WAL_VERSION + 1;
-            DB::MemoryWriteBuffer buf{};
-
-            metadata_out.write(buf);
-            buf.finalize();
-
-            try
-            {
-                metadata_out.read(*buf.tryGetReadBuffer());
-            }
-            catch (const DB::Exception & e)
-            {
-                if (e.code() != DB::ErrorCodes::UNKNOWN_FORMAT_VERSION)
-                {
-                    std::cerr << "Expected UNKNOWN_FORMAT_VERSION exception but got: "
-                        << e.what() << ", " << e.displayText() << std::endl;
-                }
-            }
-        }
-    }
-    catch (const DB::Exception & e)
-    {
-        std::cerr << e.what() << ", " << e.displayText() << std::endl;
-        return 1;
-    }
-
-    return 0;
-}
diff --git a/src/Storages/StorageJoin.cpp b/src/Storages/StorageJoin.cpp
index b122674466f..d12e5b1a20b 100644
--- a/src/Storages/StorageJoin.cpp
+++ b/src/Storages/StorageJoin.cpp
@@ -16,6 +16,7 @@
 #include <Common/Exception.h>
 #include <Core/ColumnsWithTypeAndName.h>
 #include <Interpreters/JoinUtils.h>
+#include <Formats/NativeWriter.h>
 
 #include <Compression/CompressedWriteBuffer.h>
 #include <Processors/ISource.h>
@@ -25,6 +26,7 @@
 #include <Poco/String.h>
 #include <filesystem>
 
+
 namespace fs = std::filesystem;
 
 namespace DB
diff --git a/src/Storages/StorageMemory.cpp b/src/Storages/StorageMemory.cpp
index cf23d17fc1d..7a8fb9feeda 100644
--- a/src/Storages/StorageMemory.cpp
+++ b/src/Storages/StorageMemory.cpp
@@ -19,6 +19,8 @@
 #include <Processors/QueryPlan/ReadFromMemoryStorageStep.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Parsers/ASTCreateQuery.h>
+#include <Formats/NativeReader.h>
+#include <Formats/NativeWriter.h>
 
 #include <Common/FileChecker.h>
 #include <Compression/CompressedReadBuffer.h>
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index e15b308f084..663e7f435b7 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -37,7 +37,6 @@
 #include <Storages/AlterCommands.h>
 #include <Storages/PartitionCommands.h>
 #include <Storages/MergeTree/MergeTreeSink.h>
-#include <Storages/MergeTree/MergeTreeDataPartInMemory.h>
 #include <Storages/MergeTree/MergePlainMergeTreeTask.h>
 #include <Storages/MergeTree/PartitionPruner.h>
 #include <Storages/MergeTree/MergeList.h>
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 8bf12247ef2..7db9d699176 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -685,7 +685,6 @@ PartsCommitted
 PartsCompact
 PartsDeleteOnDestroy
 PartsDeleting
-PartsInMemory
 PartsOutdated
 PartsPreActive
 PartsPreCommitted

From 24a248859d97f7faf78a1dc98a056332cde97401 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 06:52:47 +0100
Subject: [PATCH 233/985] Remove unneeded file

---
 src/Compression/examples/CMakeLists.txt       |  3 -
 .../cached_compressed_read_buffer.cpp         | 79 -------------------
 .../examples/compressed_buffer.cpp            |  3 -
 3 files changed, 85 deletions(-)
 delete mode 100644 src/Compression/examples/cached_compressed_read_buffer.cpp

diff --git a/src/Compression/examples/CMakeLists.txt b/src/Compression/examples/CMakeLists.txt
index 7bf68e8845e..86fa5c3f78d 100644
--- a/src/Compression/examples/CMakeLists.txt
+++ b/src/Compression/examples/CMakeLists.txt
@@ -1,5 +1,2 @@
 clickhouse_add_executable (compressed_buffer compressed_buffer.cpp)
 target_link_libraries (compressed_buffer PRIVATE dbms)
-
-clickhouse_add_executable (cached_compressed_read_buffer cached_compressed_read_buffer.cpp)
-target_link_libraries (cached_compressed_read_buffer PRIVATE dbms)
diff --git a/src/Compression/examples/cached_compressed_read_buffer.cpp b/src/Compression/examples/cached_compressed_read_buffer.cpp
deleted file mode 100644
index a8e14ac7271..00000000000
--- a/src/Compression/examples/cached_compressed_read_buffer.cpp
+++ /dev/null
@@ -1,79 +0,0 @@
-#include <iostream>
-#include <iomanip>
-#include <limits>
-
-#include <Compression/CompressionFactory.h>
-#include <Compression/CachedCompressedReadBuffer.h>
-#include <IO/WriteBufferFromFile.h>
-#include <Disks/IO/createReadBufferFromFileBase.h>
-#include <IO/copyData.h>
-
-#include <Common/Stopwatch.h>
-
-
-int main(int argc, char ** argv)
-{
-    using namespace DB;
-
-    if (argc < 2)
-    {
-        std::cerr << "Usage: program path\n";
-        return 1;
-    }
-
-    try
-    {
-        UncompressedCache cache("SLRU", 1024, 0.5);
-        std::string path = argv[1];
-
-        std::cerr << std::fixed << std::setprecision(3);
-
-        size_t hits = 0;
-        size_t misses = 0;
-
-        {
-            Stopwatch watch;
-            CachedCompressedReadBuffer in(
-                path,
-                [&]()
-                {
-                    return createReadBufferFromFileBase(path, {});
-                },
-                &cache
-            );
-            WriteBufferFromFile out("/dev/null");
-            copyData(in, out);
-
-            std::cerr << "Elapsed: " << watch.elapsedSeconds() << std::endl;
-        }
-
-        cache.getStats(hits, misses);
-        std::cerr << "Hits: " << hits << ", misses: " << misses << std::endl;
-
-        {
-            Stopwatch watch;
-            CachedCompressedReadBuffer in(
-                path,
-                [&]()
-                {
-                    return createReadBufferFromFileBase(path, {});
-                },
-                &cache
-            );
-            WriteBufferFromFile out("/dev/null");
-            copyData(in, out);
-
-            std::cerr << "Elapsed: " << watch.elapsedSeconds() << std::endl;
-        }
-
-        cache.getStats(hits, misses);
-        std::cerr << "Hits: " << hits << ", misses: " << misses << std::endl;
-    }
-    catch (const Exception & e)
-    {
-        std::cerr << e.what() << ", " << e.displayText() << std::endl;
-        return 1;
-    }
-
-    return 0;
-}
diff --git a/src/Compression/examples/compressed_buffer.cpp b/src/Compression/examples/compressed_buffer.cpp
index 74646ff0f28..530f0938662 100644
--- a/src/Compression/examples/compressed_buffer.cpp
+++ b/src/Compression/examples/compressed_buffer.cpp
@@ -1,7 +1,4 @@
-#include <string>
-
 #include <iostream>
-#include <fstream>
 #include <iomanip>
 
 #include <Common/Stopwatch.h>

From a231f7de9ae7b86c41204c774dda40c3fbe73ac6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 06:55:09 +0100
Subject: [PATCH 234/985] Remove unneeded file

---
 src/Compression/examples/CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Compression/examples/CMakeLists.txt b/src/Compression/examples/CMakeLists.txt
index 86fa5c3f78d..a924075d0dc 100644
--- a/src/Compression/examples/CMakeLists.txt
+++ b/src/Compression/examples/CMakeLists.txt
@@ -1,2 +1,2 @@
 clickhouse_add_executable (compressed_buffer compressed_buffer.cpp)
-target_link_libraries (compressed_buffer PRIVATE dbms)
+target_link_libraries (compressed_buffer PRIVATE clickhouse_common_io)

From 453eb259842f3181d5f9329e0e82e4c1e66f18b0 Mon Sep 17 00:00:00 2001
From: tomershafir <tomer.shafir8@gmail.com>
Date: Sun, 10 Mar 2024 08:42:54 +0200
Subject: [PATCH 235/985] rm trailing whitespace

---
 src/Client/QueryFuzzer.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index d23b5159854..7f1dce4b29a 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -1232,7 +1232,7 @@ void QueryFuzzer::addTableLike(ASTPtr ast)
         const auto iter = std::next(table_like.begin(), fuzz_rand() % table_like.size());
         const auto ast_del = *iter;
         table_like.erase(iter);
-        table_like_map.erase(ast_del.first);    
+        table_like_map.erase(ast_del.first);
     }
 
     const auto name = ast->formatForErrorMessage();

From 9ddec346a03108198fea011c1113495050ac628b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 09:02:34 +0100
Subject: [PATCH 236/985] Miscellaneous

---
 programs/odbc-bridge/ODBCBlockInputStream.cpp |   8 +-
 src/Storages/MergeTree/MergeTask.cpp          |   4 +-
 .../test_odbc_interaction/test_exiled.py      | 111 ------------------
 3 files changed, 6 insertions(+), 117 deletions(-)
 delete mode 100644 tests/integration/test_odbc_interaction/test_exiled.py

diff --git a/programs/odbc-bridge/ODBCBlockInputStream.cpp b/programs/odbc-bridge/ODBCBlockInputStream.cpp
index 2cccc66a033..4fd9b4cca45 100644
--- a/programs/odbc-bridge/ODBCBlockInputStream.cpp
+++ b/programs/odbc-bridge/ODBCBlockInputStream.cpp
@@ -98,7 +98,7 @@ void ODBCSource::insertValue(
         case ValueType::vtFloat64:
             column.insert(row.get<double>(idx));
             break;
-        case ValueType::vtFixedString:[[fallthrough]];
+        case ValueType::vtFixedString:
         case ValueType::vtEnum8:
         case ValueType::vtEnum16:
         case ValueType::vtString:
@@ -134,9 +134,9 @@ void ODBCSource::insertValue(
             column.insert(time);
             break;
         }
-        case ValueType::vtDecimal32: [[fallthrough]];
-        case ValueType::vtDecimal64: [[fallthrough]];
-        case ValueType::vtDecimal128: [[fallthrough]];
+        case ValueType::vtDecimal32:
+        case ValueType::vtDecimal64:
+        case ValueType::vtDecimal128:
         case ValueType::vtDecimal256:
         {
             auto value = row.get<std::string>(idx);
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index aa38198334e..06b6927bc43 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -296,7 +296,7 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::prepare()
 
     switch (global_ctx->chosen_merge_algorithm)
     {
-        case MergeAlgorithm::Horizontal :
+        case MergeAlgorithm::Horizontal:
         {
             global_ctx->merging_columns = global_ctx->storage_columns;
             global_ctx->merging_column_names = global_ctx->all_column_names;
@@ -304,7 +304,7 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::prepare()
             global_ctx->gathering_column_names.clear();
             break;
         }
-        case MergeAlgorithm::Vertical :
+        case MergeAlgorithm::Vertical:
         {
             ctx->rows_sources_uncompressed_write_buf = ctx->tmp_disk->createRawStream();
             ctx->rows_sources_write_buf = std::make_unique<CompressedWriteBuffer>(*ctx->rows_sources_uncompressed_write_buf);
diff --git a/tests/integration/test_odbc_interaction/test_exiled.py b/tests/integration/test_odbc_interaction/test_exiled.py
deleted file mode 100644
index bdc819b8221..00000000000
--- a/tests/integration/test_odbc_interaction/test_exiled.py
+++ /dev/null
@@ -1,111 +0,0 @@
-import time
-import logging
-import pytest
-
-from helpers.cluster import ClickHouseCluster, assert_eq_with_retry
-from test_odbc_interaction.test import (
-    create_mysql_db,
-    create_mysql_table,
-    get_mysql_conn,
-    skip_test_msan,
-)
-
-
-cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance(
-    "node1",
-    with_odbc_drivers=True,
-    main_configs=["configs/openssl.xml", "configs/odbc_logging.xml"],
-    stay_alive=True,
-    dictionaries=["configs/dictionaries/sqlite3_odbc_hashed_dictionary.xml"],
-)
-
-
-@pytest.fixture(scope="module")
-def started_cluster():
-    try:
-        cluster.start()
-
-        sqlite_db = node1.odbc_drivers["SQLite3"]["Database"]
-        logging.debug(f"sqlite data received: {sqlite_db}")
-        node1.exec_in_container(
-            [
-                "sqlite3",
-                sqlite_db,
-                "CREATE TABLE t2(id INTEGER PRIMARY KEY ASC, X INTEGER, Y, Z);",
-            ],
-            privileged=True,
-            user="root",
-        )
-
-        node1.exec_in_container(
-            ["sqlite3", sqlite_db, "INSERT INTO t2 values(1, 1, 2, 3);"],
-            privileged=True,
-            user="root",
-        )
-
-        node1.query("SYSTEM RELOAD DICTIONARY sqlite3_odbc_hashed")
-
-        yield cluster
-    except Exception as ex:
-        logging.exception(ex)
-        raise ex
-    finally:
-        cluster.shutdown()
-
-
-# This test kills ClickHouse server and ODBC bridge and in worst scenario
-# may cause group test crashes. Thus, this test is executed in a separate "module"
-# with separate environment.
-def test_bridge_dies_with_parent(started_cluster):
-    skip_test_msan(node1)
-
-    if node1.is_built_with_address_sanitizer():
-        # TODO: Leak sanitizer falsely reports about a leak of 16 bytes in clickhouse-odbc-bridge in this test and
-        # that's linked somehow with that we have replaced getauxval() in glibc-compatibility.
-        # The leak sanitizer calls getauxval() for its own purposes, and our replaced version doesn't seem to be equivalent in that case.
-        pytest.skip(
-            "Leak sanitizer falsely reports about a leak of 16 bytes in clickhouse-odbc-bridge"
-        )
-
-    assert_eq_with_retry(
-        node1, "select dictGetUInt8('sqlite3_odbc_hashed', 'Z', toUInt64(1))", "3"
-    )
-
-    clickhouse_pid = node1.get_process_pid("clickhouse server")
-    bridge_pid = node1.get_process_pid("odbc-bridge")
-    assert clickhouse_pid is not None
-    assert bridge_pid is not None
-
-    try:
-        node1.exec_in_container(
-            ["kill", str(clickhouse_pid)], privileged=True, user="root"
-        )
-    except:
-        pass
-
-    for _ in range(30):
-        time.sleep(1)
-        clickhouse_pid = node1.get_process_pid("clickhouse server")
-        if clickhouse_pid is None:
-            break
-
-    for _ in range(30):
-        time.sleep(1)  # just for sure, that odbc-bridge caught signal
-        bridge_pid = node1.get_process_pid("odbc-bridge")
-        if bridge_pid is None:
-            break
-
-    if bridge_pid:
-        out = node1.exec_in_container(
-            ["gdb", "-p", str(bridge_pid), "--ex", "thread apply all bt", "--ex", "q"],
-            privileged=True,
-            user="root",
-        )
-        logging.debug(f"Bridge is running, gdb output:\n{out}")
-
-    try:
-        assert clickhouse_pid is None
-        assert bridge_pid is None
-    finally:
-        node1.start_clickhouse(20)

From 1a2d403f7b7dc16676d1b550dd346c06503c550c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 09:16:21 +0100
Subject: [PATCH 237/985] Miscellaneae

---
 programs/odbc-bridge/ODBCBlockInputStream.cpp | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/programs/odbc-bridge/ODBCBlockInputStream.cpp b/programs/odbc-bridge/ODBCBlockInputStream.cpp
index 4fd9b4cca45..934639ae604 100644
--- a/programs/odbc-bridge/ODBCBlockInputStream.cpp
+++ b/programs/odbc-bridge/ODBCBlockInputStream.cpp
@@ -118,7 +118,8 @@ void ODBCSource::insertValue(
             auto value = row.get<std::string>(idx);
             ReadBufferFromString in(value);
             time_t time = 0;
-            readDateTimeText(time, in, assert_cast<const DataTypeDateTime *>(data_type.get())->getTimeZone());
+            const DataTypeDateTime & datetime_type = assert_cast<const DataTypeDateTime &>(*data_type);
+            readDateTimeText(time, in, datetime_type.getTimeZone());
             if (time < 0)
                 time = 0;
             column.insert(static_cast<UInt32>(time));
@@ -129,8 +130,8 @@ void ODBCSource::insertValue(
             auto value = row.get<std::string>(idx);
             ReadBufferFromString in(value);
             DateTime64 time = 0;
-            const auto * datetime_type = assert_cast<const DataTypeDateTime64 *>(data_type.get());
-            readDateTime64Text(time, datetime_type->getScale(), in, datetime_type->getTimeZone());
+            const DataTypeDateTime64 & datetime_type = assert_cast<const DataTypeDateTime64 &>(*data_type);
+            readDateTime64Text(time, datetime_type.getScale(), in, datetime_type.getTimeZone());
             column.insert(time);
             break;
         }

From 157adefc70d8152f744b23152309cbf03b00c990 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 09:17:29 +0100
Subject: [PATCH 238/985] Fix error

---
 programs/odbc-bridge/ODBCBlockInputStream.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/odbc-bridge/ODBCBlockInputStream.cpp b/programs/odbc-bridge/ODBCBlockInputStream.cpp
index 934639ae604..59a5deac960 100644
--- a/programs/odbc-bridge/ODBCBlockInputStream.cpp
+++ b/programs/odbc-bridge/ODBCBlockInputStream.cpp
@@ -50,7 +50,7 @@ Chunk ODBCSource::generate()
             const auto & sample = description.sample_block.getByPosition(idx);
 
             if (!result.is_null(idx))
-                insertValue(*columns[idx], sample.type, description.types[idx].first, result, idx);
+                insertValue(*columns[idx], removeNullable(sample.type), description.types[idx].first, result, idx);
             else
                 insertDefaultValue(*columns[idx], *sample.column);
         }

From 3b8a8c9649b00d360c5d6169dc769c5371dd44a2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 09:28:30 +0100
Subject: [PATCH 239/985] Better gitignore

---
 docker/test/stateless/.gitignore | 1 +
 programs/server/.gitignore       | 1 +
 2 files changed, 2 insertions(+)
 create mode 100644 docker/test/stateless/.gitignore

diff --git a/docker/test/stateless/.gitignore b/docker/test/stateless/.gitignore
new file mode 100644
index 00000000000..928fed26d6d
--- /dev/null
+++ b/docker/test/stateless/.gitignore
@@ -0,0 +1 @@
+/minio_data
diff --git a/programs/server/.gitignore b/programs/server/.gitignore
index ddc480e4b29..34a774bde9d 100644
--- a/programs/server/.gitignore
+++ b/programs/server/.gitignore
@@ -2,6 +2,7 @@
 /metadata_dropped
 /data
 /store
+/disks
 /access
 /flags
 /dictionaries_lib

From d8e3fa6dc107a4b43edb091a3688b1672a6c2f70 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 09:35:57 +0100
Subject: [PATCH 240/985] Fix something strange

---
 src/Interpreters/fuzzers/execute_query_fuzzer.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/fuzzers/execute_query_fuzzer.cpp b/src/Interpreters/fuzzers/execute_query_fuzzer.cpp
index 6f84a60f2af..edff202d547 100644
--- a/src/Interpreters/fuzzers/execute_query_fuzzer.cpp
+++ b/src/Interpreters/fuzzers/execute_query_fuzzer.cpp
@@ -3,7 +3,7 @@
 #include <Interpreters/registerInterpreters.h>
 #include "Processors/Executors/PullingPipelineExecutor.h"
 
-#include <Functions/registerDatabases.h>
+#include <Databases/registerDatabases.h>
 #include <Functions/registerFunctions.h>
 #include <AggregateFunctions/registerAggregateFunctions.h>
 #include <TableFunctions/registerTableFunctions.h>

From 5c41727725eb1066ff2d86fc5da3e272e03155c1 Mon Sep 17 00:00:00 2001
From: Sema Checherinda <Sema.Checherinda@clickhouse.com>
Date: Sun, 3 Mar 2024 14:22:40 +0100
Subject: [PATCH 241/985] http connections pools

---
 .../Net/include/Poco/Net/HTTPChunkedStream.h  |   4 +
 .../Net/include/Poco/Net/HTTPClientSession.h  |  24 +-
 .../include/Poco/Net/HTTPFixedLengthStream.h  |   4 +
 base/poco/Net/include/Poco/Net/HTTPSession.h  |  24 +-
 base/poco/Net/include/Poco/Net/HTTPStream.h   |   2 +
 base/poco/Net/src/HTTPChunkedStream.cpp       |   4 +-
 base/poco/Net/src/HTTPClientSession.cpp       |  23 +-
 base/poco/Net/src/HTTPFixedLengthStream.cpp   |   6 +
 programs/server/Server.cpp                    |  18 +
 .../static-files-disk-uploader.cpp            |   6 +-
 src/Access/Common/AccessType.h                |   3 +-
 src/Access/HTTPAuthClient.h                   |   2 +-
 .../CatBoostLibraryBridgeHelper.cpp           | 104 +-
 .../ExternalDictionaryLibraryBridgeHelper.cpp |  38 +-
 src/BridgeHelper/XDBCBridgeHelper.h           |  26 +-
 src/Client/Connection.cpp                     |  16 +
 src/Common/CurrentMetrics.cpp                 |  12 +
 src/Common/DNSResolver.cpp                    |   3 +-
 src/Common/HTTPConnectionPool.cpp             | 865 ++++++++++++++++
 src/Common/HTTPConnectionPool.h               |  91 ++
 src/Common/HostResolvePool.cpp                | 293 ++++++
 src/Common/HostResolvePool.h                  | 218 ++++
 src/Common/ProfileEvents.cpp                  |  29 +
 src/Common/ProxyConfiguration.h               |  12 +-
 src/Common/ProxyListConfigurationResolver.cpp |   2 -
 .../RemoteProxyConfigurationResolver.cpp      |   2 +-
 src/Common/tests/gtest_connection_pool.cpp    | 558 +++++++++++
 src/Common/tests/gtest_resolve_pool.cpp       | 278 ++++++
 src/Core/ServerSettings.h                     |  11 +-
 src/Core/Settings.h                           |   2 +-
 src/Core/SettingsChangesHistory.h             |   3 +-
 src/Dictionaries/HTTPDictionarySource.cpp     |  91 +-
 src/Dictionaries/XDBCDictionarySource.cpp     |  15 +-
 src/Dictionaries/XDBCDictionarySource.h       |   2 +-
 src/Disks/IO/ReadBufferFromWebServer.cpp      |  81 +-
 src/Disks/ObjectStorages/S3/diskSettings.cpp  |   4 -
 .../ObjectStorages/Web/WebObjectStorage.cpp   |  35 +-
 src/Functions/sqid.cpp                        |   2 +-
 src/IO/ConnectionTimeouts.cpp                 |  15 +
 src/IO/ConnectionTimeouts.h                   |   4 +
 src/IO/HTTPCommon.cpp                         | 379 +------
 src/IO/HTTPCommon.h                           |  48 +-
 src/IO/LimitReadBuffer.cpp                    |  25 +-
 src/IO/LimitReadBuffer.h                      |  18 +-
 src/IO/MMapReadBufferFromFileDescriptor.cpp   |   2 +-
 src/IO/MMapReadBufferFromFileDescriptor.h     |   2 +-
 src/IO/ReadBuffer.h                           |  12 +-
 src/IO/ReadBufferFromFileDescriptor.cpp       |   4 +-
 src/IO/ReadBufferFromFileDescriptor.h         |   4 +-
 src/IO/ReadBufferFromIStream.cpp              |  40 +-
 src/IO/ReadBufferFromS3.cpp                   | 100 +-
 src/IO/ReadBufferFromS3.h                     |   6 +-
 src/IO/ReadSettings.h                         |   2 +-
 src/IO/ReadWriteBufferFromHTTP.cpp            | 945 +++++++-----------
 src/IO/ReadWriteBufferFromHTTP.h              | 426 ++++----
 src/IO/S3/PocoHTTPClient.cpp                  |  63 +-
 src/IO/S3/PocoHTTPClient.h                    |  17 +-
 src/IO/SeekableReadBuffer.h                   |   2 +-
 src/IO/{S3 => }/SessionAwareIOStream.h        |   2 +-
 src/IO/WriteBufferFromHTTP.cpp                |   6 +-
 src/IO/WriteBufferFromHTTP.h                  |   3 +-
 src/IO/copyData.cpp                           |   2 +-
 src/Interpreters/Context.cpp                  |  13 -
 src/Interpreters/Context.h                    |   4 -
 src/Interpreters/DDLTask.cpp                  |   5 +
 src/Interpreters/InterpreterSystemQuery.cpp   |   9 +
 src/Parsers/ASTSystemQuery.cpp                |   1 +
 src/Parsers/ASTSystemQuery.h                  |   1 +
 .../Formats/Impl/AvroRowInputFormat.cpp       |   4 +-
 src/Storages/MergeTree/DataPartsExchange.cpp  |  25 +-
 src/Storages/MergeTree/DataPartsExchange.h    |  10 +-
 src/Storages/StorageDistributed.cpp           |   2 +-
 src/Storages/StorageS3.cpp                    |   4 +-
 src/Storages/StorageURL.cpp                   |  49 +-
 src/TableFunctions/ITableFunctionXDBC.cpp     |  17 +-
 .../test_cancel_backup.py                     |   2 +-
 .../configs/setting.xml                       |   1 +
 .../configs/storage_conf.xml                  |   1 +
 .../test_disk_over_web_server/test.py         |   2 +-
 tests/integration/test_dns_cache/test.py      |  12 +-
 tests/integration/test_http_failover/test.py  |   6 +-
 .../test_redirect_url_storage/test.py         |   2 +-
 .../test_s3_table_functions/test.py           |   1 +
 .../s3_mocks/unstable_server.py               |   2 +-
 .../0_stateless/00646_url_engine.python       |  13 +-
 .../01271_show_privileges.reference           |   1 +
 .../0_stateless/01293_show_settings.reference |   1 +
 .../0_stateless/02205_HTTP_user_agent.python  |  13 +-
 .../0_stateless/02233_HTTP_ranged.python      |  25 +-
 ...rofile_events_from_query_log_and_client.sh |   2 +-
 ...89_reading_from_s3_with_connection_pool.sh |   6 +-
 .../02833_url_without_path_encoding.sh        |   4 +-
 92 files changed, 3507 insertions(+), 1771 deletions(-)
 create mode 100644 src/Common/HTTPConnectionPool.cpp
 create mode 100644 src/Common/HTTPConnectionPool.h
 create mode 100644 src/Common/HostResolvePool.cpp
 create mode 100644 src/Common/HostResolvePool.h
 create mode 100644 src/Common/tests/gtest_connection_pool.cpp
 create mode 100644 src/Common/tests/gtest_resolve_pool.cpp
 rename src/IO/{S3 => }/SessionAwareIOStream.h (97%)

diff --git a/base/poco/Net/include/Poco/Net/HTTPChunkedStream.h b/base/poco/Net/include/Poco/Net/HTTPChunkedStream.h
index 5f4729c9278..a6576aa561d 100644
--- a/base/poco/Net/include/Poco/Net/HTTPChunkedStream.h
+++ b/base/poco/Net/include/Poco/Net/HTTPChunkedStream.h
@@ -45,6 +45,8 @@ namespace Net
         ~HTTPChunkedStreamBuf();
         void close();
 
+        bool isComplete() const { return _chunk == std::char_traits<char>::eof(); }
+
     protected:
         int readFromDevice(char * buffer, std::streamsize length);
         int writeToDevice(const char * buffer, std::streamsize length);
@@ -68,6 +70,8 @@ namespace Net
         ~HTTPChunkedIOS();
         HTTPChunkedStreamBuf * rdbuf();
 
+        bool isComplete() const { return _buf.isComplete(); }
+
     protected:
         HTTPChunkedStreamBuf _buf;
     };
diff --git a/base/poco/Net/include/Poco/Net/HTTPClientSession.h b/base/poco/Net/include/Poco/Net/HTTPClientSession.h
index 7c0caa1c18b..1cef988566c 100644
--- a/base/poco/Net/include/Poco/Net/HTTPClientSession.h
+++ b/base/poco/Net/include/Poco/Net/HTTPClientSession.h
@@ -210,7 +210,7 @@ namespace Net
         void setKeepAliveTimeout(const Poco::Timespan & timeout);
         /// Sets the connection timeout for HTTP connections.
 
-        const Poco::Timespan & getKeepAliveTimeout() const;
+        Poco::Timespan getKeepAliveTimeout() const;
         /// Returns the connection timeout for HTTP connections.
 
         virtual std::ostream & sendRequest(HTTPRequest & request);
@@ -275,7 +275,7 @@ namespace Net
         /// This method should only be called if the request contains
         /// a "Expect: 100-continue" header.
 
-        void flushRequest();
+        virtual void flushRequest();
         /// Flushes the request stream.
         ///
         /// Normally this method does not need to be called.
@@ -283,7 +283,7 @@ namespace Net
         /// fully sent if receiveResponse() is not called, e.g.,
         /// because the underlying socket will be detached.
 
-        void reset();
+        virtual void reset();
         /// Resets the session and closes the socket.
         ///
         /// The next request will initiate a new connection,
@@ -303,6 +303,9 @@ namespace Net
         /// Returns true if the proxy should be bypassed
         /// for the current host.
 
+        const Poco::Timestamp & getLastRequest() const;
+        /// Returns time when connection has been used last time
+
     protected:
         enum
         {
@@ -338,6 +341,10 @@ namespace Net
         /// Calls proxyConnect() and attaches the resulting StreamSocket
         /// to the HTTPClientSession.
 
+        void setLastRequest(Poco::Timestamp time);
+
+        void assign(HTTPClientSession & session);
+
         HTTPSessionFactory _proxySessionFactory;
         /// Factory to create HTTPClientSession to proxy.
     private:
@@ -433,11 +440,20 @@ namespace Net
     }
 
 
-    inline const Poco::Timespan & HTTPClientSession::getKeepAliveTimeout() const
+    inline Poco::Timespan HTTPClientSession::getKeepAliveTimeout() const
     {
         return _keepAliveTimeout;
     }
 
+    inline const Poco::Timestamp & HTTPClientSession::getLastRequest() const
+    {
+        return _lastRequest;
+    }
+
+    inline void HTTPClientSession::setLastRequest(Poco::Timestamp time)
+    {
+        _lastRequest = time;
+    }
 
 }
 } // namespace Poco::Net
diff --git a/base/poco/Net/include/Poco/Net/HTTPFixedLengthStream.h b/base/poco/Net/include/Poco/Net/HTTPFixedLengthStream.h
index 2f4df102605..17fa47cfa9b 100644
--- a/base/poco/Net/include/Poco/Net/HTTPFixedLengthStream.h
+++ b/base/poco/Net/include/Poco/Net/HTTPFixedLengthStream.h
@@ -48,6 +48,8 @@ namespace Net
         HTTPFixedLengthStreamBuf(HTTPSession & session, ContentLength length, openmode mode);
         ~HTTPFixedLengthStreamBuf();
 
+        bool isComplete() const;
+
     protected:
         int readFromDevice(char * buffer, std::streamsize length);
         int writeToDevice(const char * buffer, std::streamsize length);
@@ -67,6 +69,8 @@ namespace Net
         ~HTTPFixedLengthIOS();
         HTTPFixedLengthStreamBuf * rdbuf();
 
+        bool isComplete() const { return _buf.isComplete(); }
+
     protected:
         HTTPFixedLengthStreamBuf _buf;
     };
diff --git a/base/poco/Net/include/Poco/Net/HTTPSession.h b/base/poco/Net/include/Poco/Net/HTTPSession.h
index 934b34be5d5..cac14f479db 100644
--- a/base/poco/Net/include/Poco/Net/HTTPSession.h
+++ b/base/poco/Net/include/Poco/Net/HTTPSession.h
@@ -64,6 +64,15 @@ namespace Net
         Poco::Timespan getTimeout() const;
         /// Returns the timeout for the HTTP session.
 
+        Poco::Timespan getConnectionTimeout() const;
+        /// Returns connection timeout for the HTTP session.
+
+        Poco::Timespan getSendTimeout() const;
+        /// Returns send timeout for the HTTP session.
+
+        Poco::Timespan getReceiveTimeout() const;
+        /// Returns receive timeout for the HTTP session.
+
         bool connected() const;
         /// Returns true if the underlying socket is connected.
 
@@ -217,12 +226,25 @@ namespace Net
         return _keepAlive;
     }
 
-
     inline Poco::Timespan HTTPSession::getTimeout() const
     {
         return _receiveTimeout;
     }
 
+    inline Poco::Timespan HTTPSession::getConnectionTimeout() const
+    {
+        return _connectionTimeout;
+    }
+
+    inline Poco::Timespan HTTPSession::getSendTimeout() const
+    {
+        return _sendTimeout;
+    }
+
+    inline Poco::Timespan HTTPSession::getReceiveTimeout() const
+    {
+        return _receiveTimeout;
+    }
 
     inline StreamSocket & HTTPSession::socket()
     {
diff --git a/base/poco/Net/include/Poco/Net/HTTPStream.h b/base/poco/Net/include/Poco/Net/HTTPStream.h
index 48502347b2c..a00a861880f 100644
--- a/base/poco/Net/include/Poco/Net/HTTPStream.h
+++ b/base/poco/Net/include/Poco/Net/HTTPStream.h
@@ -63,6 +63,8 @@ namespace Net
         ~HTTPIOS();
         HTTPStreamBuf * rdbuf();
 
+        bool isComplete() const { return false; }
+
     protected:
         HTTPStreamBuf _buf;
     };
diff --git a/base/poco/Net/src/HTTPChunkedStream.cpp b/base/poco/Net/src/HTTPChunkedStream.cpp
index 376e3f55492..16ed1e71c31 100644
--- a/base/poco/Net/src/HTTPChunkedStream.cpp
+++ b/base/poco/Net/src/HTTPChunkedStream.cpp
@@ -49,10 +49,12 @@ HTTPChunkedStreamBuf::~HTTPChunkedStreamBuf()
 
 void HTTPChunkedStreamBuf::close()
 {
-	if (_mode & std::ios::out)
+	if (_mode & std::ios::out && _chunk != std::char_traits<char>::eof())
 	{
 		sync();
 		_session.write("0\r\n\r\n", 5);
+
+        _chunk = std::char_traits<char>::eof();
 	}
 }
 
diff --git a/base/poco/Net/src/HTTPClientSession.cpp b/base/poco/Net/src/HTTPClientSession.cpp
index 2282cca682b..33a3dcc4901 100644
--- a/base/poco/Net/src/HTTPClientSession.cpp
+++ b/base/poco/Net/src/HTTPClientSession.cpp
@@ -227,7 +227,7 @@ void HTTPClientSession::setKeepAliveTimeout(const Poco::Timespan& timeout)
 std::ostream& HTTPClientSession::sendRequest(HTTPRequest& request)
 {
 	_pRequestStream = 0;
-	_pResponseStream = 0;
+    _pResponseStream = 0;
 	clearException();
 	_responseReceived = false;
 
@@ -501,5 +501,26 @@ bool HTTPClientSession::bypassProxy() const
 	else return false;
 }
 
+void HTTPClientSession::assign(Poco::Net::HTTPClientSession & session)
+{
+    poco_assert (this != &session);
+
+    if (session.buffered())
+        throw Poco::LogicException("assign a session with not empty buffered data");
+
+    if (buffered())
+        throw Poco::LogicException("assign to a session with not empty buffered data");
+
+    attachSocket(session.detachSocket());
+    setLastRequest(session.getLastRequest());
+    setResolvedHost(session.getResolvedHost());
+    setKeepAlive(session.getKeepAlive());
+
+    setTimeout(session.getConnectionTimeout(), session.getSendTimeout(), session.getReceiveTimeout());
+    setKeepAliveTimeout(session.getKeepAliveTimeout());
+    setProxyConfig(session.getProxyConfig());
+
+    session.reset();
+}
 
 } } // namespace Poco::Net
diff --git a/base/poco/Net/src/HTTPFixedLengthStream.cpp b/base/poco/Net/src/HTTPFixedLengthStream.cpp
index fd77ff71cd9..837e5723c57 100644
--- a/base/poco/Net/src/HTTPFixedLengthStream.cpp
+++ b/base/poco/Net/src/HTTPFixedLengthStream.cpp
@@ -43,6 +43,12 @@ HTTPFixedLengthStreamBuf::~HTTPFixedLengthStreamBuf()
 }
 
 
+bool HTTPFixedLengthStreamBuf::isComplete() const
+{
+    return _count == _length;
+}
+
+
 int HTTPFixedLengthStreamBuf::readFromDevice(char* buffer, std::streamsize length)
 {
 	int n = 0;
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index f2c5dcc0f6d..7636f221ab5 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -46,6 +46,7 @@
 #include <Common/makeSocketAddress.h>
 #include <Common/FailPoint.h>
 #include <Common/CPUID.h>
+#include <Common/HTTPConnectionPool.h>
 #include <Server/waitServersToFinish.h>
 #include <Interpreters/Cache/FileCacheFactory.h>
 #include <Core/ServerUUID.h>
@@ -1547,6 +1548,23 @@ try
 
             FileCacheFactory::instance().updateSettingsFromConfig(*config);
 
+            HTTPConnectionPools::instance().setLimits(
+                HTTPConnectionPools::Limits{
+                    new_server_settings.disk_connections_soft_limit,
+                    new_server_settings.disk_connections_warn_limit,
+                    new_server_settings.disk_connections_store_limit,
+                },
+                HTTPConnectionPools::Limits{
+                    new_server_settings.storage_connections_soft_limit,
+                    new_server_settings.storage_connections_warn_limit,
+                    new_server_settings.storage_connections_store_limit,
+                },
+                HTTPConnectionPools::Limits{
+                    new_server_settings.http_connections_soft_limit,
+                    new_server_settings.http_connections_warn_limit,
+                    new_server_settings.http_connections_store_limit,
+                });
+
             ProfileEvents::increment(ProfileEvents::MainConfigLoads);
 
             /// Must be the last.
diff --git a/programs/static-files-disk-uploader/static-files-disk-uploader.cpp b/programs/static-files-disk-uploader/static-files-disk-uploader.cpp
index d54a2d2da6e..dfe68c819fc 100644
--- a/programs/static-files-disk-uploader/static-files-disk-uploader.cpp
+++ b/programs/static-files-disk-uploader/static-files-disk-uploader.cpp
@@ -65,7 +65,7 @@ void processFile(const fs::path & file_path, const fs::path & dst_path, bool tes
 
         /// test mode for integration tests.
         if (test_mode)
-            dst_buf = std::make_shared<WriteBufferFromHTTP>(Poco::URI(dst_file_path), Poco::Net::HTTPRequest::HTTP_PUT);
+            dst_buf = std::make_shared<WriteBufferFromHTTP>(HTTPConnectionGroupType::HTTP, Poco::URI(dst_file_path), Poco::Net::HTTPRequest::HTTP_PUT);
         else
             dst_buf = std::make_shared<WriteBufferFromFile>(dst_file_path);
 
@@ -88,7 +88,7 @@ void processTableFiles(const fs::path & data_path, fs::path dst_path, bool test_
     {
         dst_path /= "store";
         auto files_root = dst_path / prefix;
-        root_meta = std::make_shared<WriteBufferFromHTTP>(Poco::URI(files_root / ".index"), Poco::Net::HTTPRequest::HTTP_PUT);
+        root_meta = std::make_shared<WriteBufferFromHTTP>(HTTPConnectionGroupType::HTTP, Poco::URI(files_root / ".index"), Poco::Net::HTTPRequest::HTTP_PUT);
     }
     else
     {
@@ -112,7 +112,7 @@ void processTableFiles(const fs::path & data_path, fs::path dst_path, bool test_
             if (test_mode)
             {
                 auto files_root = dst_path / prefix;
-                directory_meta = std::make_shared<WriteBufferFromHTTP>(Poco::URI(dst_path / directory_prefix / ".index"), Poco::Net::HTTPRequest::HTTP_PUT);
+                directory_meta = std::make_shared<WriteBufferFromHTTP>(HTTPConnectionGroupType::HTTP, Poco::URI(dst_path / directory_prefix / ".index"), Poco::Net::HTTPRequest::HTTP_PUT);
             }
             else
             {
diff --git a/src/Access/Common/AccessType.h b/src/Access/Common/AccessType.h
index 87f96ca48be..6095f8ce6d3 100644
--- a/src/Access/Common/AccessType.h
+++ b/src/Access/Common/AccessType.h
@@ -154,7 +154,8 @@ enum class AccessType
     M(SET_DEFINER, "", USER_NAME, ALL) \
     \
     M(SYSTEM_SHUTDOWN, "SYSTEM KILL, SHUTDOWN", GLOBAL, SYSTEM) \
-    M(SYSTEM_DROP_DNS_CACHE, "SYSTEM DROP DNS, DROP DNS CACHE, DROP DNS", GLOBAL, SYSTEM_DROP_CACHE) \
+    M(SYSTEM_DROP_DNS_CACHE, "SYSTEM DROP DNS, DROP DNS CACHE, DROP DNS", GLOBAL, SYSTEM_DROP_CACHE)  \
+    M(SYSTEM_DROP_CONNECTIONS_CACHE, "SYSTEM DROP CONNECTIONS CACHE, DROP CONNECTIONS CACHE", GLOBAL, SYSTEM_DROP_CACHE)  \
     M(SYSTEM_DROP_MARK_CACHE, "SYSTEM DROP MARK, DROP MARK CACHE, DROP MARKS", GLOBAL, SYSTEM_DROP_CACHE) \
     M(SYSTEM_DROP_UNCOMPRESSED_CACHE, "SYSTEM DROP UNCOMPRESSED, DROP UNCOMPRESSED CACHE, DROP UNCOMPRESSED", GLOBAL, SYSTEM_DROP_CACHE) \
     M(SYSTEM_DROP_MMAP_CACHE, "SYSTEM DROP MMAP, DROP MMAP CACHE, DROP MMAP", GLOBAL, SYSTEM_DROP_CACHE) \
diff --git a/src/Access/HTTPAuthClient.h b/src/Access/HTTPAuthClient.h
index caefe869005..a8b56cf05a7 100644
--- a/src/Access/HTTPAuthClient.h
+++ b/src/Access/HTTPAuthClient.h
@@ -36,7 +36,7 @@ public:
 
     Result authenticateRequest(Poco::Net::HTTPRequest & request) const
     {
-        auto session = makeHTTPSession(uri, timeouts);
+        auto session = makeHTTPSession(HTTPConnectionGroupType::HTTP, uri, timeouts);
         Poco::Net::HTTPResponse response;
 
         auto milliseconds_to_wait = retry_initial_backoff_ms;
diff --git a/src/BridgeHelper/CatBoostLibraryBridgeHelper.cpp b/src/BridgeHelper/CatBoostLibraryBridgeHelper.cpp
index 4db1eb720ac..bb9d890a691 100644
--- a/src/BridgeHelper/CatBoostLibraryBridgeHelper.cpp
+++ b/src/BridgeHelper/CatBoostLibraryBridgeHelper.cpp
@@ -58,8 +58,12 @@ bool CatBoostLibraryBridgeHelper::bridgeHandShake()
     String result;
     try
     {
-        ReadWriteBufferFromHTTP buf(getPingURI(), Poco::Net::HTTPRequest::HTTP_GET, {}, http_timeouts, credentials);
-        readString(result, buf);
+        auto buf = BuilderRWBufferFromHTTP(getPingURI())
+                       .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                       .withTimeouts(http_timeouts)
+                       .create(credentials);
+
+        readString(result, *buf);
     }
     catch (...)
     {
@@ -79,29 +83,29 @@ ExternalModelInfos CatBoostLibraryBridgeHelper::listModels()
 {
     startBridgeSync();
 
-    ReadWriteBufferFromHTTP buf(
-        createRequestURI(CATBOOST_LIST_METHOD),
-        Poco::Net::HTTPRequest::HTTP_POST,
-        [](std::ostream &) {},
-        http_timeouts, credentials);
+    auto buf = BuilderRWBufferFromHTTP(createRequestURI(CATBOOST_LIST_METHOD))
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withTimeouts(http_timeouts)
+                   .create(credentials);
 
     ExternalModelInfos result;
 
     UInt64 num_rows;
-    readIntBinary(num_rows, buf);
+    readIntBinary(num_rows, *buf);
 
     for (UInt64 i = 0; i < num_rows; ++i)
     {
         ExternalModelInfo info;
 
-        readStringBinary(info.model_path, buf);
-        readStringBinary(info.model_type, buf);
+        readStringBinary(info.model_path, *buf);
+        readStringBinary(info.model_type, *buf);
 
         UInt64 t;
-        readIntBinary(t, buf);
+        readIntBinary(t, *buf);
         info.loading_start_time = std::chrono::system_clock::from_time_t(t);
 
-        readIntBinary(t, buf);
+        readIntBinary(t, *buf);
         info.loading_duration = std::chrono::milliseconds(t);
 
         result.push_back(info);
@@ -116,17 +120,19 @@ void CatBoostLibraryBridgeHelper::removeModel()
 
     assert(model_path);
 
-    ReadWriteBufferFromHTTP buf(
-        createRequestURI(CATBOOST_REMOVEMODEL_METHOD),
-        Poco::Net::HTTPRequest::HTTP_POST,
-        [this](std::ostream & os)
-        {
-            os << "model_path=" << escapeForFileName(*model_path);
-        },
-        http_timeouts, credentials);
+    auto buf = BuilderRWBufferFromHTTP(createRequestURI(CATBOOST_REMOVEMODEL_METHOD))
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withTimeouts(http_timeouts)
+                   .withOutCallback(
+                       [this](std::ostream & os)
+                       {
+                           os << "model_path=" << escapeForFileName(*model_path);
+                       })
+                   .create(credentials);
 
     String result;
-    readStringBinary(result, buf);
+    readStringBinary(result, *buf);
     assert(result == "1");
 }
 
@@ -134,14 +140,14 @@ void CatBoostLibraryBridgeHelper::removeAllModels()
 {
     startBridgeSync();
 
-    ReadWriteBufferFromHTTP buf(
-        createRequestURI(CATBOOST_REMOVEALLMODELS_METHOD),
-        Poco::Net::HTTPRequest::HTTP_POST,
-        [](std::ostream &){},
-        http_timeouts, credentials);
+    auto buf = BuilderRWBufferFromHTTP(createRequestURI(CATBOOST_REMOVEALLMODELS_METHOD))
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withTimeouts(http_timeouts)
+                   .create(credentials);
 
     String result;
-    readStringBinary(result, buf);
+    readStringBinary(result, *buf);
     assert(result == "1");
 }
 
@@ -151,18 +157,20 @@ size_t CatBoostLibraryBridgeHelper::getTreeCount()
 
     assert(model_path && library_path);
 
-    ReadWriteBufferFromHTTP buf(
-        createRequestURI(CATBOOST_GETTREECOUNT_METHOD),
-        Poco::Net::HTTPRequest::HTTP_POST,
-        [this](std::ostream & os)
-        {
-            os << "library_path=" << escapeForFileName(*library_path) << "&";
-            os << "model_path=" << escapeForFileName(*model_path);
-        },
-        http_timeouts, credentials);
+    auto buf = BuilderRWBufferFromHTTP(createRequestURI(CATBOOST_GETTREECOUNT_METHOD))
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withTimeouts(http_timeouts)
+                   .withOutCallback(
+                        [this](std::ostream & os)
+                        {
+                           os << "library_path=" << escapeForFileName(*library_path) << "&";
+                           os << "model_path=" << escapeForFileName(*model_path);
+                        })
+                   .create(credentials);
 
     size_t result;
-    readIntBinary(result, buf);
+    readIntBinary(result, *buf);
     return result;
 }
 
@@ -177,17 +185,19 @@ ColumnPtr CatBoostLibraryBridgeHelper::evaluate(const ColumnsWithTypeAndName & c
 
     assert(model_path);
 
-    ReadWriteBufferFromHTTP buf(
-        createRequestURI(CATBOOST_LIB_EVALUATE_METHOD),
-        Poco::Net::HTTPRequest::HTTP_POST,
-        [this, serialized = string_write_buf.str()](std::ostream & os)
-        {
-            os << "model_path=" << escapeForFileName(*model_path) << "&";
-            os << "data=" << escapeForFileName(serialized);
-        },
-        http_timeouts, credentials);
+    auto buf = BuilderRWBufferFromHTTP(createRequestURI(CATBOOST_LIB_EVALUATE_METHOD))
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withTimeouts(http_timeouts)
+                   .withOutCallback(
+                       [this, serialized = string_write_buf.str()](std::ostream & os)
+                       {
+                           os << "model_path=" << escapeForFileName(*model_path) << "&";
+                           os << "data=" << escapeForFileName(serialized);
+                       })
+                   .create(credentials);
 
-    NativeReader deserializer(buf, /*server_revision*/ 0);
+    NativeReader deserializer(*buf, /*server_revision*/ 0);
     Block block_read = deserializer.read();
 
     return block_read.getColumns()[0];
diff --git a/src/BridgeHelper/ExternalDictionaryLibraryBridgeHelper.cpp b/src/BridgeHelper/ExternalDictionaryLibraryBridgeHelper.cpp
index fcb8ebd1f22..a37d2bd396f 100644
--- a/src/BridgeHelper/ExternalDictionaryLibraryBridgeHelper.cpp
+++ b/src/BridgeHelper/ExternalDictionaryLibraryBridgeHelper.cpp
@@ -71,8 +71,12 @@ bool ExternalDictionaryLibraryBridgeHelper::bridgeHandShake()
     String result;
     try
     {
-        ReadWriteBufferFromHTTP buf(getPingURI(), Poco::Net::HTTPRequest::HTTP_GET, {}, http_timeouts, credentials);
-        readString(result, buf);
+        auto buf = BuilderRWBufferFromHTTP(getPingURI())
+                       .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                       .withTimeouts(http_timeouts)
+                       .create(credentials);
+
+        readString(result, *buf);
     }
     catch (...)
     {
@@ -247,30 +251,28 @@ QueryPipeline ExternalDictionaryLibraryBridgeHelper::loadKeys(const Block & requ
 
 bool ExternalDictionaryLibraryBridgeHelper::executeRequest(const Poco::URI & uri, ReadWriteBufferFromHTTP::OutStreamCallback out_stream_callback) const
 {
-    ReadWriteBufferFromHTTP buf(
-        uri,
-        Poco::Net::HTTPRequest::HTTP_POST,
-        std::move(out_stream_callback),
-        http_timeouts, credentials);
+    auto buf = BuilderRWBufferFromHTTP(uri)
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withTimeouts(http_timeouts)
+                   .withOutCallback(std::move(out_stream_callback))
+                   .create(credentials);
 
     bool res;
-    readBoolText(res, buf);
+    readBoolText(res, *buf);
     return res;
 }
 
 
 QueryPipeline ExternalDictionaryLibraryBridgeHelper::loadBase(const Poco::URI & uri, ReadWriteBufferFromHTTP::OutStreamCallback out_stream_callback)
 {
-    auto read_buf_ptr = std::make_unique<ReadWriteBufferFromHTTP>(
-        uri,
-        Poco::Net::HTTPRequest::HTTP_POST,
-        std::move(out_stream_callback),
-        http_timeouts,
-        credentials,
-        0,
-        DBMS_DEFAULT_BUFFER_SIZE,
-        getContext()->getReadSettings(),
-        HTTPHeaderEntries{});
+    auto read_buf_ptr = BuilderRWBufferFromHTTP(uri)
+                            .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                            .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                            .withSettings(getContext()->getReadSettings())
+                            .withTimeouts(http_timeouts)
+                            .withOutCallback(std::move(out_stream_callback))
+                            .create(credentials);
 
     auto source = FormatFactory::instance().getInput(ExternalDictionaryLibraryBridgeHelper::DEFAULT_FORMAT, *read_buf_ptr, sample_block, getContext(), DEFAULT_BLOCK_SIZE);
     source->addBuffer(std::move(read_buf_ptr));
diff --git a/src/BridgeHelper/XDBCBridgeHelper.h b/src/BridgeHelper/XDBCBridgeHelper.h
index d208b8ddab0..838be42357a 100644
--- a/src/BridgeHelper/XDBCBridgeHelper.h
+++ b/src/BridgeHelper/XDBCBridgeHelper.h
@@ -97,8 +97,12 @@ protected:
     {
         try
         {
-            ReadWriteBufferFromHTTP buf(getPingURI(), Poco::Net::HTTPRequest::HTTP_GET, {}, getHTTPTimeouts(), credentials);
-            return checkString(PING_OK_ANSWER, buf);
+            auto buf = BuilderRWBufferFromHTTP(getPingURI())
+                           .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                           .withTimeouts(getHTTPTimeouts())
+                           .create(credentials);
+
+            return checkString(PING_OK_ANSWER, *buf);
         }
         catch (...)
         {
@@ -198,10 +202,14 @@ protected:
             uri.addQueryParameter("connection_string", getConnectionString());
             uri.addQueryParameter("use_connection_pooling", toString(use_connection_pooling));
 
-            ReadWriteBufferFromHTTP buf(uri, Poco::Net::HTTPRequest::HTTP_POST, {}, getHTTPTimeouts(), credentials);
+            auto buf = BuilderRWBufferFromHTTP(uri)
+                           .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                           .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                           .withTimeouts(getHTTPTimeouts())
+                           .create(credentials);
 
-            bool res;
-            readBoolText(res, buf);
+            bool res = false;
+            readBoolText(res, *buf);
             is_schema_allowed = res;
         }
 
@@ -220,10 +228,14 @@ protected:
             uri.addQueryParameter("connection_string", getConnectionString());
             uri.addQueryParameter("use_connection_pooling", toString(use_connection_pooling));
 
-            ReadWriteBufferFromHTTP buf(uri, Poco::Net::HTTPRequest::HTTP_POST, {}, getHTTPTimeouts(), credentials);
+            auto buf = BuilderRWBufferFromHTTP(uri)
+                           .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                           .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                           .withTimeouts(getHTTPTimeouts())
+                           .create(credentials);
 
             std::string character;
-            readStringBinary(character, buf);
+            readStringBinary(character, *buf);
             if (character.length() > 1)
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Failed to parse quoting style from '{}' for service {}",
                     character, BridgeHelperMixin::serviceAlias());
diff --git a/src/Client/Connection.cpp b/src/Client/Connection.cpp
index 4848f4c7ee5..a11a1243957 100644
--- a/src/Client/Connection.cpp
+++ b/src/Client/Connection.cpp
@@ -153,6 +153,12 @@ void Connection::connect(const ConnectionTimeouts & timeouts)
                 current_resolved_address = *it;
                 break;
             }
+            catch (DB::NetException &)
+            {
+                if (++it == addresses.end())
+                    throw;
+                continue;
+            }
             catch (Poco::Net::NetException &)
             {
                 if (++it == addresses.end())
@@ -199,6 +205,16 @@ void Connection::connect(const ConnectionTimeouts & timeouts)
         LOG_TRACE(log_wrapper.get(), "Connected to {} server version {}.{}.{}.",
             server_name, server_version_major, server_version_minor, server_version_patch);
     }
+    catch (DB::NetException & e)
+    {
+        disconnect();
+
+        /// Remove this possible stale entry from cache
+        DNSResolver::instance().removeHostFromCache(host);
+
+        /// Add server address to exception. Also Exception will remember stack trace. It's a pity that more precise exception type is lost.
+        throw NetException(ErrorCodes::NETWORK_ERROR, "{} ({})", e.displayText(), getDescription());
+    }
     catch (Poco::Net::NetException & e)
     {
         disconnect();
diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index 82da4c4bbad..f43481f665b 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -275,6 +275,18 @@
     M(DistrCacheReadRequests, "Number of executed Read requests to Distributed Cache") \
     M(DistrCacheWriteRequests, "Number of executed Write requests to Distributed Cache") \
     M(DistrCacheServerConnections, "Number of open connections to ClickHouse server from Distributed Cache")
+    \
+    M(StorageConnectionsStored, "Total count of sessions stored in the session pool for storages") \
+    M(StorageConnectionsTotal, "Total count of all sessions: stored in the pool and actively used right now for storages") \
+    \
+    M(DiskConnectionsStored, "Total count of sessions stored in the session pool for disks") \
+    M(DiskConnectionsTotal, "Total count of all sessions: stored in the pool and actively used right now for disks") \
+    \
+    M(HTTPConnectionsStored, "Total count of sessions stored in the session pool for http hosts") \
+    M(HTTPConnectionsTotal, "Total count of all sessions: stored in the pool and actively used right now for http hosts") \
+    \
+    M(AddressesActive, "Total count of addresses which are used for creation connections with connection pools") \
+
 
 #ifdef APPLY_FOR_EXTERNAL_METRICS
     #define APPLY_FOR_METRICS(M) APPLY_FOR_BUILTIN_METRICS(M) APPLY_FOR_EXTERNAL_METRICS(M)
diff --git a/src/Common/DNSResolver.cpp b/src/Common/DNSResolver.cpp
index 5b5f5369d5e..e36e1483da8 100644
--- a/src/Common/DNSResolver.cpp
+++ b/src/Common/DNSResolver.cpp
@@ -1,6 +1,7 @@
 #include "DNSResolver.h"
 #include <Common/CacheBase.h>
 #include <Common/Exception.h>
+#include <Common/NetException.h>
 #include <Common/ProfileEvents.h>
 #include <Common/thread_local_rng.h>
 #include <Common/logger_useful.h>
@@ -108,7 +109,7 @@ DNSResolver::IPAddresses hostByName(const std::string & host)
     if (addresses.empty())
     {
         ProfileEvents::increment(ProfileEvents::DNSError);
-        throw Exception(ErrorCodes::DNS_ERROR, "Not found address of host: {}", host);
+        throw DB::NetException(ErrorCodes::DNS_ERROR, "Not found address of host: {}", host);
     }
 
     return addresses;
diff --git a/src/Common/HTTPConnectionPool.cpp b/src/Common/HTTPConnectionPool.cpp
new file mode 100644
index 00000000000..18ffef34091
--- /dev/null
+++ b/src/Common/HTTPConnectionPool.cpp
@@ -0,0 +1,865 @@
+#include <Common/HTTPConnectionPool.h>
+#include <Common/HostResolvePool.h>
+
+#include <Common/ProfileEvents.h>
+#include <Common/CurrentMetrics.h>
+#include <Common/logger_useful.h>
+#include <Common/Exception.h>
+#include <Common/ErrorCodes.h>
+#include <Common/ProxyConfiguration.h>
+#include <Common/MemoryTrackerSwitcher.h>
+#include <Common/SipHash.h>
+
+#include <Poco/Net/HTTPClientSession.h>
+#include <Poco/Net/HTTPStream.h>
+#include <Poco/Net/HTTPFixedLengthStream.h>
+#include <Poco/Net/HTTPChunkedStream.h>
+#include <Poco/Timespan.h>
+
+#include <Poco/Net/HTTPResponse.h>
+#include <Poco/Net/HTTPRequest.h>
+
+#include "config.h"
+
+#if USE_SSL
+#include <Poco/Net/HTTPSClientSession.h>
+#endif
+
+
+namespace ProfileEvents
+{
+    extern const Event StorageConnectionsCreated;
+    extern const Event StorageConnectionsReused;
+    extern const Event StorageConnectionsReset;
+    extern const Event StorageConnectionsPreserved;
+    extern const Event StorageConnectionsExpired;
+    extern const Event StorageConnectionsErrors;
+    extern const Event StorageConnectionsElapsedMicroseconds;
+
+    extern const Event DiskConnectionsCreated;
+    extern const Event DiskConnectionsReused;
+    extern const Event DiskConnectionsReset;
+    extern const Event DiskConnectionsPreserved;
+    extern const Event DiskConnectionsExpired;
+    extern const Event DiskConnectionsErrors;
+    extern const Event DiskConnectionsElapsedMicroseconds;
+
+    extern const Event HTTPConnectionsCreated;
+    extern const Event HTTPConnectionsReused;
+    extern const Event HTTPConnectionsReset;
+    extern const Event HTTPConnectionsPreserved;
+    extern const Event HTTPConnectionsExpired;
+    extern const Event HTTPConnectionsErrors;
+    extern const Event HTTPConnectionsElapsedMicroseconds;
+}
+
+
+namespace CurrentMetrics
+{
+    extern const Metric StorageConnectionsStored;
+    extern const Metric StorageConnectionsTotal;
+
+    extern const Metric DiskConnectionsStored;
+    extern const Metric DiskConnectionsTotal;
+
+    extern const Metric HTTPConnectionsStored;
+    extern const Metric HTTPConnectionsTotal;
+}
+
+namespace
+{
+    Poco::Net::HTTPClientSession::ProxyConfig proxyConfigurationToPocoProxyConfig(const DB::ProxyConfiguration & proxy_configuration)
+    {
+        Poco::Net::HTTPClientSession::ProxyConfig poco_proxy_config;
+
+        poco_proxy_config.host = proxy_configuration.host;
+        poco_proxy_config.port = proxy_configuration.port;
+        poco_proxy_config.protocol = DB::ProxyConfiguration::protocolToString(proxy_configuration.protocol);
+        poco_proxy_config.tunnel = proxy_configuration.tunneling;
+        poco_proxy_config.originalRequestProtocol = DB::ProxyConfiguration::protocolToString(proxy_configuration.original_request_protocol);
+
+        return poco_proxy_config;
+    }
+
+
+    size_t roundUp(size_t x, size_t rounding)
+    {
+        chassert(rounding > 0);
+        return (x + (rounding - 1)) / rounding * rounding;
+    }
+
+
+    Poco::Timespan divide(const Poco::Timespan span, int divisor)
+    {
+        return Poco::Timespan(Poco::Timestamp::TimeDiff(span.totalMicroseconds() / divisor));
+    }
+}
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int SUPPORT_IS_DISABLED;
+    extern const int UNSUPPORTED_URI_SCHEME;
+}
+
+
+IHTTPConnectionPoolForEndpoint::Metrics getMetricsForStorageConnectionPool()
+{
+    return IHTTPConnectionPoolForEndpoint::Metrics{
+        .created = ProfileEvents::StorageConnectionsCreated,
+        .reused = ProfileEvents::StorageConnectionsReused,
+        .reset = ProfileEvents::StorageConnectionsReset,
+        .preserved = ProfileEvents::StorageConnectionsPreserved,
+        .expired = ProfileEvents::StorageConnectionsExpired,
+        .errors = ProfileEvents::StorageConnectionsErrors,
+        .elapsed_microseconds = ProfileEvents::StorageConnectionsElapsedMicroseconds,
+        .stored_count = CurrentMetrics::StorageConnectionsStored,
+        .active_count = CurrentMetrics::StorageConnectionsTotal,
+    };
+}
+
+
+IHTTPConnectionPoolForEndpoint::Metrics getMetricsForDiskConnectionPool()
+{
+    return IHTTPConnectionPoolForEndpoint::Metrics{
+        .created = ProfileEvents::DiskConnectionsCreated,
+        .reused = ProfileEvents::DiskConnectionsReused,
+        .reset = ProfileEvents::DiskConnectionsReset,
+        .preserved = ProfileEvents::DiskConnectionsPreserved,
+        .expired = ProfileEvents::DiskConnectionsExpired,
+        .errors = ProfileEvents::DiskConnectionsErrors,
+        .elapsed_microseconds = ProfileEvents::DiskConnectionsElapsedMicroseconds,
+        .stored_count = CurrentMetrics::DiskConnectionsStored,
+        .active_count = CurrentMetrics::DiskConnectionsTotal,
+    };
+}
+
+
+IHTTPConnectionPoolForEndpoint::Metrics getMetricsForHTTPConnectionPool()
+{
+    return IHTTPConnectionPoolForEndpoint::Metrics{
+        .created = ProfileEvents::HTTPConnectionsCreated,
+        .reused = ProfileEvents::HTTPConnectionsReused,
+        .reset = ProfileEvents::HTTPConnectionsReset,
+        .preserved = ProfileEvents::HTTPConnectionsPreserved,
+        .expired = ProfileEvents::HTTPConnectionsExpired,
+        .errors = ProfileEvents::HTTPConnectionsErrors,
+        .elapsed_microseconds = ProfileEvents::HTTPConnectionsElapsedMicroseconds,
+        .stored_count = CurrentMetrics::HTTPConnectionsStored,
+        .active_count = CurrentMetrics::HTTPConnectionsTotal,
+    };
+}
+
+
+IHTTPConnectionPoolForEndpoint::Metrics getConnectionPoolMetrics(HTTPConnectionGroupType type)
+{
+    switch (type)
+    {
+        case HTTPConnectionGroupType::STORAGE:
+            return getMetricsForStorageConnectionPool();
+        case HTTPConnectionGroupType::DISK:
+            return getMetricsForDiskConnectionPool();
+        case HTTPConnectionGroupType::HTTP:
+            return getMetricsForHTTPConnectionPool();
+    }
+}
+
+
+class ConnectionGroup
+{
+public:
+    using Ptr = std::shared_ptr<ConnectionGroup>;
+
+    explicit ConnectionGroup(HTTPConnectionGroupType type_) : type(type_), metrics(getConnectionPoolMetrics(type_)) { }
+
+    void setLimits(HTTPConnectionPools::Limits limits_)
+    {
+        std::lock_guard lock(mutex);
+        limits = std::move(limits_);
+        mute_warning_until = 0;
+    }
+
+    bool isSoftLimitReached() const
+    {
+        std::lock_guard lock(mutex);
+        return total_connections_in_group >= limits.soft_limit;
+    }
+
+    bool isStoreLimitReached() const
+    {
+        std::lock_guard lock(mutex);
+        return total_connections_in_group >= limits.store_limit;
+    }
+
+    void atConnectionCreate()
+    {
+        std::lock_guard lock(mutex);
+
+        ++total_connections_in_group;
+
+        if (total_connections_in_group >= limits.warning_limit && total_connections_in_group >= mute_warning_until)
+        {
+            LOG_WARNING(log, "Too many active sessions in group {}, count {}, warning limit {}", type, total_connections_in_group, limits.warning_limit);
+            mute_warning_until = roundUp(total_connections_in_group, limits.warning_step);
+        }
+    }
+
+    void atConnectionDestroy()
+    {
+        std::lock_guard lock(mutex);
+
+        --total_connections_in_group;
+
+        const size_t reduced_warning_limit = limits.warning_limit > 10 ? limits.warning_limit - 10 : 1;
+        if (mute_warning_until > 0 && total_connections_in_group < reduced_warning_limit)
+        {
+            LOG_WARNING(log, "Sessions count is OK in the group {}, count {}", type, total_connections_in_group);
+            mute_warning_until = 0;
+        }
+    }
+
+    HTTPConnectionGroupType getType() const { return type; }
+
+    const IHTTPConnectionPoolForEndpoint::Metrics & getMetrics() const { return metrics; }
+
+private:
+    const HTTPConnectionGroupType type;
+    const IHTTPConnectionPoolForEndpoint::Metrics metrics;
+
+    LoggerPtr log = getLogger("ConnectionGroup");
+
+    mutable std::mutex mutex;
+    HTTPConnectionPools::Limits limits TSA_GUARDED_BY(mutex) = HTTPConnectionPools::Limits();
+    size_t total_connections_in_group TSA_GUARDED_BY(mutex) = 0;
+    size_t mute_warning_until TSA_GUARDED_BY(mutex) = 0;
+};
+
+
+class IExtendedPool : public IHTTPConnectionPoolForEndpoint
+{
+public:
+    using Ptr = std::shared_ptr<IExtendedPool>;
+
+    virtual HTTPConnectionGroupType getGroupType() const = 0;
+    virtual size_t wipeExpired() = 0;
+};
+
+
+// EndpointConnectionPool manage connections to the endpoint
+// Features:
+// - it uses HostResolver for address selecting. See Common/HostResolver.h for more info.
+// - it minimizes number of `Session::connect()`/`Session::reconnect()` calls
+//   - stores only connected and ready to use sessions
+//   - connection could be reused even when limits are reached
+// - soft limit, warn limit, store limit
+// - `Session::reconnect()` uses the pool as well
+// - comprehensive sensors
+// - session is reused according its inner state, automatically
+
+
+template <class Session>
+class EndpointConnectionPool : public std::enable_shared_from_this<EndpointConnectionPool<Session>>, public IExtendedPool
+{
+private:
+    friend class HTTPConnectionPools;
+
+    using WeakPtr = std::weak_ptr<EndpointConnectionPool<Session>>;
+
+    class PooledConnection : public Session
+    {
+    public:
+        using Ptr = std::shared_ptr<PooledConnection>;
+
+        void reconnect() override
+        {
+            ProfileEvents::increment(metrics.reset);
+            Session::close();
+
+            if (auto lock = pool.lock())
+            {
+                auto timeouts = getTimeouts(*this);
+                auto new_connection = lock->getConnection(timeouts);
+                Session::assign(*new_connection);
+            }
+            else
+            {
+                auto timer = CurrentThread::getProfileEvents().timer(metrics.elapsed_microseconds);
+                Session::reconnect();
+                ProfileEvents::increment(metrics.created);
+            }
+        }
+
+        String getTarget() const
+        {
+            if (!Session::getProxyConfig().host.empty())
+                return fmt::format("{} over proxy {}", Session::getHost(), Session::getProxyConfig().host);
+            return Session::getHost();
+        }
+
+        void flushRequest() override
+        {
+            if (bool(request_stream))
+            {
+                request_stream->flush();
+
+                if (auto * fixed_steam = dynamic_cast<Poco::Net::HTTPFixedLengthOutputStream *>(request_stream))
+                {
+                    request_stream_completed = fixed_steam->isComplete();
+                }
+                else if (auto * chunked_steam = dynamic_cast<Poco::Net::HTTPChunkedOutputStream *>(request_stream))
+                {
+                    chunked_steam->rdbuf()->close();
+                    request_stream_completed = chunked_steam->isComplete();
+                }
+                else if (auto * http_stream = dynamic_cast<Poco::Net::HTTPOutputStream *>(request_stream))
+                {
+                    request_stream_completed = http_stream->isComplete();
+                }
+                else
+                {
+                    request_stream_completed = false;
+                }
+            }
+            request_stream = nullptr;
+
+            Session::flushRequest();
+        }
+
+        std::ostream & sendRequest(Poco::Net::HTTPRequest & request) override
+        {
+            std::ostream & result = Session::sendRequest(request);
+            result.exceptions(std::ios::badbit);
+
+            request_stream = &result;
+            request_stream_completed = false;
+
+            response_stream = nullptr;
+            response_stream_completed = true;
+
+            return result;
+        }
+
+        std::istream & receiveResponse(Poco::Net::HTTPResponse & response) override
+        {
+            std::istream & result = Session::receiveResponse(response);
+            result.exceptions(std::ios::badbit);
+
+            response_stream = &result;
+            response_stream_completed = false;
+
+            return result;
+        }
+
+        void reset() override
+        {
+            request_stream = nullptr;
+            request_stream_completed = false;
+
+            response_stream = nullptr;
+            response_stream_completed = false;
+
+            Session::reset();
+        }
+
+        ~PooledConnection() override
+        {
+            if (bool(response_stream))
+            {
+                if (auto * fixed_steam = dynamic_cast<Poco::Net::HTTPFixedLengthInputStream *>(response_stream))
+                {
+                    response_stream_completed = fixed_steam->isComplete();
+                }
+                else if (auto * chunked_steam = dynamic_cast<Poco::Net::HTTPChunkedInputStream *>(response_stream))
+                {
+                    response_stream_completed = chunked_steam->isComplete();
+                }
+                else if (auto * http_stream = dynamic_cast<Poco::Net::HTTPInputStream *>(response_stream))
+                {
+                    response_stream_completed = http_stream->isComplete();
+                }
+                else
+                {
+                    response_stream_completed = false;
+                }
+            }
+            response_stream = nullptr;
+
+            if (auto lock = pool.lock())
+                lock->atConnectionDestroy(*this);
+            else
+                ProfileEvents::increment(metrics.reset);
+
+            CurrentMetrics::sub(metrics.active_count);
+        }
+
+    private:
+        friend class EndpointConnectionPool;
+
+        template <class... Args>
+        explicit PooledConnection(EndpointConnectionPool::WeakPtr pool_, IHTTPConnectionPoolForEndpoint::Metrics metrics_, Args &&... args)
+            : Session(args...), pool(std::move(pool_)), metrics(std::move(metrics_))
+        {
+            CurrentMetrics::add(metrics.active_count);
+        }
+
+        template <class... Args>
+        static Ptr create(Args &&... args)
+        {
+            /// Pool is global, we shouldn't attribute this memory to query/user.
+            MemoryTrackerSwitcher switcher{&total_memory_tracker};
+
+            struct make_shared_enabler : public PooledConnection
+            {
+                explicit make_shared_enabler(Args &&... args) : PooledConnection(std::forward<Args>(args)...) { }
+            };
+            return std::make_shared<make_shared_enabler>(std::forward<Args>(args)...);
+        }
+
+        void doConnect()
+        {
+            Session::reconnect();
+        }
+
+        bool isCompleted() const
+        {
+            return request_stream_completed && response_stream_completed;
+        }
+
+        WeakPtr pool;
+        IHTTPConnectionPoolForEndpoint::Metrics metrics;
+
+        Poco::Logger * log = &Poco::Logger::get("PooledConnection");
+
+        std::ostream * request_stream = nullptr;
+        std::istream * response_stream = nullptr;
+
+        bool request_stream_completed = true;
+        bool response_stream_completed = true;
+    };
+
+    using Connection = PooledConnection;
+    using ConnectionPtr = PooledConnection::Ptr;
+
+    struct GreaterByLastRequest
+    {
+        static bool operator()(const ConnectionPtr & l, const ConnectionPtr & r)
+        {
+            return l->getLastRequest() + l->getKeepAliveTimeout() > r->getLastRequest() + r->getKeepAliveTimeout();
+        }
+    };
+
+    using ConnectionsMinHeap = std::priority_queue<ConnectionPtr, std::vector<ConnectionPtr>, GreaterByLastRequest>;
+
+public:
+    template <class... Args>
+    static Ptr create(Args &&... args)
+    {
+        struct make_shared_enabler : public EndpointConnectionPool<Session>
+        {
+            explicit make_shared_enabler(Args &&... args) : EndpointConnectionPool<Session>(std::forward<Args>(args)...) { }
+        };
+        return std::make_shared<make_shared_enabler>(std::forward<Args>(args)...);
+    }
+
+    ~EndpointConnectionPool() override
+    {
+        CurrentMetrics::sub(group->getMetrics().stored_count, stored_connections.size());
+    }
+
+    String getTarget() const
+    {
+        if (!proxy_configuration.isEmpty())
+            return fmt::format("{} over proxy {}", host, proxy_configuration.host);
+        return host;
+    }
+
+    IHTTPConnectionPoolForEndpoint::ConnectionPtr getConnection(const ConnectionTimeouts & timeouts) override
+    {
+        Poco::Timestamp now;
+        std::vector<ConnectionPtr> expired_connections;
+
+        SCOPE_EXIT({
+            MemoryTrackerSwitcher switcher{&total_memory_tracker};
+            expired_connections.clear();
+        });
+
+        {
+            std::lock_guard lock(mutex);
+
+            wipeExpiredImpl(expired_connections, now);
+
+            if (!stored_connections.empty())
+            {
+                auto it = stored_connections.top();
+                stored_connections.pop();
+
+                setTimeouts(*it, timeouts);
+
+                ProfileEvents::increment(getMetrics().reused, 1);
+                CurrentMetrics::sub(getMetrics().stored_count, 1);
+
+                return it;
+            }
+        }
+
+        return prepareNewConnection(timeouts);
+    }
+
+    const IHTTPConnectionPoolForEndpoint::Metrics & getMetrics() const override
+    {
+        return group->getMetrics();
+    }
+
+    HTTPConnectionGroupType getGroupType() const override
+    {
+        return group->getType();
+    }
+
+    size_t wipeExpired() override
+    {
+        Poco::Timestamp now;
+        std::vector<ConnectionPtr> expired_connections;
+
+        SCOPE_EXIT({
+            MemoryTrackerSwitcher switcher{&total_memory_tracker};
+            expired_connections.clear();
+        });
+
+        std::lock_guard lock(mutex);
+        return wipeExpiredImpl(expired_connections, now);
+    }
+
+    size_t wipeExpiredImpl(std::vector<ConnectionPtr> & expired_connections, Poco::Timestamp now) TSA_REQUIRES(mutex)
+    {
+        while (!stored_connections.empty())
+        {
+            auto connection = stored_connections.top();
+
+            if (!isExpired(now, connection))
+                return stored_connections.size();
+
+            stored_connections.pop();
+            expired_connections.push_back(connection);
+        }
+
+        CurrentMetrics::sub(getMetrics().stored_count, expired_connections.size());
+        ProfileEvents::increment(getMetrics().expired, expired_connections.size());
+
+        return stored_connections.size();
+    }
+
+private:
+    EndpointConnectionPool(ConnectionGroup::Ptr group_, String host_, UInt16 port_, bool https_, ProxyConfiguration proxy_configuration_)
+        : host(std::move(host_))
+        , port(port_)
+        , https(https_)
+        , proxy_configuration(std::move(proxy_configuration_))
+        , group(group_)
+    {
+    }
+
+    WeakPtr getWeakFromThis() { return EndpointConnectionPool::weak_from_this(); }
+
+    bool isExpired(Poco::Timestamp & now, ConnectionPtr connection)
+    {
+        if (group->isSoftLimitReached())
+            return now > (connection->getLastRequest() + divide(connection->getKeepAliveTimeout(), 10));
+        return now > connection->getLastRequest() + connection->getKeepAliveTimeout();
+    }
+
+    ConnectionPtr allocateNewConnection()
+    {
+        ConnectionPtr connection = PooledConnection::create(this->getWeakFromThis(), getMetrics(), host, port);
+        connection->setKeepAlive(true);
+
+        if (!proxy_configuration.isEmpty())
+        {
+            connection->setProxyConfig(proxyConfigurationToPocoProxyConfig(proxy_configuration));
+        }
+
+        group->atConnectionCreate();
+
+        return connection;
+    }
+
+    ConnectionPtr prepareNewConnection(const ConnectionTimeouts & timeouts)
+    {
+        auto address = HostResolversPool::instance().getResolver(host)->resolve();
+
+        auto session = allocateNewConnection();
+
+        setTimeouts(*session, timeouts);
+        session->setResolvedHost(*address);
+
+        try
+        {
+            auto timer = CurrentThread::getProfileEvents().timer(getMetrics().elapsed_microseconds);
+            session->doConnect();
+        }
+        catch (...)
+        {
+            address.setFail();
+            ProfileEvents::increment(getMetrics().errors);
+            session->reset();
+            throw;
+        }
+
+        ProfileEvents::increment(getMetrics().created);
+        return session;
+    }
+
+    void atConnectionDestroy(PooledConnection & connection)
+    {
+        group->atConnectionDestroy();
+
+        if (!connection.connected() || connection.mustReconnect() || !connection.isCompleted() || connection.buffered()
+            || group->isStoreLimitReached())
+        {
+            ProfileEvents::increment(getMetrics().reset, 1);
+            return;
+        }
+
+        auto connection_to_store = allocateNewConnection();
+        connection_to_store->assign(connection);
+
+        CurrentMetrics::add(getMetrics().stored_count, 1);
+        ProfileEvents::increment(getMetrics().preserved, 1);
+
+        {
+            MemoryTrackerSwitcher switcher{&total_memory_tracker};
+            std::lock_guard lock(mutex);
+            stored_connections.push(connection_to_store);
+        }
+    }
+
+
+    const std::string host;
+    const UInt16 port;
+    const bool https;
+    const ProxyConfiguration proxy_configuration;
+    const ConnectionGroup::Ptr group;
+
+    std::mutex mutex;
+    ConnectionsMinHeap stored_connections TSA_GUARDED_BY(mutex);
+};
+
+struct EndpointPoolKey
+{
+    HTTPConnectionGroupType connection_group;
+    String target_host;
+    UInt16 target_port;
+    bool is_target_https;
+    ProxyConfiguration proxy_config;
+
+    bool operator==(const EndpointPoolKey & rhs) const
+    {
+        return std::tie(
+                   connection_group,
+                   target_host,
+                   target_port,
+                   is_target_https,
+                   proxy_config.host,
+                   proxy_config.port,
+                   proxy_config.protocol,
+                   proxy_config.tunneling,
+                   proxy_config.original_request_protocol)
+            == std::tie(
+                   rhs.connection_group,
+                   rhs.target_host,
+                   rhs.target_port,
+                   rhs.is_target_https,
+                   rhs.proxy_config.host,
+                   rhs.proxy_config.port,
+                   rhs.proxy_config.protocol,
+                   rhs.proxy_config.tunneling,
+                   rhs.proxy_config.original_request_protocol);
+    }
+};
+
+struct Hasher
+{
+    size_t operator()(const EndpointPoolKey & k) const
+    {
+        SipHash s;
+        s.update(k.connection_group);
+        s.update(k.target_host);
+        s.update(k.target_port);
+        s.update(k.is_target_https);
+        s.update(k.proxy_config.host);
+        s.update(k.proxy_config.port);
+        s.update(k.proxy_config.protocol);
+        s.update(k.proxy_config.tunneling);
+        s.update(k.proxy_config.original_request_protocol);
+        return s.get64();
+    }
+};
+
+IExtendedPool::Ptr
+createConnectionPool(ConnectionGroup::Ptr group, std::string host, UInt16 port, bool secure, ProxyConfiguration proxy_configuration)
+{
+    if (secure)
+    {
+#if USE_SSL
+        return EndpointConnectionPool<Poco::Net::HTTPSClientSession>::create(
+            group, std::move(host), port, secure, std::move(proxy_configuration));
+#else
+        throw Exception(
+            ErrorCodes::SUPPORT_IS_DISABLED, "Inter-server secret support is disabled, because ClickHouse was built without SSL library");
+#endif
+    }
+    else
+    {
+        return EndpointConnectionPool<Poco::Net::HTTPClientSession>::create(
+            group, std::move(host), port, secure, std::move(proxy_configuration));
+    }
+}
+
+class HTTPConnectionPools::Impl
+{
+private:
+    const size_t DEFAULT_WIPE_TIMEOUT_SECONDS = 5 * 60;
+    const Poco::Timespan wipe_timeout = Poco::Timespan(DEFAULT_WIPE_TIMEOUT_SECONDS, 0);
+
+    ConnectionGroup::Ptr disk_group = std::make_shared<ConnectionGroup>(HTTPConnectionGroupType::DISK);
+    ConnectionGroup::Ptr storage_group = std::make_shared<ConnectionGroup>(HTTPConnectionGroupType::STORAGE);
+    ConnectionGroup::Ptr http_group = std::make_shared<ConnectionGroup>(HTTPConnectionGroupType::HTTP);
+
+
+    /// If multiple mutexes are held simultaneously,
+    /// they should be locked in this order:
+    /// HTTPConnectionPools::mutex, then EndpointConnectionPool::mutex, then ConnectionGroup::mutex.
+    std::mutex mutex;
+
+    std::unordered_map<EndpointPoolKey, IExtendedPool::Ptr, Hasher> endpoints_pool TSA_GUARDED_BY(mutex);
+    Poco::Timestamp last_wipe_time TSA_GUARDED_BY(mutex);
+
+public:
+    IHTTPConnectionPoolForEndpoint::Ptr getPool(HTTPConnectionGroupType type, const Poco::URI & uri, const ProxyConfiguration & proxy_configuration)
+    {
+        Poco::Timestamp now;
+
+        std::lock_guard lock(mutex);
+
+        if (now - last_wipe_time > wipe_timeout)
+        {
+            wipeExpired();
+            last_wipe_time = now;
+        }
+
+        return getPoolImpl(type, uri, proxy_configuration);
+    }
+
+    void setLimits(HTTPConnectionPools::Limits disk, HTTPConnectionPools::Limits storage, HTTPConnectionPools::Limits http)
+    {
+        disk_group->setLimits(std::move(disk));
+        storage_group->setLimits(std::move(storage));
+        http_group->setLimits(std::move(http));
+    }
+
+    void dropCache()
+    {
+        std::lock_guard lock(mutex);
+        endpoints_pool.clear();
+    }
+
+protected:
+    ConnectionGroup::Ptr & getGroup(HTTPConnectionGroupType type)
+    {
+        switch (type)
+        {
+            case HTTPConnectionGroupType::DISK:
+                return disk_group;
+            case HTTPConnectionGroupType::STORAGE:
+                return storage_group;
+            case HTTPConnectionGroupType::HTTP:
+                return http_group;
+        }
+    }
+
+    IExtendedPool::Ptr getPoolImpl(HTTPConnectionGroupType type, const Poco::URI & uri, const ProxyConfiguration & proxy_configuration)
+        TSA_REQUIRES(mutex)
+    {
+        auto [host, port, secure] = getHostPortSecure(uri, proxy_configuration);
+        auto key = EndpointPoolKey{type, host, port, secure, proxy_configuration};
+
+        auto it = endpoints_pool.find(key);
+        if (it != endpoints_pool.end())
+            return it->second;
+
+        it = endpoints_pool.emplace(key, createConnectionPool(getGroup(type), std::move(host), port, secure, proxy_configuration)).first;
+
+        return it->second;
+    }
+
+    void wipeExpired() TSA_REQUIRES(mutex)
+    {
+        std::vector<EndpointPoolKey> keys_to_drop;
+
+        for (auto & [key, pool] : endpoints_pool)
+        {
+            auto left_connections = pool->wipeExpired();
+            if (left_connections == 0 && pool->getGroupType() != HTTPConnectionGroupType::DISK)
+                keys_to_drop.push_back(key);
+        }
+
+        for (const auto & key : keys_to_drop)
+            endpoints_pool.erase(key);
+    }
+
+    static bool useSecureConnection(const Poco::URI & uri, const ProxyConfiguration & proxy_configuration)
+    {
+        if (uri.getScheme() == "http")
+            return false;
+
+        if (uri.getScheme() != "https")
+            throw Exception(ErrorCodes::UNSUPPORTED_URI_SCHEME, "Unsupported scheme in URI '{}'", uri.toString());
+
+        if (!proxy_configuration.isEmpty())
+        {
+            if (ProxyConfiguration::Protocol::HTTP == proxy_configuration.protocol && !proxy_configuration.tunneling)
+            {
+                // If it is an HTTPS request, proxy server is HTTP and user opted for tunneling off, we must not create an HTTPS request.
+                // The desired flow is: HTTP request to the proxy server, then proxy server will initiate an HTTPS request to the target server.
+                // There is a weak link in the security, but that's what the user opted for.
+                return false;
+            }
+        }
+
+        return true;
+    }
+
+    static std::tuple<std::string, UInt16, bool> getHostPortSecure(const Poco::URI & uri, const ProxyConfiguration & proxy_configuration)
+    {
+        return std::make_tuple(uri.getHost(), uri.getPort(), useSecureConnection(uri, proxy_configuration));
+    }
+};
+
+HTTPConnectionPools::HTTPConnectionPools()
+    : impl(std::make_unique<HTTPConnectionPools::Impl>())
+{
+}
+
+HTTPConnectionPools & HTTPConnectionPools::instance()
+{
+    static HTTPConnectionPools instance;
+    return instance;
+}
+
+void HTTPConnectionPools::setLimits(HTTPConnectionPools::Limits disk, HTTPConnectionPools::Limits storage, HTTPConnectionPools::Limits http)
+{
+    impl->setLimits(std::move(disk), std::move(storage), std::move(http));
+}
+
+void HTTPConnectionPools::dropCache()
+{
+    impl->dropCache();
+}
+
+IHTTPConnectionPoolForEndpoint::Ptr
+HTTPConnectionPools::getPool(HTTPConnectionGroupType type, const Poco::URI & uri, const ProxyConfiguration & proxy_configuration)
+{
+    return impl->getPool(type, uri, proxy_configuration);
+}
+}
diff --git a/src/Common/HTTPConnectionPool.h b/src/Common/HTTPConnectionPool.h
new file mode 100644
index 00000000000..7fd0847f5a7
--- /dev/null
+++ b/src/Common/HTTPConnectionPool.h
@@ -0,0 +1,91 @@
+#pragma once
+
+#include <IO/ConnectionTimeouts.h>
+
+#include <Common/ProfileEvents.h>
+#include <Common/CurrentMetrics.h>
+#include <Common/ProxyConfiguration.h>
+#include <Common/logger_useful.h>
+
+#include <base/defines.h>
+
+#include <Poco/Timespan.h>
+#include <Poco/Net/HTTPClientSession.h>
+
+#include <mutex>
+#include <memory>
+
+namespace DB
+{
+
+class IHTTPConnectionPoolForEndpoint
+{
+public:
+    struct Metrics
+    {
+        const ProfileEvents::Event created = ProfileEvents::end();
+        const ProfileEvents::Event reused = ProfileEvents::end();
+        const ProfileEvents::Event reset = ProfileEvents::end();
+        const ProfileEvents::Event preserved = ProfileEvents::end();
+        const ProfileEvents::Event expired = ProfileEvents::end();
+        const ProfileEvents::Event errors = ProfileEvents::end();
+        const ProfileEvents::Event elapsed_microseconds = ProfileEvents::end();
+
+        const CurrentMetrics::Metric stored_count = CurrentMetrics::end();
+        const CurrentMetrics::Metric active_count = CurrentMetrics::end();
+    };
+
+    using Ptr =  std::shared_ptr<IHTTPConnectionPoolForEndpoint>;
+    using Connection = Poco::Net::HTTPClientSession;
+    using ConnectionPtr = std::shared_ptr<Poco::Net::HTTPClientSession>;
+
+    /// can throw Poco::Net::Exception, DB::NetException, DB::Exception
+    virtual ConnectionPtr getConnection(const ConnectionTimeouts & timeouts) = 0;
+    virtual const Metrics & getMetrics() const = 0;
+    virtual ~IHTTPConnectionPoolForEndpoint() = default;
+
+protected:
+    IHTTPConnectionPoolForEndpoint() = default;
+
+    IHTTPConnectionPoolForEndpoint(const IHTTPConnectionPoolForEndpoint &) = delete;
+    IHTTPConnectionPoolForEndpoint & operator=(const IHTTPConnectionPoolForEndpoint &) = delete;
+};
+
+enum class HTTPConnectionGroupType
+{
+    DISK,
+    STORAGE,
+    HTTP,
+};
+
+class HTTPConnectionPools
+{
+public:
+    struct Limits
+    {
+        size_t soft_limit = 100;
+        size_t warning_limit = 1000;
+        size_t store_limit = 10000;
+
+        static constexpr size_t warning_step = 100;
+    };
+
+private:
+    HTTPConnectionPools();
+    HTTPConnectionPools(const HTTPConnectionPools &) = delete;
+    HTTPConnectionPools & operator=(const HTTPConnectionPools &) = delete;
+
+public:
+    static HTTPConnectionPools & instance();
+
+    void setLimits(Limits disk, Limits storage, Limits http);
+    void dropCache();
+
+    IHTTPConnectionPoolForEndpoint::Ptr getPool(HTTPConnectionGroupType type, const Poco::URI & uri, const ProxyConfiguration & proxy_configuration);
+
+private:
+    class Impl;
+    std::unique_ptr<Impl> impl;
+};
+
+}
diff --git a/src/Common/HostResolvePool.cpp b/src/Common/HostResolvePool.cpp
new file mode 100644
index 00000000000..f6cc9c919ba
--- /dev/null
+++ b/src/Common/HostResolvePool.cpp
@@ -0,0 +1,293 @@
+#include <Common/HostResolvePool.h>
+
+#include <Common/DNSResolver.h>
+#include <Common/Exception.h>
+#include <Common/NetException.h>
+#include <Common/ErrorCodes.h>
+#include <Common/thread_local_rng.h>
+#include <Common/MemoryTrackerSwitcher.h>
+
+#include <mutex>
+
+namespace ProfileEvents
+{
+    extern const Event AddressesDiscovered;
+    extern const Event AddressesExpired;
+    extern const Event AddressesFailScored;
+}
+
+namespace CurrentMetrics
+{
+    extern const Metric AddressesActive;
+}
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int DNS_ERROR;
+}
+
+HostResolverMetrics HostResolver::getMetrics()
+{
+    return HostResolverMetrics{
+        .discovered = ProfileEvents::AddressesDiscovered,
+        .expired = ProfileEvents::AddressesExpired,
+        .failed = ProfileEvents::AddressesFailScored,
+        .active_count = CurrentMetrics::AddressesActive,
+    };
+}
+
+HostResolver::WeakPtr HostResolver::getWeakFromThis()
+{
+    return weak_from_this();
+}
+
+HostResolver::HostResolver(String host_, Poco::Timespan history_)
+    : host(std::move(host_))
+    , history(history_)
+    , resolve_function([](const String & host_to_resolve) { return DNSResolver::instance().resolveHostAll(host_to_resolve); })
+{
+    update();
+}
+
+HostResolver::HostResolver(
+    ResolveFunction && resolve_function_, String host_, Poco::Timespan history_)
+    : host(std::move(host_)), history(history_), resolve_function(std::move(resolve_function_))
+{
+    update();
+}
+
+HostResolver::~HostResolver()
+{
+    std::lock_guard lock(mutex);
+    CurrentMetrics::sub(metrics.active_count, records.size());
+    records.clear();
+}
+
+void HostResolver::Entry::setFail()
+{
+    fail = true;
+
+    if (auto lock = pool.lock())
+        lock->setFail(address);
+}
+
+HostResolver::Entry::~Entry()
+{
+    if (!fail)
+    {
+        if (auto lock = pool.lock())
+            lock->setSuccess(address);
+    }
+}
+
+void HostResolver::update()
+{
+    MemoryTrackerSwitcher switcher{&total_memory_tracker};
+
+    auto next_gen = resolve_function(host);
+    if (next_gen.empty())
+        throw NetException(ErrorCodes::DNS_ERROR, "no endpoints resolved for host {}", host);
+
+    std::sort(next_gen.begin(), next_gen.end());
+
+    Poco::Timestamp now;
+
+    std::lock_guard lock(mutex);
+    updateImpl(now, next_gen);
+}
+
+void HostResolver::reset()
+{
+    std::lock_guard lock(mutex);
+
+    CurrentMetrics::sub(metrics.active_count, records.size());
+    records.clear();
+}
+
+void HostResolver::updateWeights()
+{
+    updateWeightsImpl();
+
+    if (getTotalWeight() == 0 && !records.empty())
+    {
+        for (auto & rec : records)
+            rec.failed = false;
+
+        updateWeightsImpl();
+    }
+
+    chassert((getTotalWeight() > 0 && !records.empty()) || records.empty());
+    random_weight_picker = std::uniform_int_distribution<size_t>(0, getTotalWeight() - 1);
+}
+
+HostResolver::Entry HostResolver::resolve()
+{
+    if (isUpdateNeeded())
+        update();
+
+    std::lock_guard lock(mutex);
+    return Entry(*this, selectBest());
+}
+
+void HostResolver::setSuccess(const Poco::Net::IPAddress & address)
+{
+    std::lock_guard lock(mutex);
+
+    auto it = find(address);
+    if (it == records.end())
+        return;
+
+    auto old_weight = it->getWeight();
+    ++it->usage;
+    auto new_weight = it->getWeight();
+
+    if (old_weight != new_weight)
+        updateWeights();
+}
+
+void HostResolver::setFail(const Poco::Net::IPAddress & address)
+{
+    Poco::Timestamp now;
+
+    {
+        std::lock_guard lock(mutex);
+
+        auto it = find(address);
+        if (it == records.end())
+            return;
+
+        it->failed = true;
+        it->fail_time = now;
+    }
+
+    ProfileEvents::increment(metrics.failed);
+    update();
+}
+
+Poco::Net::IPAddress HostResolver::selectBest()
+{
+    chassert(!records.empty());
+    size_t weight = random_weight_picker(thread_local_rng);
+    auto it = std::partition_point(records.begin(), records.end(), [&](const Record & rec) { return rec.weight_prefix_sum <= weight; });
+    chassert(it != records.end());
+    return it->address;
+}
+
+HostResolver::Records::iterator HostResolver::find(const Poco::Net::IPAddress & addr) TSA_REQUIRES(mutex)
+{
+    return std::lower_bound(
+        records.begin(), records.end(), addr, [](const Record & rec, const Poco::Net::IPAddress & value) { return rec.address < value; });
+}
+
+bool HostResolver::isUpdateNeeded()
+{
+    Poco::Timestamp now;
+
+    std::lock_guard lock(mutex);
+    return last_resolve_time + history < now || records.empty();
+}
+
+void HostResolver::updateImpl(Poco::Timestamp now, std::vector<Poco::Net::IPAddress> & next_gen)
+    TSA_REQUIRES(mutex)
+{
+    const auto last_effective_resolve = now - history;
+
+    Records merged;
+    merged.reserve(records.size() + next_gen.size());
+
+    auto it_before = records.begin();
+    auto it_next = next_gen.begin();
+
+    while (it_before != records.end() || it_next != next_gen.end())
+    {
+        if (it_next == next_gen.end() || (it_before != records.end() && it_before->address < *it_next))
+        {
+            if (it_before->resolve_time >= last_effective_resolve)
+                merged.push_back(*it_before);
+            else
+            {
+                CurrentMetrics::sub(metrics.active_count, 1);
+                ProfileEvents::increment(metrics.expired, 1);
+            }
+            ++it_before;
+        }
+        else if (it_before == records.end() || (it_next != next_gen.end() && *it_next < it_before->address))
+        {
+            CurrentMetrics::add(metrics.active_count, 1);
+            ProfileEvents::increment(metrics.discovered, 1);
+            merged.push_back(Record(*it_next, now));
+            ++it_next;
+        }
+        else
+        {
+            merged.push_back(*it_before);
+            merged.back().resolve_time = now;
+
+            ++it_before;
+            ++it_next;
+        }
+    }
+
+    for (auto & rec : merged)
+        if (rec.failed && rec.fail_time < last_effective_resolve)
+            rec.failed = false;
+
+    chassert(std::is_sorted(merged.begin(), merged.end()));
+
+    last_resolve_time = now;
+    records.swap(merged);
+
+    if (records.empty())
+        throw NetException(ErrorCodes::DNS_ERROR, "no endpoints resolved for host {}", host);
+
+    updateWeights();
+}
+
+size_t HostResolver::getTotalWeight() const
+{
+    if (records.empty())
+        return 0;
+    return records.back().weight_prefix_sum;
+}
+
+
+void HostResolver::updateWeightsImpl()
+{
+    size_t total_weight_next = 0;
+
+    for (auto & rec: records)
+    {
+        total_weight_next += rec.getWeight();
+        rec.weight_prefix_sum = total_weight_next;
+    }
+}
+
+HostResolversPool & HostResolversPool::instance()
+{
+    static HostResolversPool instance;
+    return instance;
+}
+
+void HostResolversPool::dropCache()
+{
+    std::lock_guard lock(mutex);
+    host_pools.clear();
+}
+
+HostResolver::Ptr HostResolversPool::getResolver(const String & host)
+{
+    std::lock_guard lock(mutex);
+
+    auto it = host_pools.find(host);
+    if (it != host_pools.end())
+        return it->second;
+
+    it = host_pools.emplace(host, HostResolver::create(host)).first;
+
+    return it->second;
+}
+
+}
diff --git a/src/Common/HostResolvePool.h b/src/Common/HostResolvePool.h
new file mode 100644
index 00000000000..2a31cec3b2d
--- /dev/null
+++ b/src/Common/HostResolvePool.h
@@ -0,0 +1,218 @@
+#pragma once
+
+#include <Common/CurrentMetrics.h>
+#include <Common/HTTPConnectionPool.h>
+#include <Common/ProfileEvents.h>
+#include <Common/logger_useful.h>
+
+#include <base/defines.h>
+
+#include <Poco/Net/IPAddress.h>
+
+#include <mutex>
+#include <memory>
+
+// That class resolves host into multiply addresses
+// Features:
+// - balance address usage.
+//    `selectBest()` chooses the address by random with weights.
+//    The more ip is used the lesser weight it has. When new address is happened, it takes more weight.
+//    But still not all requests are assigned to the new address.
+// - join resolve results
+//    In case when host is resolved into different set of addresses, this class join all that addresses and use them.
+//    An address expires after `history_` time.
+// - failed address pessimization
+//    If an address marked with `setFail()` it is marked as faulty. Such address won't be selected until either
+//    a) it still occurs in resolve set after `history_` time or b) all other addresses are pessimized as well.
+// - resolve schedule
+//    Addresses are resolved through `DB::DNSResolver::instance()`.
+//    Usually it does not happen more often than once in `history_` time.
+//    But also new resolve performed each `setFail()` call.
+
+namespace DB
+{
+
+struct HostResolverMetrics
+{
+    const ProfileEvents::Event discovered = ProfileEvents::end();
+    const ProfileEvents::Event expired = ProfileEvents::end();
+    const ProfileEvents::Event failed = ProfileEvents::end();
+
+    const CurrentMetrics::Metric active_count = CurrentMetrics::end();
+};
+
+constexpr size_t DEFAULT_RESOLVE_TIME_HISTORY_SECONDS = 2*60;
+
+
+class HostResolver : public std::enable_shared_from_this<HostResolver>
+{
+private:
+    using WeakPtr = std::weak_ptr<HostResolver>;
+
+public:
+    using Ptr = std::shared_ptr<HostResolver>;
+
+    template<class... Args>
+    static Ptr create(Args&&... args)
+    {
+        struct make_shared_enabler : public HostResolver
+        {
+            explicit make_shared_enabler(Args&&... args) : HostResolver(std::forward<Args>(args)...) {}
+        };
+        return std::make_shared<make_shared_enabler>(std::forward<Args>(args)...);
+    }
+
+    virtual ~HostResolver();
+
+    class Entry
+    {
+    public:
+        explicit Entry(Entry && entry) = default;
+        explicit Entry(Entry & entry) = delete;
+
+        // no access as r-value
+        const String * operator->() && = delete;
+        const String * operator->() const && = delete;
+        const String & operator*() && = delete;
+        const String & operator*() const && = delete;
+
+        const String * operator->() & { return &resolved_host; }
+        const String * operator->() const & { return &resolved_host; }
+        const String & operator*() & { return resolved_host; }
+        const String & operator*() const & { return resolved_host; }
+
+        void setFail();
+        ~Entry();
+
+    private:
+        friend class HostResolver;
+
+        Entry(HostResolver & pool_, Poco::Net::IPAddress address_)
+            : pool(pool_.getWeakFromThis())
+            , address(std::move(address_))
+            , resolved_host(address.toString())
+        { }
+
+        HostResolver::WeakPtr pool;
+        const Poco::Net::IPAddress address;
+        const String resolved_host;
+
+        bool fail = false;
+    };
+
+    /// can throw NetException(ErrorCodes::DNS_ERROR, ...), Exception(ErrorCodes::BAD_ARGUMENTS, ...)
+    Entry resolve();
+    void update();
+    void reset();
+
+    static HostResolverMetrics getMetrics();
+
+protected:
+    explicit HostResolver(
+        String host_,
+        Poco::Timespan history_ = Poco::Timespan(DEFAULT_RESOLVE_TIME_HISTORY_SECONDS, 0));
+
+    using ResolveFunction = std::function<std::vector<Poco::Net::IPAddress> (const String & host)>;
+    HostResolver(ResolveFunction && resolve_function_,
+                    String host_,
+                    Poco::Timespan history_);
+
+    friend class Entry;
+    WeakPtr getWeakFromThis();
+
+    void setSuccess(const Poco::Net::IPAddress & address);
+    void setFail(const Poco::Net::IPAddress & address);
+
+    struct Record
+    {
+        Record(Poco::Net::IPAddress address_, Poco::Timestamp resolve_time_)
+            : address(std::move(address_))
+            , resolve_time(resolve_time_)
+        {}
+
+        explicit Record(Record && rec) = default;
+        Record& operator=(Record && s) = default;
+
+        explicit Record(const Record & rec) = default;
+        Record& operator=(const Record & s) = default;
+
+        Poco::Net::IPAddress address;
+        Poco::Timestamp resolve_time;
+        size_t usage = 0;
+        bool failed = false;
+        Poco::Timestamp fail_time = 0;
+
+        size_t weight_prefix_sum;
+
+        bool operator <(const Record & r) const
+        {
+            return address < r.address;
+        }
+
+        size_t getWeight() const
+        {
+            if (failed)
+                return 0;
+
+            /// There is no goal to make usage's distribution ideally even
+            /// The goal is to chose more often new address, but still use old addresses as well
+            /// when all addresses have usage counter greater than 10000,
+            /// no more corrections are needed, just random choice is ok
+            if (usage > 10000)
+                return 1;
+            if (usage > 1000)
+                return 5;
+            if (usage > 100)
+                return 8;
+            return 10;
+        }
+    };
+
+    using Records = std::vector<Record>;
+
+    Poco::Net::IPAddress selectBest() TSA_REQUIRES(mutex);
+    Records::iterator find(const Poco::Net::IPAddress & address) TSA_REQUIRES(mutex);
+    bool isUpdateNeeded();
+
+    void updateImpl(Poco::Timestamp now, std::vector<Poco::Net::IPAddress> & next_gen) TSA_REQUIRES(mutex);
+    void updateWeights() TSA_REQUIRES(mutex);
+    void updateWeightsImpl() TSA_REQUIRES(mutex);
+    size_t getTotalWeight() const TSA_REQUIRES(mutex);
+
+    const String host;
+    const Poco::Timespan history;
+    const HostResolverMetrics metrics = getMetrics();
+
+    // for tests purpose
+    const ResolveFunction resolve_function;
+
+    std::mutex mutex;
+
+    Poco::Timestamp last_resolve_time TSA_GUARDED_BY(mutex);
+    Records records TSA_GUARDED_BY(mutex);
+
+    std::uniform_int_distribution<size_t> random_weight_picker TSA_GUARDED_BY(mutex);
+
+    Poco::Logger * log = &Poco::Logger::get("ConnectionPool");
+};
+
+class HostResolversPool
+{
+private:
+    HostResolversPool() = default;
+    HostResolversPool(const HostResolversPool &) = delete;
+    HostResolversPool & operator=(const HostResolversPool &) = delete;
+
+public:
+    static HostResolversPool & instance();
+
+    void dropCache();
+
+    HostResolver::Ptr getResolver(const String & host);
+private:
+    std::mutex mutex;
+    std::unordered_map<String, HostResolver::Ptr> host_pools TSA_GUARDED_BY(mutex);
+};
+
+}
+
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 052c059a72d..0c9582ab4fb 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -696,6 +696,35 @@ The server successfully detected this situation and will download merged part fr
     \
     M(ParallelReplicasAvailableCount, "Number of replicas available to execute a query with task-based parallel replicas") \
     M(ParallelReplicasUnavailableCount, "Number of replicas which was chosen, but found to be unavailable during query execution with task-based parallel replicas") \
+    \
+    M(StorageConnectionsCreated, "Number of created connections for storages") \
+    M(StorageConnectionsReused, "Number of reused connections for storages") \
+    M(StorageConnectionsReset, "Number of reset connections for storages") \
+    M(StorageConnectionsPreserved, "Number of preserved connections for storages") \
+    M(StorageConnectionsExpired, "Number of expired connections for storages") \
+    M(StorageConnectionsErrors, "Number of cases when creation of a connection for storage is failed") \
+    M(StorageConnectionsElapsedMicroseconds, "Total time spend on creating connections for storages")                                                                                                                                                                                                                                               \
+    \
+    M(DiskConnectionsCreated, "Number of created connections for disk") \
+    M(DiskConnectionsReused, "Number of reused connections for disk") \
+    M(DiskConnectionsReset, "Number of reset connections for disk") \
+    M(DiskConnectionsPreserved, "Number of preserved connections for disk") \
+    M(DiskConnectionsExpired, "Number of expired connections for disk") \
+    M(DiskConnectionsErrors, "Number of cases when creation of a connection for disk is failed") \
+    M(DiskConnectionsElapsedMicroseconds, "Total time spend on creating connections for disk") \
+    \
+    M(HTTPConnectionsCreated, "Number of created http connections") \
+    M(HTTPConnectionsReused, "Number of reused http connections") \
+    M(HTTPConnectionsReset, "Number of reset http connections") \
+    M(HTTPConnectionsPreserved, "Number of preserved http connections") \
+    M(HTTPConnectionsExpired, "Number of expired http connections") \
+    M(HTTPConnectionsErrors, "Number of cases when creation of a http connection failed") \
+    M(HTTPConnectionsElapsedMicroseconds, "Total time spend on creating http connections") \
+    \
+    M(AddressesDiscovered, "Total count of new addresses in dns resolve results for connection pools") \
+    M(AddressesExpired, "Total count of expired addresses which is no longer presented in dns resolve results for for connection pools") \
+    M(AddressesFailScored, "Total count of new addresses in dns resolve results for for connection pools") \
+
 
 #ifdef APPLY_FOR_EXTERNAL_EVENTS
     #define APPLY_FOR_EVENTS(M) APPLY_FOR_BUILTIN_EVENTS(M) APPLY_FOR_EXTERNAL_EVENTS(M)
diff --git a/src/Common/ProxyConfiguration.h b/src/Common/ProxyConfiguration.h
index 53e569bf6e4..11a09cb5924 100644
--- a/src/Common/ProxyConfiguration.h
+++ b/src/Common/ProxyConfiguration.h
@@ -44,11 +44,13 @@ struct ProxyConfiguration
         }
     }
 
-    std::string host;
-    Protocol protocol;
-    uint16_t port;
-    bool tunneling;
-    Protocol original_request_protocol;
+    std::string host = std::string{};
+    Protocol protocol = Protocol::HTTP;
+    uint16_t port = 0;
+    bool tunneling = false;
+    Protocol original_request_protocol = Protocol::HTTP;
+
+    bool isEmpty() const { return host.size() == 0; }
 };
 
 }
diff --git a/src/Common/ProxyListConfigurationResolver.cpp b/src/Common/ProxyListConfigurationResolver.cpp
index 01a6f52185f..c9b8923929a 100644
--- a/src/Common/ProxyListConfigurationResolver.cpp
+++ b/src/Common/ProxyListConfigurationResolver.cpp
@@ -26,8 +26,6 @@ ProxyConfiguration ProxyListConfigurationResolver::resolve()
 
     auto & proxy = proxies[index];
 
-    LOG_DEBUG(getLogger("ProxyListConfigurationResolver"), "Use proxy: {}", proxies[index].toString());
-
     return ProxyConfiguration {
         proxy.getHost(),
         ProxyConfiguration::protocolFromString(proxy.getScheme()),
diff --git a/src/Common/RemoteProxyConfigurationResolver.cpp b/src/Common/RemoteProxyConfigurationResolver.cpp
index 117c8a34dbb..ef972a8e318 100644
--- a/src/Common/RemoteProxyConfigurationResolver.cpp
+++ b/src/Common/RemoteProxyConfigurationResolver.cpp
@@ -69,7 +69,7 @@ ProxyConfiguration RemoteProxyConfigurationResolver::resolve()
         {
             auto resolved_endpoint = endpoint;
             resolved_endpoint.setHost(resolved_hosts[i].toString());
-            session = makeHTTPSession(resolved_endpoint, timeouts);
+            session = makeHTTPSession(HTTPConnectionGroupType::HTTP, resolved_endpoint, timeouts);
 
             try
             {
diff --git a/src/Common/tests/gtest_connection_pool.cpp b/src/Common/tests/gtest_connection_pool.cpp
new file mode 100644
index 00000000000..01b78958442
--- /dev/null
+++ b/src/Common/tests/gtest_connection_pool.cpp
@@ -0,0 +1,558 @@
+#include <IO/ReadWriteBufferFromHTTP.h>
+#include <Common/HTTPConnectionPool.h>
+
+#include <Poco/URI.h>
+#include <Poco/Net/ServerSocket.h>
+#include <Poco/Net/MessageHeader.h>
+#include <Poco/Net/HTTPServerRequest.h>
+#include <Poco/Net/HTTPServerResponse.h>
+#include <Poco/Net/HTTPServer.h>
+#include <Poco/Net/HTTPServerParams.h>
+#include <Poco/Net/HTTPRequestHandler.h>
+#include <Poco/Net/HTTPRequestHandlerFactory.h>
+
+#include <thread>
+#include <gtest/gtest.h>
+
+namespace
+{
+
+size_t stream_copy_n(std::istream & in, std::ostream & out, std::size_t count = std::numeric_limits<size_t>::max())
+{
+    const size_t buffer_size = 4096;
+    char buffer[buffer_size];
+
+    size_t total_read = 0;
+
+    while (count > buffer_size)
+    {
+        in.read(buffer, buffer_size);
+        size_t read = in.gcount();
+        out.write(buffer, read);
+        count -= read;
+        total_read += read;
+
+        if (read == 0)
+            return total_read;
+    }
+
+    in.read(buffer, count);
+    size_t read = in.gcount();
+    out.write(buffer, read);
+    total_read += read;
+
+    return total_read;
+}
+
+class MockRequestHandler : public Poco::Net::HTTPRequestHandler
+{
+public:
+    explicit MockRequestHandler(std::shared_ptr<std::atomic<size_t>> slowdown_)
+        : slowdown(std::move(slowdown_))
+    {
+    }
+
+    void handleRequest(Poco::Net::HTTPServerRequest & request, Poco::Net::HTTPServerResponse & response) override
+    {
+        response.setStatus(Poco::Net::HTTPResponse::HTTP_OK);
+        auto size = request.getContentLength();
+        if (size > 0)
+            response.setContentLength(size); // ContentLength is required for keep alive
+        else
+            response.setChunkedTransferEncoding(true); // or chunk encoding
+
+        sleepForSeconds(*slowdown);
+
+        stream_copy_n(request.stream(), response.send(), size);
+    }
+
+    std::shared_ptr<std::atomic<size_t>> slowdown;
+};
+
+class HTTPRequestHandlerFactory : public Poco::Net::HTTPRequestHandlerFactory
+{
+public:
+    explicit HTTPRequestHandlerFactory(std::shared_ptr<std::atomic<size_t>> slowdown_)
+        : slowdown(std::move(slowdown_))
+    {
+    }
+
+    Poco::Net::HTTPRequestHandler * createRequestHandler(const Poco::Net::HTTPServerRequest &) override
+    {
+        return new MockRequestHandler(slowdown);
+    }
+
+    std::shared_ptr<std::atomic<size_t>> slowdown;
+};
+
+}
+
+using HTTPSession = Poco::Net::HTTPClientSession;
+using HTTPSessionPtr = std::shared_ptr<Poco::Net::HTTPClientSession>;
+
+class ConnectionPoolTest : public testing::Test {
+protected:
+    ConnectionPoolTest()
+    {
+        startServer();
+    }
+
+    void SetUp() override {
+        timeouts = DB::ConnectionTimeouts();
+        DB::HTTPConnectionPools::Limits def_limits{};
+        DB::HTTPConnectionPools::instance().setLimits(def_limits, def_limits, def_limits);
+
+        setSlowDown(0);
+
+        DB::HTTPConnectionPools::instance().dropCache();
+        DB::CurrentThread::getProfileEvents().reset();
+        // Code here will be called immediately after the constructor (right
+        // before each test).
+    }
+
+    void TearDown() override {
+        // Code here will be called immediately after each test (right
+        // before the destructor).
+    }
+
+    DB::IHTTPConnectionPoolForEndpoint::Ptr getPool()
+    {
+        auto uri = Poco::URI(getServerUrl());
+        return DB::HTTPConnectionPools::instance().getPool(DB::HTTPConnectionGroupType::HTTP, uri, DB::ProxyConfiguration{});
+    }
+
+    std::string getServerUrl() const
+    {
+        return "http://" + server_data.socket->address().toString();
+    }
+
+    void startServer()
+    {
+        server_data.reset();
+        server_data.params = new Poco::Net::HTTPServerParams();
+        server_data.socket = std::make_unique<Poco::Net::ServerSocket>(server_data.port);
+        server_data.handler_factory = new HTTPRequestHandlerFactory(slowdown_receive);
+        server_data.server =  std::make_unique<Poco::Net::HTTPServer>(
+            server_data.handler_factory, *server_data.socket, server_data.params);
+
+        server_data.server->start();
+    }
+
+    Poco::Net::HTTPServer & getServer() const
+    {
+        return *server_data.server;
+    }
+
+    void setSlowDown(size_t seconds)
+    {
+        *slowdown_receive = seconds;
+    }
+
+    DB::ConnectionTimeouts timeouts;
+    std::shared_ptr<std::atomic<size_t>> slowdown_receive = std::make_shared<std::atomic<size_t>>(0);
+
+    struct ServerData
+    {
+        // just some port to avoid collisions with others tests
+        UInt16 port = 9871;
+        Poco::Net::HTTPServerParams::Ptr params;
+        std::unique_ptr<Poco::Net::ServerSocket> socket;
+        HTTPRequestHandlerFactory::Ptr handler_factory;
+        std::unique_ptr<Poco::Net::HTTPServer> server;
+
+        ServerData() = default;
+        ServerData(ServerData &&) = default;
+        ServerData & operator =(ServerData &&) = delete;
+
+        void reset()
+        {
+            if (server)
+                server->stop();
+
+            server = nullptr;
+            handler_factory = nullptr;
+            socket = nullptr;
+            params = nullptr;
+        }
+
+        ~ServerData() {
+            reset();
+        }
+    };
+
+    ServerData server_data;
+};
+
+
+void wait_until(std::function<bool()> pred)
+{
+    while (!pred())
+        sleepForMilliseconds(250);
+}
+
+void echoRequest(String data, HTTPSession & session)
+{
+    {
+        Poco::Net::HTTPRequest request(Poco::Net::HTTPRequest::HTTP_PUT, "/", "HTTP/1.1"); // HTTP/1.1 is required for keep alive
+        request.setContentLength(data.size());
+        std::ostream & ostream = session.sendRequest(request);
+        ostream << data;
+    }
+
+    {
+        std::stringstream result;
+        Poco::Net::HTTPResponse response;
+        std::istream & istream = session.receiveResponse(response);
+        ASSERT_EQ(response.getStatus(), Poco::Net::HTTPResponse::HTTP_OK);
+
+        stream_copy_n(istream, result);
+        ASSERT_EQ(data, result.str());
+    }
+}
+
+TEST_F(ConnectionPoolTest, CanConnect)
+{
+    auto pool = getPool();
+    auto connection = pool->getConnection(timeouts);
+
+    ASSERT_TRUE(connection->connected());
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+
+    ASSERT_EQ(1, CurrentMetrics::get(pool->getMetrics().active_count));
+    ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().stored_count));
+
+    wait_until([&] () { return getServer().currentConnections() == 1; });
+    ASSERT_EQ(1, getServer().currentConnections());
+    ASSERT_EQ(1, getServer().totalConnections());
+
+    connection->reset();
+
+    wait_until([&] () { return getServer().currentConnections() == 0; });
+    ASSERT_EQ(0, getServer().currentConnections());
+    ASSERT_EQ(1, getServer().totalConnections());
+
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+}
+
+TEST_F(ConnectionPoolTest, CanRequest)
+{
+    auto pool = getPool();
+    auto connection = pool->getConnection(timeouts);
+
+    echoRequest("Hello", *connection);
+
+    ASSERT_EQ(1, getServer().totalConnections());
+    ASSERT_EQ(1, getServer().currentConnections());
+
+    connection->reset();
+
+    wait_until([&] () { return getServer().currentConnections() == 0; });
+    ASSERT_EQ(0, getServer().currentConnections());
+    ASSERT_EQ(1, getServer().totalConnections());
+
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+}
+
+TEST_F(ConnectionPoolTest, CanPreserve)
+{
+    auto pool = getPool();
+
+    {
+        auto connection = pool->getConnection(timeouts);
+    }
+
+    ASSERT_EQ(1, CurrentMetrics::get(pool->getMetrics().active_count));
+    ASSERT_EQ(1, CurrentMetrics::get(pool->getMetrics().stored_count));
+
+    wait_until([&] () { return getServer().currentConnections() == 1; });
+    ASSERT_EQ(1, getServer().currentConnections());
+
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+}
+
+TEST_F(ConnectionPoolTest, CanReuse)
+{
+    auto pool = getPool();
+
+    {
+        auto connection = pool->getConnection(timeouts);
+        // DB::setReuseTag(*connection);
+    }
+
+    ASSERT_EQ(1, CurrentMetrics::get(pool->getMetrics().active_count));
+    ASSERT_EQ(1, CurrentMetrics::get(pool->getMetrics().stored_count));
+
+    {
+        auto connection = pool->getConnection(timeouts);
+
+        ASSERT_EQ(1, CurrentMetrics::get(pool->getMetrics().active_count));
+        ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().stored_count));
+
+        wait_until([&] () { return getServer().currentConnections() == 1; });
+        ASSERT_EQ(1, getServer().currentConnections());
+
+        echoRequest("Hello", *connection);
+
+        ASSERT_EQ(1, getServer().totalConnections());
+        ASSERT_EQ(1, getServer().currentConnections());
+
+        connection->reset();
+    }
+
+    ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().active_count));
+    ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().stored_count));
+
+    wait_until([&] () { return getServer().currentConnections() == 0; });
+    ASSERT_EQ(0, getServer().currentConnections());
+    ASSERT_EQ(1, getServer().totalConnections());
+
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+}
+
+TEST_F(ConnectionPoolTest, CanReuse10)
+{
+    auto pool = getPool();
+
+
+    for (int i = 0; i < 10; ++i)
+    {
+        auto connection = pool->getConnection(timeouts);
+        echoRequest("Hello", *connection);
+    }
+
+    {
+        auto connection = pool->getConnection(timeouts);
+        connection->reset(); // reset just not to wait its expiration here
+    }
+
+    wait_until([&] () { return getServer().currentConnections() == 0; });
+    ASSERT_EQ(0, getServer().currentConnections());
+    ASSERT_EQ(1, getServer().totalConnections());
+
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(10, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(10, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+}
+
+TEST_F(ConnectionPoolTest, CanReuse5)
+{
+    timeouts.withHTTPKeepAliveTimeout(1);
+
+    auto pool = getPool();
+
+    std::vector<DB::HTTPSessionPtr> connections;
+    connections.reserve(5);
+    for (int i = 0; i < 5; ++i)
+    {
+        connections.push_back(pool->getConnection(timeouts));
+    }
+    connections.clear();
+
+    ASSERT_EQ(5, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(5, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+    ASSERT_EQ(5, CurrentMetrics::get(pool->getMetrics().active_count));
+    ASSERT_EQ(5, CurrentMetrics::get(pool->getMetrics().stored_count));
+
+    wait_until([&] () { return getServer().currentConnections() == 5; });
+    ASSERT_EQ(5, getServer().currentConnections());
+    ASSERT_EQ(5, getServer().totalConnections());
+
+    for (int i = 0; i < 5; ++i)
+    {
+        auto connection = pool->getConnection(timeouts);
+        echoRequest("Hello", *connection);
+    }
+
+    ASSERT_EQ(5, getServer().totalConnections());
+
+    ASSERT_EQ(5, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(10, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(5, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+    ASSERT_EQ(5, CurrentMetrics::get(pool->getMetrics().active_count));
+    ASSERT_EQ(5, CurrentMetrics::get(pool->getMetrics().stored_count));
+}
+
+TEST_F(ConnectionPoolTest, CanReconnectAndCreate)
+{
+    auto pool = getPool();
+
+    std::vector<HTTPSessionPtr> in_use;
+
+    const size_t count = 2;
+    for (int i = 0; i < count; ++i)
+    {
+        auto connection = pool->getConnection(timeouts);
+        // DB::setReuseTag(*connection);
+        in_use.push_back(connection);
+    }
+
+    ASSERT_EQ(count, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+
+    ASSERT_EQ(count, CurrentMetrics::get(pool->getMetrics().active_count));
+    ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().stored_count));
+
+    auto connection = std::move(in_use.back());
+    in_use.pop_back();
+
+    echoRequest("Hello", *connection);
+
+    connection->abort(); // further usage requires reconnect, new connection
+
+    echoRequest("Hello", *connection);
+
+    connection->reset();
+
+    wait_until([&] () { return getServer().currentConnections() == 1; });
+    ASSERT_EQ(1, getServer().currentConnections());
+    ASSERT_EQ(count+1, getServer().totalConnections());
+
+    ASSERT_EQ(count+1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+}
+
+TEST_F(ConnectionPoolTest, CanReconnectAndReuse)
+{
+    auto pool = getPool();
+
+    std::vector<HTTPSessionPtr> in_use;
+
+    const size_t count = 2;
+    for (int i = 0; i < count; ++i)
+    {
+        auto connection = pool->getConnection(timeouts);
+        // DB::setReuseTag(*connection);
+        in_use.push_back(std::move(connection));
+    }
+
+    auto connection = std::move(in_use.back());
+    in_use.pop_back();
+    in_use.clear(); // other connection will be reused
+
+    echoRequest("Hello", *connection);
+
+    connection->abort(); // further usage requires reconnect, reuse connection from pool
+
+    echoRequest("Hello", *connection);
+
+    connection->reset();
+
+    wait_until([&] () { return getServer().currentConnections() == 0; });
+    ASSERT_EQ(0, getServer().currentConnections());
+    ASSERT_EQ(2, getServer().totalConnections());
+
+    ASSERT_EQ(count, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+}
+
+TEST_F(ConnectionPoolTest, ReceiveTimeout)
+{
+    setSlowDown(2);
+    timeouts.withReceiveTimeout(1);
+
+    auto pool = getPool();
+
+    {
+        auto connection = pool->getConnection(timeouts);
+        ASSERT_ANY_THROW(
+            echoRequest("Hello", *connection);
+        );
+    }
+
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reset]);
+
+    {
+        timeouts.withReceiveTimeout(3);
+        auto connection = pool->getConnection(timeouts);
+        ASSERT_NO_THROW(
+            echoRequest("Hello", *connection);
+        );
+    }
+
+    ASSERT_EQ(2, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reset]);
+
+    {
+        /// timeouts have effect for reused session
+        timeouts.withReceiveTimeout(1);
+        auto connection = pool->getConnection(timeouts);
+        ASSERT_ANY_THROW(
+            echoRequest("Hello", *connection);
+        );
+    }
+
+    ASSERT_EQ(2, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reused]);
+    ASSERT_EQ(2, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reset]);
+}
+
+TEST_F(ConnectionPoolTest, ReadWriteBufferFromHTTP)
+{
+    std::string_view message = "Hello ReadWriteBufferFromHTTP";
+    auto uri = Poco::URI(getServerUrl());
+    auto metrics = DB::HTTPConnectionPools::instance().getPool(DB::HTTPConnectionGroupType::HTTP, uri, DB::ProxyConfiguration{})->getMetrics();
+    Poco::Net::HTTPBasicCredentials empty_creds;
+    auto buf_from_http = DB::BuilderRWBufferFromHTTP(uri)
+                             .withConnectionGroup(DB::HTTPConnectionGroupType::HTTP)
+                             .withOutCallback(
+                                 [&] (std::ostream & in)
+                                 {
+                                     in << message;
+                                 })
+                             .withDelayInit(false)
+                             .create(empty_creds);
+
+    ASSERT_EQ(1, CurrentMetrics::get(metrics.active_count));
+    ASSERT_EQ(0, CurrentMetrics::get(metrics.stored_count));
+
+    char buf[256];
+    std::fill(buf, buf + sizeof(buf), 0);
+
+    buf_from_http->readStrict(buf, message.size());
+    ASSERT_EQ(std::string_view(buf), message);
+    ASSERT_TRUE(buf_from_http->eof());
+
+    buf_from_http.reset();
+
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[metrics.created]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[metrics.preserved]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[metrics.reused]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[metrics.reset]);
+
+    ASSERT_EQ(1, CurrentMetrics::get(metrics.active_count));
+    ASSERT_EQ(1, CurrentMetrics::get(metrics.stored_count));
+}
+
+TEST_F(ConnectionPoolTest, HardLimit)
+{
+    DB::HTTPConnectionPools::Limits zero_limits {0, 0, 0};
+    DB::HTTPConnectionPools::instance().setLimits(zero_limits, zero_limits, zero_limits);
+
+    auto pool = getPool();
+
+    {
+        auto connection = pool->getConnection(timeouts);
+    }
+
+    ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().active_count));
+    ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().stored_count));
+
+
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reset]);
+}
diff --git a/src/Common/tests/gtest_resolve_pool.cpp b/src/Common/tests/gtest_resolve_pool.cpp
new file mode 100644
index 00000000000..25e867fdebc
--- /dev/null
+++ b/src/Common/tests/gtest_resolve_pool.cpp
@@ -0,0 +1,278 @@
+#include <IO/WriteBufferFromFile.h>
+#include <Common/HostResolvePool.h>
+#include <base/sleep.h>
+
+#include <thread>
+#include <gtest/gtest.h>
+
+class ResolvePoolMock : public DB::HostResolver
+{
+public:
+    using ResolveFunction = DB::HostResolver::ResolveFunction;
+
+    ResolvePoolMock(String host_, Poco::Timespan history_, ResolveFunction && func)
+    : DB::HostResolver(std::move(func), std::move(host_), history_)
+    {
+    }
+};
+
+class ResolvePoolTest : public testing::Test
+{
+protected:
+    ResolvePoolTest()
+    {
+        DB::HostResolversPool::instance().dropCache();
+    }
+
+    void SetUp() override {
+        DB::CurrentThread::getProfileEvents().reset();
+
+        ASSERT_EQ(0, CurrentMetrics::get(metrics.active_count));
+
+        addresses = std::set<String>{"127.0.0.1", "127.0.0.2", "127.0.0.3"};
+        // Code here will be called immediately after the constructor (right
+        // before each test).
+    }
+
+    void TearDown() override {
+        // Code here will be called immediately after each test (right
+        // before the destructor).
+    }
+
+    DB::HostResolver::Ptr make_resolver(size_t history_ms = 200)
+    {
+        auto resolve_func = [&] (const String &)
+        {
+            std::vector<Poco::Net::IPAddress> result;
+            result.reserve(addresses.size());
+            for (const auto & item : addresses)
+            {
+                result.push_back(Poco::Net::IPAddress(item));
+            }
+            return result;
+        };
+
+
+        return std::make_shared<ResolvePoolMock>("some_host", Poco::Timespan(history_ms * 1000), std::move(resolve_func));
+    }
+
+    DB::HostResolverMetrics metrics = DB::HostResolver::getMetrics();
+    std::set<String> addresses;
+};
+
+TEST_F(ResolvePoolTest, CanResolve)
+{
+    auto resolver = make_resolver();
+    auto address = resolver->resolve();
+
+    ASSERT_TRUE(addresses.contains(*address));
+
+    ASSERT_EQ(addresses.size(), DB::CurrentThread::getProfileEvents()[metrics.discovered]);
+    ASSERT_EQ(addresses.size(), CurrentMetrics::get(metrics.active_count));
+}
+
+TEST_F(ResolvePoolTest, CanResolveAll)
+{
+    auto resolver = make_resolver();
+
+    std::set<String> results;
+    while (results.size() != addresses.size())
+    {
+        auto next_addr = resolver->resolve();
+        results.insert(*next_addr);
+    }
+
+    ASSERT_EQ(addresses.size(), DB::CurrentThread::getProfileEvents()[metrics.discovered]);
+}
+
+size_t getSum(std::map<String, size_t> container)
+{
+    size_t sum = 0;
+    for (auto & [_, val] : container)
+    {
+        sum += val;
+    }
+    return sum;
+}
+
+size_t getMin(std::map<String, size_t> container)
+{
+    if (container.empty())
+        return 0;
+
+    size_t min_val = container.begin()->second;
+    for (auto & [_, val] : container)
+    {
+        min_val = std::min(min_val, val);
+    }
+    return min_val;
+}
+
+double getMean(std::map<String, size_t> container)
+{
+    return 1.0 * getSum(container) / container.size();
+}
+
+double getMaxDiff(std::map<String, size_t> container, double ref_val)
+{
+    double diff = 0.0;
+    for (auto & [_, val] : container)
+    {
+        diff = std::max(std::fabs(val - ref_val), diff);
+    }
+
+    return diff;
+}
+
+TEST_F(ResolvePoolTest, CanResolveEvenly)
+{
+    auto resolver = make_resolver();
+
+    std::map<String, size_t> results;
+
+    for (size_t i = 0; i < 50000; ++i)
+    {
+        auto next_addr = resolver->resolve();
+        if (results.contains(*next_addr))
+        {
+            results[*next_addr] += 1;
+        }
+        else
+        {
+            results[*next_addr] = 1;
+        }
+    }
+
+    auto mean = getMean(results);
+    auto diff = getMaxDiff(results, mean);
+
+    ASSERT_GT(0.3 * mean, diff);
+}
+
+TEST_F(ResolvePoolTest, CanMerge)
+{
+    auto resolver = make_resolver(100000);
+    auto address = resolver->resolve();
+
+    ASSERT_TRUE(addresses.contains(*address));
+
+    ASSERT_EQ(addresses.size(), DB::CurrentThread::getProfileEvents()[metrics.discovered]);
+
+    auto old_addresses = addresses;
+    addresses = std::set<String>{"127.0.0.4", "127.0.0.5"};
+
+
+    resolver->update();
+    ASSERT_EQ(addresses.size() + old_addresses.size(), DB::CurrentThread::getProfileEvents()[metrics.discovered]);
+    ASSERT_EQ(addresses.size() + old_addresses.size(), CurrentMetrics::get(metrics.active_count));
+
+    std::set<String> results;
+    while (results.size() != addresses.size() + old_addresses.size())
+    {
+        auto next_addr = resolver->resolve();
+        results.insert(*next_addr);
+    }
+}
+
+TEST_F(ResolvePoolTest, CanGainEven)
+{
+    auto resolver = make_resolver();
+    auto address = resolver->resolve();
+
+    std::map<String, size_t> results;
+    for (size_t i = 0; i < 40000; ++i)
+    {
+        auto next_addr = resolver->resolve();
+        if (results.contains(*next_addr))
+        {
+            results[*next_addr] += 1;
+        }
+        else
+        {
+            results[*next_addr] = 1;
+        }
+    }
+
+    ASSERT_GT(getMin(results), 10000);
+
+    addresses.insert("127.0.0.4");
+    addresses.insert("127.0.0.5");
+
+    resolver->update();
+
+    /// return mostly new addresses
+    for (size_t i = 0; i < 3000; ++i)
+    {
+        auto next_addr = resolver->resolve();
+        if (results.contains(*next_addr))
+        {
+            results[*next_addr] += 1;
+        }
+        else
+        {
+            results[*next_addr] = 1;
+        }
+    }
+
+    ASSERT_EQ(results.size(), 5);
+
+    ASSERT_GT(getMin(results), 1000);
+}
+
+TEST_F(ResolvePoolTest, CanFail)
+{
+    auto resolver = make_resolver(10000);
+
+    auto failed_addr = resolver->resolve();
+    failed_addr.setFail();
+
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[metrics.failed]);
+    ASSERT_EQ(addresses.size(), CurrentMetrics::get(metrics.active_count));
+    ASSERT_EQ(addresses.size(), DB::CurrentThread::getProfileEvents()[metrics.discovered]);
+
+    for (size_t i = 0; i < 1000; ++i)
+    {
+        auto next_addr = resolver->resolve();
+
+        ASSERT_TRUE(addresses.contains(*next_addr));
+        ASSERT_NE(*next_addr, *failed_addr);
+    }
+}
+
+TEST_F(ResolvePoolTest, CanFailAndHeal)
+{
+    auto resolver = make_resolver();
+
+    auto failed_addr = resolver->resolve();
+    failed_addr.setFail();
+
+    while (true)
+    {
+        auto next_addr = resolver->resolve();
+        if (*failed_addr == *next_addr)
+            break;
+    }
+}
+
+
+TEST_F(ResolvePoolTest, CanExpire)
+{
+    auto resolver = make_resolver();
+
+    auto expired_addr = resolver->resolve();
+    ASSERT_TRUE(addresses.contains(*expired_addr));
+
+    addresses.erase(*expired_addr);
+    sleepForSeconds(1);
+
+    for (size_t i = 0; i < 1000; ++i)
+    {
+        auto next_addr = resolver->resolve();
+
+        ASSERT_TRUE(addresses.contains(*next_addr));
+        ASSERT_NE(*next_addr, *expired_addr);
+    }
+
+    ASSERT_EQ(addresses.size() + 1, DB::CurrentThread::getProfileEvents()[metrics.discovered]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[metrics.expired]);
+}
diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index fc478ae4f41..c201bab6063 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -128,8 +128,17 @@ namespace DB
     M(Bool, format_alter_operations_with_parentheses, false, "If enabled, each operation in alter queries will be surrounded with parentheses in formatted queries to make them less ambiguous.", 0) \
     M(String, default_replica_path, "/clickhouse/tables/{uuid}/{shard}", "The path to the table in ZooKeeper", 0) \
     M(String, default_replica_name, "{replica}", "The replica name in ZooKeeper", 0) \
+    M(UInt64, disk_connections_soft_limit, 1000, "Connections above this limit have significantly shorter time to live. The limit applies to the disks connections.", 0) \
+    M(UInt64, disk_connections_warn_limit, 10000, "Warning massages are written to the logs if number of in-use connections are higher than this limit. The limit applies to the disks connections.", 0) \
+    M(UInt64, disk_connections_store_limit, 12000, "Connections above this limit reset after use. Set to 0 to turn connection cache off. The limit applies to the disks connections.", 0) \
+    M(UInt64, storage_connections_soft_limit, 100, "Connections above this limit have significantly shorter time to live. The limit applies to the storages connections.", 0) \
+    M(UInt64, storage_connections_warn_limit, 1000, "Warning massages are written to the logs if number of in-use connections are higher than this limit. The limit applies to the storages connections.", 0) \
+    M(UInt64, storage_connections_store_limit, 5000, "Connections above this limit reset after use. Set to 0 to turn connection cache off. The limit applies to the storages connections.", 0) \
+    M(UInt64, http_connections_soft_limit, 100, "Connections above this limit have significantly shorter time to live. The limit applies to the http connections which do not belong to any disk or storage.", 0) \
+    M(UInt64, http_connections_warn_limit, 1000, "Warning massages are written to the logs if number of in-use connections are higher than this limit. The limit applies to the http connections which do not belong to any disk or storage.", 0) \
+    M(UInt64, http_connections_store_limit, 5000, "Connections above this limit reset after use. Set to 0 to turn connection cache off. The limit applies to the http connections which do not belong to any disk or storage.", 0) \
 
-    /// If you add a setting which can be updated at runtime, please update 'changeable_settings' map in StorageSystemServerSettings.cpp
+/// If you add a setting which can be updated at runtime, please update 'changeable_settings' map in StorageSystemServerSettings.cpp
 
 DECLARE_SETTINGS_TRAITS(ServerSettingsTraits, SERVER_SETTINGS)
 
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index fceee63d4bb..d70a6cf51c5 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -110,7 +110,7 @@ class IColumn;
     M(Bool, s3_disable_checksum, false, "Do not calculate a checksum when sending a file to S3. This speeds up writes by avoiding excessive processing passes on a file. It is mostly safe as the data of MergeTree tables is checksummed by ClickHouse anyway, and when S3 is accessed with HTTPS, the TLS layer already provides integrity while transferring through the network. While additional checksums on S3 give defense in depth.", 0) \
     M(UInt64, s3_retry_attempts, 100, "Setting for Aws::Client::RetryStrategy, Aws::Client does retries itself, 0 means no retries", 0) \
     M(UInt64, s3_request_timeout_ms, 30000, "Idleness timeout for sending and receiving data to/from S3. Fail if a single TCP read or write call blocks for this long.", 0) \
-    M(UInt64, s3_http_connection_pool_size, 1000, "How many reusable open connections to keep per S3 endpoint. This only applies to the S3 table engine and table function, not to S3 disks (for disks, use disk config instead). Global setting, can only be set in config, overriding it per session or per query has no effect.", 0) \
+    M(UInt64, s3_connect_timeout_ms, 1000, "Connection timeout for host from s3 disks.", 0) \
     M(Bool, enable_s3_requests_logging, false, "Enable very explicit logging of S3 requests. Makes sense for debug only.", 0) \
     M(String, s3queue_default_zookeeper_path, "/clickhouse/s3queue/", "Default zookeeper path prefix for S3Queue engine", 0) \
     M(Bool, s3queue_enable_logging_to_s3queue_log, false, "Enable writing to system.s3queue_log. The value can be overwritten per table with table settings", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 2f1da7935e6..e680c02671a 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -85,7 +85,8 @@ namespace SettingsChangesHistory
 /// It's used to implement `compatibility` setting (see https://github.com/ClickHouse/ClickHouse/issues/35972)
 static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> settings_changes_history =
 {
-    {"24.3", {{"allow_experimental_shared_merge_tree", false, true, "The setting is obsolete"},
+    {"24.3", {{"s3_connect_timeout_ms", 1000, 1000, "Introduce new dedicated setting for s3 connection timeout"},
+              {"allow_experimental_shared_merge_tree", false, true, "The setting is obsolete"},
               {"use_page_cache_for_disks_without_file_cache", false, false, "Added userspace page cache"},
               {"read_from_page_cache_if_exists_otherwise_bypass_cache", false, false, "Added userspace page cache"},
               {"page_cache_inject_eviction", false, false, "Added userspace page cache"},
diff --git a/src/Dictionaries/HTTPDictionarySource.cpp b/src/Dictionaries/HTTPDictionarySource.cpp
index bf42b7931ed..dae8ec06d30 100644
--- a/src/Dictionaries/HTTPDictionarySource.cpp
+++ b/src/Dictionaries/HTTPDictionarySource.cpp
@@ -88,20 +88,18 @@ void HTTPDictionarySource::getUpdateFieldAndDate(Poco::URI & uri)
 QueryPipeline HTTPDictionarySource::loadAll()
 {
     LOG_TRACE(log, "loadAll {}", toString());
-    Poco::URI uri(configuration.url);
-    auto in_ptr = std::make_unique<ReadWriteBufferFromHTTP>(
-        uri,
-        Poco::Net::HTTPRequest::HTTP_GET,
-        ReadWriteBufferFromHTTP::OutStreamCallback(),
-        timeouts,
-        credentials,
-        0,
-        DBMS_DEFAULT_BUFFER_SIZE,
-        context->getReadSettings(),
-        configuration.header_entries,
-        nullptr, false);
 
-    return createWrappedBuffer(std::move(in_ptr));
+    Poco::URI uri(configuration.url);
+
+    auto buf = BuilderRWBufferFromHTTP(uri)
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withSettings(context->getReadSettings())
+                   .withTimeouts(timeouts)
+                   .withHeaders(configuration.header_entries)
+                   .withDelayInit(false)
+                   .create(credentials);
+
+    return createWrappedBuffer(std::move(buf));
 }
 
 QueryPipeline HTTPDictionarySource::loadUpdatedAll()
@@ -109,19 +107,16 @@ QueryPipeline HTTPDictionarySource::loadUpdatedAll()
     Poco::URI uri(configuration.url);
     getUpdateFieldAndDate(uri);
     LOG_TRACE(log, "loadUpdatedAll {}", uri.toString());
-    auto in_ptr = std::make_unique<ReadWriteBufferFromHTTP>(
-        uri,
-        Poco::Net::HTTPRequest::HTTP_GET,
-        ReadWriteBufferFromHTTP::OutStreamCallback(),
-        timeouts,
-        credentials,
-        0,
-        DBMS_DEFAULT_BUFFER_SIZE,
-        context->getReadSettings(),
-        configuration.header_entries,
-        nullptr, false);
 
-    return createWrappedBuffer(std::move(in_ptr));
+    auto buf = BuilderRWBufferFromHTTP(uri)
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withSettings(context->getReadSettings())
+                   .withTimeouts(timeouts)
+                   .withHeaders(configuration.header_entries)
+                   .withDelayInit(false)
+                   .create(credentials);
+
+    return createWrappedBuffer(std::move(buf));
 }
 
 QueryPipeline HTTPDictionarySource::loadIds(const std::vector<UInt64> & ids)
@@ -139,19 +134,18 @@ QueryPipeline HTTPDictionarySource::loadIds(const std::vector<UInt64> & ids)
     };
 
     Poco::URI uri(configuration.url);
-    auto in_ptr = std::make_unique<ReadWriteBufferFromHTTP>(
-        uri,
-        Poco::Net::HTTPRequest::HTTP_POST,
-        out_stream_callback,
-        timeouts,
-        credentials,
-        0,
-        DBMS_DEFAULT_BUFFER_SIZE,
-        context->getReadSettings(),
-        configuration.header_entries,
-        nullptr, false);
 
-    return createWrappedBuffer(std::move(in_ptr));
+    auto buf = BuilderRWBufferFromHTTP(uri)
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withSettings(context->getReadSettings())
+                   .withTimeouts(timeouts)
+                   .withHeaders(configuration.header_entries)
+                   .withOutCallback(std::move(out_stream_callback))
+                   .withDelayInit(false)
+                   .create(credentials);
+
+    return createWrappedBuffer(std::move(buf));
 }
 
 QueryPipeline HTTPDictionarySource::loadKeys(const Columns & key_columns, const std::vector<size_t> & requested_rows)
@@ -169,19 +163,18 @@ QueryPipeline HTTPDictionarySource::loadKeys(const Columns & key_columns, const
     };
 
     Poco::URI uri(configuration.url);
-    auto in_ptr = std::make_unique<ReadWriteBufferFromHTTP>(
-        uri,
-        Poco::Net::HTTPRequest::HTTP_POST,
-        out_stream_callback,
-        timeouts,
-        credentials,
-        0,
-        DBMS_DEFAULT_BUFFER_SIZE,
-        context->getReadSettings(),
-        configuration.header_entries,
-        nullptr, false);
 
-    return createWrappedBuffer(std::move(in_ptr));
+    auto buf = BuilderRWBufferFromHTTP(uri)
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withSettings(context->getReadSettings())
+                   .withTimeouts(timeouts)
+                   .withHeaders(configuration.header_entries)
+                   .withOutCallback(std::move(out_stream_callback))
+                   .withDelayInit(false)
+                   .create(credentials);
+
+    return createWrappedBuffer(std::move(buf));
 }
 
 bool HTTPDictionarySource::isModified() const
diff --git a/src/Dictionaries/XDBCDictionarySource.cpp b/src/Dictionaries/XDBCDictionarySource.cpp
index 70fe889a8ea..1ebfc4a29b0 100644
--- a/src/Dictionaries/XDBCDictionarySource.cpp
+++ b/src/Dictionaries/XDBCDictionarySource.cpp
@@ -203,7 +203,7 @@ std::string XDBCDictionarySource::doInvalidateQuery(const std::string & request)
 }
 
 
-QueryPipeline XDBCDictionarySource::loadFromQuery(const Poco::URI & url, const Block & required_sample_block, const std::string & query) const
+QueryPipeline XDBCDictionarySource::loadFromQuery(const Poco::URI & uri, const Block & required_sample_block, const std::string & query) const
 {
     bridge_helper->startBridgeSync();
 
@@ -214,10 +214,15 @@ QueryPipeline XDBCDictionarySource::loadFromQuery(const Poco::URI & url, const B
         os << "query=" << escapeForFileName(query);
     };
 
-    auto read_buf = std::make_unique<ReadWriteBufferFromHTTP>(
-        url, Poco::Net::HTTPRequest::HTTP_POST, write_body_callback, timeouts, credentials);
-    auto format = getContext()->getInputFormat(IXDBCBridgeHelper::DEFAULT_FORMAT, *read_buf, required_sample_block, max_block_size);
-    format->addBuffer(std::move(read_buf));
+    auto buf = BuilderRWBufferFromHTTP(uri)
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withTimeouts(timeouts)
+                   .withOutCallback(std::move(write_body_callback))
+                   .create(credentials);
+
+    auto format = getContext()->getInputFormat(IXDBCBridgeHelper::DEFAULT_FORMAT, *buf, required_sample_block, max_block_size);
+    format->addBuffer(std::move(buf));
 
     return QueryPipeline(std::move(format));
 }
diff --git a/src/Dictionaries/XDBCDictionarySource.h b/src/Dictionaries/XDBCDictionarySource.h
index 6011563c522..64d22807254 100644
--- a/src/Dictionaries/XDBCDictionarySource.h
+++ b/src/Dictionaries/XDBCDictionarySource.h
@@ -74,7 +74,7 @@ private:
     // execute invalidate_query. expects single cell in result
     std::string doInvalidateQuery(const std::string & request) const;
 
-    QueryPipeline loadFromQuery(const Poco::URI & url, const Block & required_sample_block, const std::string & query) const;
+    QueryPipeline loadFromQuery(const Poco::URI & uri, const Block & required_sample_block, const std::string & query) const;
 
     LoggerPtr log;
 
diff --git a/src/Disks/IO/ReadBufferFromWebServer.cpp b/src/Disks/IO/ReadBufferFromWebServer.cpp
index cc872392738..7509aa81d75 100644
--- a/src/Disks/IO/ReadBufferFromWebServer.cpp
+++ b/src/Disks/IO/ReadBufferFromWebServer.cpp
@@ -1,8 +1,6 @@
 #include "ReadBufferFromWebServer.h"
 
 #include <Common/logger_useful.h>
-#include <base/sleep.h>
-#include <Core/Types.h>
 #include <IO/ReadWriteBufferFromHTTP.h>
 #include <IO/WriteBufferFromString.h>
 #include <IO/Operators.h>
@@ -45,12 +43,6 @@ std::unique_ptr<ReadBuffer> ReadBufferFromWebServer::initialize()
     {
         if (read_until_position < offset)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to read beyond right offset ({} > {})", offset, read_until_position - 1);
-
-        LOG_DEBUG(log, "Reading with range: {}-{}", offset, read_until_position);
-    }
-    else
-    {
-        LOG_DEBUG(log, "Reading from offset: {}", offset);
     }
 
     const auto & settings = context->getSettingsRef();
@@ -60,19 +52,14 @@ std::unique_ptr<ReadBuffer> ReadBufferFromWebServer::initialize()
     connection_timeouts.withConnectionTimeout(std::max<Poco::Timespan>(settings.http_connection_timeout, Poco::Timespan(20, 0)));
     connection_timeouts.withReceiveTimeout(std::max<Poco::Timespan>(settings.http_receive_timeout, Poco::Timespan(20, 0)));
 
-    auto res = std::make_unique<ReadWriteBufferFromHTTP>(
-        uri,
-        Poco::Net::HTTPRequest::HTTP_GET,
-        ReadWriteBufferFromHTTP::OutStreamCallback(),
-        connection_timeouts,
-        credentials,
-        0,
-        buf_size,
-        read_settings,
-        HTTPHeaderEntries{},
-        &context->getRemoteHostFilter(),
-        /* delay_initialization */true,
-        use_external_buffer);
+    auto res = BuilderRWBufferFromHTTP(uri)
+                   .withConnectionGroup(HTTPConnectionGroupType::DISK)
+                   .withSettings(read_settings)
+                   .withTimeouts(connection_timeouts)
+                   .withBufSize(buf_size)
+                   .withHostFilter(&context->getRemoteHostFilter())
+                   .withExternalBuf(use_external_buffer)
+                   .create(credentials);
 
     if (read_until_position)
         res->setReadUntilPosition(read_until_position);
@@ -101,44 +88,44 @@ bool ReadBufferFromWebServer::nextImpl()
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to read beyond right offset ({} > {})", offset, read_until_position - 1);
     }
 
-    if (impl)
-    {
-        if (!use_external_buffer)
-        {
-            /**
-            * impl was initialized before, pass position() to it to make
-            * sure there is no pending data which was not read, because
-            * this branch means we read sequentially.
-            */
-            impl->position() = position();
-            assert(!impl->hasPendingData());
-        }
-    }
-    else
+    if (!impl)
     {
         impl = initialize();
+
+        if (!use_external_buffer)
+        {
+            BufferBase::set(impl->buffer().begin(), impl->buffer().size(), impl->offset());
+        }
     }
 
     if (use_external_buffer)
     {
-        /**
-        * use_external_buffer -- means we read into the buffer which
-        * was passed to us from somewhere else. We do not check whether
-        * previously returned buffer was read or not, because this branch
-        * means we are prefetching data, each nextImpl() call we can fill
-        * a different buffer.
-        */
         impl->set(internal_buffer.begin(), internal_buffer.size());
-        assert(working_buffer.begin() != nullptr);
-        assert(!internal_buffer.empty());
+    }
+    else
+    {
+        impl->position() = position();
     }
 
+    chassert(available() == 0);
+
+    chassert(pos >= working_buffer.begin());
+    chassert(pos <= working_buffer.end());
+
+    chassert(working_buffer.begin() != nullptr);
+    chassert(impl->buffer().begin() != nullptr);
+    chassert(working_buffer.begin() == impl->buffer().begin());
+
+    chassert(impl->available() == 0);
+
     auto result = impl->next();
+
+    BufferBase::set(impl->buffer().begin(), impl->buffer().size(), impl->offset());
+
+    chassert(working_buffer.begin() == impl->buffer().begin());
+
     if (result)
-    {
-        BufferBase::set(impl->buffer().begin(), impl->buffer().size(), impl->offset());
         offset += working_buffer.size();
-    }
 
     return result;
 }
diff --git a/src/Disks/ObjectStorages/S3/diskSettings.cpp b/src/Disks/ObjectStorages/S3/diskSettings.cpp
index 4fd4b17aabe..7cc29bf1da2 100644
--- a/src/Disks/ObjectStorages/S3/diskSettings.cpp
+++ b/src/Disks/ObjectStorages/S3/diskSettings.cpp
@@ -67,10 +67,6 @@ std::unique_ptr<S3::Client> getClient(
     client_configuration.requestTimeoutMs = config.getUInt(config_prefix + ".request_timeout_ms", S3::DEFAULT_REQUEST_TIMEOUT_MS);
     client_configuration.maxConnections = config.getUInt(config_prefix + ".max_connections", S3::DEFAULT_MAX_CONNECTIONS);
     client_configuration.endpointOverride = uri.endpoint;
-    client_configuration.http_keep_alive_timeout_ms = config.getUInt(
-        config_prefix + ".http_keep_alive_timeout_ms", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT * 1000);
-    client_configuration.http_connection_pool_size = config.getUInt(config_prefix + ".http_connection_pool_size", 1000);
-    client_configuration.wait_on_pool_size_limit = false;
     client_configuration.s3_use_adaptive_timeouts = config.getBool(
         config_prefix + ".use_adaptive_timeouts", client_configuration.s3_use_adaptive_timeouts);
 
diff --git a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
index 48de0bf4168..0bad668a404 100644
--- a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
@@ -44,34 +44,33 @@ WebObjectStorage::loadFiles(const String & path, const std::unique_lock<std::sha
     {
         Poco::Net::HTTPBasicCredentials credentials{};
 
-        ReadWriteBufferFromHTTP metadata_buf(
-            Poco::URI(fs::path(full_url) / ".index"),
-            Poco::Net::HTTPRequest::HTTP_GET,
-            ReadWriteBufferFromHTTP::OutStreamCallback(),
-            ConnectionTimeouts::getHTTPTimeouts(
-                getContext()->getSettingsRef(),
-                getContext()->getServerSettings().keep_alive_timeout),
-            credentials,
-            /* max_redirects= */ 0,
-            /* buffer_size_= */ DBMS_DEFAULT_BUFFER_SIZE,
-            getContext()->getReadSettings());
+        auto timeouts = ConnectionTimeouts::getHTTPTimeouts(
+            getContext()->getSettingsRef(),
+            getContext()->getServerSettings().keep_alive_timeout);
+
+        auto metadata_buf = BuilderRWBufferFromHTTP(Poco::URI(fs::path(full_url) / ".index"))
+                                .withConnectionGroup(HTTPConnectionGroupType::DISK)
+                                .withSettings(getContext()->getReadSettings())
+                                .withTimeouts(timeouts)
+                                .withHostFilter(&getContext()->getRemoteHostFilter())
+                                .create(credentials);
 
         String file_name;
 
-        while (!metadata_buf.eof())
+        while (!metadata_buf->eof())
         {
-            readText(file_name, metadata_buf);
-            assertChar('\t', metadata_buf);
+            readText(file_name, *metadata_buf);
+            assertChar('\t', *metadata_buf);
 
             bool is_directory;
-            readBoolText(is_directory, metadata_buf);
+            readBoolText(is_directory, *metadata_buf);
             size_t size = 0;
             if (!is_directory)
             {
-                assertChar('\t', metadata_buf);
-                readIntText(size, metadata_buf);
+                assertChar('\t', *metadata_buf);
+                readIntText(size, *metadata_buf);
             }
-            assertChar('\n', metadata_buf);
+            assertChar('\n', *metadata_buf);
 
             FileDataPtr file_data = is_directory
                 ? FileData::createDirectoryInfo(false)
diff --git a/src/Functions/sqid.cpp b/src/Functions/sqid.cpp
index a052f20d6fa..6679646fef4 100644
--- a/src/Functions/sqid.cpp
+++ b/src/Functions/sqid.cpp
@@ -122,7 +122,7 @@ public:
             for (size_t i = 0; i < input_rows_count; ++i)
             {
                 std::string_view sqid = col_non_const->getDataAt(i).toView();
-                std::vector<UInt64> integers = sqids.decode(sqid);
+                std::vector<UInt64> integers = sqids.decode(String(sqid));
                 res_nested_data.insert(integers.begin(), integers.end());
                 res_offsets_data.push_back(integers.size());
             }
diff --git a/src/IO/ConnectionTimeouts.cpp b/src/IO/ConnectionTimeouts.cpp
index f2db3169400..c4b636103fe 100644
--- a/src/IO/ConnectionTimeouts.cpp
+++ b/src/IO/ConnectionTimeouts.cpp
@@ -141,4 +141,19 @@ ConnectionTimeouts ConnectionTimeouts::getAdaptiveTimeouts(const String & method
         .withReceiveTimeout(saturate(recv, receive_timeout));
 }
 
+void setTimeouts(Poco::Net::HTTPClientSession & session, const ConnectionTimeouts & timeouts)
+{
+    session.setTimeout(timeouts.connection_timeout, timeouts.send_timeout, timeouts.receive_timeout);
+    session.setKeepAliveTimeout(timeouts.http_keep_alive_timeout);
+}
+
+ConnectionTimeouts getTimeouts(const Poco::Net::HTTPClientSession & session)
+{
+    return ConnectionTimeouts()
+            .withConnectionTimeout(session.getConnectionTimeout())
+            .withSendTimeout(session.getSendTimeout())
+            .withReceiveTimeout(session.getReceiveTimeout())
+            .withHTTPKeepAliveTimeout(session.getKeepAliveTimeout());
+}
+
 }
diff --git a/src/IO/ConnectionTimeouts.h b/src/IO/ConnectionTimeouts.h
index 7fe97b5ec36..2b2ab0e7ab8 100644
--- a/src/IO/ConnectionTimeouts.h
+++ b/src/IO/ConnectionTimeouts.h
@@ -4,6 +4,7 @@
 #include <Core/ServerSettings.h>
 #include <Interpreters/Context_fwd.h>
 
+#include <Poco/Net/HTTPClientSession.h>
 #include <Poco/Timespan.h>
 
 namespace DB
@@ -111,4 +112,7 @@ inline ConnectionTimeouts & ConnectionTimeouts::withConnectionTimeout(Poco::Time
     return *this;
 }
 
+void setTimeouts(Poco::Net::HTTPClientSession & session, const ConnectionTimeouts & timeouts);
+ConnectionTimeouts getTimeouts(const Poco::Net::HTTPClientSession & session);
+
 }
diff --git a/src/IO/HTTPCommon.cpp b/src/IO/HTTPCommon.cpp
index c4468a1b896..09f7724d613 100644
--- a/src/IO/HTTPCommon.cpp
+++ b/src/IO/HTTPCommon.cpp
@@ -2,13 +2,7 @@
 
 #include <Server/HTTP/HTTPServerResponse.h>
 #include <Poco/Any.h>
-#include <Common/Concepts.h>
-#include <Common/DNSResolver.h>
 #include <Common/Exception.h>
-#include <Common/MemoryTrackerSwitcher.h>
-#include <Common/PoolBase.h>
-#include <Common/ProfileEvents.h>
-#include <Common/SipHash.h>
 
 #include "config.h"
 
@@ -25,338 +19,18 @@
 
 #include <Poco/Util/Application.h>
 
-#include <sstream>
-#include <tuple>
+#include <istream>
 #include <unordered_map>
 #include <Common/ProxyConfiguration.h>
 
 
-namespace ProfileEvents
-{
-    extern const Event CreatedHTTPConnections;
-}
-
 namespace DB
 {
+
 namespace ErrorCodes
 {
     extern const int RECEIVED_ERROR_FROM_REMOTE_IO_SERVER;
     extern const int RECEIVED_ERROR_TOO_MANY_REQUESTS;
-    extern const int FEATURE_IS_NOT_ENABLED_AT_BUILD_TIME;
-    extern const int UNSUPPORTED_URI_SCHEME;
-    extern const int LOGICAL_ERROR;
-}
-
-
-namespace
-{
-    Poco::Net::HTTPClientSession::ProxyConfig proxyConfigurationToPocoProxyConfig(const ProxyConfiguration & proxy_configuration)
-    {
-        Poco::Net::HTTPClientSession::ProxyConfig poco_proxy_config;
-
-        poco_proxy_config.host = proxy_configuration.host;
-        poco_proxy_config.port = proxy_configuration.port;
-        poco_proxy_config.protocol = ProxyConfiguration::protocolToString(proxy_configuration.protocol);
-        poco_proxy_config.tunnel = proxy_configuration.tunneling;
-        poco_proxy_config.originalRequestProtocol = ProxyConfiguration::protocolToString(proxy_configuration.original_request_protocol);
-
-        return poco_proxy_config;
-    }
-
-    template <typename Session>
-    requires std::derived_from<Session, Poco::Net::HTTPClientSession>
-    class HTTPSessionAdapter : public Session
-    {
-        static_assert(std::has_virtual_destructor_v<Session>, "The base class must have a virtual destructor");
-
-    public:
-        HTTPSessionAdapter(const std::string & host, UInt16 port) : Session(host, port), log{getLogger("HTTPSessionAdapter")} { }
-        ~HTTPSessionAdapter() override = default;
-
-    protected:
-        void reconnect() override
-        {
-            // First of all will try to establish connection with last used addr.
-            if (!Session::getResolvedHost().empty())
-            {
-                try
-                {
-                    Session::reconnect();
-                    return;
-                }
-                catch (...)
-                {
-                    Session::close();
-                    LOG_TRACE(
-                        log,
-                        "Last ip ({}) is unreachable for {}:{}. Will try another resolved address.",
-                        Session::getResolvedHost(),
-                        Session::getHost(),
-                        Session::getPort());
-                }
-            }
-
-            const auto endpoinds = DNSResolver::instance().resolveHostAll(Session::getHost());
-
-            for (auto it = endpoinds.begin();;)
-            {
-                try
-                {
-                    Session::setResolvedHost(it->toString());
-                    Session::reconnect();
-
-                    LOG_TRACE(
-                        log,
-                        "Created HTTP(S) session with {}:{} ({}:{})",
-                        Session::getHost(),
-                        Session::getPort(),
-                        it->toString(),
-                        Session::getPort());
-
-                    break;
-                }
-                catch (...)
-                {
-                    Session::close();
-                    if (++it == endpoinds.end())
-                    {
-                        Session::setResolvedHost("");
-                        throw;
-                    }
-                    LOG_TRACE(
-                        log,
-                        "Failed to create connection with {}:{}, Will try another resolved address. {}",
-                        Session::getResolvedHost(),
-                        Session::getPort(),
-                        getCurrentExceptionMessage(false));
-                }
-            }
-        }
-        LoggerPtr log;
-    };
-
-    bool isHTTPS(const Poco::URI & uri)
-    {
-        if (uri.getScheme() == "https")
-            return true;
-        else if (uri.getScheme() == "http")
-            return false;
-        else
-            throw Exception(ErrorCodes::UNSUPPORTED_URI_SCHEME, "Unsupported scheme in URI '{}'", uri.toString());
-    }
-
-    HTTPSessionPtr makeHTTPSessionImpl(
-        const std::string & host,
-        UInt16 port,
-        bool https,
-        bool keep_alive,
-        DB::ProxyConfiguration proxy_configuration = {})
-    {
-        HTTPSessionPtr session;
-
-        if (!proxy_configuration.host.empty())
-        {
-            bool is_proxy_http_and_is_tunneling_off = DB::ProxyConfiguration::Protocol::HTTP == proxy_configuration.protocol
-                && !proxy_configuration.tunneling;
-
-            // If it is an HTTPS request, proxy server is HTTP and user opted for tunneling off, we must not create an HTTPS request.
-            // The desired flow is: HTTP request to the proxy server, then proxy server will initiate an HTTPS request to the target server.
-            // There is a weak link in the security, but that's what the user opted for.
-            if (https && is_proxy_http_and_is_tunneling_off)
-            {
-                https = false;
-            }
-        }
-
-        if (https)
-        {
-#if USE_SSL
-            session = std::make_shared<HTTPSessionAdapter<Poco::Net::HTTPSClientSession>>(host, port);
-#else
-            throw Exception(ErrorCodes::FEATURE_IS_NOT_ENABLED_AT_BUILD_TIME, "ClickHouse was built without HTTPS support");
-#endif
-        }
-        else
-        {
-            session = std::make_shared<HTTPSessionAdapter<Poco::Net::HTTPClientSession>>(host, port);
-        }
-
-        ProfileEvents::increment(ProfileEvents::CreatedHTTPConnections);
-
-        /// doesn't work properly without patch
-        session->setKeepAlive(keep_alive);
-
-        if (!proxy_configuration.host.empty())
-        {
-            session->setProxyConfig(proxyConfigurationToPocoProxyConfig(proxy_configuration));
-        }
-
-        return session;
-    }
-
-    class SingleEndpointHTTPSessionPool : public PoolBase<Poco::Net::HTTPClientSession>
-    {
-    private:
-        const std::string host;
-        const UInt16 port;
-        const bool https;
-        ProxyConfiguration proxy_config;
-
-        using Base = PoolBase<Poco::Net::HTTPClientSession>;
-
-        ObjectPtr allocObject() override
-        {
-            /// Pool is global, we shouldn't attribute this memory to query/user.
-            MemoryTrackerSwitcher switcher{&total_memory_tracker};
-
-            auto session = makeHTTPSessionImpl(host, port, https, true, proxy_config);
-            return session;
-        }
-
-    public:
-        SingleEndpointHTTPSessionPool(
-            const std::string & host_,
-            UInt16 port_,
-            bool https_,
-            ProxyConfiguration proxy_config_,
-            size_t max_pool_size_,
-            bool wait_on_pool_size_limit)
-            : Base(
-                static_cast<unsigned>(max_pool_size_),
-                getLogger("HTTPSessionPool"),
-                wait_on_pool_size_limit ? BehaviourOnLimit::Wait : BehaviourOnLimit::AllocateNewBypassingPool)
-            , host(host_)
-            , port(port_)
-            , https(https_)
-            , proxy_config(proxy_config_)
-        {
-        }
-    };
-
-    class HTTPSessionPool : private boost::noncopyable
-    {
-    public:
-        struct Key
-        {
-            String target_host;
-            UInt16 target_port;
-            bool is_target_https;
-            ProxyConfiguration proxy_config;
-            bool wait_on_pool_size_limit;
-
-            bool operator ==(const Key & rhs) const
-            {
-                return std::tie(
-                           target_host,
-                           target_port,
-                           is_target_https,
-                           proxy_config.host,
-                           proxy_config.port,
-                           proxy_config.protocol,
-                           proxy_config.tunneling,
-                           proxy_config.original_request_protocol,
-                           wait_on_pool_size_limit)
-                    == std::tie(
-                           rhs.target_host,
-                           rhs.target_port,
-                           rhs.is_target_https,
-                           rhs.proxy_config.host,
-                           rhs.proxy_config.port,
-                           rhs.proxy_config.protocol,
-                           rhs.proxy_config.tunneling,
-                           rhs.proxy_config.original_request_protocol,
-                           rhs.wait_on_pool_size_limit);
-            }
-        };
-
-    private:
-        using PoolPtr = std::shared_ptr<SingleEndpointHTTPSessionPool>;
-        using Entry = SingleEndpointHTTPSessionPool::Entry;
-
-        struct Hasher
-        {
-            size_t operator()(const Key & k) const
-            {
-                SipHash s;
-                s.update(k.target_host);
-                s.update(k.target_port);
-                s.update(k.is_target_https);
-                s.update(k.proxy_config.host);
-                s.update(k.proxy_config.port);
-                s.update(k.proxy_config.protocol);
-                s.update(k.proxy_config.tunneling);
-                s.update(k.proxy_config.original_request_protocol);
-                s.update(k.wait_on_pool_size_limit);
-                return s.get64();
-            }
-        };
-
-        std::mutex mutex;
-        std::unordered_map<Key, PoolPtr, Hasher> endpoints_pool;
-
-    protected:
-        HTTPSessionPool() = default;
-
-    public:
-        static auto & instance()
-        {
-            static HTTPSessionPool instance;
-            return instance;
-        }
-
-        Entry getSession(
-            const Poco::URI & uri,
-            const ProxyConfiguration & proxy_config,
-            const ConnectionTimeouts & timeouts,
-            size_t max_connections_per_endpoint,
-            bool wait_on_pool_size_limit)
-        {
-            std::unique_lock lock(mutex);
-            const std::string & host = uri.getHost();
-            UInt16 port = uri.getPort();
-            bool https = isHTTPS(uri);
-
-            HTTPSessionPool::Key key{host, port, https, proxy_config, wait_on_pool_size_limit};
-            auto pool_ptr = endpoints_pool.find(key);
-            if (pool_ptr == endpoints_pool.end())
-                std::tie(pool_ptr, std::ignore) = endpoints_pool.emplace(
-                    key,
-                    std::make_shared<SingleEndpointHTTPSessionPool>(
-                        host,
-                        port,
-                        https,
-                        proxy_config,
-                        max_connections_per_endpoint,
-                        wait_on_pool_size_limit));
-
-            /// Some routines held session objects until the end of its lifetime. Also this routines may create another sessions in this time frame.
-            /// If some other session holds `lock` because it waits on another lock inside `pool_ptr->second->get` it isn't possible to create any
-            /// new session and thus finish routine, return session to the pool and unlock the thread waiting inside `pool_ptr->second->get`.
-            /// To avoid such a deadlock we unlock `lock` before entering `pool_ptr->second->get`.
-            lock.unlock();
-
-            auto retry_timeout = timeouts.connection_timeout.totalMilliseconds();
-            auto session = pool_ptr->second->get(retry_timeout);
-
-            const auto & session_data = session->sessionData();
-            if (session_data.empty() || !Poco::AnyCast<HTTPSessionReuseTag>(&session_data))
-            {
-                /// Reset session if it is not reusable. See comment for HTTPSessionReuseTag.
-                session->reset();
-            }
-            session->attachSessionData({});
-
-            setTimeouts(*session, timeouts);
-
-            return session;
-        }
-    };
-}
-
-void setTimeouts(Poco::Net::HTTPClientSession & session, const ConnectionTimeouts & timeouts)
-{
-    session.setTimeout(timeouts.connection_timeout, timeouts.send_timeout, timeouts.receive_timeout);
-    session.setKeepAliveTimeout(timeouts.http_keep_alive_timeout);
 }
 
 void setResponseDefaultHeaders(HTTPServerResponse & response, size_t keep_alive_timeout)
@@ -370,28 +44,13 @@ void setResponseDefaultHeaders(HTTPServerResponse & response, size_t keep_alive_
 }
 
 HTTPSessionPtr makeHTTPSession(
+    HTTPConnectionGroupType group,
     const Poco::URI & uri,
     const ConnectionTimeouts & timeouts,
-    ProxyConfiguration proxy_configuration
-)
+    ProxyConfiguration proxy_configuration)
 {
-    const std::string & host = uri.getHost();
-    UInt16 port = uri.getPort();
-    bool https = isHTTPS(uri);
-
-    auto session = makeHTTPSessionImpl(host, port, https, false, proxy_configuration);
-    setTimeouts(*session, timeouts);
-    return session;
-}
-
-PooledHTTPSessionPtr makePooledHTTPSession(
-    const Poco::URI & uri,
-    const ConnectionTimeouts & timeouts,
-    size_t per_endpoint_pool_size,
-    bool wait_on_pool_size_limit,
-    ProxyConfiguration proxy_config)
-{
-    return HTTPSessionPool::instance().getSession(uri, proxy_config, timeouts, per_endpoint_pool_size, wait_on_pool_size_limit);
+    auto connection_pool = HTTPConnectionPools::instance().getPool(group, uri, proxy_configuration);
+    return connection_pool->getConnection(timeouts);
 }
 
 bool isRedirect(const Poco::Net::HTTPResponse::HTTPStatus status) { return status == Poco::Net::HTTPResponse::HTTP_MOVED_PERMANENTLY  || status == Poco::Net::HTTPResponse::HTTP_FOUND || status == Poco::Net::HTTPResponse::HTTP_SEE_OTHER  || status == Poco::Net::HTTPResponse::HTTP_TEMPORARY_REDIRECT; }
@@ -400,11 +59,11 @@ std::istream * receiveResponse(
     Poco::Net::HTTPClientSession & session, const Poco::Net::HTTPRequest & request, Poco::Net::HTTPResponse & response, const bool allow_redirects)
 {
     auto & istr = session.receiveResponse(response);
-    assertResponseIsOk(request, response, istr, allow_redirects);
+    assertResponseIsOk(request.getURI(), response, istr, allow_redirects);
     return &istr;
 }
 
-void assertResponseIsOk(const Poco::Net::HTTPRequest & request, Poco::Net::HTTPResponse & response, std::istream & istr, const bool allow_redirects)
+void assertResponseIsOk(const String & uri, Poco::Net::HTTPResponse & response, std::istream & istr, const bool allow_redirects)
 {
     auto status = response.getStatus();
 
@@ -422,7 +81,7 @@ void assertResponseIsOk(const Poco::Net::HTTPRequest & request, Poco::Net::HTTPR
         body.exceptions(std::ios::failbit);
         body << istr.rdbuf();
 
-        throw HTTPException(code, request.getURI(), status, response.getReason(), body.str());
+        throw HTTPException(code, uri, status, response.getReason(), body.str());
     }
 }
 
@@ -440,24 +99,4 @@ Exception HTTPException::makeExceptionMessage(
         uri, static_cast<int>(http_status), reason, body);
 }
 
-void markSessionForReuse(Poco::Net::HTTPSession & session)
-{
-    const auto & session_data = session.sessionData();
-    if (!session_data.empty() && !Poco::AnyCast<HTTPSessionReuseTag>(&session_data))
-        throw Exception(
-            ErrorCodes::LOGICAL_ERROR, "Data of an unexpected type ({}) is attached to the session", session_data.type().name());
-
-    session.attachSessionData(HTTPSessionReuseTag{});
-}
-
-void markSessionForReuse(HTTPSessionPtr session)
-{
-    markSessionForReuse(*session);
-}
-
-void markSessionForReuse(PooledHTTPSessionPtr session)
-{
-    markSessionForReuse(static_cast<Poco::Net::HTTPSession &>(*session));
-}
-
 }
diff --git a/src/IO/HTTPCommon.h b/src/IO/HTTPCommon.h
index c9968fc6915..e27269e2559 100644
--- a/src/IO/HTTPCommon.h
+++ b/src/IO/HTTPCommon.h
@@ -7,9 +7,9 @@
 #include <Poco/Net/HTTPRequest.h>
 #include <Poco/Net/HTTPResponse.h>
 #include <Poco/URI.h>
-#include <Common/PoolBase.h>
-#include <Common/ProxyConfiguration.h>
 #include <Poco/URIStreamFactory.h>
+#include <Common/HTTPConnectionPool.h>
+#include <Common/ProxyConfiguration.h>
 
 #include <IO/ConnectionTimeouts.h>
 
@@ -36,7 +36,7 @@ public:
     HTTPException * clone() const override { return new HTTPException(*this); }
     void rethrow() const override { throw *this; }
 
-    int getHTTPStatus() const { return http_status; }
+    Poco::Net::HTTPResponse::HTTPStatus getHTTPStatus() const { return http_status; }
 
 private:
     Poco::Net::HTTPResponse::HTTPStatus http_status{};
@@ -52,55 +52,18 @@ private:
     const char * className() const noexcept override { return "DB::HTTPException"; }
 };
 
-using PooledHTTPSessionPtr = PoolBase<Poco::Net::HTTPClientSession>::Entry; // SingleEndpointHTTPSessionPool::Entry
 using HTTPSessionPtr = std::shared_ptr<Poco::Net::HTTPClientSession>;
 
-/// If a session have this tag attached, it will be reused without calling `reset()` on it.
-/// All pooled sessions don't have this tag attached after being taken from a pool.
-/// If the request and the response were fully written/read, the client code should add this tag
-/// explicitly by calling `markSessionForReuse()`.
-///
-/// Note that HTTP response may contain extra bytes after the last byte of the payload. Specifically,
-/// when chunked encoding is used, there's an empty chunk at the end. Those extra bytes must also be
-/// read before the session can be reused. So we usually put an `istr->ignore(INT64_MAX)` call
-/// before `markSessionForReuse()`.
-struct HTTPSessionReuseTag
-{
-};
-
-void markSessionForReuse(Poco::Net::HTTPSession & session);
-void markSessionForReuse(HTTPSessionPtr session);
-void markSessionForReuse(PooledHTTPSessionPtr session);
-
-
 void setResponseDefaultHeaders(HTTPServerResponse & response, size_t keep_alive_timeout);
 
 /// Create session object to perform requests and set required parameters.
 HTTPSessionPtr makeHTTPSession(
+    HTTPConnectionGroupType group,
     const Poco::URI & uri,
     const ConnectionTimeouts & timeouts,
     ProxyConfiguration proxy_config = {}
 );
 
-/// As previous method creates session, but takes it from pool, without and with proxy uri.
-///
-/// The max_connections_per_endpoint parameter makes it look like the pool size can be different for
-/// different requests (whatever that means), but actually we just assign the endpoint's connection
-/// pool size when we see the endpoint for the first time, then we never change it.
-/// We should probably change how this configuration works, and how this pooling works in general:
-///  * Make the per_endpoint_pool_size be a global server setting instead of per-disk or per-query.
-///  * Have boolean per-disk/per-query settings for enabling/disabling pooling.
-///  * Add a limit on the number of endpoints and the total number of sessions across all endpoints.
-///  * Enable pooling by default everywhere. In particular StorageURL and StorageS3.
-///    (Enabling it for StorageURL is scary without the previous item - the user may query lots of
-///     different endpoints. So currently pooling is mainly used for S3.)
-PooledHTTPSessionPtr makePooledHTTPSession(
-    const Poco::URI & uri,
-    const ConnectionTimeouts & timeouts,
-    size_t per_endpoint_pool_size,
-    bool wait_on_pool_size_limit = true,
-    ProxyConfiguration proxy_config = {});
-
 bool isRedirect(Poco::Net::HTTPResponse::HTTPStatus status);
 
 /** Used to receive response (response headers and possibly body)
@@ -112,7 +75,6 @@ std::istream * receiveResponse(
     Poco::Net::HTTPClientSession & session, const Poco::Net::HTTPRequest & request, Poco::Net::HTTPResponse & response, bool allow_redirects);
 
 void assertResponseIsOk(
-    const Poco::Net::HTTPRequest & request, Poco::Net::HTTPResponse & response, std::istream & istr, bool allow_redirects = false);
+    const String & uri, Poco::Net::HTTPResponse & response, std::istream & istr, bool allow_redirects = false);
 
-void setTimeouts(Poco::Net::HTTPClientSession & session, const ConnectionTimeouts & timeouts);
 }
diff --git a/src/IO/LimitReadBuffer.cpp b/src/IO/LimitReadBuffer.cpp
index e14112f8d19..84c7ac86227 100644
--- a/src/IO/LimitReadBuffer.cpp
+++ b/src/IO/LimitReadBuffer.cpp
@@ -1,5 +1,4 @@
 #include <IO/LimitReadBuffer.h>
-
 #include <Common/Exception.h>
 
 
@@ -15,7 +14,7 @@ namespace ErrorCodes
 
 bool LimitReadBuffer::nextImpl()
 {
-    assert(position() >= in->position());
+    chassert(position() >= in->position());
 
     /// Let underlying buffer calculate read bytes in `next()` call.
     in->position() = position();
@@ -39,20 +38,18 @@ bool LimitReadBuffer::nextImpl()
         if (exact_limit && bytes != *exact_limit)
             throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Unexpected EOF, got {} of {} bytes", bytes, *exact_limit);
         /// Clearing the buffer with existing data.
-        set(in->position(), 0);
+        BufferBase::set(in->position(), 0, 0);
+
         return false;
     }
 
-    working_buffer = in->buffer();
-
-    if (limit - bytes < working_buffer.size())
-        working_buffer.resize(limit - bytes);
+    BufferBase::set(in->position(), std::min(in->available(), limit - bytes), 0);
 
     return true;
 }
 
 
-LimitReadBuffer::LimitReadBuffer(ReadBuffer * in_, bool owns, UInt64 limit_, bool throw_exception_,
+LimitReadBuffer::LimitReadBuffer(ReadBuffer * in_, bool owns, size_t limit_, bool throw_exception_,
                                  std::optional<size_t> exact_limit_, std::string exception_message_)
     : ReadBuffer(in_ ? in_->position() : nullptr, 0)
     , in(in_)
@@ -62,24 +59,20 @@ LimitReadBuffer::LimitReadBuffer(ReadBuffer * in_, bool owns, UInt64 limit_, boo
     , exact_limit(exact_limit_)
     , exception_message(std::move(exception_message_))
 {
-    assert(in);
+    chassert(in);
 
-    size_t remaining_bytes_in_buffer = in->buffer().end() - in->position();
-    if (remaining_bytes_in_buffer > limit)
-        remaining_bytes_in_buffer = limit;
-
-    working_buffer = Buffer(in->position(), in->position() + remaining_bytes_in_buffer);
+    BufferBase::set(in->position(), std::min(in->available(), limit), 0);
 }
 
 
-LimitReadBuffer::LimitReadBuffer(ReadBuffer & in_, UInt64 limit_, bool throw_exception_,
+LimitReadBuffer::LimitReadBuffer(ReadBuffer & in_, size_t limit_, bool throw_exception_,
                                  std::optional<size_t> exact_limit_, std::string exception_message_)
     : LimitReadBuffer(&in_, false, limit_, throw_exception_, exact_limit_, exception_message_)
 {
 }
 
 
-LimitReadBuffer::LimitReadBuffer(std::unique_ptr<ReadBuffer> in_, UInt64 limit_, bool throw_exception_,
+LimitReadBuffer::LimitReadBuffer(std::unique_ptr<ReadBuffer> in_, size_t limit_, bool throw_exception_,
                                  std::optional<size_t> exact_limit_, std::string exception_message_)
     : LimitReadBuffer(in_.release(), true, limit_, throw_exception_, exact_limit_, exception_message_)
 {
diff --git a/src/IO/LimitReadBuffer.h b/src/IO/LimitReadBuffer.h
index 15885c1d850..b869f2935fb 100644
--- a/src/IO/LimitReadBuffer.h
+++ b/src/IO/LimitReadBuffer.h
@@ -13,22 +13,24 @@ namespace DB
 class LimitReadBuffer : public ReadBuffer
 {
 public:
-    LimitReadBuffer(ReadBuffer & in_, UInt64 limit_, bool throw_exception_,
+    LimitReadBuffer(ReadBuffer & in_, size_t limit_, bool throw_exception_,
                     std::optional<size_t> exact_limit_, std::string exception_message_ = {});
-    LimitReadBuffer(std::unique_ptr<ReadBuffer> in_, UInt64 limit_, bool throw_exception_, std::optional<size_t> exact_limit_,
+    LimitReadBuffer(std::unique_ptr<ReadBuffer> in_, size_t limit_, bool throw_exception_, std::optional<size_t> exact_limit_,
                     std::string exception_message_ = {});
     ~LimitReadBuffer() override;
 
 private:
     ReadBuffer * in;
-    bool owns_in;
+    const bool owns_in;
 
-    UInt64 limit;
-    bool throw_exception;
-    std::optional<size_t> exact_limit;
-    std::string exception_message;
+    const size_t limit;
+    const bool throw_exception;
+    const std::optional<size_t> exact_limit;
+    const std::string exception_message;
 
-    LimitReadBuffer(ReadBuffer * in_, bool owns, UInt64 limit_, bool throw_exception_, std::optional<size_t> exact_limit_, std::string exception_message_);
+    LoggerPtr log;
+
+    LimitReadBuffer(ReadBuffer * in_, bool owns, size_t limit_, bool throw_exception_, std::optional<size_t> exact_limit_, std::string exception_message_);
 
     bool nextImpl() override;
 };
diff --git a/src/IO/MMapReadBufferFromFileDescriptor.cpp b/src/IO/MMapReadBufferFromFileDescriptor.cpp
index 9b1c132cc01..f27828f71b2 100644
--- a/src/IO/MMapReadBufferFromFileDescriptor.cpp
+++ b/src/IO/MMapReadBufferFromFileDescriptor.cpp
@@ -92,7 +92,7 @@ size_t MMapReadBufferFromFileDescriptor::getFileSize()
     return getSizeFromFileDescriptor(getFD(), getFileName());
 }
 
-size_t MMapReadBufferFromFileDescriptor::readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &)
+size_t MMapReadBufferFromFileDescriptor::readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &) const
 {
     if (offset >= mapped.getLength())
         return 0;
diff --git a/src/IO/MMapReadBufferFromFileDescriptor.h b/src/IO/MMapReadBufferFromFileDescriptor.h
index 2a039e04971..f774538374a 100644
--- a/src/IO/MMapReadBufferFromFileDescriptor.h
+++ b/src/IO/MMapReadBufferFromFileDescriptor.h
@@ -40,7 +40,7 @@ public:
 
     size_t getFileSize() override;
 
-    size_t readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &) override;
+    size_t readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &) const override;
     bool supportsReadAt() override { return true; }
 };
 
diff --git a/src/IO/ReadBuffer.h b/src/IO/ReadBuffer.h
index 00325734354..056e25a5fbe 100644
--- a/src/IO/ReadBuffer.h
+++ b/src/IO/ReadBuffer.h
@@ -63,21 +63,23 @@ public:
       */
     bool next()
     {
-        assert(!hasPendingData());
-        assert(position() <= working_buffer.end());
+        chassert(!hasPendingData());
+        chassert(position() <= working_buffer.end());
 
         bytes += offset();
         bool res = nextImpl();
         if (!res)
+        {
             working_buffer = Buffer(pos, pos);
+        }
         else
         {
-            pos = working_buffer.begin() + nextimpl_working_buffer_offset;
-            assert(position() != working_buffer.end());
+            pos = working_buffer.begin() + std::min(nextimpl_working_buffer_offset, working_buffer.size());
+            chassert(position() < working_buffer.end());
         }
         nextimpl_working_buffer_offset = 0;
 
-        assert(position() <= working_buffer.end());
+        chassert(position() <= working_buffer.end());
 
         return res;
     }
diff --git a/src/IO/ReadBufferFromFileDescriptor.cpp b/src/IO/ReadBufferFromFileDescriptor.cpp
index 3211f8eeb35..57442a15853 100644
--- a/src/IO/ReadBufferFromFileDescriptor.cpp
+++ b/src/IO/ReadBufferFromFileDescriptor.cpp
@@ -49,7 +49,7 @@ std::string ReadBufferFromFileDescriptor::getFileName() const
 }
 
 
-size_t ReadBufferFromFileDescriptor::readImpl(char * to, size_t min_bytes, size_t max_bytes, size_t offset)
+size_t ReadBufferFromFileDescriptor::readImpl(char * to, size_t min_bytes, size_t max_bytes, size_t offset) const
 {
     chassert(min_bytes <= max_bytes);
 
@@ -265,7 +265,7 @@ bool ReadBufferFromFileDescriptor::checkIfActuallySeekable()
     return res == 0 && S_ISREG(stat.st_mode);
 }
 
-size_t ReadBufferFromFileDescriptor::readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &)
+size_t ReadBufferFromFileDescriptor::readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &) const
 {
     chassert(use_pread);
     return readImpl(to, n, n, offset);
diff --git a/src/IO/ReadBufferFromFileDescriptor.h b/src/IO/ReadBufferFromFileDescriptor.h
index 4762998c67b..db256ef91c7 100644
--- a/src/IO/ReadBufferFromFileDescriptor.h
+++ b/src/IO/ReadBufferFromFileDescriptor.h
@@ -34,7 +34,7 @@ protected:
     /// Doesn't seek (`offset` must match fd's position if !use_pread).
     /// Stops after min_bytes or eof. Returns 0 if eof.
     /// Thread safe.
-    size_t readImpl(char * to, size_t min_bytes, size_t max_bytes, size_t offset);
+    size_t readImpl(char * to, size_t min_bytes, size_t max_bytes, size_t offset) const;
 
 public:
     explicit ReadBufferFromFileDescriptor(
@@ -73,7 +73,7 @@ public:
 
     bool checkIfActuallySeekable() override;
 
-    size_t readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &) override;
+    size_t readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &) const override;
     bool supportsReadAt() override { return use_pread; }
 };
 
diff --git a/src/IO/ReadBufferFromIStream.cpp b/src/IO/ReadBufferFromIStream.cpp
index 52546f1703d..bc90ec7ed15 100644
--- a/src/IO/ReadBufferFromIStream.cpp
+++ b/src/IO/ReadBufferFromIStream.cpp
@@ -5,52 +5,44 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int CANNOT_READ_FROM_ISTREAM;
-}
-
 bool ReadBufferFromIStream::nextImpl()
 {
     if (eof)
         return false;
 
+    chassert(internal_buffer.begin() != nullptr);
+    chassert(!internal_buffer.empty());
+
     size_t bytes_read = 0;
     char * read_to = internal_buffer.begin();
 
     /// It is necessary to read in a loop, since socket usually returns only data available at the moment.
     while (bytes_read < internal_buffer.size())
     {
-        try
+        const auto bytes_read_last_time = stream_buf.readFromDevice(read_to, internal_buffer.size() - bytes_read);
+        if (bytes_read_last_time <= 0)
         {
-            const auto bytes_read_last_time = stream_buf.readFromDevice(read_to, internal_buffer.size() - bytes_read);
-            if (bytes_read_last_time <= 0)
-            {
-                eof = true;
-                break;
-            }
+            eof = true;
+            break;
+        }
 
-            bytes_read += bytes_read_last_time;
-            read_to += bytes_read_last_time;
-        }
-        catch (...)
-        {
-            throw Exception(
-                ErrorCodes::CANNOT_READ_FROM_ISTREAM,
-                "Cannot read from istream at offset {}: {}",
-                count(),
-                getCurrentExceptionMessage(/*with_stacktrace=*/true));
-        }
+        bytes_read += bytes_read_last_time;
+        read_to += bytes_read_last_time;
     }
 
     if (bytes_read)
+    {
+        working_buffer = internal_buffer;
         working_buffer.resize(bytes_read);
+    }
 
     return bytes_read;
 }
 
 ReadBufferFromIStream::ReadBufferFromIStream(std::istream & istr_, size_t size)
-    : BufferWithOwnMemory<ReadBuffer>(size), istr(istr_), stream_buf(dynamic_cast<Poco::Net::HTTPBasicStreamBuf &>(*istr.rdbuf()))
+    : BufferWithOwnMemory<ReadBuffer>(size)
+    , istr(istr_)
+    , stream_buf(dynamic_cast<Poco::Net::HTTPBasicStreamBuf &>(*istr.rdbuf()))
 {
 }
 
diff --git a/src/IO/ReadBufferFromS3.cpp b/src/IO/ReadBufferFromS3.cpp
index 4529771e7b2..491ff253066 100644
--- a/src/IO/ReadBufferFromS3.cpp
+++ b/src/IO/ReadBufferFromS3.cpp
@@ -34,61 +34,6 @@ namespace ProfileEvents
     extern const Event RemoteReadThrottlerSleepMicroseconds;
 }
 
-namespace
-{
-DB::PooledHTTPSessionPtr getSession(Aws::S3::Model::GetObjectResult & read_result)
-{
-    if (auto * session_aware_stream = dynamic_cast<DB::S3::SessionAwareIOStream<DB::PooledHTTPSessionPtr> *>(&read_result.GetBody()))
-        return static_cast<DB::PooledHTTPSessionPtr &>(session_aware_stream->getSession());
-
-    if (dynamic_cast<DB::S3::SessionAwareIOStream<DB::HTTPSessionPtr> *>(&read_result.GetBody()))
-        return {};
-
-    /// accept result from S# mock in gtest_writebuffer_s3.cpp
-    if (dynamic_cast<Aws::Utils::Stream::DefaultUnderlyingStream *>(&read_result.GetBody()))
-        return {};
-
-    throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Session of unexpected type encountered");
-}
-
-void resetSession(Aws::S3::Model::GetObjectResult & read_result)
-{
-    if (auto session = getSession(read_result); !session.isNull())
-    {
-        auto & http_session = static_cast<Poco::Net::HTTPClientSession &>(*session);
-        http_session.reset();
-    }
-}
-
-void resetSessionIfNeeded(bool read_all_range_successfully, std::optional<Aws::S3::Model::GetObjectResult> & read_result)
-{
-    if (!read_result)
-        return;
-
-    if (!read_all_range_successfully)
-    {
-        /// When we abandon a session with an ongoing GetObject request and there is another one trying to delete the same object this delete
-        /// operation will hang until GetObject's session idle timeouts. So we have to call `reset()` on GetObject's session session immediately.
-        resetSession(*read_result);
-        ProfileEvents::increment(ProfileEvents::ReadBufferFromS3ResetSessions);
-    }
-    else if (auto session = getSession(*read_result); !session.isNull())
-    {
-        if (!session->getProxyHost().empty())
-        {
-            /// Reset proxified sessions because proxy can change for every request. See ProxyConfigurationResolver.
-            resetSession(*read_result);
-            ProfileEvents::increment(ProfileEvents::ReadBufferFromS3ResetSessions);
-        }
-        else
-        {
-            DB::markSessionForReuse(session);
-            ProfileEvents::increment(ProfileEvents::ReadBufferFromS3PreservedSessions);
-        }
-    }
-}
-}
-
 namespace DB
 {
 namespace ErrorCodes
@@ -228,7 +173,7 @@ bool ReadBufferFromS3::nextImpl()
 }
 
 
-size_t ReadBufferFromS3::readBigAt(char * to, size_t n, size_t range_begin, const std::function<bool(size_t)> & progress_callback)
+size_t ReadBufferFromS3::readBigAt(char * to, size_t n, size_t range_begin, const std::function<bool(size_t)> & progress_callback) const
 {
     size_t initial_n = n;
     size_t sleep_time_with_backoff_milliseconds = 100;
@@ -240,29 +185,6 @@ size_t ReadBufferFromS3::readBigAt(char * to, size_t n, size_t range_begin, cons
         ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::ReadBufferFromS3Microseconds);
 
         std::optional<Aws::S3::Model::GetObjectResult> result;
-        /// Connection is reusable if we've read the full response.
-        bool session_is_reusable = false;
-        SCOPE_EXIT(
-        {
-            if (!result.has_value())
-                return;
-            if (session_is_reusable)
-            {
-                auto session = getSession(*result);
-                if (!session.isNull())
-                {
-                    DB::markSessionForReuse(session);
-                    ProfileEvents::increment(ProfileEvents::ReadBufferFromS3PreservedSessions);
-                }
-                else
-                    session_is_reusable = false;
-            }
-            if (!session_is_reusable)
-            {
-                resetSession(*result);
-                ProfileEvents::increment(ProfileEvents::ReadBufferFromS3ResetSessions);
-            }
-        });
 
         try
         {
@@ -276,9 +198,8 @@ size_t ReadBufferFromS3::readBigAt(char * to, size_t n, size_t range_begin, cons
             if (read_settings.remote_throttler)
                 read_settings.remote_throttler->add(bytes_copied, ProfileEvents::RemoteReadThrottlerBytes, ProfileEvents::RemoteReadThrottlerSleepMicroseconds);
 
-            /// Read remaining bytes after the end of the payload, see HTTPSessionReuseTag.
+            /// Read remaining bytes after the end of the payload
             istr.ignore(INT64_MAX);
-            session_is_reusable = true;
         }
         catch (Poco::Exception & e)
         {
@@ -451,21 +372,8 @@ bool ReadBufferFromS3::atEndOfRequestedRangeGuess()
     return false;
 }
 
-ReadBufferFromS3::~ReadBufferFromS3()
-{
-    try
-    {
-        resetSessionIfNeeded(readAllRangeSuccessfully(), read_result);
-    }
-    catch (...)
-    {
-        tryLogCurrentException(log);
-    }
-}
-
 std::unique_ptr<ReadBuffer> ReadBufferFromS3::initialize(size_t attempt)
 {
-    resetSessionIfNeeded(readAllRangeSuccessfully(), read_result);
     read_all_range_successfully = false;
 
     /**
@@ -534,10 +442,6 @@ Aws::S3::Model::GetObjectResult ReadBufferFromS3::sendRequest(size_t attempt, si
     }
 }
 
-bool ReadBufferFromS3::readAllRangeSuccessfully() const
-{
-    return read_until_position ? offset == read_until_position : read_all_range_successfully;
-}
 }
 
 #endif
diff --git a/src/IO/ReadBufferFromS3.h b/src/IO/ReadBufferFromS3.h
index f28c23a71d7..003c88df7d2 100644
--- a/src/IO/ReadBufferFromS3.h
+++ b/src/IO/ReadBufferFromS3.h
@@ -55,7 +55,7 @@ public:
         bool restricted_seek_ = false,
         std::optional<size_t> file_size = std::nullopt);
 
-    ~ReadBufferFromS3() override;
+    ~ReadBufferFromS3() override = default;
 
     bool nextImpl() override;
 
@@ -74,7 +74,7 @@ public:
 
     String getFileName() const override { return bucket + "/" + key; }
 
-    size_t readBigAt(char * to, size_t n, size_t range_begin, const std::function<bool(size_t)> & progress_callback) override;
+    size_t readBigAt(char * to, size_t n, size_t range_begin, const std::function<bool(size_t)> & progress_callback) const override;
 
     bool supportsReadAt() override { return true; }
 
@@ -90,8 +90,6 @@ private:
 
     Aws::S3::Model::GetObjectResult sendRequest(size_t attempt, size_t range_begin, std::optional<size_t> range_end_incl) const;
 
-    bool readAllRangeSuccessfully() const;
-
     ReadSettings read_settings;
 
     bool use_external_buffer;
diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index 31ea45d92a9..38904df4403 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -122,7 +122,7 @@ struct ReadSettings
     // Resource to be used during reading
     ResourceLink resource_link;
 
-    size_t http_max_tries = 1;
+    size_t http_max_tries = 10;
     size_t http_retry_initial_backoff_ms = 100;
     size_t http_retry_max_backoff_ms = 1600;
     bool http_skip_not_found_url_for_globs = true;
diff --git a/src/IO/ReadWriteBufferFromHTTP.cpp b/src/IO/ReadWriteBufferFromHTTP.cpp
index 15c2a0a021b..bcbec97537a 100644
--- a/src/IO/ReadWriteBufferFromHTTP.cpp
+++ b/src/IO/ReadWriteBufferFromHTTP.cpp
@@ -1,13 +1,65 @@
 #include "ReadWriteBufferFromHTTP.h"
 
 #include <IO/HTTPCommon.h>
+#include <Common/NetException.h>
+#include <Poco/Net/NetException.h>
+
 
 namespace ProfileEvents
 {
     extern const Event ReadBufferSeekCancelConnection;
-    extern const Event ReadWriteBufferFromHTTPPreservedSessions;
 }
 
+
+namespace
+{
+
+bool isRetriableError(const Poco::Net::HTTPResponse::HTTPStatus http_status) noexcept
+{
+    static constexpr std::array non_retriable_errors{
+        Poco::Net::HTTPResponse::HTTPStatus::HTTP_BAD_REQUEST,
+        Poco::Net::HTTPResponse::HTTPStatus::HTTP_UNAUTHORIZED,
+        Poco::Net::HTTPResponse::HTTPStatus::HTTP_NOT_FOUND,
+        Poco::Net::HTTPResponse::HTTPStatus::HTTP_FORBIDDEN,
+        Poco::Net::HTTPResponse::HTTPStatus::HTTP_NOT_IMPLEMENTED,
+        Poco::Net::HTTPResponse::HTTPStatus::HTTP_METHOD_NOT_ALLOWED};
+
+    return std::all_of(
+        non_retriable_errors.begin(), non_retriable_errors.end(), [&](const auto status) { return http_status != status; });
+}
+
+Poco::URI getUriAfterRedirect(const Poco::URI & prev_uri, Poco::Net::HTTPResponse & response)
+{
+    chassert(DB::isRedirect(response.getStatus()));
+
+    auto location = response.get("Location");
+    auto location_uri = Poco::URI(location);
+    if (!location_uri.isRelative())
+        return location_uri;
+    /// Location header contains relative path. So we need to concatenate it
+    /// with path from the original URI and normalize it.
+    auto path = std::filesystem::weakly_canonical(std::filesystem::path(prev_uri.getPath()) / location);
+    location_uri = prev_uri;
+    location_uri.setPath(path);
+    return location_uri;
+}
+
+class ReadBufferFromSessionResponse : public DB::ReadBufferFromIStream
+{
+private:
+    DB::HTTPSessionPtr session;
+
+public:
+    ReadBufferFromSessionResponse(DB::HTTPSessionPtr && session_, std::istream & rstr, size_t size)
+    : ReadBufferFromIStream(rstr, size)
+    , session(std::move(session_))
+    {
+    }
+};
+
+}
+
+
 namespace DB
 {
 
@@ -21,94 +73,29 @@ namespace ErrorCodes
     extern const int UNKNOWN_FILE_SIZE;
 }
 
-template <typename TSessionFactory>
-UpdatableSession<TSessionFactory>::UpdatableSession(const Poco::URI & uri, UInt64 max_redirects_, std::shared_ptr<TSessionFactory> session_factory_)
-    : max_redirects{max_redirects_}
-    , initial_uri(uri)
-    , session_factory(std::move(session_factory_))
+std::unique_ptr<ReadBuffer> ReadWriteBufferFromHTTP::CallResult::transformToReadBuffer(size_t buf_size) &&
 {
-    session = session_factory->buildNewSession(uri);
+    chassert(session);
+    return std::make_unique<ReadBufferFromSessionResponse>(std::move(session), *response_stream, buf_size);
 }
 
-template <typename TSessionFactory>
-typename UpdatableSession<TSessionFactory>::SessionPtr UpdatableSession<TSessionFactory>::getSession() { return session; }
-
-template <typename TSessionFactory>
-void UpdatableSession<TSessionFactory>::updateSession(const Poco::URI & uri)
-{
-    ++redirects;
-    if (redirects <= max_redirects)
-        session = session_factory->buildNewSession(uri);
-    else
-        throw Exception(ErrorCodes::TOO_MANY_REDIRECTS,
-            "Too many redirects while trying to access {}."
-            " You can {} redirects by changing the setting 'max_http_get_redirects'."
-            " Example: `SET max_http_get_redirects = 10`."
-            " Redirects are restricted to prevent possible attack when a malicious server redirects to an internal resource, bypassing the authentication or firewall.",
-            initial_uri.toString(), max_redirects ? "increase the allowed maximum number of" : "allow");
-}
-
-template <typename TSessionFactory>
-typename UpdatableSession<TSessionFactory>::SessionPtr UpdatableSession<TSessionFactory>::createDetachedSession(const Poco::URI & uri)
-{
-    return session_factory->buildNewSession(uri);
-}
-
-template <typename TSessionFactory>
-std::shared_ptr<UpdatableSession<TSessionFactory>> UpdatableSession<TSessionFactory>::clone(const Poco::URI & uri)
-{
-    return std::make_shared<UpdatableSession<TSessionFactory>>(uri, max_redirects, session_factory);
-}
-
-
-namespace detail
-{
-
-static bool isRetriableError(const Poco::Net::HTTPResponse::HTTPStatus http_status) noexcept
-{
-    static constexpr std::array non_retriable_errors{
-        Poco::Net::HTTPResponse::HTTPStatus::HTTP_BAD_REQUEST,
-        Poco::Net::HTTPResponse::HTTPStatus::HTTP_UNAUTHORIZED,
-        Poco::Net::HTTPResponse::HTTPStatus::HTTP_NOT_FOUND,
-        Poco::Net::HTTPResponse::HTTPStatus::HTTP_FORBIDDEN,
-        Poco::Net::HTTPResponse::HTTPStatus::HTTP_NOT_IMPLEMENTED,
-        Poco::Net::HTTPResponse::HTTPStatus::HTTP_METHOD_NOT_ALLOWED};
-
-    return std::all_of(
-        non_retriable_errors.begin(), non_retriable_errors.end(), [&](const auto status) { return http_status != status; });
-}
-
-static Poco::URI getUriAfterRedirect(const Poco::URI & prev_uri, Poco::Net::HTTPResponse & response)
-{
-    auto location = response.get("Location");
-    auto location_uri = Poco::URI(location);
-    if (!location_uri.isRelative())
-        return location_uri;
-    /// Location header contains relative path. So we need to concatenate it
-    /// with path from the original URI and normalize it.
-    auto path = std::filesystem::weakly_canonical(std::filesystem::path(prev_uri.getPath()) / location);
-    location_uri = prev_uri;
-    location_uri.setPath(path);
-    return location_uri;
-}
-
-template <typename UpdatableSessionPtr>
-bool ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::withPartialContent(const HTTPRange & range) const
+bool ReadWriteBufferFromHTTP::withPartialContent() const
 {
     /**
      * Add range header if we have some passed range
      * or if we want to retry GET request on purpose.
      */
-    return range.begin || range.end || retry_with_range_header;
+    return read_range.begin || read_range.end || getOffset() > 0;
 }
 
-template <typename UpdatableSessionPtr>
-size_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getOffset() const { return read_range.begin.value_or(0) + offset_from_begin_pos; }
-
-template <typename UpdatableSessionPtr>
-void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::prepareRequest(Poco::Net::HTTPRequest & request, Poco::URI uri_, std::optional<HTTPRange> range) const
+size_t ReadWriteBufferFromHTTP::getOffset() const
 {
-    request.setHost(uri_.getHost()); // use original, not resolved host name in header
+    return read_range.begin.value_or(0) + offset_from_begin_pos;
+}
+
+void ReadWriteBufferFromHTTP::prepareRequest(Poco::Net::HTTPRequest & request, std::optional<HTTPRange> range) const
+{
+    request.setHost(initial_uri.getHost()); // use original, not resolved host name in header
 
     if (out_stream_callback)
         request.setChunkedTransferEncoding(true);
@@ -125,7 +112,6 @@ void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::prepareRequest(Poco::Net:
             range_header_value = fmt::format("bytes={}-{}", *range->begin, *range->end);
         else
             range_header_value = fmt::format("bytes={}-", *range->begin);
-        LOG_TEST(log, "Adding header: Range: {}", range_header_value);
         request.set("Range", range_header_value);
     }
 
@@ -133,45 +119,7 @@ void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::prepareRequest(Poco::Net:
         credentials.authenticate(request);
 }
 
-template <typename UpdatableSessionPtr>
-std::istream * ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::callImpl(
-    UpdatableSessionPtr & current_session, Poco::URI uri_, Poco::Net::HTTPResponse & response, const std::string & method_, bool for_object_info)
-{
-    // With empty path poco will send "POST  HTTP/1.1" its bug.
-    if (uri_.getPath().empty())
-        uri_.setPath("/");
-
-    std::optional<HTTPRange> range;
-    if (!for_object_info)
-    {
-        if (withPartialContent(read_range))
-            range = HTTPRange{getOffset(), read_range.end};
-    }
-
-    Poco::Net::HTTPRequest request(method_, uri_.getPathAndQuery(), Poco::Net::HTTPRequest::HTTP_1_1);
-    prepareRequest(request, uri_, range);
-
-    LOG_TRACE(log, "Sending request to {}", uri_.toString());
-
-    auto sess = current_session->getSession();
-    auto & stream_out = sess->sendRequest(request);
-
-    if (out_stream_callback)
-        out_stream_callback(stream_out);
-
-    auto result_istr = receiveResponse(*sess, request, response, true);
-    response.getCookies(cookies);
-
-    /// we can fetch object info while the request is being processed
-    /// and we don't want to override any context used by it
-    if (!for_object_info)
-        content_encoding = response.get("Content-Encoding", "");
-
-    return result_istr;
-}
-
-template <typename UpdatableSessionPtr>
-size_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getFileSize()
+size_t ReadWriteBufferFromHTTP::getFileSize()
 {
     if (!file_info)
         file_info = getFileInfo();
@@ -179,243 +127,288 @@ size_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getFileSize()
     if (file_info->file_size)
         return *file_info->file_size;
 
-    throw Exception(ErrorCodes::UNKNOWN_FILE_SIZE, "Cannot find out file size for: {}", uri.toString());
+    throw Exception(ErrorCodes::UNKNOWN_FILE_SIZE, "Cannot find out file size for: {}", initial_uri.toString());
 }
 
-template <typename UpdatableSessionPtr>
-bool ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::supportsReadAt()
+bool ReadWriteBufferFromHTTP::supportsReadAt()
 {
     if (!file_info)
         file_info = getFileInfo();
     return method == Poco::Net::HTTPRequest::HTTP_GET && file_info->seekable;
 }
 
-template <typename UpdatableSessionPtr>
-bool ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::checkIfActuallySeekable()
+bool ReadWriteBufferFromHTTP::checkIfActuallySeekable()
 {
     if (!file_info)
         file_info = getFileInfo();
     return file_info->seekable;
 }
 
-template <typename UpdatableSessionPtr>
-String ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getFileName() const { return uri.toString(); }
-
-template <typename UpdatableSessionPtr>
-void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getHeadResponse(Poco::Net::HTTPResponse & response)
+String ReadWriteBufferFromHTTP::getFileName() const
 {
-    for (size_t i = 0; i < settings.http_max_tries; ++i)
-    {
-        try
-        {
-            callWithRedirects(response, Poco::Net::HTTPRequest::HTTP_HEAD, true, true);
-            break;
-        }
-        catch (const Poco::Exception & e)
-        {
-            if (i == settings.http_max_tries - 1 || e.code() == ErrorCodes::TOO_MANY_REDIRECTS || !isRetriableError(response.getStatus()))
-                throw;
-
-            LOG_ERROR(log, "Failed to make HTTP_HEAD request to {}. Error: {}", uri.toString(), e.displayText());
-        }
-    }
+    return initial_uri.toString();
 }
 
-template <typename UpdatableSessionPtr>
-void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::setupExternalBuffer()
+void ReadWriteBufferFromHTTP::getHeadResponse(Poco::Net::HTTPResponse & response)
 {
-    /**
-    * use_external_buffer -- means we read into the buffer which
-    * was passed to us from somewhere else. We do not check whether
-    * previously returned buffer was read or not (no hasPendingData() check is needed),
-    * because this branch means we are prefetching data,
-    * each nextImpl() call we can fill a different buffer.
-    */
-    impl->set(internal_buffer.begin(), internal_buffer.size());
-    assert(working_buffer.begin() != nullptr);
-    assert(!internal_buffer.empty());
+    doWithRetries(
+        [&] ()
+        {
+            callWithRedirects(response, Poco::Net::HTTPRequest::HTTP_HEAD, {});
+        },
+        /*on_retry=*/ nullptr,
+        /*mute_logging=*/ true);
 }
 
-template <typename UpdatableSessionPtr>
-ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::ReadWriteBufferFromHTTPBase(
-    UpdatableSessionPtr session_,
-    Poco::URI uri_,
-    const Poco::Net::HTTPBasicCredentials & credentials_,
+ReadWriteBufferFromHTTP::ReadWriteBufferFromHTTP(
+    const HTTPConnectionGroupType & connection_group_,
+    const Poco::URI & uri_,
     const std::string & method_,
-    OutStreamCallback out_stream_callback_,
-    size_t buffer_size_,
-    const ReadSettings & settings_,
-    HTTPHeaderEntries http_header_entries_,
+    ProxyConfiguration proxy_config_,
+    ReadSettings read_settings_,
+    ConnectionTimeouts timeouts_,
+    const Poco::Net::HTTPBasicCredentials & credentials_,
     const RemoteHostFilter * remote_host_filter_,
-    bool delay_initialization,
+    size_t buffer_size_,
+    size_t max_redirects_,
+    OutStreamCallback out_stream_callback_,
     bool use_external_buffer_,
     bool http_skip_not_found_url_,
-    std::optional<HTTPFileInfo> file_info_,
-    ProxyConfiguration proxy_config_)
+    HTTPHeaderEntries http_header_entries_,
+    bool delay_initialization,
+    std::optional<HTTPFileInfo> file_info_)
     : SeekableReadBuffer(nullptr, 0)
-    , uri {uri_}
-    , method {!method_.empty() ? method_ : out_stream_callback_ ? Poco::Net::HTTPRequest::HTTP_POST : Poco::Net::HTTPRequest::HTTP_GET}
-    , session {session_}
-    , out_stream_callback {out_stream_callback_}
-    , credentials {credentials_}
-    , http_header_entries {std::move(http_header_entries_)}
-    , remote_host_filter {remote_host_filter_}
-    , buffer_size {buffer_size_}
-    , use_external_buffer {use_external_buffer_}
-    , file_info(file_info_)
+    , connection_group(connection_group_)
+    , initial_uri(uri_)
+    , method(!method_.empty() ? method_ : out_stream_callback_ ? Poco::Net::HTTPRequest::HTTP_POST : Poco::Net::HTTPRequest::HTTP_GET)
+    , proxy_config(std::move(proxy_config_))
+    , read_settings(std::move(read_settings_))
+    , timeouts(std::move(timeouts_))
+    , credentials(credentials_)
+    , remote_host_filter(remote_host_filter_)
+    , buffer_size(buffer_size_)
+    , max_redirects(max_redirects_)
+    , use_external_buffer(use_external_buffer_)
     , http_skip_not_found_url(http_skip_not_found_url_)
-    , settings {settings_}
+    , out_stream_callback(std::move(out_stream_callback_))
+    , redirects(0)
+    , http_header_entries {std::move(http_header_entries_)}
+    , file_info(file_info_)
     , log(getLogger("ReadWriteBufferFromHTTP"))
-    , proxy_config(proxy_config_)
 {
-    if (settings.http_max_tries <= 0 || settings.http_retry_initial_backoff_ms <= 0
-        || settings.http_retry_initial_backoff_ms >= settings.http_retry_max_backoff_ms)
+    current_uri = initial_uri;
+
+    if (current_uri.getPath().empty())
+        current_uri.setPath("/");
+
+    if (read_settings.http_max_tries <= 0 || read_settings.http_retry_initial_backoff_ms <= 0
+        || read_settings.http_retry_initial_backoff_ms >= read_settings.http_retry_max_backoff_ms)
         throw Exception(
             ErrorCodes::BAD_ARGUMENTS,
             "Invalid setting for http backoff, "
             "must be http_max_tries >= 1 (current is {}) and "
             "0 < http_retry_initial_backoff_ms < settings.http_retry_max_backoff_ms (now 0 < {} < {})",
-            settings.http_max_tries,
-            settings.http_retry_initial_backoff_ms,
-            settings.http_retry_max_backoff_ms);
+            read_settings.http_max_tries,
+            read_settings.http_retry_initial_backoff_ms,
+            read_settings.http_retry_max_backoff_ms);
 
     // Configure User-Agent if it not already set.
     const std::string user_agent = "User-Agent";
-    auto iter = std::find_if(
-        http_header_entries.begin(),
-        http_header_entries.end(),
-        [&user_agent](const HTTPHeaderEntry & entry) { return entry.name == user_agent; });
+    auto iter = std::find_if(http_header_entries.begin(), http_header_entries.end(),
+        [&user_agent] (const HTTPHeaderEntry & entry) { return entry.name == user_agent; });
 
     if (iter == http_header_entries.end())
     {
-        http_header_entries.emplace_back("User-Agent", fmt::format("ClickHouse/{}", VERSION_STRING));
+        http_header_entries.emplace_back(user_agent, fmt::format("ClickHouse/{}", VERSION_STRING));
     }
 
+    if (!delay_initialization && use_external_buffer)
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS,
+            "Invalid setting for ReadWriteBufferFromHTTP"
+            "delay_initialization is false and use_external_buffer it true.");
+
     if (!delay_initialization)
     {
-        initialize();
-        if (exception)
-            std::rethrow_exception(exception);
+        next();
     }
 }
 
-template <typename UpdatableSessionPtr>
-void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::callWithRedirects(Poco::Net::HTTPResponse & response, const String & method_, bool throw_on_all_errors, bool for_object_info)
+ReadWriteBufferFromHTTP::CallResult ReadWriteBufferFromHTTP::callImpl(
+    Poco::Net::HTTPResponse & response, const Poco::URI & uri_, const std::string & method_, const std::optional<HTTPRange> & range, bool allow_redirects) const
 {
-    UpdatableSessionPtr current_session = nullptr;
+    if (remote_host_filter)
+        remote_host_filter->checkURL(uri_);
 
-    /// we can fetch object info while the request is being processed
-    /// and we don't want to override any context used by it
-    if (for_object_info)
-        current_session = session->clone(uri);
-    else
-        current_session = session;
+    Poco::Net::HTTPRequest request(method_, uri_.getPathAndQuery(), Poco::Net::HTTPRequest::HTTP_1_1);
+    prepareRequest(request, range);
 
-    call(current_session, response, method_, throw_on_all_errors, for_object_info);
-    saved_uri_redirect = uri;
+    auto session = makeHTTPSession(connection_group, uri_, timeouts, proxy_config);
+
+    auto & stream_out = session->sendRequest(request);
+    if (out_stream_callback)
+        out_stream_callback(stream_out);
+
+    auto & resp_stream = session->receiveResponse(response);
+
+    assertResponseIsOk(current_uri.toString(), response, resp_stream, allow_redirects);
+
+    return ReadWriteBufferFromHTTP::CallResult(std::move(session), resp_stream);
+}
+
+ReadWriteBufferFromHTTP::CallResult ReadWriteBufferFromHTTP::callWithRedirects(
+    Poco::Net::HTTPResponse & response, const String & method_, const std::optional<HTTPRange> & range)
+{
+    auto result = callImpl(response, current_uri, method_, range, true);
 
     while (isRedirect(response.getStatus()))
     {
-        Poco::URI uri_redirect = getUriAfterRedirect(*saved_uri_redirect, response);
-        saved_uri_redirect = uri_redirect;
-        if (remote_host_filter)
-            remote_host_filter->checkURL(uri_redirect);
+        Poco::URI uri_redirect = getUriAfterRedirect(current_uri, response);
+        ++redirects;
+        if (redirects > max_redirects)
+            throw Exception(
+                ErrorCodes::TOO_MANY_REDIRECTS,
+                "Too many redirects while trying to access {}."
+                " You can {} redirects by changing the setting 'max_http_get_redirects'."
+                " Example: `SET max_http_get_redirects = 10`."
+                " Redirects are restricted to prevent possible attack when a malicious server redirects to an internal resource, bypassing the authentication or firewall.",
+                initial_uri.toString(), max_redirects ? "increase the allowed maximum number of" : "allow");
 
-        current_session->updateSession(uri_redirect);
+        current_uri = uri_redirect;
 
-        /// we can fetch object info while the request is being processed
-        /// and we don't want to override any context used by it
-        auto result_istr = callImpl(current_session, uri_redirect, response, method, for_object_info);
-        if (!for_object_info)
-            istr = result_istr;
+        result = callImpl(response, uri_redirect, method_, range, true);
     }
+
+    return result;
 }
 
-template <typename UpdatableSessionPtr>
-void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::call(UpdatableSessionPtr & current_session, Poco::Net::HTTPResponse & response, const String & method_, bool throw_on_all_errors, bool for_object_info)
+
+void ReadWriteBufferFromHTTP::doWithRetries(std::function<void()> && callable,
+                                            std::function<void()> on_retry,
+                                            bool mute_logging) const
 {
-    try
+    [[maybe_unused]] auto milliseconds_to_wait = read_settings.http_retry_initial_backoff_ms;
+
+    bool is_retriable = true;
+    std::exception_ptr exception = nullptr;
+
+    for (size_t attempt = 1; attempt <= read_settings.http_max_tries; ++attempt)
     {
-        /// we can fetch object info while the request is being processed
-        /// and we don't want to override any context used by it
-        auto result_istr = callImpl(current_session, saved_uri_redirect ? *saved_uri_redirect : uri, response, method_, for_object_info);
-        if (!for_object_info)
-            istr = result_istr;
-    }
-    catch (...)
-    {
-        /// we can fetch object info while the request is being processed
-        /// and we don't want to override any context used by it
-        if (for_object_info)
-            throw;
+        [[maybe_unused]] bool last_attempt = attempt + 1 > read_settings.http_max_tries;
 
-        if (throw_on_all_errors)
-            throw;
+        String error_message;
 
-        auto http_status = response.getStatus();
-
-        if (http_status == Poco::Net::HTTPResponse::HTTPStatus::HTTP_NOT_FOUND && http_skip_not_found_url)
+        try
         {
-            initialization_error = InitializeError::SKIP_NOT_FOUND_URL;
+            callable();
+            return;
         }
-        else if (!isRetriableError(http_status))
+        catch (Poco::Net::NetException & e)
         {
-            initialization_error = InitializeError::NON_RETRYABLE_ERROR;
+            error_message = e.displayText();
             exception = std::current_exception();
         }
+        catch (DB::NetException & e)
+        {
+            error_message = e.displayText();
+            exception = std::current_exception();
+        }
+        catch (DB::HTTPException & e)
+        {
+            if (!isRetriableError(e.getHTTPStatus()))
+                is_retriable = false;
+
+            error_message = e.displayText();
+            exception = std::current_exception();
+        }
+        catch (DB::Exception & e)
+        {
+            is_retriable = false;
+
+            error_message = e.displayText();
+            exception = std::current_exception();
+        }
+        catch (Poco::Exception & e)
+        {
+            if (e.code() == POCO_EMFILE)
+                is_retriable = false;
+
+            error_message = e.displayText();
+            exception = std::current_exception();
+        }
+
+        chassert(exception);
+
+        if (last_attempt || !is_retriable)
+        {
+            if (!mute_logging)
+                LOG_ERROR(log,
+                          "Failed to make request to '{}'. Error: '{}'. "
+                          "Failed at try {}/{}.",
+                          initial_uri.toString(), error_message,
+                          attempt, read_settings.http_max_tries);
+
+            std::rethrow_exception(exception);
+        }
         else
         {
-            throw;
+            if (on_retry)
+                on_retry();
+
+            if (!mute_logging)
+                LOG_INFO(log,
+                         "Failed to make request to `{}`. Error: {}. "
+                         "Failed at try {}/{}. "
+                         "Will retry with current backoff wait is {}/{} ms.",
+                         initial_uri.toString(), error_message,
+                         attempt + 1, read_settings.http_max_tries,
+                         milliseconds_to_wait, read_settings.http_retry_max_backoff_ms);
+
+            sleepForMilliseconds(milliseconds_to_wait);
+            milliseconds_to_wait = std::min(milliseconds_to_wait * 2, read_settings.http_retry_max_backoff_ms);
         }
     }
 }
 
-template <typename UpdatableSessionPtr>
-void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::initialize()
+
+std::unique_ptr<ReadBuffer> ReadWriteBufferFromHTTP::initialize()
 {
     Poco::Net::HTTPResponse response;
 
-    call(session, response, method);
-    if (initialization_error != InitializeError::NONE)
-        return;
+    std::optional<HTTPRange> range;
+    if (withPartialContent())
+        range = HTTPRange{getOffset(), read_range.end};
 
-    while (isRedirect(response.getStatus()))
-    {
-        Poco::URI uri_redirect = getUriAfterRedirect(saved_uri_redirect.value_or(uri), response);
-        if (remote_host_filter)
-            remote_host_filter->checkURL(uri_redirect);
+    auto result = callWithRedirects(response, method, range);
 
-        session->updateSession(uri_redirect);
-
-        istr = callImpl(session, uri_redirect, response, method);
-        saved_uri_redirect = uri_redirect;
-    }
-
-    if (response.hasContentLength())
-        LOG_DEBUG(log, "Received response with content length: {}", response.getContentLength());
-
-    if (withPartialContent(read_range) && response.getStatus() != Poco::Net::HTTPResponse::HTTPStatus::HTTP_PARTIAL_CONTENT)
+    if (range.has_value() && response.getStatus() != Poco::Net::HTTPResponse::HTTPStatus::HTTP_PARTIAL_CONTENT)
     {
         /// Having `200 OK` instead of `206 Partial Content` is acceptable in case we retried with range.begin == 0.
         if (getOffset() != 0)
         {
-            if (!exception)
+            /// Retry 200OK
+            if (response.getStatus() == Poco::Net::HTTPResponse::HTTPStatus::HTTP_OK)
             {
-                exception = std::make_exception_ptr(Exception(
+                String reason = fmt::format(
+                    "Cannot read with range: [{}, {}] (response status: {}, reason: {}), will retry",
+                    *read_range.begin, read_range.end ? toString(*read_range.end) : "-",
+                    toString(response.getStatus()), response.getReason());
+
+                /// it is retriable error
+                throw HTTPException(
+                    ErrorCodes::HTTP_RANGE_NOT_SATISFIABLE,
+                    current_uri.toString(),
+                    Poco::Net::HTTPResponse::HTTP_REQUESTED_RANGE_NOT_SATISFIABLE,
+                    reason,
+                    "");
+            }
+            else
+                throw Exception(
                     ErrorCodes::HTTP_RANGE_NOT_SATISFIABLE,
                     "Cannot read with range: [{}, {}] (response status: {}, reason: {})",
                     *read_range.begin,
                     read_range.end ? toString(*read_range.end) : "-",
-                    toString(response.getStatus()), response.getReason()));
-            }
-
-            /// Retry 200OK
-            if (response.getStatus() == Poco::Net::HTTPResponse::HTTPStatus::HTTP_OK)
-                initialization_error = InitializeError::RETRYABLE_ERROR;
-            else
-                initialization_error = InitializeError::NON_RETRYABLE_ERROR;
-
-            return;
+                    toString(response.getStatus()), response.getReason());
         }
         else if (read_range.end)
         {
@@ -425,257 +418,140 @@ void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::initialize()
         }
     }
 
+    response.getCookies(cookies);
+    content_encoding = response.get("Content-Encoding", "");
+
     // Remember file size. It'll be used to report eof in next nextImpl() call.
     if (!read_range.end && response.hasContentLength())
-        file_info = parseFileInfo(response, withPartialContent(read_range) ? getOffset() : 0);
+        file_info = parseFileInfo(response, range.has_value() ? getOffset() : 0);
 
-    impl = std::make_unique<ReadBufferFromIStream>(*istr, buffer_size);
-
-    if (use_external_buffer)
-        setupExternalBuffer();
+    return std::move(result).transformToReadBuffer(use_external_buffer ? 0 : buffer_size);
 }
 
-template <typename UpdatableSessionPtr>
-bool ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::nextImpl()
+bool ReadWriteBufferFromHTTP::nextImpl()
 {
-    if (initialization_error == InitializeError::SKIP_NOT_FOUND_URL)
-        return false;
-    assert(initialization_error == InitializeError::NONE);
-
     if (next_callback)
         next_callback(count());
 
-    if ((read_range.end && getOffset() > read_range.end.value()) ||
-        (file_info && file_info->file_size && getOffset() >= file_info->file_size.value()))
-    {
-        /// Response was fully read.
-        markSessionForReuse(session->getSession());
-        ProfileEvents::increment(ProfileEvents::ReadWriteBufferFromHTTPPreservedSessions);
-        return false;
-    }
+    bool next_result = false;
 
-    if (impl)
-    {
-        if (use_external_buffer)
-        {
-            setupExternalBuffer();
-        }
-        else
-        {
-            /**
-            * impl was initialized before, pass position() to it to make
-            * sure there is no pending data which was not read.
-            */
-            if (!working_buffer.empty())
-                impl->position() = position();
-        }
-    }
-
-    bool result = false;
-    size_t milliseconds_to_wait = settings.http_retry_initial_backoff_ms;
-    bool last_attempt = false;
-
-    auto on_retriable_error = [&]()
-    {
-        retry_with_range_header = true;
-        impl.reset();
-        auto http_session = session->getSession();
-        http_session->reset();
-        if (!last_attempt)
-        {
-            sleepForMilliseconds(milliseconds_to_wait);
-            milliseconds_to_wait = std::min(milliseconds_to_wait * 2, settings.http_retry_max_backoff_ms);
-        }
-    };
-
-    for (size_t i = 0;; ++i)
-    {
-        if (last_attempt)
-            break;
-        last_attempt = i + 1 >= settings.http_max_tries;
-
-        exception = nullptr;
-        initialization_error = InitializeError::NONE;
-
-        try
+    doWithRetries(
+        /*callable=*/ [&] ()
         {
             if (!impl)
             {
-                initialize();
-
-                if (initialization_error == InitializeError::NON_RETRYABLE_ERROR)
+                try
                 {
-                    assert(exception);
-                    break;
+                    impl = initialize();
                 }
-                else if (initialization_error == InitializeError::SKIP_NOT_FOUND_URL)
+                catch (HTTPException & e)
                 {
-                    return false;
-                }
-                else if (initialization_error == InitializeError::RETRYABLE_ERROR)
-                {
-                    LOG_TRACE(
-                        log,
-                        "HTTP request to `{}` failed at try {}/{} with bytes read: {}/{}. "
-                        "(Current backoff wait is {}/{} ms)",
-                        uri.toString(), i + 1, settings.http_max_tries, getOffset(),
-                        read_range.end ? toString(*read_range.end) : "unknown",
-                        milliseconds_to_wait, settings.http_retry_max_backoff_ms);
+                    if (http_skip_not_found_url && e.getHTTPStatus() == Poco::Net::HTTPResponse::HTTPStatus::HTTP_NOT_FOUND)
+                    {
+                        next_result = false;
+                        return;
+                    }
 
-                    assert(exception);
-                    on_retriable_error();
-                    continue;
+                    throw;
                 }
 
-                assert(!exception);
-
                 if (use_external_buffer)
                 {
-                    setupExternalBuffer();
+                    impl->set(internal_buffer.begin(), internal_buffer.size());
+                }
+                else
+                {
+                    BufferBase::set(impl->buffer().begin(), impl->buffer().size(), impl->offset());
                 }
             }
 
-            result = impl->next();
-            exception = nullptr;
-            break;
-        }
-        catch (const Poco::Exception & e)
+            if (use_external_buffer)
+            {
+                impl->set(internal_buffer.begin(), internal_buffer.size());
+            }
+            else
+            {
+                impl->position() = position();
+            }
+
+            next_result = impl->next();
+
+            BufferBase::set(impl->buffer().begin(), impl->buffer().size(), impl->offset());
+
+            offset_from_begin_pos += working_buffer.size();
+        },
+        /*on_retry=*/ [&] ()
         {
-            /// Too many open files or redirects - non-retryable.
-            if (e.code() == POCO_EMFILE || e.code() == ErrorCodes::TOO_MANY_REDIRECTS)
-                throw;
+            impl.reset();
+        });
 
-            /** Retry request unconditionally if nothing has been read yet.
-                    * Otherwise if it is GET method retry with range header.
-                    */
-            bool can_retry_request = !offset_from_begin_pos || method == Poco::Net::HTTPRequest::HTTP_GET;
-            if (!can_retry_request)
-                throw;
-
-            LOG_INFO(
-                log,
-                "HTTP request to `{}` failed at try {}/{} with bytes read: {}/{}. "
-                "Error: {}. (Current backoff wait is {}/{} ms)",
-                uri.toString(),
-                i + 1,
-                settings.http_max_tries,
-                getOffset(),
-                read_range.end ? toString(*read_range.end) : "unknown",
-                e.displayText(),
-                milliseconds_to_wait,
-                settings.http_retry_max_backoff_ms);
-
-            on_retriable_error();
-            exception = std::current_exception();
-        }
-    }
-
-    if (exception)
-        std::rethrow_exception(exception);
-
-    if (!result)
-    {
-        /// Eof is reached, i.e response was fully read.
-        markSessionForReuse(session->getSession());
-        ProfileEvents::increment(ProfileEvents::ReadWriteBufferFromHTTPPreservedSessions);
-        return false;
-    }
-
-    internal_buffer = impl->buffer();
-    working_buffer = internal_buffer;
-    offset_from_begin_pos += working_buffer.size();
-    return true;
+    return next_result;
 }
 
-template <typename UpdatableSessionPtr>
-size_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> & progress_callback)
+size_t ReadWriteBufferFromHTTP::readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> & progress_callback) const
 {
     /// Caller must have checked supportsReadAt().
-    /// This ensures we've sent at least one HTTP request and populated saved_uri_redirect.
+    /// This ensures we've sent at least one HTTP request and populated current_uri.
     chassert(file_info && file_info->seekable);
 
-    Poco::URI uri_ = saved_uri_redirect.value_or(uri);
-    if (uri_.getPath().empty())
-        uri_.setPath("/");
-
     size_t initial_n = n;
-    size_t milliseconds_to_wait = settings.http_retry_initial_backoff_ms;
+    size_t total_bytes_copied = 0;
+    size_t bytes_copied = 0;
+    bool is_canceled = false;
 
-    for (size_t attempt = 0; n > 0; ++attempt)
-    {
-        bool last_attempt = attempt + 1 >= settings.http_max_tries;
-
-        Poco::Net::HTTPRequest request(method, uri_.getPathAndQuery(), Poco::Net::HTTPRequest::HTTP_1_1);
-        prepareRequest(request, uri_, HTTPRange { .begin = offset, .end = offset + n - 1});
-
-        LOG_TRACE(log, "Sending request to {} for range [{}, {})", uri_.toString(), offset, offset + n);
-
-        auto sess = session->createDetachedSession(uri_);
-
-        Poco::Net::HTTPResponse response;
-        std::istream * result_istr;
-        size_t bytes_copied = 0;
-
-        try
+    doWithRetries(
+        /*callable=*/ [&] ()
         {
-            sess->sendRequest(request);
-            result_istr = receiveResponse(*sess, request, response, /*allow_redirects*/ false);
+            auto range = HTTPRange{offset, offset + n - 1};
+
+            Poco::Net::HTTPResponse response;
+            auto result = callImpl(response, current_uri, method, range, false);
 
             if (response.getStatus() != Poco::Net::HTTPResponse::HTTPStatus::HTTP_PARTIAL_CONTENT &&
                 (offset != 0 || offset + n < *file_info->file_size))
-                throw Exception(
-                    ErrorCodes::HTTP_RANGE_NOT_SATISFIABLE,
-                    "Expected 206 Partial Content, got {} when reading {} range [{}, {})",
-                    toString(response.getStatus()), uri_.toString(), offset, offset + n);
-
-            copyFromIStreamWithProgressCallback(*result_istr, to, n, progress_callback, &bytes_copied);
-            if (bytes_copied == n)
             {
-                result_istr->ignore(UINT64_MAX);
-                /// Response was fully read.
-                markSessionForReuse(*sess);
-                ProfileEvents::increment(ProfileEvents::ReadWriteBufferFromHTTPPreservedSessions);
+                String reason = fmt::format(
+                    "When reading with readBigAt {}."
+                    "Cannot read with range: [{}, {}] (response status: {}, reason: {}), will retry",
+                    initial_uri.toString(),
+                    *range.begin, *range.end,
+                    toString(response.getStatus()), response.getReason());
+
+                throw HTTPException(
+                    ErrorCodes::HTTP_RANGE_NOT_SATISFIABLE,
+                    current_uri.toString(),
+                    Poco::Net::HTTPResponse::HTTP_REQUESTED_RANGE_NOT_SATISFIABLE,
+                    reason,
+                    "");
             }
-        }
-        catch (const Poco::Exception & e)
+
+            copyFromIStreamWithProgressCallback(*result.response_stream, to, n, progress_callback, &bytes_copied, &is_canceled);
+
+            offset += bytes_copied;
+            total_bytes_copied += bytes_copied;
+            to += bytes_copied;
+            n -= bytes_copied;
+            bytes_copied = 0;
+        },
+        /*on_retry=*/ [&] ()
         {
-            LOG_ERROR(
-                log,
-                "HTTP request (positioned) to `{}` with range [{}, {}) failed at try {}/{}: {}",
-                uri_.toString(), offset, offset + n, attempt + 1, settings.http_max_tries,
-                e.what());
+            offset += bytes_copied;
+            total_bytes_copied += bytes_copied;
+            to += bytes_copied;
+            n -= bytes_copied;
+            bytes_copied = 0;
+        });
 
-            /// Decide whether to retry.
-
-            if (last_attempt)
-                throw;
-
-            /// Too many open files - non-retryable.
-            if (e.code() == POCO_EMFILE)
-                throw;
-
-            if (const auto * h = dynamic_cast<const HTTPException*>(&e);
-                h && !isRetriableError(static_cast<Poco::Net::HTTPResponse::HTTPStatus>(h->getHTTPStatus())))
-                throw;
-
-            sleepForMilliseconds(milliseconds_to_wait);
-            milliseconds_to_wait = std::min(milliseconds_to_wait * 2, settings.http_retry_max_backoff_ms);
-        }
-
-        /// Make sure retries don't re-read the bytes that we've already reported to progress_callback.
-        offset += bytes_copied;
-        to += bytes_copied;
-        n -= bytes_copied;
-    }
-
-    return initial_n;
+    chassert(total_bytes_copied == initial_n || is_canceled);
+    return total_bytes_copied;
 }
 
-template <typename UpdatableSessionPtr>
-off_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getPosition() { return getOffset() - available(); }
+off_t ReadWriteBufferFromHTTP::getPosition()
+{
+    return getOffset() - available();
+}
 
-template <typename UpdatableSessionPtr>
-off_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::seek(off_t offset_, int whence)
+off_t ReadWriteBufferFromHTTP::seek(off_t offset_, int whence)
 {
     if (whence != SEEK_SET)
         throw Exception(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, "Only SEEK_SET mode is allowed.");
@@ -688,8 +564,8 @@ off_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::seek(off_t offset_, int
     if (!working_buffer.empty() && size_t(offset_) >= current_offset - working_buffer.size() && offset_ < current_offset)
     {
         pos = working_buffer.end() - (current_offset - offset_);
-        assert(pos >= working_buffer.begin());
-        assert(pos < working_buffer.end());
+        chassert(pos >= working_buffer.begin());
+        chassert(pos < working_buffer.end());
 
         return getPosition();
     }
@@ -700,7 +576,7 @@ off_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::seek(off_t offset_, int
         if (offset_ > position)
         {
             size_t diff = offset_ - position;
-            if (diff < settings.remote_read_min_bytes_for_seek)
+            if (diff < read_settings.remote_read_min_bytes_for_seek)
             {
                 ignore(diff);
                 return offset_;
@@ -709,6 +585,7 @@ off_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::seek(off_t offset_, int
 
         if (!atEndOfRequestedRangeGuess())
             ProfileEvents::increment(ProfileEvents::ReadBufferSeekCancelConnection);
+
         impl.reset();
     }
 
@@ -719,8 +596,8 @@ off_t ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::seek(off_t offset_, int
     return offset_;
 }
 
-template <typename UpdatableSessionPtr>
-void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::setReadUntilPosition(size_t until)
+
+void ReadWriteBufferFromHTTP::setReadUntilPosition(size_t until)
 {
     until = std::max(until, 1ul);
     if (read_range.end && *read_range.end + 1 == until)
@@ -736,8 +613,7 @@ void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::setReadUntilPosition(size
     }
 }
 
-template <typename UpdatableSessionPtr>
-void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::setReadUntilEnd()
+void ReadWriteBufferFromHTTP::setReadUntilEnd()
 {
     if (!read_range.end)
         return;
@@ -752,11 +628,9 @@ void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::setReadUntilEnd()
     }
 }
 
-template <typename UpdatableSessionPtr>
-bool ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::supportsRightBoundedReads() const { return true; }
+bool ReadWriteBufferFromHTTP::supportsRightBoundedReads() const { return true; }
 
-template <typename UpdatableSessionPtr>
-bool ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::atEndOfRequestedRangeGuess()
+bool ReadWriteBufferFromHTTP::atEndOfRequestedRangeGuess()
 {
     if (!impl)
         return true;
@@ -767,8 +641,7 @@ bool ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::atEndOfRequestedRangeGues
     return false;
 }
 
-template <typename UpdatableSessionPtr>
-std::string ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getResponseCookie(const std::string & name, const std::string & def) const
+std::string ReadWriteBufferFromHTTP::getResponseCookie(const std::string & name, const std::string & def) const
 {
     for (const auto & cookie : cookies)
         if (cookie.getName() == name)
@@ -776,19 +649,19 @@ std::string ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getResponseCookie(
     return def;
 }
 
-template <typename UpdatableSessionPtr>
-void ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::setNextCallback(NextCallback next_callback_)
+void ReadWriteBufferFromHTTP::setNextCallback(NextCallback next_callback_)
 {
     next_callback = next_callback_;
     /// Some data maybe already read
     next_callback(count());
 }
 
-template <typename UpdatableSessionPtr>
-const std::string & ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getCompressionMethod() const { return content_encoding; }
+const std::string & ReadWriteBufferFromHTTP::getCompressionMethod() const
+{
+    return content_encoding;
+}
 
-template <typename UpdatableSessionPtr>
-std::optional<time_t> ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::tryGetLastModificationTime()
+std::optional<time_t> ReadWriteBufferFromHTTP::tryGetLastModificationTime()
 {
     if (!file_info)
     {
@@ -805,12 +678,11 @@ std::optional<time_t> ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::tryGetLa
     return file_info->last_modified;
 }
 
-template <typename UpdatableSessionPtr>
-HTTPFileInfo ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getFileInfo()
+ReadWriteBufferFromHTTP::HTTPFileInfo ReadWriteBufferFromHTTP::getFileInfo()
 {
     /// May be disabled in case the user knows in advance that the server doesn't support HEAD requests.
     /// Allows to avoid making unnecessary requests in such cases.
-    if (!settings.http_make_head_request)
+    if (!read_settings.http_make_head_request)
         return HTTPFileInfo{};
 
     Poco::Net::HTTPResponse response;
@@ -832,11 +704,11 @@ HTTPFileInfo ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getFileInfo()
 
         throw;
     }
+
     return parseFileInfo(response, 0);
 }
 
-template <typename UpdatableSessionPtr>
-HTTPFileInfo ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::parseFileInfo(const Poco::Net::HTTPResponse & response, size_t requested_range_begin)
+ReadWriteBufferFromHTTP::HTTPFileInfo ReadWriteBufferFromHTTP::parseFileInfo(const Poco::Net::HTTPResponse & response, size_t requested_range_begin)
 {
     HTTPFileInfo res;
 
@@ -869,78 +741,3 @@ HTTPFileInfo ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::parseFileInfo(con
 
 }
 
-SessionFactory::SessionFactory(const ConnectionTimeouts & timeouts_, ProxyConfiguration proxy_config_)
-    : timeouts(timeouts_), proxy_config(proxy_config_) {}
-
-SessionFactory::SessionType SessionFactory::buildNewSession(const Poco::URI & uri)
-{
-    return makeHTTPSession(uri, timeouts, proxy_config);
-}
-
-ReadWriteBufferFromHTTP::ReadWriteBufferFromHTTP(
-    Poco::URI uri_,
-    const std::string & method_,
-    OutStreamCallback out_stream_callback_,
-    const ConnectionTimeouts & timeouts,
-    const Poco::Net::HTTPBasicCredentials & credentials_,
-    const UInt64 max_redirects,
-    size_t buffer_size_,
-    const ReadSettings & settings_,
-    const HTTPHeaderEntries & http_header_entries_,
-    const RemoteHostFilter * remote_host_filter_,
-    bool delay_initialization_,
-    bool use_external_buffer_,
-    bool skip_not_found_url_,
-    std::optional<HTTPFileInfo> file_info_,
-    ProxyConfiguration proxy_config_)
-    : Parent(
-        std::make_shared<SessionType>(uri_, max_redirects, std::make_shared<SessionFactory>(timeouts, proxy_config_)),
-        uri_,
-        credentials_,
-        method_,
-        out_stream_callback_,
-        buffer_size_,
-        settings_,
-        http_header_entries_,
-        remote_host_filter_,
-        delay_initialization_,
-        use_external_buffer_,
-        skip_not_found_url_,
-        file_info_,
-        proxy_config_) {}
-
-
-PooledSessionFactory::PooledSessionFactory(
-    const ConnectionTimeouts & timeouts_, size_t per_endpoint_pool_size_)
-    : timeouts(timeouts_)
-    , per_endpoint_pool_size(per_endpoint_pool_size_) {}
-
-PooledSessionFactory::SessionType PooledSessionFactory::buildNewSession(const Poco::URI & uri)
-{
-    return makePooledHTTPSession(uri, timeouts, per_endpoint_pool_size);
-}
-
-
-PooledReadWriteBufferFromHTTP::PooledReadWriteBufferFromHTTP(
-    Poco::URI uri_,
-    const std::string & method_,
-    OutStreamCallback out_stream_callback_,
-    const Poco::Net::HTTPBasicCredentials & credentials_,
-    size_t buffer_size_,
-    const UInt64 max_redirects,
-    PooledSessionFactoryPtr session_factory)
-    : Parent(
-        std::make_shared<SessionType>(uri_, max_redirects, session_factory),
-        uri_,
-        credentials_,
-        method_,
-        out_stream_callback_,
-        buffer_size_) {}
-
-
-template class UpdatableSession<SessionFactory>;
-template class UpdatableSession<PooledSessionFactory>;
-template class detail::ReadWriteBufferFromHTTPBase<std::shared_ptr<UpdatableSession<SessionFactory>>>;
-template class detail::ReadWriteBufferFromHTTPBase<std::shared_ptr<UpdatableSession<PooledSessionFactory>>>;
-
-}
diff --git a/src/IO/ReadWriteBufferFromHTTP.h b/src/IO/ReadWriteBufferFromHTTP.h
index 63ca3e0417c..5df87fb6149 100644
--- a/src/IO/ReadWriteBufferFromHTTP.h
+++ b/src/IO/ReadWriteBufferFromHTTP.h
@@ -20,7 +20,6 @@
 #include <Poco/Net/HTTPResponse.h>
 #include <Poco/URI.h>
 #include <Poco/URIStreamFactory.h>
-#include <Common/DNSResolver.h>
 #include <Common/RemoteHostFilter.h>
 #include "config.h"
 #include <Common/config_version.h>
@@ -30,44 +29,19 @@
 namespace DB
 {
 
-template <typename TSessionFactory>
-class UpdatableSession
+class ReadWriteBufferFromHTTP : public SeekableReadBuffer, public WithFileName, public WithFileSize
 {
 public:
-    using SessionPtr = typename TSessionFactory::SessionType;
-
-    explicit UpdatableSession(const Poco::URI & uri, UInt64 max_redirects_, std::shared_ptr<TSessionFactory> session_factory_);
-
-    SessionPtr getSession();
-
-    void updateSession(const Poco::URI & uri);
-
-    /// Thread safe.
-    SessionPtr createDetachedSession(const Poco::URI & uri);
-
-    std::shared_ptr<UpdatableSession<TSessionFactory>> clone(const Poco::URI & uri);
+    /// Information from HTTP response header.
+    struct HTTPFileInfo
+    {
+        // nullopt if the server doesn't report it.
+        std::optional<size_t> file_size;
+        std::optional<time_t> last_modified;
+        bool seekable = false;
+    };
 
 private:
-    SessionPtr session;
-    UInt64 redirects{0};
-    UInt64 max_redirects;
-    Poco::URI initial_uri;
-    std::shared_ptr<TSessionFactory> session_factory;
-};
-
-
-/// Information from HTTP response header.
-struct HTTPFileInfo
-{
-    // nullopt if the server doesn't report it.
-    std::optional<size_t> file_size;
-    std::optional<time_t> last_modified;
-    bool seekable = false;
-};
-
-
-namespace detail
-{
     /// Byte range, including right bound [begin, end].
     struct HTTPRange
     {
@@ -75,218 +49,208 @@ namespace detail
         std::optional<size_t> end;
     };
 
-    template <typename UpdatableSessionPtr>
-    class ReadWriteBufferFromHTTPBase : public SeekableReadBuffer, public WithFileName, public WithFileSize
+    struct CallResult
     {
-    protected:
-        Poco::URI uri;
-        std::string method;
-        std::string content_encoding;
+        HTTPSessionPtr session;
+        std::istream * response_stream = nullptr;
 
-        UpdatableSessionPtr session;
-        std::istream * istr; /// owned by session
-        std::unique_ptr<ReadBuffer> impl;
-        std::function<void(std::ostream &)> out_stream_callback;
-        const Poco::Net::HTTPBasicCredentials & credentials;
-        std::vector<Poco::Net::HTTPCookie> cookies;
-        HTTPHeaderEntries http_header_entries;
-        const RemoteHostFilter * remote_host_filter = nullptr;
-        std::function<void(size_t)> next_callback;
+        CallResult(HTTPSessionPtr && session_, std::istream & response_stream_)
+            : session(session_)
+            , response_stream(&response_stream_)
+        {}
+        CallResult(CallResult &&) = default;
+        CallResult & operator= (CallResult &&) = default;
 
-        size_t buffer_size;
-        bool use_external_buffer;
-
-        size_t offset_from_begin_pos = 0;
-        HTTPRange read_range;
-        std::optional<HTTPFileInfo> file_info;
-
-        /// Delayed exception in case retries with partial content are not satisfiable.
-        std::exception_ptr exception;
-        bool retry_with_range_header = false;
-        /// In case of redirects, save result uri to use it if we retry the request.
-        std::optional<Poco::URI> saved_uri_redirect;
-
-        bool http_skip_not_found_url;
-
-        ReadSettings settings;
-        LoggerPtr log;
-
-        ProxyConfiguration proxy_config;
-
-        bool withPartialContent(const HTTPRange & range) const;
-
-        size_t getOffset() const;
-
-        void prepareRequest(Poco::Net::HTTPRequest & request, Poco::URI uri_, std::optional<HTTPRange> range) const;
-
-        std::istream * callImpl(UpdatableSessionPtr & current_session, Poco::URI uri_, Poco::Net::HTTPResponse & response, const std::string & method_, bool for_object_info = false);
-
-        size_t getFileSize() override;
-
-        bool supportsReadAt() override;
-
-        bool checkIfActuallySeekable() override;
-
-        String getFileName() const override;
-
-        enum class InitializeError
-        {
-            RETRYABLE_ERROR,
-            /// If error is not retriable, `exception` variable must be set.
-            NON_RETRYABLE_ERROR,
-            /// Allows to skip not found urls for globs
-            SKIP_NOT_FOUND_URL,
-            NONE,
-        };
-
-        InitializeError initialization_error = InitializeError::NONE;
-
-    private:
-        void getHeadResponse(Poco::Net::HTTPResponse & response);
-
-        void setupExternalBuffer();
-
-    public:
-        using NextCallback = std::function<void(size_t)>;
-        using OutStreamCallback = std::function<void(std::ostream &)>;
-
-        explicit ReadWriteBufferFromHTTPBase(
-            UpdatableSessionPtr session_,
-            Poco::URI uri_,
-            const Poco::Net::HTTPBasicCredentials & credentials_,
-            const std::string & method_ = {},
-            OutStreamCallback out_stream_callback_ = {},
-            size_t buffer_size_ = DBMS_DEFAULT_BUFFER_SIZE,
-            const ReadSettings & settings_ = {},
-            HTTPHeaderEntries http_header_entries_ = {},
-            const RemoteHostFilter * remote_host_filter_ = nullptr,
-            bool delay_initialization = false,
-            bool use_external_buffer_ = false,
-            bool http_skip_not_found_url_ = false,
-            std::optional<HTTPFileInfo> file_info_ = std::nullopt,
-            ProxyConfiguration proxy_config_ = {});
-
-        void callWithRedirects(Poco::Net::HTTPResponse & response, const String & method_, bool throw_on_all_errors = false, bool for_object_info = false);
-
-        void call(UpdatableSessionPtr & current_session, Poco::Net::HTTPResponse & response, const String & method_, bool throw_on_all_errors = false, bool for_object_info = false);
-
-        /**
-         * Throws if error is retryable, otherwise sets initialization_error = NON_RETRYABLE_ERROR and
-         * saves exception into `exception` variable. In case url is not found and skip_not_found_url == true,
-         * sets initialization_error = SKIP_NOT_FOUND_URL, otherwise throws.
-         */
-        void initialize();
-
-        bool nextImpl() override;
-
-        size_t readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> & progress_callback) override;
-
-        off_t getPosition() override;
-
-        off_t seek(off_t offset_, int whence) override;
-
-        void setReadUntilPosition(size_t until) override;
-
-        void setReadUntilEnd() override;
-
-        bool supportsRightBoundedReads() const override;
-
-        // If true, if we destroy impl now, no work was wasted. Just for metrics.
-        bool atEndOfRequestedRangeGuess();
-
-        std::string getResponseCookie(const std::string & name, const std::string & def) const;
-
-        /// Set function to call on each nextImpl, useful when you need to track
-        /// progress.
-        /// NOTE: parameter on each call is not incremental -- it's all bytes count
-        /// passed through the buffer
-        void setNextCallback(NextCallback next_callback_);
-
-        const std::string & getCompressionMethod() const;
-
-        std::optional<time_t> tryGetLastModificationTime();
-
-        HTTPFileInfo getFileInfo();
-
-        HTTPFileInfo parseFileInfo(const Poco::Net::HTTPResponse & response, size_t requested_range_begin);
+        std::unique_ptr<ReadBuffer> transformToReadBuffer(size_t buf_size) &&;
     };
-}
 
-class SessionFactory
-{
-public:
-    explicit SessionFactory(const ConnectionTimeouts & timeouts_, ProxyConfiguration proxy_config_ = {});
+    const HTTPConnectionGroupType connection_group;
+    const Poco::URI initial_uri;
+    const std::string method;
+    const ProxyConfiguration proxy_config;
+    const ReadSettings read_settings;
+    const ConnectionTimeouts timeouts;
 
-    using SessionType = HTTPSessionPtr;
+    const Poco::Net::HTTPBasicCredentials & credentials;
+    const RemoteHostFilter * remote_host_filter;
 
-    SessionType buildNewSession(const Poco::URI & uri);
-private:
-    ConnectionTimeouts timeouts;
-    ProxyConfiguration proxy_config;
-};
+    const size_t buffer_size;
+    const size_t max_redirects;
 
-class ReadWriteBufferFromHTTP : public detail::ReadWriteBufferFromHTTPBase<std::shared_ptr<UpdatableSession<SessionFactory>>>
-{
-    using SessionType = UpdatableSession<SessionFactory>;
-    using Parent = detail::ReadWriteBufferFromHTTPBase<std::shared_ptr<SessionType>>;
+    const bool use_external_buffer;
+    const bool http_skip_not_found_url;
+
+    std::function<void(std::ostream &)> out_stream_callback;
+
+    Poco::URI current_uri;
+    size_t redirects = 0;
+
+    std::string content_encoding;
+    std::unique_ptr<ReadBuffer> impl;
+
+    std::vector<Poco::Net::HTTPCookie> cookies;
+    HTTPHeaderEntries http_header_entries;
+    std::function<void(size_t)> next_callback;
+
+    size_t offset_from_begin_pos = 0;
+    HTTPRange read_range;
+    std::optional<HTTPFileInfo> file_info;
+
+    LoggerPtr log;
+
+    bool withPartialContent() const;
+
+    void prepareRequest(Poco::Net::HTTPRequest & request, std::optional<HTTPRange> range) const;
+
+    void doWithRetries(std::function<void()> && callable, std::function<void()> on_retry = nullptr, bool mute_logging = false) const;
+
+    CallResult  callImpl(
+        Poco::Net::HTTPResponse & response,
+        const Poco::URI & uri_,
+        const std::string & method_,
+        const std::optional<HTTPRange> & range,
+        bool allow_redirects) const;
+
+    CallResult  callWithRedirects(
+        Poco::Net::HTTPResponse & response,
+        const String & method_,
+        const std::optional<HTTPRange> & range);
+
+    std::unique_ptr<ReadBuffer> initialize();
+
+    size_t getFileSize() override;
+
+    bool supportsReadAt() override;
+
+    bool checkIfActuallySeekable() override;
+
+    String getFileName() const override;
+
+    void getHeadResponse(Poco::Net::HTTPResponse & response);
+
+    void setupExternalBuffer();
+
+    size_t getOffset() const;
+
+    // If true, if we destroy impl now, no work was wasted. Just for metrics.
+    bool atEndOfRequestedRangeGuess();
 
 public:
+    using NextCallback = std::function<void(size_t)>;
+    using OutStreamCallback = std::function<void(std::ostream &)>;
+
     ReadWriteBufferFromHTTP(
-        Poco::URI uri_,
+        const HTTPConnectionGroupType & connection_group_,
+        const Poco::URI & uri_,
         const std::string & method_,
-        OutStreamCallback out_stream_callback_,
-        const ConnectionTimeouts & timeouts,
-        const Poco::Net::HTTPBasicCredentials & credentials_,
-        const UInt64 max_redirects = 0,
-        size_t buffer_size_ = DBMS_DEFAULT_BUFFER_SIZE,
-        const ReadSettings & settings_ = {},
-        const HTTPHeaderEntries & http_header_entries_ = {},
-        const RemoteHostFilter * remote_host_filter_ = nullptr,
-        bool delay_initialization_ = true,
-        bool use_external_buffer_ = false,
-        bool skip_not_found_url_ = false,
-        std::optional<HTTPFileInfo> file_info_ = std::nullopt,
-        ProxyConfiguration proxy_config_ = {});
-};
-
-class PooledSessionFactory
-{
-public:
-    explicit PooledSessionFactory(
-        const ConnectionTimeouts & timeouts_, size_t per_endpoint_pool_size_);
-
-    using SessionType = PooledHTTPSessionPtr;
-
-    /// Thread safe.
-    SessionType buildNewSession(const Poco::URI & uri);
-
-private:
-    ConnectionTimeouts timeouts;
-    size_t per_endpoint_pool_size;
-};
-
-using PooledSessionFactoryPtr = std::shared_ptr<PooledSessionFactory>;
-
-class PooledReadWriteBufferFromHTTP : public detail::ReadWriteBufferFromHTTPBase<std::shared_ptr<UpdatableSession<PooledSessionFactory>>>
-{
-    using SessionType = UpdatableSession<PooledSessionFactory>;
-    using Parent = detail::ReadWriteBufferFromHTTPBase<std::shared_ptr<SessionType>>;
-
-public:
-    explicit PooledReadWriteBufferFromHTTP(
-        Poco::URI uri_,
-        const std::string & method_,
-        OutStreamCallback out_stream_callback_,
+        ProxyConfiguration proxy_config_,
+        ReadSettings read_settings_,
+        ConnectionTimeouts timeouts_,
         const Poco::Net::HTTPBasicCredentials & credentials_,
+        const RemoteHostFilter * remote_host_filter_,
         size_t buffer_size_,
-        const UInt64 max_redirects,
-        PooledSessionFactoryPtr session_factory);
+        size_t max_redirects_,
+        OutStreamCallback out_stream_callback_,
+        bool use_external_buffer_,
+        bool http_skip_not_found_url_,
+        HTTPHeaderEntries http_header_entries_,
+        bool delay_initialization,
+        std::optional<HTTPFileInfo> file_info_);
+
+    bool nextImpl() override;
+
+    size_t readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> & progress_callback) const override;
+
+    off_t seek(off_t offset_, int whence) override;
+
+    void setReadUntilPosition(size_t until) override;
+
+    void setReadUntilEnd() override;
+
+    bool supportsRightBoundedReads() const override;
+
+    off_t getPosition() override;
+
+    std::string getResponseCookie(const std::string & name, const std::string & def) const;
+
+    /// Set function to call on each nextImpl, useful when you need to track
+    /// progress.
+    /// NOTE: parameter on each call is not incremental -- it's all bytes count
+    /// passed through the buffer
+    void setNextCallback(NextCallback next_callback_);
+
+    const std::string & getCompressionMethod() const;
+
+    std::optional<time_t> tryGetLastModificationTime();
+
+    HTTPFileInfo getFileInfo();
+    static HTTPFileInfo parseFileInfo(const Poco::Net::HTTPResponse & response, size_t requested_range_begin);
 };
 
+using ReadWriteBufferFromHTTPPtr = std::unique_ptr<ReadWriteBufferFromHTTP>;
 
-extern template class UpdatableSession<SessionFactory>;
-extern template class UpdatableSession<PooledSessionFactory>;
-extern template class detail::ReadWriteBufferFromHTTPBase<std::shared_ptr<UpdatableSession<SessionFactory>>>;
-extern template class detail::ReadWriteBufferFromHTTPBase<std::shared_ptr<UpdatableSession<PooledSessionFactory>>>;
+class BuilderRWBufferFromHTTP
+{
+    Poco::URI uri;
+    std::string method = Poco::Net::HTTPRequest::HTTP_GET;
+    HTTPConnectionGroupType connection_group = HTTPConnectionGroupType::HTTP;
+    ProxyConfiguration proxy_config{};
+    ReadSettings read_settings{};
+    ConnectionTimeouts timeouts{};
+    const RemoteHostFilter * remote_host_filter = nullptr;
+    size_t buffer_size = DBMS_DEFAULT_BUFFER_SIZE;
+    size_t max_redirects = 0;
+    ReadWriteBufferFromHTTP::OutStreamCallback out_stream_callback = nullptr;
+    bool use_external_buffer = false;
+    HTTPHeaderEntries http_header_entries{};
+    bool delay_initialization = true;
+
+public:
+    BuilderRWBufferFromHTTP(Poco::URI uri_)
+        : uri(uri_)
+    {}
+
+#define setterMember(name, member) \
+    BuilderRWBufferFromHTTP & name(decltype(BuilderRWBufferFromHTTP::member) arg_##member) \
+    { \
+        member = std::move(arg_##member); \
+        return *this; \
+    }
+
+    setterMember(withConnectionGroup, connection_group)
+    setterMember(withMethod, method)
+    setterMember(withProxy, proxy_config)
+    setterMember(withSettings, read_settings)
+    setterMember(withTimeouts, timeouts)
+    setterMember(withHostFilter, remote_host_filter)
+    setterMember(withBufSize, buffer_size)
+    setterMember(withRedirects, max_redirects)
+    setterMember(withOutCallback, out_stream_callback)
+    setterMember(withHeaders, http_header_entries)
+    setterMember(withExternalBuf, use_external_buffer)
+    setterMember(withDelayInit, delay_initialization)
+#undef setterMember
+
+    ReadWriteBufferFromHTTPPtr create(const Poco::Net::HTTPBasicCredentials & credentials_)
+    {
+        return std::make_unique<ReadWriteBufferFromHTTP>(
+            connection_group,
+            uri,
+            method,
+            proxy_config,
+            read_settings,
+            timeouts,
+            credentials_,
+            remote_host_filter,
+            buffer_size,
+            max_redirects,
+            out_stream_callback,
+            use_external_buffer,
+            /*http_skip_not_found_url=*/ false,
+            http_header_entries,
+            delay_initialization,
+            /*file_info_=*/ std::nullopt);
+    }
+};
 
 }
diff --git a/src/IO/S3/PocoHTTPClient.cpp b/src/IO/S3/PocoHTTPClient.cpp
index dbb93e63143..a29a4b0b8ee 100644
--- a/src/IO/S3/PocoHTTPClient.cpp
+++ b/src/IO/S3/PocoHTTPClient.cpp
@@ -1,5 +1,4 @@
 #include <Poco/Timespan.h>
-#include "Common/DNSResolver.h"
 #include "config.h"
 
 #if USE_AWS_S3
@@ -147,9 +146,7 @@ ConnectionTimeouts getTimeoutsFromConfiguration(const PocoHTTPClientConfiguratio
         .withSendTimeout(Poco::Timespan(client_configuration.requestTimeoutMs * 1000))
         .withReceiveTimeout(Poco::Timespan(client_configuration.requestTimeoutMs * 1000))
         .withTCPKeepAliveTimeout(Poco::Timespan(
-            client_configuration.enableTcpKeepAlive ? client_configuration.tcpKeepAliveIntervalMs * 1000 : 0))
-        .withHTTPKeepAliveTimeout(Poco::Timespan(
-            client_configuration.http_keep_alive_timeout_ms * 1000)); /// flag indicating whether keep-alive is enabled is set to each session upon creation
+            client_configuration.enableTcpKeepAlive ? client_configuration.tcpKeepAliveIntervalMs * 1000 : 0));
 }
 
 PocoHTTPClient::PocoHTTPClient(const PocoHTTPClientConfiguration & client_configuration)
@@ -164,8 +161,6 @@ PocoHTTPClient::PocoHTTPClient(const PocoHTTPClientConfiguration & client_config
     , get_request_throttler(client_configuration.get_request_throttler)
     , put_request_throttler(client_configuration.put_request_throttler)
     , extra_headers(client_configuration.extra_headers)
-    , http_connection_pool_size(client_configuration.http_connection_pool_size)
-    , wait_on_pool_size_limit(client_configuration.wait_on_pool_size_limit)
 {
 }
 
@@ -308,12 +303,8 @@ void PocoHTTPClient::makeRequestInternal(
     Aws::Utils::RateLimits::RateLimiterInterface * readLimiter,
     Aws::Utils::RateLimits::RateLimiterInterface * writeLimiter) const
 {
-    /// Most sessions in pool are already connected and it is not possible to set proxy host/port to a connected session.
     const auto request_configuration = per_request_configuration();
-    if (http_connection_pool_size)
-        makeRequestInternalImpl<true>(request, request_configuration, response, readLimiter, writeLimiter);
-    else
-        makeRequestInternalImpl<false>(request, request_configuration, response, readLimiter, writeLimiter);
+    makeRequestInternalImpl(request, request_configuration, response, readLimiter, writeLimiter);
 }
 
 String getMethod(const Aws::Http::HttpRequest & request)
@@ -335,7 +326,6 @@ String getMethod(const Aws::Http::HttpRequest & request)
     }
 }
 
-template <bool pooled>
 void PocoHTTPClient::makeRequestInternalImpl(
     Aws::Http::HttpRequest & request,
     const DB::ProxyConfiguration & proxy_configuration,
@@ -343,8 +333,6 @@ void PocoHTTPClient::makeRequestInternalImpl(
     Aws::Utils::RateLimits::RateLimiterInterface *,
     Aws::Utils::RateLimits::RateLimiterInterface *) const
 {
-    using SessionPtr = std::conditional_t<pooled, PooledHTTPSessionPtr, HTTPSessionPtr>;
-
     LoggerPtr log = getLogger("AWSClient");
 
     auto uri = request.GetUri().GetURIString();
@@ -396,40 +384,17 @@ void PocoHTTPClient::makeRequestInternalImpl(
         for (unsigned int attempt = 0; attempt <= s3_max_redirects; ++attempt)
         {
             Poco::URI target_uri(uri);
-            SessionPtr session;
 
-            if (!proxy_configuration.host.empty())
-            {
-                if (enable_s3_requests_logging)
-                    LOG_TEST(log, "Due to reverse proxy host name ({}) won't be resolved on ClickHouse side", uri);
-                /// Reverse proxy can replace host header with resolved ip address instead of host name.
-                /// This can lead to request signature difference on S3 side.
-                if constexpr (pooled)
-                    session = makePooledHTTPSession(
-                        target_uri,
-                        getTimeouts(method, first_attempt, /*first_byte*/ true),
-                        http_connection_pool_size,
-                        wait_on_pool_size_limit,
-                        proxy_configuration);
-                else
-                    session = makeHTTPSession(
-                            target_uri,
-                            getTimeouts(method, first_attempt, /*first_byte*/ true),
-                            proxy_configuration);
-            }
-            else
-            {
-                if constexpr (pooled)
-                    session = makePooledHTTPSession(
-                        target_uri,
-                        getTimeouts(method, first_attempt, /*first_byte*/ true),
-                        http_connection_pool_size,
-                        wait_on_pool_size_limit);
-                else
-                    session = makeHTTPSession(
-                            target_uri,
-                            getTimeouts(method, first_attempt, /*first_byte*/ true));
-            }
+            if (enable_s3_requests_logging && !proxy_configuration.isEmpty())
+                LOG_TEST(log, "Due to reverse proxy host name ({}) won't be resolved on ClickHouse side", uri);
+
+            auto group = for_disk_s3 ? HTTPConnectionGroupType::DISK : HTTPConnectionGroupType::STORAGE;
+
+            auto session = makeHTTPSession(
+                group,
+                target_uri,
+                getTimeouts(method, first_attempt, /*first_byte*/ true),
+                proxy_configuration);
 
             /// In case of error this address will be written to logs
             request.SetResolvedRemoteHost(session->getResolvedAddress());
@@ -612,10 +577,6 @@ void PocoHTTPClient::makeRequestInternalImpl(
         response->SetClientErrorMessage(getCurrentExceptionMessage(false));
 
         addMetric(request, S3MetricType::Errors);
-
-        /// Probably this is socket timeout or something more or less related to DNS
-        /// Let's just remove this host from DNS cache to be more safe
-        DNSResolver::instance().removeHostFromCache(Poco::URI(uri).getHost());
     }
 }
 
diff --git a/src/IO/S3/PocoHTTPClient.h b/src/IO/S3/PocoHTTPClient.h
index 5178d75e7b6..a93a4dfbaf7 100644
--- a/src/IO/S3/PocoHTTPClient.h
+++ b/src/IO/S3/PocoHTTPClient.h
@@ -13,7 +13,7 @@
 #include <IO/ConnectionTimeouts.h>
 #include <IO/HTTPCommon.h>
 #include <IO/HTTPHeaderEntries.h>
-#include <IO/S3/SessionAwareIOStream.h>
+#include <IO/SessionAwareIOStream.h>
 
 #include <aws/core/client/ClientConfiguration.h>
 #include <aws/core/http/HttpClient.h>
@@ -49,12 +49,7 @@ struct PocoHTTPClientConfiguration : public Aws::Client::ClientConfiguration
     ThrottlerPtr put_request_throttler;
     HTTPHeaderEntries extra_headers;
 
-    /// Not a client parameter in terms of HTTP and we won't send it to the server. Used internally to determine when connection have to be re-established.
-    uint32_t http_keep_alive_timeout_ms = 0;
-    /// Zero means pooling will not be used.
-    size_t http_connection_pool_size = 0;
     /// See PoolBase::BehaviourOnLimit
-    bool wait_on_pool_size_limit = true;
     bool s3_use_adaptive_timeouts = true;
 
     std::function<void(const DB::ProxyConfiguration &)> error_report;
@@ -98,12 +93,6 @@ public:
         );
     }
 
-    void SetResponseBody(Aws::IStream & incoming_stream, PooledHTTPSessionPtr & session_) /// NOLINT
-    {
-        body_stream = Aws::Utils::Stream::ResponseStream(
-            Aws::New<SessionAwareIOStream<PooledHTTPSessionPtr>>("http result streambuf", session_, incoming_stream.rdbuf()));
-    }
-
     void SetResponseBody(std::string & response_body) /// NOLINT
     {
         auto stream = Aws::New<std::stringstream>("http result buf", response_body); // STYLE_CHECK_ALLOW_STD_STRING_STREAM
@@ -163,7 +152,6 @@ private:
         EnumSize,
     };
 
-    template <bool pooled>
     void makeRequestInternalImpl(
         Aws::Http::HttpRequest & request,
         const DB::ProxyConfiguration & proxy_configuration,
@@ -196,9 +184,6 @@ protected:
     ThrottlerPtr put_request_throttler;
 
     const HTTPHeaderEntries extra_headers;
-
-    size_t http_connection_pool_size = 0;
-    bool wait_on_pool_size_limit = true;
 };
 
 }
diff --git a/src/IO/SeekableReadBuffer.h b/src/IO/SeekableReadBuffer.h
index c002d30e633..798833e1a9b 100644
--- a/src/IO/SeekableReadBuffer.h
+++ b/src/IO/SeekableReadBuffer.h
@@ -82,7 +82,7 @@ public:
     ///    (e.g. next() or supportsReadAt()).
     ///  * Performance: there's no buffering. Each readBigAt() call typically translates into actual
     ///    IO operation (e.g. HTTP request). Don't use it for small adjacent reads.
-    virtual size_t readBigAt(char * /*to*/, size_t /*n*/, size_t /*offset*/, const std::function<bool(size_t m)> & /*progress_callback*/ = nullptr)
+    virtual size_t readBigAt(char * /*to*/, size_t /*n*/, size_t /*offset*/, const std::function<bool(size_t m)> & /*progress_callback*/ = nullptr) const
         { throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method readBigAt() not implemented"); }
 
     /// Checks if readBigAt() is allowed. May be slow, may throw (e.g. it may do an HTTP request or an fstat).
diff --git a/src/IO/S3/SessionAwareIOStream.h b/src/IO/SessionAwareIOStream.h
similarity index 97%
rename from src/IO/S3/SessionAwareIOStream.h
rename to src/IO/SessionAwareIOStream.h
index babe52545d1..2380bd0fd60 100644
--- a/src/IO/S3/SessionAwareIOStream.h
+++ b/src/IO/SessionAwareIOStream.h
@@ -3,7 +3,7 @@
 #include <iosfwd>
 
 
-namespace DB::S3
+namespace DB
 {
 /**
  * Wrapper of IOStream to store response stream and corresponding HTTP session.
diff --git a/src/IO/WriteBufferFromHTTP.cpp b/src/IO/WriteBufferFromHTTP.cpp
index 8ddcbc03b84..d54e1685017 100644
--- a/src/IO/WriteBufferFromHTTP.cpp
+++ b/src/IO/WriteBufferFromHTTP.cpp
@@ -7,6 +7,7 @@ namespace DB
 {
 
 WriteBufferFromHTTP::WriteBufferFromHTTP(
+    const HTTPConnectionGroupType & connection_group,
     const Poco::URI & uri,
     const std::string & method,
     const std::string & content_type,
@@ -14,9 +15,10 @@ WriteBufferFromHTTP::WriteBufferFromHTTP(
     const HTTPHeaderEntries & additional_headers,
     const ConnectionTimeouts & timeouts,
     size_t buffer_size_,
-    ProxyConfiguration proxy_configuration)
+    ProxyConfiguration proxy_configuration
+)
     : WriteBufferFromOStream(buffer_size_)
-    , session{makeHTTPSession(uri, timeouts, proxy_configuration)}
+    , session{makeHTTPSession(connection_group, uri, timeouts, proxy_configuration)}
     , request{method, uri.getPathAndQuery(), Poco::Net::HTTPRequest::HTTP_1_1}
 {
     request.setHost(uri.getHost());
diff --git a/src/IO/WriteBufferFromHTTP.h b/src/IO/WriteBufferFromHTTP.h
index f1e1e2a9e91..09fd55ec290 100644
--- a/src/IO/WriteBufferFromHTTP.h
+++ b/src/IO/WriteBufferFromHTTP.h
@@ -19,7 +19,8 @@ namespace DB
 class WriteBufferFromHTTP : public WriteBufferFromOStream
 {
 public:
-    explicit WriteBufferFromHTTP(const Poco::URI & uri,
+    explicit WriteBufferFromHTTP(const HTTPConnectionGroupType & connection_group,
+                                 const Poco::URI & uri,
                                  const std::string & method = Poco::Net::HTTPRequest::HTTP_POST, // POST or PUT only
                                  const std::string & content_type = "",
                                  const std::string & content_encoding = "",
diff --git a/src/IO/copyData.cpp b/src/IO/copyData.cpp
index 07222a930b5..d2c7200c350 100644
--- a/src/IO/copyData.cpp
+++ b/src/IO/copyData.cpp
@@ -35,7 +35,7 @@ void copyDataImpl(ReadBuffer & from, WriteBuffer & to, bool check_bytes, size_t
     }
 
     if (check_bytes && bytes > 0)
-        throw Exception(ErrorCodes::ATTEMPT_TO_READ_AFTER_EOF, "Attempt to read after EOF.");
+        throw Exception(ErrorCodes::ATTEMPT_TO_READ_AFTER_EOF, "Attempt to read after EOF, left to copy {} bytes.", bytes);
 }
 
 void copyDataImpl(ReadBuffer & from, WriteBuffer & to, bool check_bytes, size_t bytes, std::function<void()> cancellation_hook, ThrottlerPtr throttler)
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index a81392cb3d8..d658fbe9920 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -380,8 +380,6 @@ struct ContextSharedPart : boost::noncopyable
     OrdinaryBackgroundExecutorPtr moves_executor TSA_GUARDED_BY(background_executors_mutex);
     OrdinaryBackgroundExecutorPtr fetch_executor TSA_GUARDED_BY(background_executors_mutex);
     OrdinaryBackgroundExecutorPtr common_executor TSA_GUARDED_BY(background_executors_mutex);
-    /// The global pool of HTTP sessions for background fetches.
-    PooledSessionFactoryPtr fetches_session_factory TSA_GUARDED_BY(background_executors_mutex);
 
     RemoteHostFilter remote_host_filter;                    /// Allowed URL from config.xml
     HTTPHeaderFilter http_header_filter;                    /// Forbidden HTTP headers from config.xml
@@ -5039,11 +5037,6 @@ void Context::initializeBackgroundExecutorsIfNeeded()
     );
     LOG_INFO(shared->log, "Initialized background executor for move operations with num_threads={}, num_tasks={}", background_move_pool_size, background_move_pool_size);
 
-    auto timeouts = ConnectionTimeouts::getFetchPartHTTPTimeouts(getServerSettings(), getSettingsRef());
-    /// The number of background fetches is limited by the number of threads in the background thread pool.
-    /// It doesn't make any sense to limit the number of connections per host any further.
-    shared->fetches_session_factory = std::make_shared<PooledSessionFactory>(timeouts, background_fetches_pool_size);
-
     shared->fetch_executor = std::make_shared<OrdinaryBackgroundExecutor>
     (
         "Fetch",
@@ -5097,12 +5090,6 @@ OrdinaryBackgroundExecutorPtr Context::getCommonExecutor() const
     return shared->common_executor;
 }
 
-PooledSessionFactoryPtr Context::getCommonFetchesSessionFactory() const
-{
-    SharedLockGuard lock(shared->background_executors_mutex);
-    return shared->fetches_session_factory;
-}
-
 IAsynchronousReader & Context::getThreadPoolReader(FilesystemReaderType type) const
 {
     callOnce(shared->readers_initialized, [&] {
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index b2310eaa85d..c8aa3604a6f 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -206,9 +206,6 @@ using TemporaryDataOnDiskScopePtr = std::shared_ptr<TemporaryDataOnDiskScope>;
 class PreparedSetsCache;
 using PreparedSetsCachePtr = std::shared_ptr<PreparedSetsCache>;
 
-class PooledSessionFactory;
-using PooledSessionFactoryPtr = std::shared_ptr<PooledSessionFactory>;
-
 class SessionTracker;
 
 struct ServerSettings;
@@ -1226,7 +1223,6 @@ public:
     OrdinaryBackgroundExecutorPtr getMovesExecutor() const;
     OrdinaryBackgroundExecutorPtr getFetchesExecutor() const;
     OrdinaryBackgroundExecutorPtr getCommonExecutor() const;
-    PooledSessionFactoryPtr getCommonFetchesSessionFactory() const;
 
     IAsynchronousReader & getThreadPoolReader(FilesystemReaderType type) const;
 #if USE_LIBURING
diff --git a/src/Interpreters/DDLTask.cpp b/src/Interpreters/DDLTask.cpp
index 6a8f82914bf..fe2baea6b4e 100644
--- a/src/Interpreters/DDLTask.cpp
+++ b/src/Interpreters/DDLTask.cpp
@@ -44,6 +44,11 @@ bool HostID::isLocalAddress(UInt16 clickhouse_port) const
     {
         return DB::isLocalAddress(DNSResolver::instance().resolveAddress(host_name, port), clickhouse_port);
     }
+    catch (const DB::NetException &)
+    {
+        /// Avoid "Host not found" exceptions
+        return false;
+    }
     catch (const Poco::Net::NetException &)
     {
         /// Avoid "Host not found" exceptions
diff --git a/src/Interpreters/InterpreterSystemQuery.cpp b/src/Interpreters/InterpreterSystemQuery.cpp
index 37f3c8b2958..026e0c166b4 100644
--- a/src/Interpreters/InterpreterSystemQuery.cpp
+++ b/src/Interpreters/InterpreterSystemQuery.cpp
@@ -11,6 +11,7 @@
 #include <Common/CurrentMetrics.h>
 #include <Common/FailPoint.h>
 #include <Common/PageCache.h>
+#include <Common/HostResolvePool.h>
 #include <Interpreters/Cache/FileCacheFactory.h>
 #include <Interpreters/Cache/FileCache.h>
 #include <Interpreters/Context.h>
@@ -333,10 +334,17 @@ BlockIO InterpreterSystemQuery::execute()
         {
             getContext()->checkAccess(AccessType::SYSTEM_DROP_DNS_CACHE);
             DNSResolver::instance().dropCache();
+            HostResolversPool::instance().dropCache();
             /// Reinitialize clusters to update their resolved_addresses
             system_context->reloadClusterConfig();
             break;
         }
+        case Type::DROP_CONNECTIONS_CACHE:
+        {
+            getContext()->checkAccess(AccessType::SYSTEM_DROP_CONNECTIONS_CACHE);
+            HTTPConnectionPools::instance().dropCache();
+            break;
+        }
         case Type::DROP_MARK_CACHE:
             getContext()->checkAccess(AccessType::SYSTEM_DROP_MARK_CACHE);
             system_context->clearMarkCache();
@@ -1201,6 +1209,7 @@ AccessRightsElements InterpreterSystemQuery::getRequiredAccessForDDLOnCluster()
             break;
         }
         case Type::DROP_DNS_CACHE:
+        case Type::DROP_CONNECTIONS_CACHE:
         case Type::DROP_MARK_CACHE:
         case Type::DROP_MMAP_CACHE:
         case Type::DROP_QUERY_CACHE:
diff --git a/src/Parsers/ASTSystemQuery.cpp b/src/Parsers/ASTSystemQuery.cpp
index e2ebaee8438..effc7207793 100644
--- a/src/Parsers/ASTSystemQuery.cpp
+++ b/src/Parsers/ASTSystemQuery.cpp
@@ -384,6 +384,7 @@ void ASTSystemQuery::formatImpl(const FormatSettings & settings, FormatState & s
         case Type::KILL:
         case Type::SHUTDOWN:
         case Type::DROP_DNS_CACHE:
+        case Type::DROP_CONNECTIONS_CACHE:
         case Type::DROP_MMAP_CACHE:
         case Type::DROP_QUERY_CACHE:
         case Type::DROP_MARK_CACHE:
diff --git a/src/Parsers/ASTSystemQuery.h b/src/Parsers/ASTSystemQuery.h
index 48be7f6b84f..70a9e27178d 100644
--- a/src/Parsers/ASTSystemQuery.h
+++ b/src/Parsers/ASTSystemQuery.h
@@ -22,6 +22,7 @@ public:
         KILL,
         SUSPEND,
         DROP_DNS_CACHE,
+        DROP_CONNECTIONS_CACHE,
         DROP_MARK_CACHE,
         DROP_UNCOMPRESSED_CACHE,
         DROP_INDEX_MARK_CACHE,
diff --git a/src/Processors/Formats/Impl/AvroRowInputFormat.cpp b/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
index 8ef2cda5587..2ed55cca30c 100644
--- a/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
@@ -1016,7 +1016,7 @@ private:
                     http_basic_credentials.authenticate(request);
                 }
 
-                auto session = makePooledHTTPSession(url, timeouts, 1);
+                auto session = makeHTTPSession(HTTPConnectionGroupType::HTTP, url, timeouts);
                 session->sendRequest(request);
 
                 Poco::Net::HTTPResponse response;
@@ -1025,8 +1025,6 @@ private:
                 Poco::JSON::Parser parser;
                 auto json_body = parser.parse(*response_body).extract<Poco::JSON::Object::Ptr>();
 
-                /// Response was fully read.
-                markSessionForReuse(session);
 
                 auto schema = json_body->getValue<std::string>("schema");
                 LOG_TRACE((getLogger("AvroConfluentRowInputFormat")), "Successfully fetched schema id = {}\n{}", id, schema);
diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index 168c5f729ce..05e1129f9dc 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -526,14 +526,12 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> Fetcher::fetchSelected
         creds.setPassword(password);
     }
 
-    std::unique_ptr<PooledReadWriteBufferFromHTTP> in = std::make_unique<PooledReadWriteBufferFromHTTP>(
-        uri,
-        Poco::Net::HTTPRequest::HTTP_POST,
-        nullptr,
-        creds,
-        DBMS_DEFAULT_BUFFER_SIZE,
-        0, /* no redirects */
-        context->getCommonFetchesSessionFactory());
+    auto in = BuilderRWBufferFromHTTP(uri)
+                  .withConnectionGroup(HTTPConnectionGroupType::HTTP)
+                  .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                  .withTimeouts(timeouts)
+                  .withDelayInit(false)
+                  .create(creds);
 
     int server_protocol_version = parse<int>(in->getResponseCookie("server_protocol_version", "0"));
     String remote_fs_metadata = parse<String>(in->getResponseCookie("remote_fs_metadata", ""));
@@ -557,11 +555,13 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> Fetcher::fetchSelected
     if (server_protocol_version >= REPLICATION_PROTOCOL_VERSION_WITH_PARTS_SIZE)
     {
         readBinary(sum_files_size, *in);
+
         if (server_protocol_version >= REPLICATION_PROTOCOL_VERSION_WITH_PARTS_SIZE_AND_TTL_INFOS)
         {
             IMergeTreeDataPart::TTLInfos ttl_infos;
             String ttl_infos_string;
             readBinary(ttl_infos_string, *in);
+
             ReadBufferFromString ttl_infos_buffer(ttl_infos_string);
             assertString("ttl format version: 1\n", ttl_infos_buffer);
             ttl_infos.read(ttl_infos_buffer);
@@ -609,6 +609,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> Fetcher::fetchSelected
     }
 
     UInt64 revision = parse<UInt64>(in->getResponseCookie("disk_revision", "0"));
+
     if (revision)
         disk->syncRevision(revision);
 
@@ -743,7 +744,7 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPartToMemory(
     const UUID & part_uuid,
     const StorageMetadataPtr & metadata_snapshot,
     ContextPtr context,
-    PooledReadWriteBufferFromHTTP & in,
+    ReadWriteBufferFromHTTP & in,
     size_t projections,
     bool is_projection,
     ThrottlerPtr throttler)
@@ -799,7 +800,7 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPartToMemory(
 void Fetcher::downloadBaseOrProjectionPartToDisk(
     const String & replica_path,
     const MutableDataPartStoragePtr & data_part_storage,
-    PooledReadWriteBufferFromHTTP & in,
+    ReadWriteBufferFromHTTP & in,
     OutputBufferGetter output_buffer_getter,
     MergeTreeData::DataPart::Checksums & checksums,
     ThrottlerPtr throttler,
@@ -807,6 +808,8 @@ void Fetcher::downloadBaseOrProjectionPartToDisk(
 {
     size_t files;
     readBinary(files, in);
+    LOG_DEBUG(log, "Downloading files {}", files);
+
 
     std::vector<std::unique_ptr<WriteBufferFromFileBase>> written_files;
 
@@ -872,7 +875,7 @@ MergeTreeData::MutableDataPartPtr Fetcher::downloadPartToDisk(
     const String & tmp_prefix,
     DiskPtr disk,
     bool to_remote_disk,
-    PooledReadWriteBufferFromHTTP & in,
+    ReadWriteBufferFromHTTP & in,
     OutputBufferGetter output_buffer_getter,
     size_t projections,
     ThrottlerPtr throttler,
diff --git a/src/Storages/MergeTree/DataPartsExchange.h b/src/Storages/MergeTree/DataPartsExchange.h
index 8c15dc3cfdb..45a6cf83872 100644
--- a/src/Storages/MergeTree/DataPartsExchange.h
+++ b/src/Storages/MergeTree/DataPartsExchange.h
@@ -20,7 +20,7 @@ namespace DB
 {
 
 class StorageReplicatedMergeTree;
-class PooledReadWriteBufferFromHTTP;
+class ReadWriteBufferFromHTTP;
 
 namespace DataPartsExchange
 {
@@ -94,7 +94,7 @@ private:
     void downloadBaseOrProjectionPartToDisk(
         const String & replica_path,
         const MutableDataPartStoragePtr & data_part_storage,
-        PooledReadWriteBufferFromHTTP & in,
+        ReadWriteBufferFromHTTP & in,
         OutputBufferGetter output_buffer_getter,
         MergeTreeData::DataPart::Checksums & checksums,
         ThrottlerPtr throttler,
@@ -107,7 +107,7 @@ private:
         const String & tmp_prefix_,
         DiskPtr disk,
         bool to_remote_disk,
-        PooledReadWriteBufferFromHTTP & in,
+        ReadWriteBufferFromHTTP & in,
         OutputBufferGetter output_buffer_getter,
         size_t projections,
         ThrottlerPtr throttler,
@@ -120,7 +120,7 @@ private:
        const UUID & part_uuid,
        const StorageMetadataPtr & metadata_snapshot,
        ContextPtr context,
-       PooledReadWriteBufferFromHTTP & in,
+       ReadWriteBufferFromHTTP & in,
        size_t projections,
        bool is_projection,
        ThrottlerPtr throttler);
@@ -131,7 +131,7 @@ private:
        bool to_detached,
        const String & tmp_prefix_,
        DiskPtr disk,
-       PooledReadWriteBufferFromHTTP & in,
+       ReadWriteBufferFromHTTP & in,
        size_t projections,
        MergeTreeData::DataPart::Checksums & checksums,
        ThrottlerPtr throttler);
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 4e3d8d38b0e..3b766ac8d26 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -963,7 +963,7 @@ SinkToStoragePtr StorageDistributed::write(const ASTPtr &, const StorageMetadata
     else
         columns_to_send = metadata_snapshot->getSampleBlockNonMaterialized().getNames();
 
-    /// DistributedSink will not own cluster, but will own ConnectionPools of the cluster
+    /// DistributedSink will not own cluster
     return std::make_shared<DistributedSink>(
         local_context, *this, metadata_snapshot, cluster, insert_sync, timeout,
         StorageID{remote_database, remote_table}, columns_to_send);
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 72bbcdd3ea8..11da394feec 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -1420,8 +1420,10 @@ void StorageS3::Configuration::connect(const ContextPtr & context)
         url.uri.getScheme());
 
     client_configuration.endpointOverride = url.endpoint;
+    /// seems as we don't use it
     client_configuration.maxConnections = static_cast<unsigned>(request_settings.max_connections);
-    client_configuration.http_connection_pool_size = global_settings.s3_http_connection_pool_size;
+    client_configuration.connectTimeoutMs = local_settings.s3_connect_timeout_ms;
+
     auto headers = auth_settings.headers;
     if (!headers_from_ast.empty())
         headers.insert(headers.end(), headers_from_ast.begin(), headers_from_ast.end());
diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index 039be222e7e..b539a152b69 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -461,21 +461,23 @@ std::pair<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> StorageURLSource:
         try
         {
             auto res = std::make_unique<ReadWriteBufferFromHTTP>(
+                HTTPConnectionGroupType::STORAGE,
                 request_uri,
                 http_method,
-                callback,
+                proxy_config,
+                read_settings,
                 timeouts,
                 credentials,
-                settings.max_http_get_redirects,
-                settings.max_read_buffer_size,
-                read_settings,
-                headers,
                 &context_->getRemoteHostFilter(),
+                settings.max_read_buffer_size,
+                settings.max_http_get_redirects,
+                callback,
+                /*use_external_buffer*/ false,
+                skip_url_not_found_error,
+                headers,
                 delay_initialization,
-                /* use_external_buffer */ false,
-                /* skip_url_not_found_error */ skip_url_not_found_error,
-                /* file_info */ std::nullopt,
-                proxy_config);
+                /*file_info_*/ std::nullopt);
+
 
             if (context_->getSettingsRef().engine_url_skip_empty_files && res->eof() && option != std::prev(end))
             {
@@ -547,7 +549,7 @@ StorageURLSink::StorageURLSink(
     auto proxy_config = getProxyConfiguration(http_method);
 
     auto write_buffer = std::make_unique<WriteBufferFromHTTP>(
-        Poco::URI(uri), http_method, content_type, content_encoding, headers, timeouts, DBMS_DEFAULT_BUFFER_SIZE, proxy_config
+        HTTPConnectionGroupType::STORAGE, Poco::URI(uri), http_method, content_type, content_encoding, headers, timeouts, DBMS_DEFAULT_BUFFER_SIZE, proxy_config
     );
 
     const auto & settings = context->getSettingsRef();
@@ -1320,24 +1322,17 @@ std::optional<time_t> IStorageURLBase::tryGetLastModificationTime(
 
     auto proxy_config = getProxyConfiguration(uri.getScheme());
 
-    ReadWriteBufferFromHTTP buf(
-        uri,
-        Poco::Net::HTTPRequest::HTTP_GET,
-        {},
-        getHTTPTimeouts(context),
-        credentials,
-        settings.max_http_get_redirects,
-        settings.max_read_buffer_size,
-        context->getReadSettings(),
-        headers,
-        &context->getRemoteHostFilter(),
-        true,
-        false,
-        false,
-        std::nullopt,
-        proxy_config);
+    auto buf = BuilderRWBufferFromHTTP(uri)
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withSettings(context->getReadSettings())
+                   .withTimeouts(getHTTPTimeouts(context))
+                   .withHostFilter(&context->getRemoteHostFilter())
+                   .withBufSize(settings.max_read_buffer_size)
+                   .withRedirects(settings.max_http_get_redirects)
+                   .withHeaders(headers)
+                   .create(credentials);
 
-    return buf.tryGetLastModificationTime();
+    return buf->tryGetLastModificationTime();
 }
 
 StorageURL::StorageURL(
diff --git a/src/TableFunctions/ITableFunctionXDBC.cpp b/src/TableFunctions/ITableFunctionXDBC.cpp
index ca6d40a05a3..a5c16b3a5aa 100644
--- a/src/TableFunctions/ITableFunctionXDBC.cpp
+++ b/src/TableFunctions/ITableFunctionXDBC.cpp
@@ -153,17 +153,16 @@ ColumnsDescription ITableFunctionXDBC::getActualTableStructure(ContextPtr contex
     columns_info_uri.addQueryParameter("external_table_functions_use_nulls", toString(use_nulls));
 
     Poco::Net::HTTPBasicCredentials credentials{};
-    ReadWriteBufferFromHTTP buf(
-        columns_info_uri,
-        Poco::Net::HTTPRequest::HTTP_POST,
-        {},
-        ConnectionTimeouts::getHTTPTimeouts(
-            context->getSettingsRef(),
-            context->getServerSettings().keep_alive_timeout),
-        credentials);
+    auto buf = BuilderRWBufferFromHTTP(columns_info_uri)
+                   .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
+                   .withTimeouts(ConnectionTimeouts::getHTTPTimeouts(
+                        context->getSettingsRef(),
+                        context->getServerSettings().keep_alive_timeout))
+                   .create(credentials);
 
     std::string columns_info;
-    readStringBinary(columns_info, buf);
+    readStringBinary(columns_info, *buf);
     NamesAndTypesList columns = NamesAndTypesList::parse(columns_info);
 
     return ColumnsDescription{columns};
diff --git a/tests/integration/test_backup_restore_new/test_cancel_backup.py b/tests/integration/test_backup_restore_new/test_cancel_backup.py
index 6016bac9197..cce23a7e932 100644
--- a/tests/integration/test_backup_restore_new/test_cancel_backup.py
+++ b/tests/integration/test_backup_restore_new/test_cancel_backup.py
@@ -177,7 +177,7 @@ def cancel_restore(restore_id):
 def test_cancel_backup():
     # We use partitioning so backups would contain more files.
     node.query(
-        "CREATE TABLE tbl (x UInt64) ENGINE=MergeTree() ORDER BY tuple() PARTITION BY x%5"
+        "CREATE TABLE tbl (x UInt64) ENGINE=MergeTree() ORDER BY tuple() PARTITION BY x%20"
     )
 
     node.query(f"INSERT INTO tbl SELECT number FROM numbers(500)")
diff --git a/tests/integration/test_checking_s3_blobs_paranoid/configs/setting.xml b/tests/integration/test_checking_s3_blobs_paranoid/configs/setting.xml
index 23ab57f9330..d94ef68d9c4 100644
--- a/tests/integration/test_checking_s3_blobs_paranoid/configs/setting.xml
+++ b/tests/integration/test_checking_s3_blobs_paranoid/configs/setting.xml
@@ -5,6 +5,7 @@
         <default>
             <s3_check_objects_after_upload>1</s3_check_objects_after_upload>
             <enable_s3_requests_logging>1</enable_s3_requests_logging>
+            <s3_connect_timeout_ms>10000</s3_connect_timeout_ms>
         </default>
     </profiles>
     <users>
diff --git a/tests/integration/test_checking_s3_blobs_paranoid/configs/storage_conf.xml b/tests/integration/test_checking_s3_blobs_paranoid/configs/storage_conf.xml
index 7b1f503ed55..84f7f9f1b6d 100644
--- a/tests/integration/test_checking_s3_blobs_paranoid/configs/storage_conf.xml
+++ b/tests/integration/test_checking_s3_blobs_paranoid/configs/storage_conf.xml
@@ -19,6 +19,7 @@
                 <access_key_id>minio</access_key_id>
                 <secret_access_key>minio123</secret_access_key>
                 <skip_access_check>1</skip_access_check>
+                <s3_connect_timeout_ms>10000</s3_connect_timeout_ms>
             </broken_s3>
         </disks>
 
diff --git a/tests/integration/test_disk_over_web_server/test.py b/tests/integration/test_disk_over_web_server/test.py
index e84209a03a1..dbcd7cc3c21 100644
--- a/tests/integration/test_disk_over_web_server/test.py
+++ b/tests/integration/test_disk_over_web_server/test.py
@@ -278,7 +278,7 @@ def test_unavailable_server(cluster):
             "Caught exception while loading metadata.*Connection refused"
         )
         assert node2.contains_in_log(
-            "HTTP request to \`http://nginx:8080/test1/.*\` failed at try 1/10 with bytes read: 0/unknown. Error: Connection refused."
+            "Failed to make request to 'http://nginx:8080/test1/.*'. Error: 'Connection refused'. Failed at try 10/10."
         )
     finally:
         node2.exec_in_container(
diff --git a/tests/integration/test_dns_cache/test.py b/tests/integration/test_dns_cache/test.py
index 9c1c9797383..a6db26c8575 100644
--- a/tests/integration/test_dns_cache/test.py
+++ b/tests/integration/test_dns_cache/test.py
@@ -46,6 +46,7 @@ def cluster_without_dns_cache_update():
 
     except Exception as ex:
         print(ex)
+        raise
 
     finally:
         cluster.shutdown()
@@ -61,6 +62,7 @@ def test_ip_change_drop_dns_cache(cluster_without_dns_cache_update):
     node2.set_hosts([("2001:3984:3989::1:1111", "node1")])
     # drop DNS cache
     node2.query("SYSTEM DROP DNS CACHE")
+    node2.query("SYSTEM DROP CONNECTIONS CACHE")
 
     # First we check, that normal replication works
     node1.query(
@@ -86,6 +88,7 @@ def test_ip_change_drop_dns_cache(cluster_without_dns_cache_update):
 
     # drop DNS cache
     node2.query("SYSTEM DROP DNS CACHE")
+    node2.query("SYSTEM DROP CONNECTIONS CACHE")
     # Data is downloaded
     assert_eq_with_retry(node2, "SELECT count(*) from test_table_drop", "6")
 
@@ -124,6 +127,7 @@ def cluster_with_dns_cache_update():
 
     except Exception as ex:
         print(ex)
+        raise
 
     finally:
         cluster.shutdown()
@@ -267,6 +271,11 @@ def test_user_access_ip_change(cluster_with_dns_cache_update, node):
             privileged=True,
             user="root",
         )
+        node.exec_in_container(
+            ["bash", "-c", 'clickhouse client -q "SYSTEM DROP CONNECTIONS CACHE"'],
+            privileged=True,
+            user="root",
+        )
         retry_count = 1
 
     assert_eq_with_retry(
@@ -296,7 +305,8 @@ def test_host_is_drop_from_cache_after_consecutive_failures(
     # Note that the list of hosts in variable since lost_host will be there too (and it's dropped and added back)
     # dns_update_short -> dns_max_consecutive_failures set to 6
     assert node4.wait_for_log_line(
-        "Code: 198. DB::Exception: Not found address of host: InvalidHostThatDoesNotExist."
+        regexp="Code: 198. DB::NetException: Not found address of host: InvalidHostThatDoesNotExist.",
+        look_behind_lines=300,
     )
     assert node4.wait_for_log_line(
         "Cached hosts not found:.*InvalidHostThatDoesNotExist**",
diff --git a/tests/integration/test_http_failover/test.py b/tests/integration/test_http_failover/test.py
index 41b55ef635c..5920fd980ce 100644
--- a/tests/integration/test_http_failover/test.py
+++ b/tests/integration/test_http_failover/test.py
@@ -56,9 +56,10 @@ def dst_node_addrs(started_cluster, request):
 
     yield
 
-    # Clear static DNS entries
+    # Clear static DNS entries and all keep alive connections
     src_node.set_hosts([])
     src_node.query("SYSTEM DROP DNS CACHE")
+    src_node.query("SYSTEM DROP CONNECTIONS CACHE")
 
 
 @pytest.mark.parametrize(
@@ -77,7 +78,8 @@ def dst_node_addrs(started_cluster, request):
 def test_url_destination_host_with_multiple_addrs(dst_node_addrs, expectation):
     with expectation:
         result = src_node.query(
-            "SELECT * FROM url('http://dst_node:8123/?query=SELECT+42', TSV, 'column1 UInt32')"
+            "SELECT * FROM url('http://dst_node:8123/?query=SELECT+42', TSV, 'column1 UInt32')",
+            settings={"http_max_tries": "3"},
         )
         assert result == "42\n"
 
diff --git a/tests/integration/test_redirect_url_storage/test.py b/tests/integration/test_redirect_url_storage/test.py
index 17a9a03008e..033f02d7bde 100644
--- a/tests/integration/test_redirect_url_storage/test.py
+++ b/tests/integration/test_redirect_url_storage/test.py
@@ -150,7 +150,7 @@ def test_url_reconnect(started_cluster):
         def select():
             global result
             result = node1.query(
-                "select sum(cityHash64(id)) from url('http://hdfs1:50075/webhdfs/v1/storage_big?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV', 'id Int32') settings http_max_tries = 10, http_retry_max_backoff_ms=1000"
+                "select sum(cityHash64(id)) from url('http://hdfs1:50075/webhdfs/v1/storage_big?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'TSV', 'id Int32') settings http_max_tries=10, http_retry_max_backoff_ms=1000, http_make_head_request=false"
             )
             assert int(result) == 6581218782194912115
 
diff --git a/tests/integration/test_s3_table_functions/test.py b/tests/integration/test_s3_table_functions/test.py
index a6def175136..ff62d1a9eac 100644
--- a/tests/integration/test_s3_table_functions/test.py
+++ b/tests/integration/test_s3_table_functions/test.py
@@ -80,6 +80,7 @@ def test_s3_table_functions_timeouts(started_cluster):
     Test with timeout limit of 1200ms.
     This should raise an Exception and pass.
     """
+
     with PartitionManager() as pm:
         pm.add_network_delay(node, 1200)
 
diff --git a/tests/integration/test_storage_s3/s3_mocks/unstable_server.py b/tests/integration/test_storage_s3/s3_mocks/unstable_server.py
index 5ef781bdc9e..70d49b7c1b0 100644
--- a/tests/integration/test_storage_s3/s3_mocks/unstable_server.py
+++ b/tests/integration/test_storage_s3/s3_mocks/unstable_server.py
@@ -118,5 +118,5 @@ class RequestHandler(http.server.BaseHTTPRequestHandler):
             self.wfile.write(b"OK")
 
 
-httpd = http.server.HTTPServer(("0.0.0.0", int(sys.argv[1])), RequestHandler)
+httpd = http.server.ThreadingHTTPServer(("0.0.0.0", int(sys.argv[1])), RequestHandler)
 httpd.serve_forever()
diff --git a/tests/queries/0_stateless/00646_url_engine.python b/tests/queries/0_stateless/00646_url_engine.python
index dc0fdd1a71d..931d18a3f80 100644
--- a/tests/queries/0_stateless/00646_url_engine.python
+++ b/tests/queries/0_stateless/00646_url_engine.python
@@ -12,6 +12,7 @@ import urllib.request
 import subprocess
 from io import StringIO
 from http.server import BaseHTTPRequestHandler, HTTPServer
+from socketserver import ThreadingMixIn
 
 
 def is_ipv6(host):
@@ -145,11 +146,19 @@ class HTTPServerV6(HTTPServer):
     address_family = socket.AF_INET6
 
 
+class ThreadedHTTPServer(ThreadingMixIn, HTTPServer):
+    pass
+
+
+class ThreadedHTTPServerV6(ThreadingMixIn, HTTPServerV6):
+    pass
+
+
 def start_server():
     if IS_IPV6:
-        httpd = HTTPServerV6(HTTP_SERVER_ADDRESS, CSVHTTPServer)
+        httpd = ThreadedHTTPServerV6(HTTP_SERVER_ADDRESS, CSVHTTPServer)
     else:
-        httpd = HTTPServer(HTTP_SERVER_ADDRESS, CSVHTTPServer)
+        httpd = ThreadedHTTPServer(HTTP_SERVER_ADDRESS, CSVHTTPServer)
 
     t = threading.Thread(target=httpd.serve_forever)
     return t, httpd
diff --git a/tests/queries/0_stateless/01271_show_privileges.reference b/tests/queries/0_stateless/01271_show_privileges.reference
index 7af299c6728..b18ae8a99be 100644
--- a/tests/queries/0_stateless/01271_show_privileges.reference
+++ b/tests/queries/0_stateless/01271_show_privileges.reference
@@ -105,6 +105,7 @@ NAMED COLLECTION ADMIN	['NAMED COLLECTION CONTROL']	NAMED_COLLECTION	ALL
 SET DEFINER	[]	USER_NAME	ALL
 SYSTEM SHUTDOWN	['SYSTEM KILL','SHUTDOWN']	GLOBAL	SYSTEM
 SYSTEM DROP DNS CACHE	['SYSTEM DROP DNS','DROP DNS CACHE','DROP DNS']	GLOBAL	SYSTEM DROP CACHE
+SYSTEM DROP CONNECTIONS CACHE	['SYSTEM DROP CONNECTIONS CACHE','DROP CONNECTIONS CACHE']	GLOBAL	SYSTEM DROP CACHE
 SYSTEM DROP MARK CACHE	['SYSTEM DROP MARK','DROP MARK CACHE','DROP MARKS']	GLOBAL	SYSTEM DROP CACHE
 SYSTEM DROP UNCOMPRESSED CACHE	['SYSTEM DROP UNCOMPRESSED','DROP UNCOMPRESSED CACHE','DROP UNCOMPRESSED']	GLOBAL	SYSTEM DROP CACHE
 SYSTEM DROP MMAP CACHE	['SYSTEM DROP MMAP','DROP MMAP CACHE','DROP MMAP']	GLOBAL	SYSTEM DROP CACHE
diff --git a/tests/queries/0_stateless/01293_show_settings.reference b/tests/queries/0_stateless/01293_show_settings.reference
index f053387d1c5..187f55697e4 100644
--- a/tests/queries/0_stateless/01293_show_settings.reference
+++ b/tests/queries/0_stateless/01293_show_settings.reference
@@ -3,6 +3,7 @@ connect_timeout	Seconds	10
 connect_timeout_with_failover_ms	Milliseconds	2000
 connect_timeout_with_failover_secure_ms	Milliseconds	3000
 external_storage_connect_timeout_sec	UInt64	10
+s3_connect_timeout_ms	UInt64	1000
 filesystem_prefetch_max_memory_usage	UInt64	1073741824
 max_untracked_memory	UInt64	1048576
 memory_profiler_step	UInt64	1048576
diff --git a/tests/queries/0_stateless/02205_HTTP_user_agent.python b/tests/queries/0_stateless/02205_HTTP_user_agent.python
index d8f8a32b6db..83089741bf2 100644
--- a/tests/queries/0_stateless/02205_HTTP_user_agent.python
+++ b/tests/queries/0_stateless/02205_HTTP_user_agent.python
@@ -1,6 +1,7 @@
 #!/usr/bin/env python3
 
 from http.server import SimpleHTTPRequestHandler, HTTPServer
+from socketserver import ThreadingMixIn
 import socket
 import sys
 import threading
@@ -116,11 +117,19 @@ class HTTPServerV6(HTTPServer):
     address_family = socket.AF_INET6
 
 
+class ThreadedHTTPServer(ThreadingMixIn, HTTPServer):
+    pass
+
+
+class ThreadedHTTPServerV6(ThreadingMixIn, HTTPServerV6):
+    pass
+
+
 def start_server(requests_amount):
     if IS_IPV6:
-        httpd = HTTPServerV6(HTTP_SERVER_ADDRESS, HttpProcessor)
+        httpd = ThreadedHTTPServerV6(HTTP_SERVER_ADDRESS, HttpProcessor)
     else:
-        httpd = HTTPServer(HTTP_SERVER_ADDRESS, HttpProcessor)
+        httpd = ThreadedHTTPServer(HTTP_SERVER_ADDRESS, HttpProcessor)
 
     def real_func():
         for i in range(requests_amount):
diff --git a/tests/queries/0_stateless/02233_HTTP_ranged.python b/tests/queries/0_stateless/02233_HTTP_ranged.python
index 66ef3304098..5d06e4824b1 100644
--- a/tests/queries/0_stateless/02233_HTTP_ranged.python
+++ b/tests/queries/0_stateless/02233_HTTP_ranged.python
@@ -1,6 +1,7 @@
 #!/usr/bin/env python3
 
 from http.server import BaseHTTPRequestHandler, HTTPServer
+from socketserver import ThreadingMixIn
 import socket
 import sys
 import re
@@ -206,13 +207,22 @@ class HTTPServerV6(HTTPServer):
     address_family = socket.AF_INET6
 
 
+class ThreadedHTTPServer(ThreadingMixIn, HTTPServer):
+    pass
+
+
+class ThreadedHTTPServerV6(ThreadingMixIn, HTTPServerV6):
+    pass
+
+
 def start_server():
     if IS_IPV6:
-        httpd = HTTPServerV6(HTTP_SERVER_ADDRESS, HttpProcessor)
+        httpd = ThreadedHTTPServerV6(HTTP_SERVER_ADDRESS, HttpProcessor)
     else:
-        httpd = HTTPServer(HTTP_SERVER_ADDRESS, HttpProcessor)
+        httpd = ThreadedHTTPServer(HTTP_SERVER_ADDRESS, HttpProcessor)
 
     t = threading.Thread(target=httpd.serve_forever)
+    t.start()
     return t, httpd
 
 
@@ -235,8 +245,6 @@ def run_test(allow_range, settings, check_retries=False):
         HttpProcessor.responses_to_get = ["500", "200", "206"]
     retries_num = len(HttpProcessor.responses_to_get)
 
-    t, httpd = start_server()
-    t.start()
     test_select(settings)
 
     download_buffer_size = settings["max_download_buffer_size"]
@@ -261,12 +269,12 @@ def run_test(allow_range, settings, check_retries=False):
         if HttpProcessor.range_used:
             raise Exception("HTTP Range used while not supported")
 
-    httpd.shutdown()
-    t.join()
     print("PASSED")
 
 
 def main():
+    t, httpd = start_server()
+
     settings = {"max_download_buffer_size": 20}
 
     # Test Accept-Ranges=False
@@ -285,10 +293,15 @@ def main():
     settings["max_download_threads"] = 2
     run_test(allow_range=True, settings=settings, check_retries=True)
 
+    httpd.shutdown()
+    t.join()
+
 
 if __name__ == "__main__":
     try:
         main()
+        sys.stdout.flush()
+        os._exit(0)
     except Exception as ex:
         exc_type, exc_value, exc_traceback = sys.exc_info()
         traceback.print_tb(exc_traceback, file=sys.stderr)
diff --git a/tests/queries/0_stateless/02675_profile_events_from_query_log_and_client.sh b/tests/queries/0_stateless/02675_profile_events_from_query_log_and_client.sh
index 288f1129b53..e346d9893a7 100755
--- a/tests/queries/0_stateless/02675_profile_events_from_query_log_and_client.sh
+++ b/tests/queries/0_stateless/02675_profile_events_from_query_log_and_client.sh
@@ -9,7 +9,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 echo "INSERT TO S3"
 $CLICKHOUSE_CLIENT --print-profile-events --profile-events-delay-ms=-1 -nq "
 INSERT INTO TABLE FUNCTION s3('http://localhost:11111/test/profile_events.csv', 'test', 'testtest', 'CSV', 'number UInt64') SELECT number FROM numbers(1000000) SETTINGS s3_max_single_part_upload_size = 10, s3_truncate_on_insert = 1;
-" 2>&1 | grep -o -e '\ \[\ .*\ \]\ S3.*:\ .*\ ' | grep -v 'Microseconds' | sort
+" 2>&1 | grep -o -e '\ \[\ .*\ \]\ S3.*:\ .*\ ' | grep -v 'Microseconds' | grep -v 'S3DiskConnections' | grep -v 'S3DiskAddresses' | sort
 
 echo "CHECK WITH query_log"
 $CLICKHOUSE_CLIENT -nq "
diff --git a/tests/queries/0_stateless/02789_reading_from_s3_with_connection_pool.sh b/tests/queries/0_stateless/02789_reading_from_s3_with_connection_pool.sh
index ce90157d004..e4a1de9a2ec 100755
--- a/tests/queries/0_stateless/02789_reading_from_s3_with_connection_pool.sh
+++ b/tests/queries/0_stateless/02789_reading_from_s3_with_connection_pool.sh
@@ -19,8 +19,8 @@ query_id=$(${CLICKHOUSE_CLIENT} --query "select queryID() from ($query) limit 1"
 ${CLICKHOUSE_CLIENT} --query "SYSTEM FLUSH LOGS"
 ${CLICKHOUSE_CLIENT} -nm --query "
 WITH
-    ProfileEvents['ReadBufferFromS3ResetSessions'] AS reset,
-    ProfileEvents['ReadBufferFromS3PreservedSessions'] AS preserved
+    ProfileEvents['DiskConnectionsReset'] AS reset,
+    ProfileEvents['DiskConnectionsPreserved'] AS preserved
 SELECT preserved > reset
 FROM system.query_log
 WHERE type = 'QueryFinish'
@@ -51,7 +51,7 @@ select queryID() from(
 " 2>&1)
 ${CLICKHOUSE_CLIENT} --query "SYSTEM FLUSH LOGS"
 ${CLICKHOUSE_CLIENT} -nm --query "
-SELECT ProfileEvents['ReadWriteBufferFromHTTPPreservedSessions'] > 0
+SELECT ProfileEvents['StorageConnectionsPreserved'] > 0
 FROM system.query_log
 WHERE type = 'QueryFinish'
     AND current_database = currentDatabase()
diff --git a/tests/queries/0_stateless/02833_url_without_path_encoding.sh b/tests/queries/0_stateless/02833_url_without_path_encoding.sh
index b71586099cf..eb845c6b45b 100755
--- a/tests/queries/0_stateless/02833_url_without_path_encoding.sh
+++ b/tests/queries/0_stateless/02833_url_without_path_encoding.sh
@@ -8,5 +8,5 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 $CLICKHOUSE_CLIENT -q "select count() from url('http://localhost:11111/test%2Fa.tsv') settings enable_url_encoding=1"
 
 # Grep 'test%2Fa.tsv' to ensure that path wasn't encoded/decoded
-$CLICKHOUSE_CLIENT -q "select count() from url('http://localhost:11111/test%2Fa.tsv') settings enable_url_encoding=0" 2>&1 | grep -o "test%2Fa.tsv" -m1
-
+$CLICKHOUSE_CLIENT -q "select count() from url('http://localhost:11111/test%2Fa.tsv') settings enable_url_encoding=0" 2>&1 | \
+ grep -o "test%2Fa.tsv" -m1 | head -n 1

From f7f1d86e667117dd51b74747c1b1ed5f9339c466 Mon Sep 17 00:00:00 2001
From: Sema Checherinda <Sema.Checherinda@clickhouse.com>
Date: Mon, 4 Mar 2024 14:37:17 +0100
Subject: [PATCH 242/985] fix tests test_attach_without_fetching
 test_replicated_merge_tree_wait_on_shutdown

---
 src/Common/CurrentMetrics.cpp                                 | 2 +-
 src/Disks/IO/ReadBufferFromWebServer.cpp                      | 1 -
 tests/integration/test_attach_without_fetching/test.py        | 1 +
 .../test_replicated_merge_tree_wait_on_shutdown/test.py       | 4 ++++
 4 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index f43481f665b..dfbf6199361 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -274,7 +274,7 @@
     M(DistrCacheUsedConnections, "Number of currently used connections to Distributed Cache") \
     M(DistrCacheReadRequests, "Number of executed Read requests to Distributed Cache") \
     M(DistrCacheWriteRequests, "Number of executed Write requests to Distributed Cache") \
-    M(DistrCacheServerConnections, "Number of open connections to ClickHouse server from Distributed Cache")
+    M(DistrCacheServerConnections, "Number of open connections to ClickHouse server from Distributed Cache") \
     \
     M(StorageConnectionsStored, "Total count of sessions stored in the session pool for storages") \
     M(StorageConnectionsTotal, "Total count of all sessions: stored in the pool and actively used right now for storages") \
diff --git a/src/Disks/IO/ReadBufferFromWebServer.cpp b/src/Disks/IO/ReadBufferFromWebServer.cpp
index 7509aa81d75..03300cc0714 100644
--- a/src/Disks/IO/ReadBufferFromWebServer.cpp
+++ b/src/Disks/IO/ReadBufferFromWebServer.cpp
@@ -114,7 +114,6 @@ bool ReadBufferFromWebServer::nextImpl()
 
     chassert(working_buffer.begin() != nullptr);
     chassert(impl->buffer().begin() != nullptr);
-    chassert(working_buffer.begin() == impl->buffer().begin());
 
     chassert(impl->available() == 0);
 
diff --git a/tests/integration/test_attach_without_fetching/test.py b/tests/integration/test_attach_without_fetching/test.py
index b430387e0f1..67352e2dcbe 100644
--- a/tests/integration/test_attach_without_fetching/test.py
+++ b/tests/integration/test_attach_without_fetching/test.py
@@ -56,6 +56,7 @@ def check_data(nodes, detached_parts):
 
         node.query_with_retry("SYSTEM SYNC REPLICA test")
 
+    for node in nodes:
         print("> Checking data integrity for", node.name)
 
         for i in range(10):
diff --git a/tests/integration/test_replicated_merge_tree_wait_on_shutdown/test.py b/tests/integration/test_replicated_merge_tree_wait_on_shutdown/test.py
index 67dd03098e9..995afedf415 100644
--- a/tests/integration/test_replicated_merge_tree_wait_on_shutdown/test.py
+++ b/tests/integration/test_replicated_merge_tree_wait_on_shutdown/test.py
@@ -40,6 +40,10 @@ def test_shutdown_and_wait(start_cluster):
             f"CREATE TABLE test_table (value UInt64) ENGINE=ReplicatedMergeTree('/test/table', 'r{i}') ORDER BY tuple()"
         )
 
+    # we stop merges on node1 to make node2 fetch all 51 origin parts from node1
+    # and not to fetch a smaller set of merged covering parts
+    node1.query("SYSTEM STOP MERGES test_table")
+
     node1.query("INSERT INTO test_table VALUES (0)")
     node2.query("SYSTEM SYNC REPLICA test_table")
 

From 4df406d3adce0ae1fb55d742cf59ddd928e96ddb Mon Sep 17 00:00:00 2001
From: Sema Checherinda <Sema.Checherinda@clickhouse.com>
Date: Thu, 7 Mar 2024 13:56:51 +0100
Subject: [PATCH 243/985] work with review notes

---
 src/Client/Connection.cpp                  |  9 ++++----
 src/Common/HTTPConnectionPool.cpp          |  2 +-
 src/Common/HostResolvePool.cpp             | 13 +++++++----
 src/Common/HostResolvePool.h               |  2 --
 src/Common/ProfileEvents.cpp               |  6 ++---
 src/Common/tests/gtest_connection_pool.cpp | 27 ++++++++++++++++++++++
 6 files changed, 45 insertions(+), 14 deletions(-)

diff --git a/src/Client/Connection.cpp b/src/Client/Connection.cpp
index a11a1243957..180942e6b83 100644
--- a/src/Client/Connection.cpp
+++ b/src/Client/Connection.cpp
@@ -212,8 +212,9 @@ void Connection::connect(const ConnectionTimeouts & timeouts)
         /// Remove this possible stale entry from cache
         DNSResolver::instance().removeHostFromCache(host);
 
-        /// Add server address to exception. Also Exception will remember stack trace. It's a pity that more precise exception type is lost.
-        throw NetException(ErrorCodes::NETWORK_ERROR, "{} ({})", e.displayText(), getDescription());
+        /// Add server address to exception. Exception will preserve stack trace.
+        e.addMessage("({})", getDescription());
+        throw;
     }
     catch (Poco::Net::NetException & e)
     {
@@ -222,7 +223,7 @@ void Connection::connect(const ConnectionTimeouts & timeouts)
         /// Remove this possible stale entry from cache
         DNSResolver::instance().removeHostFromCache(host);
 
-        /// Add server address to exception. Also Exception will remember stack trace. It's a pity that more precise exception type is lost.
+        /// Add server address to exception. Also Exception will remember new stack trace. It's a pity that more precise exception type is lost.
         throw NetException(ErrorCodes::NETWORK_ERROR, "{} ({})", e.displayText(), getDescription());
     }
     catch (Poco::TimeoutException & e)
@@ -232,7 +233,7 @@ void Connection::connect(const ConnectionTimeouts & timeouts)
         /// Remove this possible stale entry from cache
         DNSResolver::instance().removeHostFromCache(host);
 
-        /// Add server address to exception. Also Exception will remember stack trace. It's a pity that more precise exception type is lost.
+        /// Add server address to exception. Also Exception will remember new stack trace. It's a pity that more precise exception type is lost.
         /// This exception can only be thrown from socket->connect(), so add information about connection timeout.
         const auto & connection_timeout = static_cast<bool>(secure) ? timeouts.secure_connection_timeout : timeouts.connection_timeout;
         throw NetException(
diff --git a/src/Common/HTTPConnectionPool.cpp b/src/Common/HTTPConnectionPool.cpp
index 18ffef34091..a21438a11a2 100644
--- a/src/Common/HTTPConnectionPool.cpp
+++ b/src/Common/HTTPConnectionPool.cpp
@@ -336,7 +336,7 @@ private:
             request_stream_completed = false;
 
             response_stream = nullptr;
-            response_stream_completed = true;
+            response_stream_completed = false;
 
             return result;
         }
diff --git a/src/Common/HostResolvePool.cpp b/src/Common/HostResolvePool.cpp
index f6cc9c919ba..6db28edc07e 100644
--- a/src/Common/HostResolvePool.cpp
+++ b/src/Common/HostResolvePool.cpp
@@ -13,7 +13,7 @@ namespace ProfileEvents
 {
     extern const Event AddressesDiscovered;
     extern const Event AddressesExpired;
-    extern const Event AddressesFailScored;
+    extern const Event AddressesMarkedAsFailed;
 }
 
 namespace CurrentMetrics
@@ -34,7 +34,7 @@ HostResolverMetrics HostResolver::getMetrics()
     return HostResolverMetrics{
         .discovered = ProfileEvents::AddressesDiscovered,
         .expired = ProfileEvents::AddressesExpired,
-        .failed = ProfileEvents::AddressesFailScored,
+        .failed = ProfileEvents::AddressesMarkedAsFailed,
         .active_count = CurrentMetrics::AddressesActive,
     };
 }
@@ -120,7 +120,6 @@ void HostResolver::updateWeights()
     }
 
     chassert((getTotalWeight() > 0 && !records.empty()) || records.empty());
-    random_weight_picker = std::uniform_int_distribution<size_t>(0, getTotalWeight() - 1);
 }
 
 HostResolver::Entry HostResolver::resolve()
@@ -170,6 +169,7 @@ void HostResolver::setFail(const Poco::Net::IPAddress & address)
 Poco::Net::IPAddress HostResolver::selectBest()
 {
     chassert(!records.empty());
+    auto random_weight_picker = std::uniform_int_distribution<size_t>(0, getTotalWeight() - 1);
     size_t weight = random_weight_picker(thread_local_rng);
     auto it = std::partition_point(records.begin(), records.end(), [&](const Record & rec) { return rec.weight_prefix_sum <= weight; });
     chassert(it != records.end());
@@ -178,8 +178,13 @@ Poco::Net::IPAddress HostResolver::selectBest()
 
 HostResolver::Records::iterator HostResolver::find(const Poco::Net::IPAddress & addr) TSA_REQUIRES(mutex)
 {
-    return std::lower_bound(
+    auto it = std::lower_bound(
         records.begin(), records.end(), addr, [](const Record & rec, const Poco::Net::IPAddress & value) { return rec.address < value; });
+
+    if (it != records.end() && it->address != addr)
+        return records.end();
+
+    return it;
 }
 
 bool HostResolver::isUpdateNeeded()
diff --git a/src/Common/HostResolvePool.h b/src/Common/HostResolvePool.h
index 2a31cec3b2d..4f127f05253 100644
--- a/src/Common/HostResolvePool.h
+++ b/src/Common/HostResolvePool.h
@@ -191,8 +191,6 @@ protected:
     Poco::Timestamp last_resolve_time TSA_GUARDED_BY(mutex);
     Records records TSA_GUARDED_BY(mutex);
 
-    std::uniform_int_distribution<size_t> random_weight_picker TSA_GUARDED_BY(mutex);
-
     Poco::Logger * log = &Poco::Logger::get("ConnectionPool");
 };
 
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 0c9582ab4fb..c1ac3d08245 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -721,9 +721,9 @@ The server successfully detected this situation and will download merged part fr
     M(HTTPConnectionsErrors, "Number of cases when creation of a http connection failed") \
     M(HTTPConnectionsElapsedMicroseconds, "Total time spend on creating http connections") \
     \
-    M(AddressesDiscovered, "Total count of new addresses in dns resolve results for connection pools") \
-    M(AddressesExpired, "Total count of expired addresses which is no longer presented in dns resolve results for for connection pools") \
-    M(AddressesFailScored, "Total count of new addresses in dns resolve results for for connection pools") \
+    M(AddressesDiscovered, "Total count of new addresses in dns resolve results for http connections") \
+    M(AddressesExpired, "Total count of expired addresses which is no longer presented in dns resolve results for http connections") \
+    M(AddressesMarkedAsFailed, "Total count of addresses which has been marked as faulty due to connection errors for http connections") \
 
 
 #ifdef APPLY_FOR_EXTERNAL_EVENTS
diff --git a/src/Common/tests/gtest_connection_pool.cpp b/src/Common/tests/gtest_connection_pool.cpp
index 01b78958442..c271cc0e2ec 100644
--- a/src/Common/tests/gtest_connection_pool.cpp
+++ b/src/Common/tests/gtest_connection_pool.cpp
@@ -552,6 +552,33 @@ TEST_F(ConnectionPoolTest, HardLimit)
     ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().stored_count));
 
 
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
+    ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
+    ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reset]);
+}
+
+TEST_F(ConnectionPoolTest, NoReceiveCall)
+{
+    auto pool = getPool();
+
+    {
+        auto connection = pool->getConnection(timeouts);
+
+        {
+            auto data = String("Hello");
+            Poco::Net::HTTPRequest request(Poco::Net::HTTPRequest::HTTP_PUT, "/", "HTTP/1.1"); // HTTP/1.1 is required for keep alive
+            request.setContentLength(data.size());
+            std::ostream & ostream = connection->sendRequest(request);
+            ostream << data;
+        }
+
+        connection->flushRequest();
+    }
+
+    ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().active_count));
+    ASSERT_EQ(0, CurrentMetrics::get(pool->getMetrics().stored_count));
+
+
     ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().created]);
     ASSERT_EQ(0, DB::CurrentThread::getProfileEvents()[pool->getMetrics().preserved]);
     ASSERT_EQ(1, DB::CurrentThread::getProfileEvents()[pool->getMetrics().reset]);

From 21b04143e81e5e2e9a6c5fa02103bcafdb4a27ed Mon Sep 17 00:00:00 2001
From: Sema Checherinda <Sema.Checherinda@clickhouse.com>
Date: Thu, 7 Mar 2024 19:17:25 +0100
Subject: [PATCH 244/985] set vat RECORDS in main proccess

---
 tests/queries/0_stateless/02998_system_dns_cache_table.sh | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/02998_system_dns_cache_table.sh b/tests/queries/0_stateless/02998_system_dns_cache_table.sh
index 41d2386fe9c..b74fc00ab3b 100755
--- a/tests/queries/0_stateless/02998_system_dns_cache_table.sh
+++ b/tests/queries/0_stateless/02998_system_dns_cache_table.sh
@@ -5,12 +5,14 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 # Retries are necessary because the DNS cache may be flushed before second statement is executed
-i=0 retries=3
+i=0
+retries=5
 while [[ $i -lt $retries ]]; do
-    ${CLICKHOUSE_CURL} -sS --fail --data "SELECT * FROM url('http://localhost:8123/ping', CSV, 'auto', headers())" "${CLICKHOUSE_URL}" | grep -oP -q 'Ok.' && \
+    ${CLICKHOUSE_CURL} -sS --fail --data "SELECT * FROM url('http://localhost:8123/ping', CSV, 'auto', headers())" "${CLICKHOUSE_URL}" | grep -oP -q 'Ok.' || continue
+
     RECORDS=$(${CLICKHOUSE_CURL} -sS --fail --data "SELECT hostname, ip_address, ip_family, (isNotNull(cached_at) AND cached_at > '1970-01-01 00:00:00') FROM system.dns_cache WHERE hostname = 'localhost' and ip_family = 'IPv4';" "${CLICKHOUSE_URL}")
 
-    if [ "${RECORDS}" != "" ]; then
+    if [[ -n "${RECORDS}" ]]; then
        echo "${RECORDS}"
        exit 0
     fi

From 77c5de700f62451c6f2cf55620d9522832b5d56b Mon Sep 17 00:00:00 2001
From: Sema Checherinda <Sema.Checherinda@clickhouse.com>
Date: Sat, 9 Mar 2024 13:35:12 +0100
Subject: [PATCH 245/985] fix how web disk read empty directories

---
 .../ObjectStorages/Web/WebObjectStorage.cpp   |  5 +--
 src/IO/ReadWriteBufferFromHTTP.h              |  4 ++-
 src/Storages/StorageURL.cpp                   | 32 ++++++++-----------
 3 files changed, 18 insertions(+), 23 deletions(-)

diff --git a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
index 0bad668a404..4adb92cf5c8 100644
--- a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
@@ -53,6 +53,7 @@ WebObjectStorage::loadFiles(const String & path, const std::unique_lock<std::sha
                                 .withSettings(getContext()->getReadSettings())
                                 .withTimeouts(timeouts)
                                 .withHostFilter(&getContext()->getRemoteHostFilter())
+                                .withSkipNotFound(true)
                                 .create(credentials);
 
         String file_name;
@@ -98,10 +99,6 @@ WebObjectStorage::loadFiles(const String & path, const std::unique_lock<std::sha
     }
     catch (HTTPException & e)
     {
-        /// 404 - no files
-        if (e.getHTTPStatus() == Poco::Net::HTTPResponse::HTTP_NOT_FOUND)
-            return {};
-
         e.addMessage("while loading disk metadata");
         throw;
     }
diff --git a/src/IO/ReadWriteBufferFromHTTP.h b/src/IO/ReadWriteBufferFromHTTP.h
index 5df87fb6149..d0d792430c0 100644
--- a/src/IO/ReadWriteBufferFromHTTP.h
+++ b/src/IO/ReadWriteBufferFromHTTP.h
@@ -202,6 +202,7 @@ class BuilderRWBufferFromHTTP
     size_t max_redirects = 0;
     ReadWriteBufferFromHTTP::OutStreamCallback out_stream_callback = nullptr;
     bool use_external_buffer = false;
+    bool http_skip_not_found_url = false;
     HTTPHeaderEntries http_header_entries{};
     bool delay_initialization = true;
 
@@ -229,6 +230,7 @@ public:
     setterMember(withHeaders, http_header_entries)
     setterMember(withExternalBuf, use_external_buffer)
     setterMember(withDelayInit, delay_initialization)
+    setterMember(withSkipNotFound, http_skip_not_found_url)
 #undef setterMember
 
     ReadWriteBufferFromHTTPPtr create(const Poco::Net::HTTPBasicCredentials & credentials_)
@@ -246,7 +248,7 @@ public:
             max_redirects,
             out_stream_callback,
             use_external_buffer,
-            /*http_skip_not_found_url=*/ false,
+            http_skip_not_found_url,
             http_header_entries,
             delay_initialization,
             /*file_info_=*/ std::nullopt);
diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index b539a152b69..adcb83218fd 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -460,24 +460,20 @@ std::pair<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> StorageURLSource:
 
         try
         {
-            auto res = std::make_unique<ReadWriteBufferFromHTTP>(
-                HTTPConnectionGroupType::STORAGE,
-                request_uri,
-                http_method,
-                proxy_config,
-                read_settings,
-                timeouts,
-                credentials,
-                &context_->getRemoteHostFilter(),
-                settings.max_read_buffer_size,
-                settings.max_http_get_redirects,
-                callback,
-                /*use_external_buffer*/ false,
-                skip_url_not_found_error,
-                headers,
-                delay_initialization,
-                /*file_info_*/ std::nullopt);
-
+            auto res = BuilderRWBufferFromHTTP(request_uri)
+                           .withConnectionGroup(HTTPConnectionGroupType::STORAGE)
+                           .withMethod(http_method)
+                           .withProxy(proxy_config)
+                           .withSettings(read_settings)
+                           .withTimeouts(timeouts)
+                           .withHostFilter(&context_->getRemoteHostFilter())
+                           .withBufSize(settings.max_read_buffer_size)
+                           .withRedirects(settings.max_http_get_redirects)
+                           .withOutCallback(callback)
+                           .withSkipNotFound(skip_url_not_found_error)
+                           .withHeaders(headers)
+                           .withDelayInit(delay_initialization)
+                           .create(credentials);
 
             if (context_->getSettingsRef().engine_url_skip_empty_files && res->eof() && option != std::prev(end))
             {

From 69cab686e4e418c0e7cfa74dfea459671d14bc49 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 10:03:31 +0100
Subject: [PATCH 246/985] Fix build of examples

---
 src/Compression/examples/CMakeLists.txt       |   2 +-
 src/Core/examples/CMakeLists.txt              |   3 -
 src/Core/examples/mysql_protocol.cpp          | 390 ------------------
 src/Interpreters/examples/CMakeLists.txt      |  22 +-
 src/Interpreters/examples/hash_map.cpp        |   1 -
 src/Interpreters/examples/hash_map_lookup.cpp |   2 -
 src/Processors/CMakeLists.txt                 |   4 -
 src/Processors/examples/CMakeLists.txt        |   4 -
 .../examples/comma_separated_streams.cpp      | 117 ------
 src/Processors/examples/test_in               |   8 -
 src/Storages/MergeTree/CMakeLists.txt         |   3 -
 .../MergeTree/examples/CMakeLists.txt         |   2 -
 .../examples/wal_action_metadata.cpp          |  61 ---
 src/Storages/examples/CMakeLists.txt          |   8 -
 src/Storages/examples/active_parts.py         |  41 --
 .../examples/async_read_buffer_from_hdfs.cpp  |  37 --
 ...get_abandonable_lock_in_all_partitions.cpp |  71 ----
 17 files changed, 12 insertions(+), 764 deletions(-)
 delete mode 100644 src/Core/examples/mysql_protocol.cpp
 delete mode 100644 src/Processors/examples/CMakeLists.txt
 delete mode 100644 src/Processors/examples/comma_separated_streams.cpp
 delete mode 100644 src/Processors/examples/test_in
 delete mode 100644 src/Storages/MergeTree/examples/CMakeLists.txt
 delete mode 100644 src/Storages/MergeTree/examples/wal_action_metadata.cpp
 delete mode 100644 src/Storages/examples/active_parts.py
 delete mode 100644 src/Storages/examples/async_read_buffer_from_hdfs.cpp
 delete mode 100644 src/Storages/examples/get_abandonable_lock_in_all_partitions.cpp

diff --git a/src/Compression/examples/CMakeLists.txt b/src/Compression/examples/CMakeLists.txt
index a924075d0dc..a7cc6bebf42 100644
--- a/src/Compression/examples/CMakeLists.txt
+++ b/src/Compression/examples/CMakeLists.txt
@@ -1,2 +1,2 @@
 clickhouse_add_executable (compressed_buffer compressed_buffer.cpp)
-target_link_libraries (compressed_buffer PRIVATE clickhouse_common_io)
+target_link_libraries (compressed_buffer PRIVATE clickhouse_common_io clickhouse_compression)
diff --git a/src/Core/examples/CMakeLists.txt b/src/Core/examples/CMakeLists.txt
index 2326eada96d..f30ee25491f 100644
--- a/src/Core/examples/CMakeLists.txt
+++ b/src/Core/examples/CMakeLists.txt
@@ -6,6 +6,3 @@ target_link_libraries (field PRIVATE dbms)
 
 clickhouse_add_executable (string_ref_hash string_ref_hash.cpp)
 target_link_libraries (string_ref_hash PRIVATE clickhouse_common_io)
-
-clickhouse_add_executable (mysql_protocol mysql_protocol.cpp)
-target_link_libraries (mysql_protocol PRIVATE dbms)
diff --git a/src/Core/examples/mysql_protocol.cpp b/src/Core/examples/mysql_protocol.cpp
deleted file mode 100644
index a6247418e87..00000000000
--- a/src/Core/examples/mysql_protocol.cpp
+++ /dev/null
@@ -1,390 +0,0 @@
-#include <string>
-
-#include <Core/MySQL/Authentication.h>
-#include <Core/MySQL/MySQLClient.h>
-#include <Core/MySQL/PacketsConnection.h>
-#include <Core/MySQL/PacketsGeneric.h>
-#include <Core/MySQL/PacketsProtocolText.h>
-#include <IO/ReadBufferFromString.h>
-#include <IO/WriteBufferFromString.h>
-#include <IO/WriteBufferFromOStream.h>
-
-#include <boost/program_options.hpp>
-
-int main(int argc, char ** argv)
-{
-    using namespace DB;
-    using namespace MySQLProtocol;
-    using namespace MySQLProtocol::Generic;
-    using namespace MySQLProtocol::Authentication;
-    using namespace MySQLProtocol::ConnectionPhase;
-    using namespace MySQLProtocol::ProtocolText;
-
-
-    uint8_t server_sequence_id = 1;
-    uint8_t client_sequence_id = 1;
-    String user = "default";
-    String password = "123";
-    String database;
-
-    UInt8 charset_utf8 = 33;
-    UInt32 max_packet_size = MAX_PACKET_LENGTH;
-    String mysql_native_password = "mysql_native_password";
-
-    UInt32 server_capability_flags = CLIENT_PROTOCOL_41 | CLIENT_SECURE_CONNECTION | CLIENT_PLUGIN_AUTH
-        | CLIENT_PLUGIN_AUTH_LENENC_CLIENT_DATA | CLIENT_CONNECT_WITH_DB | CLIENT_DEPRECATE_EOF;
-
-    UInt32 client_capability_flags = CLIENT_PROTOCOL_41 | CLIENT_PLUGIN_AUTH | CLIENT_SECURE_CONNECTION;
-
-    /// Handshake packet
-    {
-        /// 1. Greeting:
-        /// 1.1 Server writes greeting to client
-        std::string s0;
-        WriteBufferFromString out0(s0);
-
-        Handshake server_handshake(
-            server_capability_flags, -1, "ClickHouse", "mysql_native_password", "aaaaaaaaaaaaaaaaaaaaa", CharacterSet::utf8_general_ci);
-        server_handshake.writePayload(out0, server_sequence_id);
-
-        /// 1.2 Client reads the greeting
-        ReadBufferFromString in0(s0);
-        Handshake client_handshake;
-        client_handshake.readPayload(in0, client_sequence_id);
-
-        /// Check packet
-        ASSERT(server_handshake.capability_flags == client_handshake.capability_flags)
-        ASSERT(server_handshake.status_flags == client_handshake.status_flags)
-        ASSERT(server_handshake.server_version == client_handshake.server_version)
-        ASSERT(server_handshake.protocol_version == client_handshake.protocol_version)
-        ASSERT(server_handshake.auth_plugin_data.substr(0, 20) == client_handshake.auth_plugin_data)
-        ASSERT(server_handshake.auth_plugin_name == client_handshake.auth_plugin_name)
-
-        /// 2. Greeting Response:
-        std::string s1;
-        WriteBufferFromString out1(s1);
-
-        /// 2.1 Client writes to server
-        Native41 native41(password, client_handshake.auth_plugin_data);
-        String auth_plugin_data = native41.getAuthPluginData();
-        HandshakeResponse client_handshake_response(
-            client_capability_flags, max_packet_size, charset_utf8, user, database, auth_plugin_data, mysql_native_password);
-        client_handshake_response.writePayload(out1, client_sequence_id);
-
-        /// 2.2 Server reads the response
-        ReadBufferFromString in1(s1);
-        HandshakeResponse server_handshake_response;
-        server_handshake_response.readPayload(in1, server_sequence_id);
-
-        /// Check
-        ASSERT(server_handshake_response.capability_flags == client_handshake_response.capability_flags)
-        ASSERT(server_handshake_response.character_set == client_handshake_response.character_set)
-        ASSERT(server_handshake_response.username == client_handshake_response.username)
-        ASSERT(server_handshake_response.database == client_handshake_response.database)
-        ASSERT(server_handshake_response.auth_response == client_handshake_response.auth_response)
-        ASSERT(server_handshake_response.auth_plugin_name == client_handshake_response.auth_plugin_name)
-    }
-
-    /// OK Packet
-    {
-        // 1. Server writes packet
-        std::string s0;
-        WriteBufferFromString out0(s0);
-        OKPacket server(0x00, server_capability_flags, 0, 0, 0, "", "");
-        server.writePayload(out0, server_sequence_id);
-
-        // 2. Client reads packet
-        ReadBufferFromString in0(s0);
-        ResponsePacket client(server_capability_flags);
-        client.readPayload(in0, client_sequence_id);
-
-        // Check
-        ASSERT(client.getType() == PACKET_OK)
-        ASSERT(client.ok.header == server.header)
-        ASSERT(client.ok.status_flags == server.status_flags)
-        ASSERT(client.ok.capabilities == server.capabilities)
-    }
-
-    /// ERR Packet
-    {
-        // 1. Server writes packet
-        std::string s0;
-        WriteBufferFromString out0(s0);
-        ERRPacket server(123, "12345", "This is the error message");
-        server.writePayload(out0, server_sequence_id);
-
-        // 2. Client reads packet
-        ReadBufferFromString in0(s0);
-        ResponsePacket client(server_capability_flags);
-        client.readPayload(in0, client_sequence_id);
-
-        // Check
-        ASSERT(client.getType() == PACKET_ERR)
-        ASSERT(client.err.header == server.header)
-        ASSERT(client.err.error_code == server.error_code)
-        ASSERT(client.err.sql_state == server.sql_state)
-        ASSERT(client.err.error_message == server.error_message)
-    }
-
-    /// EOF Packet
-    {
-        // 1. Server writes packet
-        std::string s0;
-        WriteBufferFromString out0(s0);
-        EOFPacket server(1, 1);
-        server.writePayload(out0, server_sequence_id);
-
-        // 2. Client reads packet
-        ReadBufferFromString in0(s0);
-        ResponsePacket client(server_capability_flags);
-        client.readPayload(in0, client_sequence_id);
-
-        // Check
-        ASSERT(client.getType() == PACKET_EOF)
-        ASSERT(client.eof.header == server.header)
-        ASSERT(client.eof.warnings == server.warnings)
-        ASSERT(client.eof.status_flags == server.status_flags)
-    }
-
-    /// ColumnDefinition Packet
-    {
-        // 1. Server writes packet
-        std::string s0;
-        WriteBufferFromString out0(s0);
-        ColumnDefinition server("schema", "tbl", "org_tbl", "name", "org_name", 33, 0x00, MYSQL_TYPE_STRING, 0x00, 0x00);
-        server.writePayload(out0, server_sequence_id);
-
-        // 2. Client reads packet
-        ReadBufferFromString in0(s0);
-        ColumnDefinition client;
-        client.readPayload(in0, client_sequence_id);
-
-        // Check
-        ASSERT(client.column_type == server.column_type)
-        ASSERT(client.column_length == server.column_length)
-        ASSERT(client.next_length == server.next_length)
-        ASSERT(client.character_set == server.character_set)
-        ASSERT(client.decimals == server.decimals)
-        ASSERT(client.name == server.name)
-        ASSERT(client.org_name == server.org_name)
-        ASSERT(client.table == server.table)
-        ASSERT(client.org_table == server.org_table)
-        ASSERT(client.schema == server.schema)
-    }
-
-    /// GTID sets tests.
-   {
-        struct Testcase
-        {
-            String name;
-            String sets;
-            String want;
-        };
-
-        Testcase cases[] = {
-            {"gtid-sets-without-whitespace",
-             "2c5adab4-d64a-11e5-82df-ac162d72dac0:1-247743812,9f58c169-d121-11e7-835b-ac162db9c048:1-56060985:56060987-56061175:56061177-"
-             "56061224:56061226-75201528:75201530-75201755:75201757-75201983:75201985-75407550:75407552-75407604:75407606-75407661:"
-             "75407663-87889848:87889850-87889935:87889937-87890042:87890044-88391955:88391957-88392125:88392127-88392245:88392247-"
-             "88755771:88755773-88755826:88755828-88755921:88755923-100279047:100279049-100279126:100279128-100279247:100279249-121672430:"
-             "121672432-121672503:121672505-121672524:121672526-122946019:122946021-122946291:122946293-122946469:122946471-134313284:"
-             "134313286-134313415:134313417-134313648:134313650-136492728:136492730-136492784:136492786-136492904:136492906-145582402:"
-             "145582404-145582439:145582441-145582463:145582465-147455222:147455224-147455262:147455264-147455277:147455279-149319049:"
-             "149319051-149319261:149319263-150635915,a6d83ff6-bfcf-11e7-8c93-246e96158550:1-126618302",
-             "2c5adab4-d64a-11e5-82df-ac162d72dac0:1-247743812,9f58c169-d121-11e7-835b-ac162db9c048:1-56060985:56060987-56061175:56061177-"
-             "56061224:56061226-75201528:75201530-75201755:75201757-75201983:75201985-75407550:75407552-75407604:75407606-75407661:"
-             "75407663-87889848:87889850-87889935:87889937-87890042:87890044-88391955:88391957-88392125:88392127-88392245:88392247-"
-             "88755771:88755773-88755826:88755828-88755921:88755923-100279047:100279049-100279126:100279128-100279247:100279249-121672430:"
-             "121672432-121672503:121672505-121672524:121672526-122946019:122946021-122946291:122946293-122946469:122946471-134313284:"
-             "134313286-134313415:134313417-134313648:134313650-136492728:136492730-136492784:136492786-136492904:136492906-145582402:"
-             "145582404-145582439:145582441-145582463:145582465-147455222:147455224-147455262:147455264-147455277:147455279-149319049:"
-             "149319051-149319261:149319263-150635915,a6d83ff6-bfcf-11e7-8c93-246e96158550:1-126618302"},
-
-            {"gtid-sets-with-whitespace",
-             "2c5adab4-d64a-11e5-82df-ac162d72dac0:1-247743812, 9f58c169-d121-11e7-835b-ac162db9c048:1-56060985:56060987-56061175:56061177",
-             "2c5adab4-d64a-11e5-82df-ac162d72dac0:1-247743812,9f58c169-d121-11e7-835b-ac162db9c048:1-56060985:56060987-56061175:56061177"},
-
-            {"gtid-sets-single", "2c5adab4-d64a-11e5-82df-ac162d72dac0:1-247743812", "2c5adab4-d64a-11e5-82df-ac162d72dac0:1-247743812"}};
-
-        for (auto & tc : cases)
-        {
-            GTIDSets gtid_sets;
-            gtid_sets.parse(tc.sets);
-
-            String want = tc.want;
-            String got = gtid_sets.toString();
-            ASSERT(want == got)
-        }
-    }
-
-    {
-        struct Testcase
-        {
-            String name;
-            String gtid_sets;
-            String gtid_str;
-            String want;
-        };
-
-        Testcase cases[] = {
-            {"merge",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-2:4-7",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:3",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-7"},
-
-            {"merge-front",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-2:5-7",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:3",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-3:5-7"},
-
-            {"extend-interval",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-2:6-7",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:4",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-2:4:6-7"},
-
-            {"extend-interval",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-2:4:7-9",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:5",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-2:4-5:7-9"},
-
-            {"extend-interval",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:6-7",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:4",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:4:6-7"},
-
-            {"extend-interval",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:6-7",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:9",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:6-7:9"},
-
-            {"extend-interval",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:6-7",
-             "20662d71-9d91-11ea-bbc2-0242ac110003:9",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:6-7,20662d71-9d91-11ea-bbc2-0242ac110003:9"},
-
-            {"shrink-sequence",
-              "10662d71-9d91-11ea-bbc2-0242ac110003:1-3:4-5:7",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:6",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-7"},
-
-            {"shrink-sequence",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-3:4-5:10",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:8",
-             "10662d71-9d91-11ea-bbc2-0242ac110003:1-5:8:10"
-            }
-        };
-
-        for (auto & tc : cases)
-        {
-            GTIDSets gtid_sets;
-            gtid_sets.parse(tc.gtid_sets);
-            ASSERT(tc.gtid_sets == gtid_sets.toString())
-
-            GTIDSets gtid_sets1;
-            gtid_sets1.parse(tc.gtid_str);
-
-            GTID gtid;
-            gtid.uuid = gtid_sets1.sets[0].uuid;
-            gtid.seq_no = gtid_sets1.sets[0].intervals[0].start;
-            gtid_sets.update(gtid);
-
-            String want = tc.want;
-            String got = gtid_sets.toString();
-            ASSERT(want == got)
-        }
-    }
-
-    {
-        /// mysql_protocol --host=172.17.0.3 --user=root --password=123 --db=sbtest
-        try
-        {
-            boost::program_options::options_description desc("Allowed options");
-            desc.add_options()("host", boost::program_options::value<std::string>()->required(), "master host")(
-                "port", boost::program_options::value<std::int32_t>()->default_value(3306), "master port")(
-                "user", boost::program_options::value<std::string>()->default_value("root"), "master user")(
-                "password", boost::program_options::value<std::string>()->required(), "master password")(
-                "gtid", boost::program_options::value<std::string>()->default_value(""), "executed GTID sets")(
-                "db", boost::program_options::value<std::string>()->required(), "replicate do db")(
-                "binlog_checksum", boost::program_options::value<std::string>()->default_value("CRC32"), "master binlog_checksum");
-
-            boost::program_options::variables_map options;
-            boost::program_options::store(boost::program_options::parse_command_line(argc, argv, desc), options);
-            if (argc == 0)
-            {
-                return 1;
-            }
-
-            auto host = options.at("host").as<String>();
-            auto port = options.at("port").as<Int32>();
-            auto master_user = options.at("user").as<String>();
-            auto master_password = options.at("password").as<String>();
-            auto gtid_sets = options.at("gtid").as<String>();
-            auto replicate_db = options.at("db").as<String>();
-            auto binlog_checksum = options.at("binlog_checksum").as<String>();
-
-            std::cerr << "Master Host: " << host << ", Port: " << port << ", User: " << master_user << ", Password: " << master_password
-                      << ", Replicate DB: " << replicate_db << ", GTID: " << gtid_sets << std::endl;
-
-            UInt32 slave_id = 9004;
-            MySQLClient slave(host, port, master_user, master_password);
-
-            /// Connect to the master.
-            slave.connect();
-            slave.startBinlogDumpGTID(slave_id, replicate_db, {}, gtid_sets, binlog_checksum);
-
-            WriteBufferFromOStream cerr(std::cerr);
-
-            /// Read one binlog event on by one.
-            while (true)
-            {
-                auto event = slave.readOneBinlogEvent();
-                switch (event->type())
-                {
-                    case MYSQL_QUERY_EVENT: {
-                        auto binlog_event = std::static_pointer_cast<QueryEvent>(event);
-                        binlog_event->dump(cerr);
-
-                        Position pos = slave.getPosition();
-                        pos.dump(cerr);
-                        break;
-                    }
-                    case MYSQL_WRITE_ROWS_EVENT: {
-                        auto binlog_event = std::static_pointer_cast<WriteRowsEvent>(event);
-                        binlog_event->dump(cerr);
-
-                        Position pos = slave.getPosition();
-                        pos.dump(cerr);
-                        break;
-                    }
-                    case MYSQL_UPDATE_ROWS_EVENT: {
-                        auto binlog_event = std::static_pointer_cast<UpdateRowsEvent>(event);
-                        binlog_event->dump(cerr);
-
-                        Position pos = slave.getPosition();
-                        pos.dump(cerr);
-                        break;
-                    }
-                    case MYSQL_DELETE_ROWS_EVENT: {
-                        auto binlog_event = std::static_pointer_cast<DeleteRowsEvent>(event);
-                        binlog_event->dump(cerr);
-
-                        Position pos = slave.getPosition();
-                        pos.dump(cerr);
-                        break;
-                    }
-                    default:
-                        if (event->header.type != MySQLReplication::EventType::HEARTBEAT_EVENT)
-                        {
-                            event->dump(cerr);
-                        }
-                        break;
-                }
-            }
-        }
-        catch (const Exception & ex)
-        {
-            std::cerr << "Error: " << ex.message() << std::endl;
-            return 1;
-        }
-    }
-}
diff --git a/src/Interpreters/examples/CMakeLists.txt b/src/Interpreters/examples/CMakeLists.txt
index 11c219ff64e..8bb7f9eeb98 100644
--- a/src/Interpreters/examples/CMakeLists.txt
+++ b/src/Interpreters/examples/CMakeLists.txt
@@ -1,35 +1,35 @@
 clickhouse_add_executable (hash_map hash_map.cpp)
-target_link_libraries (hash_map PRIVATE dbms ch_contrib::sparsehash)
+target_link_libraries (hash_map PRIVATE dbms clickhouse_functions ch_contrib::sparsehash)
 
 clickhouse_add_executable (hash_map_lookup hash_map_lookup.cpp)
-target_link_libraries (hash_map_lookup PRIVATE dbms)
+target_link_libraries (hash_map_lookup PRIVATE clickhouse_common_io clickhouse_compression)
 
 clickhouse_add_executable (hash_map3 hash_map3.cpp)
-target_link_libraries (hash_map3 PRIVATE dbms ch_contrib::farmhash ch_contrib::metrohash)
+target_link_libraries (hash_map3 PRIVATE clickhouse_common_io clickhouse_compression ch_contrib::farmhash ch_contrib::metrohash)
 
 clickhouse_add_executable (hash_map_string hash_map_string.cpp)
-target_link_libraries (hash_map_string PRIVATE dbms ch_contrib::sparsehash)
+target_link_libraries (hash_map_string PRIVATE clickhouse_common_io clickhouse_compression ch_contrib::sparsehash)
 
 clickhouse_add_executable (hash_map_string_2 hash_map_string_2.cpp)
-target_link_libraries (hash_map_string_2 PRIVATE dbms)
+target_link_libraries (hash_map_string_2 PRIVATE clickhouse_common_io clickhouse_compression)
 
 clickhouse_add_executable (hash_map_string_3 hash_map_string_3.cpp)
-target_link_libraries (hash_map_string_3 PRIVATE dbms ch_contrib::farmhash ch_contrib::metrohash)
+target_link_libraries (hash_map_string_3 PRIVATE clickhouse_common_io clickhouse_compression ch_contrib::farmhash ch_contrib::metrohash)
 
 clickhouse_add_executable (hash_map_string_small hash_map_string_small.cpp)
-target_link_libraries (hash_map_string_small PRIVATE dbms ch_contrib::sparsehash)
+target_link_libraries (hash_map_string_small PRIVATE clickhouse_common_io clickhouse_compression ch_contrib::sparsehash)
 
 clickhouse_add_executable (string_hash_map string_hash_map.cpp)
-target_link_libraries (string_hash_map PRIVATE dbms ch_contrib::sparsehash)
+target_link_libraries (string_hash_map PRIVATE clickhouse_common_io clickhouse_compression ch_contrib::sparsehash)
 
 clickhouse_add_executable (string_hash_map_aggregation string_hash_map.cpp)
-target_link_libraries (string_hash_map_aggregation PRIVATE dbms)
+target_link_libraries (string_hash_map_aggregation PRIVATE clickhouse_common_io clickhouse_compression)
 
 clickhouse_add_executable (string_hash_set string_hash_set.cpp)
-target_link_libraries (string_hash_set PRIVATE dbms)
+target_link_libraries (string_hash_set PRIVATE clickhouse_common_io clickhouse_compression)
 
 clickhouse_add_executable (two_level_hash_map two_level_hash_map.cpp)
-target_link_libraries (two_level_hash_map PRIVATE dbms ch_contrib::sparsehash)
+target_link_libraries (two_level_hash_map PRIVATE clickhouse_common_io clickhouse_compression ch_contrib::sparsehash)
 
 clickhouse_add_executable (jit_example jit_example.cpp)
 target_link_libraries (jit_example PRIVATE dbms)
diff --git a/src/Interpreters/examples/hash_map.cpp b/src/Interpreters/examples/hash_map.cpp
index b55f174678e..0a91d00809f 100644
--- a/src/Interpreters/examples/hash_map.cpp
+++ b/src/Interpreters/examples/hash_map.cpp
@@ -15,7 +15,6 @@
 #include <IO/ReadBufferFromFile.h>
 #include <Compression/CompressedReadBuffer.h>
 #include <Common/HashTable/HashMap.h>
-#include <Common/HashTable/PackedHashMap.h>
 #include <AggregateFunctions/IAggregateFunction.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 #include <DataTypes/DataTypesNumber.h>
diff --git a/src/Interpreters/examples/hash_map_lookup.cpp b/src/Interpreters/examples/hash_map_lookup.cpp
index fd6b231cf73..829a234c537 100644
--- a/src/Interpreters/examples/hash_map_lookup.cpp
+++ b/src/Interpreters/examples/hash_map_lookup.cpp
@@ -8,10 +8,8 @@
 #define DBMS_HASH_MAP_DEBUG_RESIZES
 
 #include <Compression/CompressedReadBuffer.h>
-#include <base/types.h>
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
-#include <Interpreters/AggregationCommon.h>
 #include <Common/HashTable/FixedHashMap.h>
 #include <Common/HashTable/HashMap.h>
 
diff --git a/src/Processors/CMakeLists.txt b/src/Processors/CMakeLists.txt
index 7e965188b4c..e69de29bb2d 100644
--- a/src/Processors/CMakeLists.txt
+++ b/src/Processors/CMakeLists.txt
@@ -1,4 +0,0 @@
-if (ENABLE_EXAMPLES)
-    add_subdirectory(examples)
-endif ()
-
diff --git a/src/Processors/examples/CMakeLists.txt b/src/Processors/examples/CMakeLists.txt
deleted file mode 100644
index 5d43a0d7d08..00000000000
--- a/src/Processors/examples/CMakeLists.txt
+++ /dev/null
@@ -1,4 +0,0 @@
-if (TARGET ch_contrib::hivemetastore)
-    clickhouse_add_executable (comma_separated_streams comma_separated_streams.cpp)
-    target_link_libraries (comma_separated_streams PRIVATE dbms)
-endif()
diff --git a/src/Processors/examples/comma_separated_streams.cpp b/src/Processors/examples/comma_separated_streams.cpp
deleted file mode 100644
index 2ec5564f346..00000000000
--- a/src/Processors/examples/comma_separated_streams.cpp
+++ /dev/null
@@ -1,117 +0,0 @@
-#include <string>
-#include <iostream>
-#include <fstream>
-
-#include <IO/ReadBufferFromFile.h>
-#include <IO/WriteBufferFromFile.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypeString.h>
-#include <Processors/Formats/Impl/HiveTextRowInputFormat.h>
-#include <Processors/Formats/Impl/CSVRowOutputFormat.h>
-#include <Formats/FormatFactory.h>
-#include <QueryPipeline/QueryPipeline.h>
-#include <Processors/Executors/PullingPipelineExecutor.h>
-
-using namespace DB;
-
-int main()
-try
-{
-    Block sample;
-    {
-        // a
-        ColumnWithTypeAndName col;
-        col.name = "a";
-        col.type = std::make_shared<DataTypeInt64>();
-        sample.insert(std::move(col));
-    }
-    {
-        // b
-        ColumnWithTypeAndName col;
-        col.name = "b";
-        col.type = std::make_shared<DataTypeFloat64>();
-        sample.insert(std::move(col));
-    }
-    {
-        // c
-        ColumnWithTypeAndName col;
-        col.name = "c";
-        col.type = std::make_shared<DataTypeInt64>();
-        sample.insert(std::move(col));
-    }
-    {
-        // d
-        ColumnWithTypeAndName col;
-        col.name = "d";
-        col.type = std::make_shared<DataTypeString>();
-        sample.insert(std::move(col));
-    }
-    {
-        // e
-        ColumnWithTypeAndName col;
-        col.name = "e";
-        col.type = std::make_shared<DataTypeString>();
-        sample.insert(std::move(col));
-    }
-    {
-        // f
-        ColumnWithTypeAndName col;
-        col.name = "f";
-        col.type = std::make_shared<DataTypeString>();
-        sample.insert(std::move(col));
-    }
-    {
-        // g
-        ColumnWithTypeAndName col;
-        col.name = "g";
-        col.type = std::make_shared<DataTypeInt64>();
-        sample.insert(std::move(col));
-    }
-    {
-        // h
-        ColumnWithTypeAndName col;
-        col.name = "h";
-        col.type = std::make_shared<DataTypeInt64>();
-        sample.insert(std::move(col));
-    }
-
-
-    ReadBufferFromFile in_buf("test_in");
-    WriteBufferFromFile out_buf("test_out");
-
-    FormatSettings format_settings;
-    format_settings.with_names_use_header = true;
-    format_settings.skip_unknown_fields = true;
-    format_settings.csv.delimiter = '\x01';
-    format_settings.hive_text.input_field_names =
-    {
-        "d",
-        "e",
-        "f",
-        "a",
-        "b",
-        "c",
-        "g",
-        "h",
-        "i",
-        "j",
-    };
-
-    RowInputFormatParams in_params{DEFAULT_INSERT_BLOCK_SIZE};
-    InputFormatPtr input_format = std::make_shared<HiveTextRowInputFormat>(sample, in_buf, in_params, format_settings);
-    auto pipeline = QueryPipeline(std::move(input_format));
-    auto reader = std::make_unique<PullingPipelineExecutor>(pipeline);
-
-    OutputFormatPtr output_format = std::make_shared<CSVRowOutputFormat>(out_buf, sample, true, true, format_settings);
-    Block res;
-    while (reader->pull(res))
-    {
-        output_format->write(res);
-    }
-    return 0;
-}
-catch (...)
-{
-    std::cerr << getCurrentExceptionMessage(true) << '\n';
-    return 1;
-}
diff --git a/src/Processors/examples/test_in b/src/Processors/examples/test_in
deleted file mode 100644
index c7df97a26a6..00000000000
--- a/src/Processors/examples/test_in
+++ /dev/null
@@ -1,8 +0,0 @@
-2021-09-14JPall20.0200
-2021-09-14CIall20.0100
-2021-09-14JMall40.25411
-2021-09-14MMall310.19354838709677422766
-2021-09-14TZAndroid30.3333333333333333311
-2021-09-14SGall80.25412
-2021-09-14PYall11.0001
-2021-09-14MXall10.0100
diff --git a/src/Storages/MergeTree/CMakeLists.txt b/src/Storages/MergeTree/CMakeLists.txt
index 390835f17ae..e69de29bb2d 100644
--- a/src/Storages/MergeTree/CMakeLists.txt
+++ b/src/Storages/MergeTree/CMakeLists.txt
@@ -1,3 +0,0 @@
-if(ENABLE_EXAMPLES)
-    add_subdirectory(examples)
-endif()
diff --git a/src/Storages/MergeTree/examples/CMakeLists.txt b/src/Storages/MergeTree/examples/CMakeLists.txt
deleted file mode 100644
index 25bba7ae0b4..00000000000
--- a/src/Storages/MergeTree/examples/CMakeLists.txt
+++ /dev/null
@@ -1,2 +0,0 @@
-clickhouse_add_executable (wal_action_metadata wal_action_metadata.cpp)
-target_link_libraries (wal_action_metadata PRIVATE dbms)
diff --git a/src/Storages/MergeTree/examples/wal_action_metadata.cpp b/src/Storages/MergeTree/examples/wal_action_metadata.cpp
deleted file mode 100644
index 03c38c7a186..00000000000
--- a/src/Storages/MergeTree/examples/wal_action_metadata.cpp
+++ /dev/null
@@ -1,61 +0,0 @@
-#include <iostream>
-
-#include <IO/MemoryReadWriteBuffer.h>
-#include <Storages/MergeTree/MergeTreeWriteAheadLog.h>
-
-namespace DB
-{
-namespace ErrorCodes
-{
-    extern const int UNKNOWN_FORMAT_VERSION;
-}
-}
-
-int main(int, char **)
-{
-    try
-    {
-        {
-            std::cout << "test: dummy test" << std::endl;
-
-            DB::MergeTreeWriteAheadLog::ActionMetadata metadata_out;
-            DB::MemoryWriteBuffer buf{};
-
-            metadata_out.write(buf);
-            buf.finalize();
-
-            metadata_out.read(*buf.tryGetReadBuffer());
-        }
-
-        {
-            std::cout << "test: min compatibility" << std::endl;
-
-            DB::MergeTreeWriteAheadLog::ActionMetadata metadata_out;
-            metadata_out.min_compatible_version = DB::MergeTreeWriteAheadLog::WAL_VERSION + 1;
-            DB::MemoryWriteBuffer buf{};
-
-            metadata_out.write(buf);
-            buf.finalize();
-
-            try
-            {
-                metadata_out.read(*buf.tryGetReadBuffer());
-            }
-            catch (const DB::Exception & e)
-            {
-                if (e.code() != DB::ErrorCodes::UNKNOWN_FORMAT_VERSION)
-                {
-                    std::cerr << "Expected UNKNOWN_FORMAT_VERSION exception but got: "
-                        << e.what() << ", " << e.displayText() << std::endl;
-                }
-            }
-        }
-    }
-    catch (const DB::Exception & e)
-    {
-        std::cerr << e.what() << ", " << e.displayText() << std::endl;
-        return 1;
-    }
-
-    return 0;
-}
diff --git a/src/Storages/examples/CMakeLists.txt b/src/Storages/examples/CMakeLists.txt
index 225337d8ec8..cddfc9404d4 100644
--- a/src/Storages/examples/CMakeLists.txt
+++ b/src/Storages/examples/CMakeLists.txt
@@ -6,11 +6,3 @@ target_link_libraries (merge_selector2 PRIVATE dbms)
 
 clickhouse_add_executable (get_current_inserts_in_replicated get_current_inserts_in_replicated.cpp)
 target_link_libraries (get_current_inserts_in_replicated PRIVATE dbms clickhouse_common_config clickhouse_common_zookeeper string_utils)
-
-clickhouse_add_executable (get_abandonable_lock_in_all_partitions get_abandonable_lock_in_all_partitions.cpp)
-target_link_libraries (get_abandonable_lock_in_all_partitions PRIVATE dbms clickhouse_common_config clickhouse_common_zookeeper)
-
-if (TARGET ch_contrib::hdfs)
-    clickhouse_add_executable (async_read_buffer_from_hdfs async_read_buffer_from_hdfs.cpp)
-    target_link_libraries (async_read_buffer_from_hdfs PRIVATE dbms ch_contrib::hdfs)
-endif ()
diff --git a/src/Storages/examples/active_parts.py b/src/Storages/examples/active_parts.py
deleted file mode 100644
index d82c5ca96bf..00000000000
--- a/src/Storages/examples/active_parts.py
+++ /dev/null
@@ -1,41 +0,0 @@
-#!/usr/bin/python
-# coding=UTF-8
-
-# Displays a list of active parts - parts that are not overlapped by any other part.
-# Usage: `ls /var/lib/clickhouse/data/merge/visits | active_parts.py`
-
-import sys
-import re
-
-parts = {}
-for s in sys.stdin.read().split():
-    m = re.match(
-        "^([0-9]{6})[0-9]{2}_([0-9]{6})[0-9]{2}_([0-9]+)_([0-9]+)_([0-9]+)$", s
-    )
-    if m == None:
-        continue
-    m1 = m.group(1)
-    m2 = m.group(2)
-    i1 = int(m.group(3))
-    i2 = int(m.group(4))
-    l = int(m.group(5))
-    if m1 != m2:
-        raise Exception("not in single month: " + s)
-    if m1 not in parts:
-        parts[m1] = []
-    parts[m1].append((i1, i2, l, s))
-
-for m, ps in sorted(parts.items()):
-    ps.sort(key=lambda i1_i2_l_s: (i1_i2_l_s[0], -i1_i2_l_s[1], -i1_i2_l_s[2]))
-    (x2, y2, l2, s2) = (-1, -1, -1, -1)
-    for x1, y1, l1, s1 in ps:
-        if x1 >= x2 and y1 <= y2 and l1 < l2 and (x1, y1) != (x2, y2):  # 2 contains 1
-            pass
-        elif x1 > y2:  # 1 is to the right of 2
-            if x1 != y2 + 1 and y2 != -1:
-                print()  # to see the missing numbers
-            (x2, y2, l2, s2) = (x1, y1, l1, s1)
-            print(s1)
-        else:
-            raise Exception("invalid parts intersection: " + s1 + " and " + s2)
-    print()
diff --git a/src/Storages/examples/async_read_buffer_from_hdfs.cpp b/src/Storages/examples/async_read_buffer_from_hdfs.cpp
deleted file mode 100644
index 4f6aed8ef65..00000000000
--- a/src/Storages/examples/async_read_buffer_from_hdfs.cpp
+++ /dev/null
@@ -1,37 +0,0 @@
-#include <memory>
-#include <string>
-#include <filesystem>
-
-#include <IO/WriteHelpers.h>
-#include <IO/copyData.h>
-#include <IO/WriteBufferFromString.h>
-#include <Disks/ObjectStorages/IObjectStorage.h>
-#include <Disks/IO/getThreadPoolReader.h>
-#include <Interpreters/Context.h>
-#include <Common/Config/ConfigProcessor.h>
-#include <Storages/HDFS/AsynchronousReadBufferFromHDFS.h>
-
-int main()
-{
-    using namespace DB;
-    namespace fs = std::filesystem;
-
-    String config_path = "/path/to/config/file";
-    ConfigProcessor config_processor(config_path, false, true);
-    config_processor.setConfigPath(fs::path(config_path).parent_path());
-    auto loaded_config = config_processor.loadConfig(false);
-    auto * config = loaded_config.configuration.duplicate();
-
-    String hdfs_namenode_url = "hdfs://namenode:port/";
-    String path = "/path/to/hdfs/file";
-    ReadSettings settings = {};
-    auto in = std::make_unique<ReadBufferFromHDFS>(hdfs_namenode_url, path, *config, settings);
-    auto & reader = getThreadPoolReader(FilesystemReaderType::ASYNCHRONOUS_REMOTE_FS_READER);
-    AsynchronousReadBufferFromHDFS buf(reader, {}, std::move(in));
-
-    String output;
-    WriteBufferFromString out(output);
-    copyData(buf, out);
-    std::cout << "output:" << output << std::endl;
-    return 0;
-}
diff --git a/src/Storages/examples/get_abandonable_lock_in_all_partitions.cpp b/src/Storages/examples/get_abandonable_lock_in_all_partitions.cpp
deleted file mode 100644
index 4607d68f02d..00000000000
--- a/src/Storages/examples/get_abandonable_lock_in_all_partitions.cpp
+++ /dev/null
@@ -1,71 +0,0 @@
-#include <Common/Config/ConfigProcessor.h>
-#include <Common/ZooKeeper/ZooKeeper.h>
-#include <Common/Exception.h>
-#include <Common/Stopwatch.h>
-#include <Storages/MergeTree/EphemeralLockInZooKeeper.h>
-
-#include <base/scope_guard.h>
-
-#include <iostream>
-
-
-using namespace DB;
-
-/// This test is useful for assessing the performance of acquiring block numbers in all partitions (and there
-/// can be ~1000 of them). This is needed when creating a mutation entry for a ReplicatedMergeTree table.
-int main(int argc, char ** argv)
-try
-{
-    if (argc != 3)
-    {
-        std::cerr << "usage: " << argv[0] << " <zookeeper_config> <path_to_table>" << std::endl;
-        return 3;
-    }
-
-    ConfigProcessor processor(argv[1], false, true);
-    auto config = processor.loadConfig().configuration;
-    String root_path = argv[2];
-
-    auto zk = zkutil::ZooKeeper::createWithoutKillingPreviousSessions(*config, zkutil::getZooKeeperConfigName(*config), nullptr);
-
-    String temp_path = root_path + "/temp";
-    String blocks_path = root_path + "/block_numbers";
-
-    Stopwatch total_timer;
-    Stopwatch timer;
-
-    EphemeralLocksInAllPartitions locks(blocks_path, "test_lock-", temp_path, *zk);
-
-    std::cerr << "Locked, elapsed: " << timer.elapsedSeconds() << std::endl;
-    for (const auto & lock : locks.getLocks())
-        std::cout << lock.partition_id << " " << lock.number << std::endl;
-    timer.restart();
-
-    locks.unlock();
-    std::cerr << "Abandoned, elapsed: " << timer.elapsedSeconds() << std::endl;
-
-    std::cerr << "Total elapsed: " << total_timer.elapsedSeconds() << std::endl;
-
-    return 0;
-}
-catch (const Exception & e)
-{
-    std::cerr << e.what() << ", " << e.displayText() << ": " << std::endl
-              << e.getStackTraceString() << std::endl;
-    throw;
-}
-catch (Poco::Exception & e)
-{
-    std::cerr << "Exception: " << e.displayText() << std::endl;
-    throw;
-}
-catch (std::exception & e)
-{
-    std::cerr << "std::exception: " << e.what() << std::endl;
-    throw;
-}
-catch (...)
-{
-    std::cerr << "Some exception" << std::endl;
-    throw;
-}

From dbb6dad921be5ee24b222d29f375d31aa70028f8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 10:04:40 +0100
Subject: [PATCH 247/985] Fix style

---
 src/Storages/MergeTree/DataPartsExchange.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index cc2967003a4..296c11f4673 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -43,10 +43,8 @@ namespace ErrorCodes
     extern const int CANNOT_WRITE_TO_OSTREAM;
     extern const int CHECKSUM_DOESNT_MATCH;
     extern const int INSECURE_PATH;
-    extern const int CORRUPTED_DATA;
     extern const int LOGICAL_ERROR;
     extern const int S3_ERROR;
-    extern const int INCORRECT_PART_TYPE;
     extern const int ZERO_COPY_REPLICATION_ERROR;
 }
 

From d340d9cfaf58e63392c3725c55fb9e447bda6185 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 10:05:07 +0100
Subject: [PATCH 248/985] Fix build

---
 src/Storages/MergeTree/CMakeLists.txt | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/src/Storages/MergeTree/CMakeLists.txt b/src/Storages/MergeTree/CMakeLists.txt
index 390835f17ae..e69de29bb2d 100644
--- a/src/Storages/MergeTree/CMakeLists.txt
+++ b/src/Storages/MergeTree/CMakeLists.txt
@@ -1,3 +0,0 @@
-if(ENABLE_EXAMPLES)
-    add_subdirectory(examples)
-endif()

From 6a0eb7a3cdc01f0ea827228b5e21be65951bc07b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 14:42:58 +0300
Subject: [PATCH 249/985] Update ColumnSizeEstimator.h

---
 src/Storages/MergeTree/ColumnSizeEstimator.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/ColumnSizeEstimator.h b/src/Storages/MergeTree/ColumnSizeEstimator.h
index a9c4f75ed6b..e512415ff05 100644
--- a/src/Storages/MergeTree/ColumnSizeEstimator.h
+++ b/src/Storages/MergeTree/ColumnSizeEstimator.h
@@ -9,7 +9,7 @@ namespace DB
 /* Allow to compute more accurate progress statistics */
 class ColumnSizeEstimator
 {
-    using ColumnToSize = std::map<String, size_t>;
+    using ColumnToSize = std::map<String, UInt64>;
     ColumnToSize map;
 public:
 

From 1d8b95bdcd9c0b63c615d42b6242fa5dd0d1314c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 14:43:18 +0300
Subject: [PATCH 250/985] Update MergeTask.cpp

---
 src/Storages/MergeTree/MergeTask.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index 77bc680eae2..5587e3884c8 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -309,7 +309,7 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::prepare()
             ctx->rows_sources_uncompressed_write_buf = ctx->tmp_disk->createRawStream();
             ctx->rows_sources_write_buf = std::make_unique<CompressedWriteBuffer>(*ctx->rows_sources_uncompressed_write_buf);
 
-            std::map<String, size_t> local_merged_column_to_size;
+            std::map<String, UInt64> local_merged_column_to_size;
             for (const MergeTreeData::DataPartPtr & part : global_ctx->future_part->parts)
                 part->accumulateColumnSizes(local_merged_column_to_size);
 

From 2cc071e0e4c7486368e9dca8b2b68c0e1ed2af11 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 12:48:15 +0100
Subject: [PATCH 251/985] Fix error

---
 docker/test/fuzzer/run-fuzzer.sh              |  2 +-
 src/Core/Field.h                              |  6 +++---
 src/Core/Types.h                              | 15 ++++++---------
 .../MergeTree/MergeTreeDataSelectExecutor.cpp | 11 ++++++-----
 .../0_stateless/03008_index_small.reference   |  2 ++
 .../queries/0_stateless/03008_index_small.sql | 19 +++++++++++++++++++
 6 files changed, 37 insertions(+), 18 deletions(-)
 create mode 100644 tests/queries/0_stateless/03008_index_small.reference
 create mode 100644 tests/queries/0_stateless/03008_index_small.sql

diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index dc1b35b3a21..63471c288dd 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -343,7 +343,7 @@ quit
         # which is confusing.
         task_exit_code=$fuzzer_exit_code
         echo "failure" > status.txt
-        echo "Achtung!" > description.txt
+        echo "Let op!" > description.txt
         echo "Fuzzer went wrong with error code: ($fuzzer_exit_code). Its process died somehow when the server stayed alive. The server log probably won't tell you much so try to find information in other files." >>description.txt
         { rg -ao "Found error:.*" fuzzer.log || rg -ao "Exception:.*" fuzzer.log; } | tail -1 >>description.txt
     fi
diff --git a/src/Core/Field.h b/src/Core/Field.h
index 414874310a6..43f175cb476 100644
--- a/src/Core/Field.h
+++ b/src/Core/Field.h
@@ -497,7 +497,7 @@ public:
 
         switch (which)
         {
-            case Types::Null:    return false;
+            case Types::Null:    return get<Null>() < rhs.get<Null>();
             case Types::Bool:    [[fallthrough]];
             case Types::UInt64:  return get<UInt64>()  < rhs.get<UInt64>();
             case Types::UInt128: return get<UInt128>() < rhs.get<UInt128>();
@@ -541,7 +541,7 @@ public:
 
         switch (which)
         {
-            case Types::Null:    return true;
+            case Types::Null:    return get<Null>() <= rhs.get<Null>();
             case Types::Bool: [[fallthrough]];
             case Types::UInt64:  return get<UInt64>()  <= rhs.get<UInt64>();
             case Types::UInt128: return get<UInt128>() <= rhs.get<UInt128>();
@@ -590,7 +590,7 @@ public:
 
         switch (which)
         {
-            case Types::Null: return true;
+            case Types::Null: return get<Null>() == rhs.get<Null>();
             case Types::Bool: [[fallthrough]];
             case Types::UInt64: return get<UInt64>() == rhs.get<UInt64>();
             case Types::Int64:   return get<Int64>() == rhs.get<Int64>();
diff --git a/src/Core/Types.h b/src/Core/Types.h
index 74e18e9494d..2a930d09873 100644
--- a/src/Core/Types.h
+++ b/src/Core/Types.h
@@ -23,9 +23,9 @@ struct Null
 {
     enum class Value
     {
-        Null,
-        PositiveInfinity,
-        NegativeInfinity,
+        NegativeInfinity = -1,
+        Null = 0,
+        PositiveInfinity = 1,
     };
 
     Value value{Value::Null};
@@ -34,15 +34,12 @@ struct Null
     bool isPositiveInfinity() const { return value == Value::PositiveInfinity; }
     bool isNegativeInfinity() const { return value == Value::NegativeInfinity; }
 
-    bool operator==(const Null & other) const
+    auto operator<=>(const Null & other) const
     {
-        return value == other.value;
+        return static_cast<int>(value) <=> static_cast<int>(other.value);
     }
 
-    bool operator!=(const Null & other) const
-    {
-        return !(*this == other);
-    }
+    bool operator==(const Null &) const = default;
 };
 
 using UInt128 = ::UInt128;
diff --git a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
index 93b9ad60e3c..ef679b61a79 100644
--- a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
@@ -1130,6 +1130,7 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
     bool part_offset_condition_exact_range
         = !part_offset_condition || part_offset_condition->alwaysUnknownOrTrue() || part_offset_condition->matchesExactContinuousRange();
     const String & part_name = part->isProjectionPart() ? fmt::format("{}.{}", part->name, part->getParentPart()->name) : part->name;
+
     if (!key_condition_exact_range || !part_offset_condition_exact_range)
     {
         // Do exclusion search, where we drop ranges that do not match
@@ -1144,10 +1145,10 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
             part->index_granularity_info.index_granularity_bytes);
 
         /** There will always be disjoint suspicious segments on the stack, the leftmost one at the top (back).
-        * At each step, take the left segment and check if it fits.
-        * If fits, split it into smaller ones and put them on the stack. If not, discard it.
-        * If the segment is already of one mark length, add it to response and discard it.
-        */
+          * At each step, take the left segment and check if it fits.
+          * If fits, split it into smaller ones and put them on the stack. If not, discard it.
+          * If the segment is already of one mark length, add it to response and discard it.
+          */
         std::vector<MarkRange> ranges_stack = { {0, marks_count} };
 
         size_t steps = 0;
@@ -1157,7 +1158,7 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
             MarkRange range = ranges_stack.back();
             ranges_stack.pop_back();
 
-            steps++;
+            ++steps;
 
             if (!may_be_true_in_range(range))
                 continue;
diff --git a/tests/queries/0_stateless/03008_index_small.reference b/tests/queries/0_stateless/03008_index_small.reference
new file mode 100644
index 00000000000..a5c8806279f
--- /dev/null
+++ b/tests/queries/0_stateless/03008_index_small.reference
@@ -0,0 +1,2 @@
+3
+3
diff --git a/tests/queries/0_stateless/03008_index_small.sql b/tests/queries/0_stateless/03008_index_small.sql
new file mode 100644
index 00000000000..4eb2db3abc3
--- /dev/null
+++ b/tests/queries/0_stateless/03008_index_small.sql
@@ -0,0 +1,19 @@
+DROP TABLE IF EXISTS test;
+
+CREATE TABLE test (a UInt8, b UInt8) ENGINE = MergeTree ORDER BY (a, b)
+SETTINGS index_granularity = 1, primary_key_ratio_of_unique_prefix_values_to_skip_suffix_columns = 0.01;
+
+SET optimize_move_to_prewhere = 0;
+
+INSERT INTO test
+SELECT number DIV 2, number
+FROM numbers(3);
+
+SELECT count() FROM test WHERE b >= 0;
+
+DETACH TABLE test;
+ATTACH TABLE test;
+
+SELECT count() FROM test WHERE b >= 0;
+
+-- DROP TABLE test;

From adf056b54ad35638245c1a5c30bc57c4cb17fc6c Mon Sep 17 00:00:00 2001
From: Dan Wu <wudanzy@google.com>
Date: Sun, 10 Mar 2024 20:42:41 +0800
Subject: [PATCH 252/985] Update check-large-objects.sh to be language neutral

The previous implementation uses `total` keyword to filter out lines that contains the total size of objects under a directory. But when the OS uses other language, it fails to filter out that line, so the script would fail.

This implementation changes the script to match only lines that contains object file by their extension. This implementation would be language neutral.
---
 utils/check-style/check-large-objects.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/utils/check-style/check-large-objects.sh b/utils/check-style/check-large-objects.sh
index 5c1276e5732..04f4e0c3171 100755
--- a/utils/check-style/check-large-objects.sh
+++ b/utils/check-style/check-large-objects.sh
@@ -12,7 +12,7 @@ TU_EXCLUDES=(
     Aggregator
 )
 
-if find $1 -name '*.o' | xargs wc -c | grep -v total | sort -rn | awk '{ if ($1 > 50000000) print }' \
+if find $1 -name '*.o' | xargs wc -c | grep --regexp='.o$' | sort -rn | awk '{ if ($1 > 50000000) print }' \
     | grep -v -f <(printf "%s\n" "${TU_EXCLUDES[@]}")
 then
     echo "^ It's not allowed to have so large translation units."

From 530efbe8102023f857ec29b1f9c7f2090973f736 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Sun, 10 Mar 2024 13:08:50 +0000
Subject: [PATCH 253/985] Beautify exception, pt. II

---
 src/Functions/array/arrayDistance.cpp   | 6 +++---
 src/Functions/array/arrayDotProduct.cpp | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index 8b591e37ff6..69e5e3712dd 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -357,7 +357,7 @@ public:
                 throw Exception(
                     ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                     "Arguments of function {} has nested type {}. "
-                    "Support: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
+                    "Supported types: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
                     getName(),
                     common_type->getName());
         }
@@ -412,7 +412,7 @@ private:
                 throw Exception(
                     ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                     "Arguments of function {} has nested type {}. "
-                    "Support: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
+                    "Supported types: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
                     getName(),
                     type_x->getName());
         }
@@ -437,7 +437,7 @@ private:
                 throw Exception(
                     ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                     "Arguments of function {} has nested type {}. "
-                    "Support: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
+                    "Supported types: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
                     getName(),
                     type_y->getName());
         }
diff --git a/src/Functions/array/arrayDotProduct.cpp b/src/Functions/array/arrayDotProduct.cpp
index 3f37e6f609f..a9547ca90bb 100644
--- a/src/Functions/array/arrayDotProduct.cpp
+++ b/src/Functions/array/arrayDotProduct.cpp
@@ -237,7 +237,7 @@ private:
                 throw Exception(
                     ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                     "Arguments of function {} has nested type {}. "
-                    "Support: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
+                    "Supported types: UInt8, UInt16, UInt32, UInt64, Int8, Int16, Int32, Int64, Float32, Float64.",
                     getName(),
                     type_y->getName());
         }

From bcd705517a510feffd08e9e27c93c2e09eecd144 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Sun, 10 Mar 2024 12:53:58 +0000
Subject: [PATCH 254/985] Remove unnecessary call to
 convertToFullColumnIfConst()

---
 src/Functions/array/arrayDistance.cpp   | 3 ---
 src/Functions/array/arrayDotProduct.cpp | 3 ---
 src/Functions/array/arrayNorm.cpp       | 3 +--
 3 files changed, 1 insertion(+), 8 deletions(-)

diff --git a/src/Functions/array/arrayDistance.cpp b/src/Functions/array/arrayDistance.cpp
index 69e5e3712dd..6ed4bf24f99 100644
--- a/src/Functions/array/arrayDistance.cpp
+++ b/src/Functions/array/arrayDistance.cpp
@@ -455,9 +455,6 @@ private:
             return executeWithLeftArgConst<ResultType, RightType, LeftType>(col_y, col_x, input_rows_count, arguments);
         }
 
-        col_x = col_x->convertToFullColumnIfConst();
-        col_y = col_y->convertToFullColumnIfConst();
-
         const auto & array_x = *assert_cast<const ColumnArray *>(col_x.get());
         const auto & array_y = *assert_cast<const ColumnArray *>(col_y.get());
 
diff --git a/src/Functions/array/arrayDotProduct.cpp b/src/Functions/array/arrayDotProduct.cpp
index a9547ca90bb..783843a89d5 100644
--- a/src/Functions/array/arrayDotProduct.cpp
+++ b/src/Functions/array/arrayDotProduct.cpp
@@ -255,9 +255,6 @@ private:
             return executeWithLeftArgConst<ResultType, RightType, LeftType>(col_y, col_x, input_rows_count);
         }
 
-        col_x = col_x->convertToFullColumnIfConst();
-        col_y = col_y->convertToFullColumnIfConst();
-
         const auto & array_x = *assert_cast<const ColumnArray *>(col_x.get());
         const auto & array_y = *assert_cast<const ColumnArray *>(col_y.get());
 
diff --git a/src/Functions/array/arrayNorm.cpp b/src/Functions/array/arrayNorm.cpp
index 027a33d094c..e87eff6add1 100644
--- a/src/Functions/array/arrayNorm.cpp
+++ b/src/Functions/array/arrayNorm.cpp
@@ -175,8 +175,7 @@ public:
         }
     }
 
-    ColumnPtr
-    executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
     {
         DataTypePtr type = typeid_cast<const DataTypeArray *>(arguments[0].type.get())->getNestedType();
         ColumnPtr column = arguments[0].column->convertToFullColumnIfConst();

From 349894fc2b73fad70910c325e0de053a56ec1bc7 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Fri, 8 Mar 2024 11:27:09 +0000
Subject: [PATCH 255/985] Fixes #61051

---
 docs/en/operations/settings/settings.md       | 12 +++++
 .../functions/string-search-functions.md      | 18 ++++++-
 src/Core/Settings.h                           |  1 +
 src/Core/SettingsChangesHistory.h             |  1 +
 src/Functions/FunctionsStringSearch.h         | 53 ++++++++++++++-----
 .../array/FunctionsMapMiscellaneous.cpp       |  1 +
 src/Functions/like.cpp                        |  2 +-
 src/Functions/locate.cpp                      | 34 ++++++++++++
 src/Functions/position.cpp                    |  1 -
 .../0_stateless/00765_locate.reference        |  7 +++
 tests/queries/0_stateless/00765_locate.sql    | 15 ++++++
 .../00765_sql_compatibility_aliases.reference |  1 -
 .../00765_sql_compatibility_aliases.sql       |  1 -
 ..._case_insensitive_function_names.reference |  1 -
 ...malize_case_insensitive_function_names.sql |  2 +-
 15 files changed, 130 insertions(+), 20 deletions(-)
 create mode 100644 src/Functions/locate.cpp
 create mode 100644 tests/queries/0_stateless/00765_locate.reference
 create mode 100644 tests/queries/0_stateless/00765_locate.sql

diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index 622644a1543..e75435669fb 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -4336,6 +4336,18 @@ Possible values:
 
 Default value: `0`.
 
+
+## function_locate_has_mysql_compatible_argument_order {#function-locate-has-mysql-compatible-argument-order}
+
+Controls the order of arguments in function [locate](../../sql-reference/functions/string-search-functions.md#locate).
+
+Possible values:
+
+- 0 — Function `locate` accepts arguments `(haystack, needle[, start_pos])`.
+- 1 — Function `locate` accepts arguments `(needle, haystack, [, start_pos])` (MySQL-compatible behavior)
+
+Default value: `1`.
+
 ## date_time_overflow_behavior {#date_time_overflow_behavior}
 
 Defines the behavior when [Date](../../sql-reference/data-types/date.md), [Date32](../../sql-reference/data-types/date32.md), [DateTime](../../sql-reference/data-types/datetime.md), [DateTime64](../../sql-reference/data-types/datetime64.md) or integers are converted into Date, Date32, DateTime or DateTime64 but the value cannot be represented in the result type.
diff --git a/docs/en/sql-reference/functions/string-search-functions.md b/docs/en/sql-reference/functions/string-search-functions.md
index 22f879c62ae..1b03f220db2 100644
--- a/docs/en/sql-reference/functions/string-search-functions.md
+++ b/docs/en/sql-reference/functions/string-search-functions.md
@@ -30,7 +30,6 @@ position(haystack, needle[, start_pos])
 
 Alias:
 - `position(needle IN haystack)`
-- `locate(haystack, needle[, start_pos])`.
 
 **Arguments**
 
@@ -49,7 +48,7 @@ If substring `needle` is empty, these rules apply:
 - if `start_pos >= 1` and `start_pos <= length(haystack) + 1`: return `start_pos`
 - otherwise: return `0`
 
-The same rules also apply to functions `positionCaseInsensitive`, `positionUTF8` and `positionCaseInsensitiveUTF8`
+The same rules also apply to functions `locate`, `positionCaseInsensitive`, `positionUTF8` and `positionCaseInsensitiveUTF8`.
 
 Type: `Integer`.
 
@@ -114,6 +113,21 @@ SELECT
 └─────────────────────┴────────────────────────┴────────────────────────┴────────────────────────┴────────────────────────┴────────────────────────┴────────────────────────┘
 ```
 
+## locate
+
+Like [position](#position) but with arguments `haystack` and `locate` switched.
+
+The behavior of this function depends on the ClickHouse version:
+- in versions < v24.3, `locate` was an alias of function `position` and accepted arguments `(haystack, needle[, start_pos])`.
+- in versions >= 24.3,, `locate` is an individual function (for better compatibility with MySQL) and accepts arguments `(needle, haystack[, start_pos])`. The previous behavior
+  can be restored using setting [function_locate_has_mysql_compatible_argument_order = false](../../operations/settings/settings.md#function-locate-has-mysql-compatible-argument-order);
+
+**Syntax**
+
+``` sql
+locate(needle, haystack[, start_pos])
+```
+
 ## positionCaseInsensitive
 
 Like [position](#position) but searches case-insensitively.
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index c8bdb515baf..185fa99e062 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -175,6 +175,7 @@ class IColumn;
     M(Bool, enable_positional_arguments, true, "Enable positional arguments in ORDER BY, GROUP BY and LIMIT BY", 0) \
     M(Bool, enable_extended_results_for_datetime_functions, false, "Enable date functions like toLastDayOfMonth return Date32 results (instead of Date results) for Date32/DateTime64 arguments.", 0) \
     M(Bool, allow_nonconst_timezone_arguments, false, "Allow non-const timezone arguments in certain time-related functions like toTimeZone(), fromUnixTimestamp*(), snowflakeToDateTime*()", 0) \
+    M(Bool, function_locate_has_mysql_compatible_argument_order, true, "Function locate() has arguments (needle, haystack[, start_pos]) like in MySQL instead of (haystack, needle[, start_pos]) like function position()", 0) \
     \
     M(Bool, group_by_use_nulls, false, "Treat columns mentioned in ROLLUP, CUBE or GROUPING SETS as Nullable", 0) \
     \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 2f1da7935e6..1c5e8ab3818 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -92,6 +92,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"input_format_json_use_string_type_for_ambiguous_paths_in_named_tuples_inference_from_objects", false, false, "Allow to use String type for ambiguous paths during named tuple inference from JSON objects"},
               {"throw_if_deduplication_in_dependent_materialized_views_enabled_with_async_insert", false, true, "Deduplication is dependent materialized view cannot work together with async inserts."},
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
+              {"function_locate_has_mysql_compatible_argument_order", false, true, "Increase compatibility with MySQL's locate function."},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
diff --git a/src/Functions/FunctionsStringSearch.h b/src/Functions/FunctionsStringSearch.h
index 41b476ccc56..53d99198134 100644
--- a/src/Functions/FunctionsStringSearch.h
+++ b/src/Functions/FunctionsStringSearch.h
@@ -22,13 +22,13 @@ namespace DB
   * positionCaseInsensitive(haystack, needle)
   * positionCaseInsensitiveUTF8(haystack, needle)
   *
-  * like(haystack, pattern)        - search by the regular expression LIKE; Returns 0 or 1. Case-insensitive, but only for Latin.
-  * notLike(haystack, pattern)
+  * like(haystack, needle)        - search by the regular expression LIKE; Returns 0 or 1. Case-insensitive, but only for Latin.
+  * notLike(haystack, needle)
   *
-  * ilike(haystack, pattern) - like 'like' but case-insensitive
-  * notIlike(haystack, pattern)
+  * ilike(haystack, needle) - like 'like' but case-insensitive
+  * notIlike(haystack, needle)
   *
-  * match(haystack, pattern)       - search by regular expression re2; Returns 0 or 1.
+  * match(haystack, needle)       - search by regular expression re2; Returns 0 or 1.
   *
   * countSubstrings(haystack, needle) -- count number of occurrences of needle in haystack.
   * countSubstringsCaseInsensitive(haystack, needle)
@@ -53,7 +53,7 @@ namespace DB
   * - the first subpattern, if the regexp has a subpattern;
   * - the zero subpattern (the match part, otherwise);
   * - if not match - an empty string.
-  * extract(haystack, pattern)
+  * extract(haystack, needle)
   */
 
 namespace ErrorCodes
@@ -69,13 +69,39 @@ enum class ExecutionErrorPolicy
     Throw
 };
 
-template <typename Impl, ExecutionErrorPolicy execution_error_policy = ExecutionErrorPolicy::Throw>
+enum class HaystackNeedleOrderIsConfigurable
+{
+    No,     /// function arguments are always: (haystack, needle[, position])
+    Yes     /// depending on a setting, the function arguments are (haystack, needle[, position]) or (needle, haystack[, position])
+};
+
+template <typename Impl,
+         ExecutionErrorPolicy execution_error_policy = ExecutionErrorPolicy::Throw,
+         HaystackNeedleOrderIsConfigurable haystack_needle_order_is_configurable = HaystackNeedleOrderIsConfigurable::No>
 class FunctionsStringSearch : public IFunction
 {
+private:
+    enum class ArgumentOrder
+    {
+        HaystackNeedle,
+        NeedleHaystack
+    };
+
+    ArgumentOrder argument_order = ArgumentOrder::HaystackNeedle;
+
 public:
     static constexpr auto name = Impl::name;
 
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionsStringSearch>(); }
+    static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionsStringSearch>(context); }
+
+    explicit FunctionsStringSearch([[maybe_unused]] ContextPtr context)
+    {
+        if constexpr (haystack_needle_order_is_configurable == HaystackNeedleOrderIsConfigurable::Yes)
+        {
+            if (context->getSettingsRef().function_locate_has_mysql_compatible_argument_order)
+                argument_order = ArgumentOrder::NeedleHaystack;
+        }
+    }
 
     String getName() const override { return name; }
 
@@ -105,13 +131,16 @@ public:
                 "Number of arguments for function {} doesn't match: passed {}, should be 2 or 3",
                 getName(), arguments.size());
 
-        if (!isStringOrFixedString(arguments[0]))
+        const auto & haystack_type = (argument_order == ArgumentOrder::HaystackNeedle) ? arguments[0] : arguments[1];
+        const auto & needle_type = (argument_order == ArgumentOrder::HaystackNeedle) ? arguments[1] : arguments[0];
+
+        if (!isStringOrFixedString(haystack_type))
             throw Exception(
                 ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                 "Illegal type {} of argument of function {}",
                 arguments[0]->getName(), getName());
 
-        if (!isString(arguments[1]))
+        if (!isString(needle_type))
             throw Exception(
                 ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
                 "Illegal type {} of argument of function {}",
@@ -135,8 +164,8 @@ public:
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t /*input_rows_count*/) const override
     {
-        const ColumnPtr & column_haystack = arguments[0].column;
-        const ColumnPtr & column_needle = arguments[1].column;
+        const ColumnPtr & column_haystack = (argument_order == ArgumentOrder::HaystackNeedle) ? arguments[0].column : arguments[1].column;
+        const ColumnPtr & column_needle = (argument_order == ArgumentOrder::HaystackNeedle) ? arguments[1].column : arguments[0].column;
 
         ColumnPtr column_start_pos = nullptr;
         if (arguments.size() >= 3)
diff --git a/src/Functions/array/FunctionsMapMiscellaneous.cpp b/src/Functions/array/FunctionsMapMiscellaneous.cpp
index 157f2fa8a26..d92bfcf0bc6 100644
--- a/src/Functions/array/FunctionsMapMiscellaneous.cpp
+++ b/src/Functions/array/FunctionsMapMiscellaneous.cpp
@@ -213,6 +213,7 @@ struct MapToSubcolumnAdapter : public MapAdapterBase<MapToSubcolumnAdapter<Name,
 class FunctionMapKeyLike : public IFunction
 {
 public:
+    FunctionMapKeyLike() : impl(/*context*/ nullptr) {} /// nullptr because getting a context here is hard and FunctionLike doesn't need context
     String getName() const override { return "mapKeyLike"; }
     size_t getNumberOfArguments() const override { return 3; }
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; }
diff --git a/src/Functions/like.cpp b/src/Functions/like.cpp
index 5a86e37a92d..de907380265 100644
--- a/src/Functions/like.cpp
+++ b/src/Functions/like.cpp
@@ -1,5 +1,5 @@
-#include "FunctionFactory.h"
 #include "like.h"
+#include "FunctionFactory.h"
 
 
 namespace DB
diff --git a/src/Functions/locate.cpp b/src/Functions/locate.cpp
new file mode 100644
index 00000000000..9a70fbb2d72
--- /dev/null
+++ b/src/Functions/locate.cpp
@@ -0,0 +1,34 @@
+#include "FunctionsStringSearch.h"
+#include "FunctionFactory.h"
+#include "PositionImpl.h"
+
+
+namespace DB
+{
+namespace
+{
+
+struct NameLocate
+{
+    static constexpr auto name = "locate";
+};
+
+using FunctionLocate = FunctionsStringSearch<PositionImpl<NameLocate, PositionCaseSensitiveASCII>, ExecutionErrorPolicy::Throw, HaystackNeedleOrderIsConfigurable::Yes>;
+
+}
+
+REGISTER_FUNCTION(Locate)
+{
+    FunctionDocumentation::Description doc_description = "Like function `position` but with arguments `haystack` and `locate` switched. The behavior of this function depends on the ClickHouse version: In versions < v24.3, `locate` was an alias of function `position` and accepted arguments `(haystack, needle[, start_pos])`. In versions >= 24.3,, `locate` is an individual function (for better compatibility with MySQL) and accepts arguments `(needle, haystack[, start_pos])`. The previous behaviorcan be restored using setting `function_locate_has_mysql_compatible_argument_order = false`.";
+    FunctionDocumentation::Syntax doc_syntax = "location(needle, haystack[, start_pos])";
+    FunctionDocumentation::Arguments doc_arguments = {{"needle", "Substring to be searched (String)"},
+                                                      {"haystack", "String in which the search is performed (String)."},
+                                                      {"start_pos", "Position (1-based) in `haystack` at which the search starts (UInt*)."}};
+    FunctionDocumentation::ReturnedValue doc_returned_value = "Starting position in bytes and counting from 1, if the substring was found. 0, if the substring was not found.";
+    FunctionDocumentation::Examples doc_examples = {{"Example", "SELECT locate('abcabc', 'ca');", "3"}};
+    FunctionDocumentation::Categories doc_categories = {"String search"};
+
+
+    factory.registerFunction<FunctionLocate>({doc_description, doc_syntax, doc_arguments, doc_returned_value, doc_examples, doc_categories}, FunctionFactory::CaseInsensitive);
+}
+}
diff --git a/src/Functions/position.cpp b/src/Functions/position.cpp
index 409a593b44c..29a5db2eb24 100644
--- a/src/Functions/position.cpp
+++ b/src/Functions/position.cpp
@@ -20,6 +20,5 @@ using FunctionPosition = FunctionsStringSearch<PositionImpl<NamePosition, Positi
 REGISTER_FUNCTION(Position)
 {
     factory.registerFunction<FunctionPosition>({}, FunctionFactory::CaseInsensitive);
-    factory.registerAlias("locate", NamePosition::name, FunctionFactory::CaseInsensitive);
 }
 }
diff --git a/tests/queries/0_stateless/00765_locate.reference b/tests/queries/0_stateless/00765_locate.reference
new file mode 100644
index 00000000000..3b066c0d68b
--- /dev/null
+++ b/tests/queries/0_stateless/00765_locate.reference
@@ -0,0 +1,7 @@
+-- negative tests
+-- test mysql compatibility setting
+0
+0
+3
+-- the function name needs to be case-insensitive for historical reasons
+0
diff --git a/tests/queries/0_stateless/00765_locate.sql b/tests/queries/0_stateless/00765_locate.sql
new file mode 100644
index 00000000000..3467ebd4249
--- /dev/null
+++ b/tests/queries/0_stateless/00765_locate.sql
@@ -0,0 +1,15 @@
+SET send_logs_level = 'fatal';
+
+SELECT '-- negative tests';
+SELECT locate(); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
+SELECT locate(1, 'abc'); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+SELECT locate('abc', 1); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+SELECT locate('abc', 'abc', 'abc'); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+
+SELECT '-- test mysql compatibility setting';
+SELECT locate('abcabc', 'ca');
+SELECT locate('abcabc', 'ca') SETTINGS function_locate_has_mysql_compatible_argument_order = true;
+SELECT locate('abcabc', 'ca') SETTINGS function_locate_has_mysql_compatible_argument_order = false;
+
+SELECT '-- the function name needs to be case-insensitive for historical reasons';
+SELECT LoCaTe('abcabc', 'ca');
diff --git a/tests/queries/0_stateless/00765_sql_compatibility_aliases.reference b/tests/queries/0_stateless/00765_sql_compatibility_aliases.reference
index 285b9a62d20..6d31168c2b7 100644
--- a/tests/queries/0_stateless/00765_sql_compatibility_aliases.reference
+++ b/tests/queries/0_stateless/00765_sql_compatibility_aliases.reference
@@ -4,7 +4,6 @@ foo
 FOO
 baz
 zzz
-2
 fo
 oo
 o
diff --git a/tests/queries/0_stateless/00765_sql_compatibility_aliases.sql b/tests/queries/0_stateless/00765_sql_compatibility_aliases.sql
index da0eb9bea6d..995aaef9ea5 100644
--- a/tests/queries/0_stateless/00765_sql_compatibility_aliases.sql
+++ b/tests/queries/0_stateless/00765_sql_compatibility_aliases.sql
@@ -6,7 +6,6 @@ select LOWER('Foo');
 select UPPER('Foo');
 select REPLACE('bar', 'r', 'z');
 select REGEXP_REPLACE('bar', '.', 'z');
-select Locate('foo', 'o');
 select SUBSTRING('foo', 1, 2);
 select Substr('foo', 2);
 select mid('foo', 3);
diff --git a/tests/queries/0_stateless/01705_normalize_case_insensitive_function_names.reference b/tests/queries/0_stateless/01705_normalize_case_insensitive_function_names.reference
index de5a62159ef..76dd04b0e42 100644
--- a/tests/queries/0_stateless/01705_normalize_case_insensitive_function_names.reference
+++ b/tests/queries/0_stateless/01705_normalize_case_insensitive_function_names.reference
@@ -26,7 +26,6 @@ SELECT
     least(1),
     length('1'),
     log(1),
-    position('1', '1'),
     log(1),
     log10(1),
     log2(1),
diff --git a/tests/queries/0_stateless/01705_normalize_case_insensitive_function_names.sql b/tests/queries/0_stateless/01705_normalize_case_insensitive_function_names.sql
index dda2e045e76..d8054b9757c 100644
--- a/tests/queries/0_stateless/01705_normalize_case_insensitive_function_names.sql
+++ b/tests/queries/0_stateless/01705_normalize_case_insensitive_function_names.sql
@@ -1 +1 @@
-EXPLAIN SYNTAX SELECT CAST(1 AS INT), CEIL(1), CEILING(1), CHAR(49), CHAR_LENGTH('1'), CHARACTER_LENGTH('1'), COALESCE(1), CONCAT('1', '1'), CORR(1, 1), COS(1), COUNT(1), COVAR_POP(1, 1), COVAR_SAMP(1, 1), DATABASE(), SCHEMA(), DATEDIFF('DAY', toDate('2020-10-24'), toDate('2019-10-24')), EXP(1), FLATTEN([[1]]), FLOOR(1), FQDN(), GREATEST(1), IF(1, 1, 1), IFNULL(1, 1), LCASE('A'), LEAST(1), LENGTH('1'), LN(1), LOCATE('1', '1'), LOG(1), LOG10(1), LOG2(1), LOWER('A'), MAX(1), MID('123', 1, 1), MIN(1), MOD(1, 1), NOT(1), NOW(), NOW64(), NULLIF(1, 1), PI(), POSITION('123', '2'), POW(1, 1), POWER(1, 1), RAND(), REPLACE('1', '1', '2'), REVERSE('123'), ROUND(1), SIN(1), SQRT(1), STDDEV_POP(1), STDDEV_SAMP(1), SUBSTR('123', 2), SUBSTRING('123', 2), SUM(1), TAN(1), TANH(1), TRUNC(1), TRUNCATE(1), UCASE('A'), UPPER('A'), USER(), VAR_POP(1), VAR_SAMP(1), WEEK(toDate('2020-10-24')), YEARWEEK(toDate('2020-10-24')) format TSVRaw;
+EXPLAIN SYNTAX SELECT CAST(1 AS INT), CEIL(1), CEILING(1), CHAR(49), CHAR_LENGTH('1'), CHARACTER_LENGTH('1'), COALESCE(1), CONCAT('1', '1'), CORR(1, 1), COS(1), COUNT(1), COVAR_POP(1, 1), COVAR_SAMP(1, 1), DATABASE(), SCHEMA(), DATEDIFF('DAY', toDate('2020-10-24'), toDate('2019-10-24')), EXP(1), FLATTEN([[1]]), FLOOR(1), FQDN(), GREATEST(1), IF(1, 1, 1), IFNULL(1, 1), LCASE('A'), LEAST(1), LENGTH('1'), LN(1), LOG(1), LOG10(1), LOG2(1), LOWER('A'), MAX(1), MID('123', 1, 1), MIN(1), MOD(1, 1), NOT(1), NOW(), NOW64(), NULLIF(1, 1), PI(), POSITION('123', '2'), POW(1, 1), POWER(1, 1), RAND(), REPLACE('1', '1', '2'), REVERSE('123'), ROUND(1), SIN(1), SQRT(1), STDDEV_POP(1), STDDEV_SAMP(1), SUBSTR('123', 2), SUBSTRING('123', 2), SUM(1), TAN(1), TANH(1), TRUNC(1), TRUNCATE(1), UCASE('A'), UPPER('A'), USER(), VAR_POP(1), VAR_SAMP(1), WEEK(toDate('2020-10-24')), YEARWEEK(toDate('2020-10-24')) format TSVRaw;

From 0b63cb237a5a72c96bbc3d4cf52ab70a5d2ad2aa Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Sun, 10 Mar 2024 12:05:32 +0100
Subject: [PATCH 256/985] Fix

---
 src/Storages/System/StorageSystemDisks.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Storages/System/StorageSystemDisks.cpp b/src/Storages/System/StorageSystemDisks.cpp
index f67d4f7acd0..eecc889f86b 100644
--- a/src/Storages/System/StorageSystemDisks.cpp
+++ b/src/Storages/System/StorageSystemDisks.cpp
@@ -73,9 +73,9 @@ Pipe StorageSystemDisks::read(
         col_unreserved->insert(disk_ptr->getUnreservedSpace().value_or(std::numeric_limits<UInt64>::max()));
         col_keep->insert(disk_ptr->getKeepingFreeSpace());
         auto data_source_description = disk_ptr->getDataSourceDescription();
-        col_type->insert(data_source_description.type);
-        col_object_storage_type->insert(data_source_description.object_storage_type);
-        col_metadata_type->insert(data_source_description.metadata_type);
+        col_type->insert(magic_enum::enum_name(data_source_description.type));
+        col_object_storage_type->insert(magic_enum::enum_name(data_source_description.object_storage_type));
+        col_metadata_type->insert(magic_enum::enum_name(data_source_description.metadata_type));
         col_is_encrypted->insert(data_source_description.is_encrypted);
         col_is_read_only->insert(disk_ptr->isReadOnly());
         col_is_write_once->insert(disk_ptr->isWriteOnce());

From 04d885b570325b1e66bf0c7c13d4732b4d9340ec Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Sun, 10 Mar 2024 16:42:40 +0100
Subject: [PATCH 257/985] Throw memory limit exceptions to avoid OOM in some
 places

---
 src/Processors/Executors/ExecutingGraph.h   | 7 ++++++-
 src/Processors/Executors/ExecutorTasks.h    | 5 ++++-
 src/Processors/Executors/PipelineExecutor.h | 7 ++++++-
 3 files changed, 16 insertions(+), 3 deletions(-)

diff --git a/src/Processors/Executors/ExecutingGraph.h b/src/Processors/Executors/ExecutingGraph.h
index 1a7659d3e08..e6d41321edd 100644
--- a/src/Processors/Executors/ExecutingGraph.h
+++ b/src/Processors/Executors/ExecutingGraph.h
@@ -3,6 +3,7 @@
 #include <Processors/Port.h>
 #include <Processors/IProcessor.h>
 #include <Common/SharedMutex.h>
+#include <Common/AllocatorWithMemoryTracking.h>
 #include <mutex>
 #include <queue>
 #include <stack>
@@ -117,7 +118,11 @@ public:
         }
     };
 
-    using Queue = std::queue<Node *>;
+    /// This queue can grow a lot and lead to OOM. That is why we use non-default
+    /// allocator for container which throws exceptions in operator new
+    using DequeWithMemoryTracker = std::deque<ExecutingGraph::Node *, AllocatorWithMemoryTracking<ExecutingGraph::Node *>>;
+    using Queue = std::queue<ExecutingGraph::Node *, DequeWithMemoryTracker>;
+
     using NodePtr = std::unique_ptr<Node>;
     using Nodes = std::vector<NodePtr>;
     Nodes nodes;
diff --git a/src/Processors/Executors/ExecutorTasks.h b/src/Processors/Executors/ExecutorTasks.h
index d35f8de94d1..202ca253c6c 100644
--- a/src/Processors/Executors/ExecutorTasks.h
+++ b/src/Processors/Executors/ExecutorTasks.h
@@ -47,7 +47,10 @@ class ExecutorTasks
 
 public:
     using Stack = std::stack<UInt64>;
-    using Queue = std::queue<ExecutingGraph::Node *>;
+    /// This queue can grow a lot and lead to OOM. That is why we use non-default
+    /// allocator for container which throws exceptions in operator new
+    using DequeWithMemoryTracker = std::deque<ExecutingGraph::Node *, AllocatorWithMemoryTracking<ExecutingGraph::Node *>>;
+    using Queue = std::queue<ExecutingGraph::Node *, DequeWithMemoryTracker>;
 
     void finish();
     bool isFinished() const { return finished; }
diff --git a/src/Processors/Executors/PipelineExecutor.h b/src/Processors/Executors/PipelineExecutor.h
index cb74b524163..03f0f7f1a0a 100644
--- a/src/Processors/Executors/PipelineExecutor.h
+++ b/src/Processors/Executors/PipelineExecutor.h
@@ -5,7 +5,9 @@
 #include <Common/EventCounter.h>
 #include <Common/ThreadPool_fwd.h>
 #include <Common/ConcurrencyControl.h>
+#include <Common/AllocatorWithMemoryTracking.h>
 
+#include <deque>
 #include <queue>
 #include <mutex>
 #include <memory>
@@ -90,7 +92,10 @@ private:
 
     ReadProgressCallbackPtr read_progress_callback;
 
-    using Queue = std::queue<ExecutingGraph::Node *>;
+    /// This queue can grow a lot and lead to OOM. That is why we use non-default
+    /// allocator for container which throws exceptions in operator new
+    using DequeWithMemoryTracker = std::deque<ExecutingGraph::Node *, AllocatorWithMemoryTracking<ExecutingGraph::Node *>>;
+    using Queue = std::queue<ExecutingGraph::Node *, DequeWithMemoryTracker>;
 
     void initializeExecution(size_t num_threads, bool concurrency_control); /// Initialize executor contexts and task_queue.
     void finalizeExecution(); /// Check all processors are finished.

From f429f54af8f1fc8fad56a96818c3fe6cc8a1ee7a Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Sat, 9 Mar 2024 20:38:23 +0000
Subject: [PATCH 258/985] CI: make style check fast  #do_not_test

---
 tests/ci/style_check.py                       | 32 +++++++----
 .../{check_cpp_docs.sh => check_cpp.sh}       | 55 ++++++++++++-------
 utils/check-style/check_py.sh                 | 19 ++++---
 3 files changed, 68 insertions(+), 38 deletions(-)
 rename utils/check-style/{check_cpp_docs.sh => check_cpp.sh} (50%)

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index d0565e136d3..a772539aef8 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -10,7 +10,7 @@ from pathlib import Path
 from typing import List, Tuple
 
 from docker_images_helper import get_docker_image, pull_image
-from env_helper import REPO_COPY, TEMP_PATH
+from env_helper import CI, REPO_COPY, TEMP_PATH
 from git_helper import GIT_PREFIX, git_runner
 from pr_info import PRInfo
 from report import ERROR, FAILURE, SUCCESS, JobReport, TestResults, read_test_results
@@ -128,32 +128,40 @@ def main():
     temp_path = Path(TEMP_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
 
-    # pr_info = PRInfo()
+    pr_info = PRInfo()
 
     IMAGE_NAME = "clickhouse/style-test"
     image = pull_image(get_docker_image(IMAGE_NAME))
-    cmd_1 = (
+    cmd_cpp = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
         f"--entrypoint= -w/ClickHouse/utils/check-style "
-        f"{image} ./check_cpp_docs.sh"
+        f"{image} ./check_cpp.sh"
     )
-    cmd_2 = (
+    cmd_py = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
         f"--entrypoint= -w/ClickHouse/utils/check-style "
         f"{image} ./check_py.sh"
     )
-    logging.info("Is going to run the command: %s", cmd_1)
-    logging.info("Is going to run the command: %s", cmd_2)
 
     with ProcessPoolExecutor(max_workers=2) as executor:
-        # Submit commands for execution in parallel
-        future1 = executor.submit(subprocess.run, cmd_1, shell=True)
-        future2 = executor.submit(subprocess.run, cmd_2, shell=True)
-        # Wait for both commands to complete
+        logging.info("Is going to run the command: %s", cmd_cpp)
+        future1 = executor.submit(subprocess.run, cmd_cpp, shell=True)
+        # Parallelization  does not make it faster - run subsequently
         _ = future1.result()
-        _ = future2.result()
+
+        run_pycheck = True
+        if CI and pr_info.number > 0:
+            # skip py check if PR and no changed py files
+            pr_info.fetch_changed_files()
+            if not any(file.endswith(".py") for file in pr_info.changed_files):
+                run_pycheck = False
+
+        if run_pycheck:
+            logging.info("Is going to run the command: %s", cmd_py)
+            future2 = executor.submit(subprocess.run, cmd_py, shell=True)
+            _ = future2.result()
 
     # if args.push:
     #     checkout_head(pr_info)
diff --git a/utils/check-style/check_cpp_docs.sh b/utils/check-style/check_cpp.sh
similarity index 50%
rename from utils/check-style/check_cpp_docs.sh
rename to utils/check-style/check_cpp.sh
index 7ad3cede758..20d4c7f5ee9 100755
--- a/utils/check-style/check_cpp_docs.sh
+++ b/utils/check-style/check_cpp.sh
@@ -4,31 +4,48 @@
 
 cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_output/check_status.tsv
 
-# FIXME: 30 sec to wait
-# echo "Check duplicates" | ts
-# ./check-duplicate-includes.sh |& tee /test_output/duplicate_includes_output.txt
+start_total=`date +%s`
 
-echo "Check style" | ts
+# 40 sec - too much
+# start=`date +%s`
+# ./check-duplicate-includes.sh |& tee /test_output/duplicate_includes_output.txt
+# runtime=$((`date +%s`-start))
+# echo "Duplicates check. Done. $runtime seconds."
+
+start=`date +%s`
 ./check-style -n              |& tee /test_output/style_output.txt
-echo "Check typos" | ts
-./check-typos                 |& tee /test_output/typos_output.txt
-echo "Check docs spelling" | ts
-./check-doc-aspell            |& tee /test_output/docs_spelling_output.txt
-echo "Check whitespaces" | ts
+runtime=$((`date +%s`-start))
+echo "Check style. Done. $runtime seconds."
+
+start=`date +%s`
 ./check-whitespaces -n        |& tee /test_output/whitespaces_output.txt
-echo "Check workflows" | ts
+runtime=$((`date +%s`-start))
+echo "Check whitespaces. Done. $runtime seconds."
+
+start=`date +%s`
 ./check-workflows             |& tee /test_output/workflows_output.txt
-echo "Check submodules" | ts
+runtime=$((`date +%s`-start))
+echo "Check workflows. Done. $runtime seconds."
+
+start=`date +%s`
 ./check-submodules            |& tee /test_output/submodules_output.txt
-echo "Check style. Done" | ts
+runtime=$((`date +%s`-start))
+echo "Check submodules. Done. $runtime seconds."
+
+start=`date +%s`
+./check-typos                 |& tee /test_output/typos_output.txt
+runtime=$((`date +%s`-start))
+echo "Check typos. Done. $runtime seconds."
+
+start=`date +%s`
+./check-doc-aspell            |& tee /test_output/docs_spelling_output.txt
+runtime=$((`date +%s`-start))
+echo "Check docs spelling. Done. $runtime seconds."
+
+runtime=$((`date +%s`-start_total))
+echo "Check style, total. Done. $runtime seconds."
+
 
 # FIXME: 6 min to wait
 # echo "Check shell scripts with shellcheck" | ts
 # ./shellcheck-run.sh           |& tee /test_output/shellcheck_output.txt
-
-
-# FIXME: move out
-# /process_style_check_result.py || echo -e "failure\tCannot parse results" > /test_output/check_status.tsv
-# echo "Check help for changelog generator works" | ts
-# cd ../changelog || exit 1
-# ./changelog.py -h 2>/dev/null 1>&2
diff --git a/utils/check-style/check_py.sh b/utils/check-style/check_py.sh
index 48c02013734..5caeffa65fe 100755
--- a/utils/check-style/check_py.sh
+++ b/utils/check-style/check_py.sh
@@ -1,17 +1,22 @@
 #!/bin/bash
 
-# yaml check is not the best one
-
 cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_output/check_status.tsv
 
 # FIXME: 1 min to wait + head checkout
 # echo "Check python formatting with black" | ts
 # ./check-black -n              |& tee /test_output/black_output.txt
 
-echo "Check pylint" | ts
-./check-pylint -n               |& tee /test_output/pylint_output.txt
-echo "Check pylint. Done" | ts
+start_total=`date +%s`
 
-echo "Check python type hinting with mypy" | ts
+start=`date +%s`
+./check-pylint -n               |& tee /test_output/pylint_output.txt
+runtime=$((`date +%s`-start))
+echo "Check pylint. Done. $runtime seconds."
+
+start=`date +%s`
 ./check-mypy -n               |& tee /test_output/mypy_output.txt
-echo "Check python type hinting with mypy. Done" | ts
+runtime=$((`date +%s`-start))
+echo "Check python type hinting with mypy. Done. $runtime seconds."
+
+runtime=$((`date +%s`-start_total))
+echo "Check python total. Done. $runtime seconds."

From c1caeaa81483e33c666679fb1ce20d6a7da154c3 Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Sun, 10 Mar 2024 20:51:54 +0100
Subject: [PATCH 259/985] fix build

---
 src/Common/CgroupsMemoryUsageObserver.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index 639433b5016..fc0d847af4f 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -91,7 +91,7 @@ public:
 
     void setLimits(uint64_t, uint64_t) {}
     size_t readMemoryUsage() { return 0; }
-    void startThread();
+    void startThread() {}
     size_t getHardLimit() { return 0; }
     size_t getSoftLimit() { return 0; }
     void setOnMemoryLimitUpdate(std::function<void()>) {}

From 7a8d79de234e4f83a4e6421e5de49e5800ff70bc Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Sun, 10 Mar 2024 22:13:49 +0100
Subject: [PATCH 260/985] reload CI due to OOM in build


From d2b7fb03b12c5ce3ec5a377f3872483639e8c4fe Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 10 Mar 2024 23:36:03 +0100
Subject: [PATCH 261/985] Fix localization in check-large-objects

---
 utils/check-style/check-large-objects.sh | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/utils/check-style/check-large-objects.sh b/utils/check-style/check-large-objects.sh
index 4eb9190512f..3e2a385bdd0 100755
--- a/utils/check-style/check-large-objects.sh
+++ b/utils/check-style/check-large-objects.sh
@@ -1,5 +1,7 @@
 #!/usr/bin/env bash
 
+export LC_ALL=C # The "total" should be printed without localization
+
 # Check that there are no new translation units compiled to an object file larger than a certain size.
 
 TU_EXCLUDES=(

From fc9efeddf77dc76981ccbad263566911994d33a2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 11 Mar 2024 01:42:44 +0300
Subject: [PATCH 262/985] Update check-large-objects.sh

---
 utils/check-style/check-large-objects.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/utils/check-style/check-large-objects.sh b/utils/check-style/check-large-objects.sh
index 04f4e0c3171..5faacae84b9 100755
--- a/utils/check-style/check-large-objects.sh
+++ b/utils/check-style/check-large-objects.sh
@@ -12,7 +12,7 @@ TU_EXCLUDES=(
     Aggregator
 )
 
-if find $1 -name '*.o' | xargs wc -c | grep --regexp='.o$' | sort -rn | awk '{ if ($1 > 50000000) print }' \
+if find $1 -name '*.o' | xargs wc -c | grep --regexp='\.o$' | sort -rn | awk '{ if ($1 > 50000000) print }' \
     | grep -v -f <(printf "%s\n" "${TU_EXCLUDES[@]}")
 then
     echo "^ It's not allowed to have so large translation units."

From 2ea4de78dd3e5e25d43bc834ce5e05da630472ac Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 11 Mar 2024 00:00:13 +0100
Subject: [PATCH 263/985] Update the test

---
 .../0_stateless/02998_primary_key_skip_columns.reference        | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.reference b/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
index 08ccdb83b11..f3c4a4f40fe 100644
--- a/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.reference
@@ -10,7 +10,7 @@ Key size: 	2400000
 100000
 14954
 798
-15907
+15908
 108
 120
 2334

From 92734843fb9aff0c82871f352a19da7b190ba2f4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 11 Mar 2024 02:42:44 +0300
Subject: [PATCH 264/985] Update 03008_index_small.sql

---
 tests/queries/0_stateless/03008_index_small.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03008_index_small.sql b/tests/queries/0_stateless/03008_index_small.sql
index 4eb2db3abc3..72213ed4fc9 100644
--- a/tests/queries/0_stateless/03008_index_small.sql
+++ b/tests/queries/0_stateless/03008_index_small.sql
@@ -16,4 +16,4 @@ ATTACH TABLE test;
 
 SELECT count() FROM test WHERE b >= 0;
 
--- DROP TABLE test;
+DROP TABLE test;

From 8c08fc1f579861d02690653cc05a87826e59a5b0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 11 Mar 2024 04:09:26 +0300
Subject: [PATCH 265/985] Revert "CI: make style check faster"

---
 tests/ci/style_check.py                       | 32 ++++-------
 .../{check_cpp.sh => check_cpp_docs.sh}       | 55 +++++++------------
 utils/check-style/check_py.sh                 | 17 ++----
 3 files changed, 37 insertions(+), 67 deletions(-)
 rename utils/check-style/{check_cpp.sh => check_cpp_docs.sh} (50%)

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index a772539aef8..d0565e136d3 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -10,7 +10,7 @@ from pathlib import Path
 from typing import List, Tuple
 
 from docker_images_helper import get_docker_image, pull_image
-from env_helper import CI, REPO_COPY, TEMP_PATH
+from env_helper import REPO_COPY, TEMP_PATH
 from git_helper import GIT_PREFIX, git_runner
 from pr_info import PRInfo
 from report import ERROR, FAILURE, SUCCESS, JobReport, TestResults, read_test_results
@@ -128,40 +128,32 @@ def main():
     temp_path = Path(TEMP_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
 
-    pr_info = PRInfo()
+    # pr_info = PRInfo()
 
     IMAGE_NAME = "clickhouse/style-test"
     image = pull_image(get_docker_image(IMAGE_NAME))
-    cmd_cpp = (
+    cmd_1 = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
         f"--entrypoint= -w/ClickHouse/utils/check-style "
-        f"{image} ./check_cpp.sh"
+        f"{image} ./check_cpp_docs.sh"
     )
-    cmd_py = (
+    cmd_2 = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
         f"--entrypoint= -w/ClickHouse/utils/check-style "
         f"{image} ./check_py.sh"
     )
+    logging.info("Is going to run the command: %s", cmd_1)
+    logging.info("Is going to run the command: %s", cmd_2)
 
     with ProcessPoolExecutor(max_workers=2) as executor:
-        logging.info("Is going to run the command: %s", cmd_cpp)
-        future1 = executor.submit(subprocess.run, cmd_cpp, shell=True)
-        # Parallelization  does not make it faster - run subsequently
+        # Submit commands for execution in parallel
+        future1 = executor.submit(subprocess.run, cmd_1, shell=True)
+        future2 = executor.submit(subprocess.run, cmd_2, shell=True)
+        # Wait for both commands to complete
         _ = future1.result()
-
-        run_pycheck = True
-        if CI and pr_info.number > 0:
-            # skip py check if PR and no changed py files
-            pr_info.fetch_changed_files()
-            if not any(file.endswith(".py") for file in pr_info.changed_files):
-                run_pycheck = False
-
-        if run_pycheck:
-            logging.info("Is going to run the command: %s", cmd_py)
-            future2 = executor.submit(subprocess.run, cmd_py, shell=True)
-            _ = future2.result()
+        _ = future2.result()
 
     # if args.push:
     #     checkout_head(pr_info)
diff --git a/utils/check-style/check_cpp.sh b/utils/check-style/check_cpp_docs.sh
similarity index 50%
rename from utils/check-style/check_cpp.sh
rename to utils/check-style/check_cpp_docs.sh
index 20d4c7f5ee9..7ad3cede758 100755
--- a/utils/check-style/check_cpp.sh
+++ b/utils/check-style/check_cpp_docs.sh
@@ -4,48 +4,31 @@
 
 cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_output/check_status.tsv
 
-start_total=`date +%s`
-
-# 40 sec - too much
-# start=`date +%s`
+# FIXME: 30 sec to wait
+# echo "Check duplicates" | ts
 # ./check-duplicate-includes.sh |& tee /test_output/duplicate_includes_output.txt
-# runtime=$((`date +%s`-start))
-# echo "Duplicates check. Done. $runtime seconds."
 
-start=`date +%s`
+echo "Check style" | ts
 ./check-style -n              |& tee /test_output/style_output.txt
-runtime=$((`date +%s`-start))
-echo "Check style. Done. $runtime seconds."
-
-start=`date +%s`
-./check-whitespaces -n        |& tee /test_output/whitespaces_output.txt
-runtime=$((`date +%s`-start))
-echo "Check whitespaces. Done. $runtime seconds."
-
-start=`date +%s`
-./check-workflows             |& tee /test_output/workflows_output.txt
-runtime=$((`date +%s`-start))
-echo "Check workflows. Done. $runtime seconds."
-
-start=`date +%s`
-./check-submodules            |& tee /test_output/submodules_output.txt
-runtime=$((`date +%s`-start))
-echo "Check submodules. Done. $runtime seconds."
-
-start=`date +%s`
+echo "Check typos" | ts
 ./check-typos                 |& tee /test_output/typos_output.txt
-runtime=$((`date +%s`-start))
-echo "Check typos. Done. $runtime seconds."
-
-start=`date +%s`
+echo "Check docs spelling" | ts
 ./check-doc-aspell            |& tee /test_output/docs_spelling_output.txt
-runtime=$((`date +%s`-start))
-echo "Check docs spelling. Done. $runtime seconds."
-
-runtime=$((`date +%s`-start_total))
-echo "Check style, total. Done. $runtime seconds."
-
+echo "Check whitespaces" | ts
+./check-whitespaces -n        |& tee /test_output/whitespaces_output.txt
+echo "Check workflows" | ts
+./check-workflows             |& tee /test_output/workflows_output.txt
+echo "Check submodules" | ts
+./check-submodules            |& tee /test_output/submodules_output.txt
+echo "Check style. Done" | ts
 
 # FIXME: 6 min to wait
 # echo "Check shell scripts with shellcheck" | ts
 # ./shellcheck-run.sh           |& tee /test_output/shellcheck_output.txt
+
+
+# FIXME: move out
+# /process_style_check_result.py || echo -e "failure\tCannot parse results" > /test_output/check_status.tsv
+# echo "Check help for changelog generator works" | ts
+# cd ../changelog || exit 1
+# ./changelog.py -h 2>/dev/null 1>&2
diff --git a/utils/check-style/check_py.sh b/utils/check-style/check_py.sh
index 5caeffa65fe..48c02013734 100755
--- a/utils/check-style/check_py.sh
+++ b/utils/check-style/check_py.sh
@@ -1,22 +1,17 @@
 #!/bin/bash
 
+# yaml check is not the best one
+
 cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_output/check_status.tsv
 
 # FIXME: 1 min to wait + head checkout
 # echo "Check python formatting with black" | ts
 # ./check-black -n              |& tee /test_output/black_output.txt
 
-start_total=`date +%s`
-
-start=`date +%s`
+echo "Check pylint" | ts
 ./check-pylint -n               |& tee /test_output/pylint_output.txt
-runtime=$((`date +%s`-start))
-echo "Check pylint. Done. $runtime seconds."
+echo "Check pylint. Done" | ts
 
-start=`date +%s`
+echo "Check python type hinting with mypy" | ts
 ./check-mypy -n               |& tee /test_output/mypy_output.txt
-runtime=$((`date +%s`-start))
-echo "Check python type hinting with mypy. Done. $runtime seconds."
-
-runtime=$((`date +%s`-start_total))
-echo "Check python total. Done. $runtime seconds."
+echo "Check python type hinting with mypy. Done" | ts

From b354d07b829a94a43cf6f3867585efac389088c1 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Mon, 11 Mar 2024 14:59:22 +0800
Subject: [PATCH 266/985] remove break

---
 src/Processors/Transforms/FilterTransform.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Processors/Transforms/FilterTransform.cpp b/src/Processors/Transforms/FilterTransform.cpp
index 0f2509c7510..b3be9246f43 100644
--- a/src/Processors/Transforms/FilterTransform.cpp
+++ b/src/Processors/Transforms/FilterTransform.cpp
@@ -337,7 +337,6 @@ void FilterTransform::doTransform(Chunk & chunk)
                 min_size_in_memory = size_in_memory;
                 first_non_constant_column = i;
             }
-            break;
         }
     }
     (void)min_size_in_memory; /// Suppress error of clang-analyzer-deadcode.DeadStores

From cdb9c962f998d218bda99e69edbaabbd0e1a9433 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 9 Mar 2024 09:22:14 +0100
Subject: [PATCH 267/985] Loosen

---
 CMakeLists.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index b55e9810361..9ffb4789dc9 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -61,8 +61,8 @@ if (ENABLE_CHECK_HEAVY_BUILDS)
     # set CPU time limit to 1000 seconds
     set (RLIMIT_CPU 1000)
 
-    # -fsanitize=memory is too heavy
-    if (SANITIZE STREQUAL "memory")
+    # -fsanitize=memory and address are too heavy
+    if (SANITIZE)
        set (RLIMIT_DATA 10000000000) # 10G
     endif()
 

From 1c82f8707d76821cbe006ed3f9be84822677cd9b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 11 Mar 2024 08:38:03 +0100
Subject: [PATCH 268/985] Fix tidy

---
 src/Functions/FunctionsConversion.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index d2d72558500..94fd960a99e 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1056,7 +1056,7 @@ struct ConvertImpl<DataTypeEnum<FieldType>, DataTypeNumber<FieldType>, Name, Con
     }
 };
 
-static inline ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
+inline ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
 {
     ColumnUInt8::MutablePtr null_map = nullptr;
     if (const auto * col_null = checkAndGetColumn<ColumnNullable>(col.get()))
@@ -1984,7 +1984,7 @@ struct NameParseDateTimeBestEffortOrZero;
 struct NameParseDateTimeBestEffortOrNull;
 
 template<typename Name, typename ToDataType>
-static inline bool isDateTime64(const ColumnsWithTypeAndName & arguments)
+inline bool isDateTime64(const ColumnsWithTypeAndName & arguments)
 {
     if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
         return true;
@@ -3391,7 +3391,7 @@ arguments, result_type, input_rows_count); \
             case IntervalKind::Kind::INTERVAL_KIND: \
                 return createFunctionAdaptor(FunctionConvert<DataTypeInterval, NameToInterval##INTERVAL_KIND, PositiveMonotonicity>::create(), from_type);
 
-    static WrapperType createIntervalWrapper(const DataTypePtr & from_type, IntervalKind kind)
+    static WrapperType createIntervalWrapper(const DataTypePtr & from_type, IntervalKind::Kind kind)
     {
         switch (kind)
         {
@@ -3994,7 +3994,7 @@ arguments, result_type, input_rows_count); \
         {
             return [is_nullable = to_type->hasNullableSubcolumns()] (ColumnsWithTypeAndName & arguments, const DataTypePtr & , const ColumnNullable * , size_t) -> ColumnPtr
             {
-                auto & column_object = assert_cast<const ColumnObject &>(*arguments.front().column);
+                const auto & column_object = assert_cast<const ColumnObject &>(*arguments.front().column);
                 auto res = ColumnObject::create(is_nullable);
                 for (size_t i = 0; i < column_object.size(); i++)
                     res->insert(column_object[i]);

From d16c6780c7b5c6b7180e0744c55856b1e5b8285d Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Thu, 25 Jan 2024 11:50:18 -0400
Subject: [PATCH 269/985] Adds basic emptyArrayUIntX docs.

---
 .../functions/array-functions.md              | 174 +++++++++++++++++-
 1 file changed, 172 insertions(+), 2 deletions(-)

diff --git a/docs/en/sql-reference/functions/array-functions.md b/docs/en/sql-reference/functions/array-functions.md
index 2120b675c73..6dea8e89b6a 100644
--- a/docs/en/sql-reference/functions/array-functions.md
+++ b/docs/en/sql-reference/functions/array-functions.md
@@ -19,7 +19,7 @@ empty([x])
 An array is considered empty if it does not contain any elements.
 
 :::note
-Can be optimized by enabling the [optimize_functions_to_subcolumns](../../operations/settings/settings.md#optimize-functions-to-subcolumns) setting. With `optimize_functions_to_subcolumns = 1` the function reads only [size0](../../sql-reference/data-types/array.md#array-size) subcolumn instead of reading and processing the whole array column. The query `SELECT empty(arr) FROM TABLE;` transforms to `SELECT arr.size0 = 0 FROM TABLE;`.
+Can be optimized by enabling the [`optimize_functions_to_subcolumns` setting](../../operations/settings/settings.md#optimize-functions-to-subcolumns). With `optimize_functions_to_subcolumns = 1` the function reads only [size0](../../sql-reference/data-types/array.md#array-size) subcolumn instead of reading and processing the whole array column. The query `SELECT empty(arr) FROM TABLE;` transforms to `SELECT arr.size0 = 0 FROM TABLE;`.
 :::
 
 The function also works for [strings](string-functions.md#empty) or [UUID](uuid-functions.md#empty).
@@ -104,7 +104,177 @@ Can be optimized by enabling the [optimize_functions_to_subcolumns](../../operat
 
 Alias: `OCTET_LENGTH`
 
-## emptyArrayUInt8, emptyArrayUInt16, emptyArrayUInt32, emptyArrayUInt64
+## emptyArrayUInt8
+
+Accepts zero arguments and returns an empty UInt8 array.
+
+**Syntax**
+
+```sql
+emptyArrayUInt8()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(UInt8)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayUInt8());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 255) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1234	Alex	33	[]
+1234	Alex	33	[255]
+```
+
+## emptyArrayUInt16
+
+Accepts zero arguments and returns an empty UInt16 array.
+
+**Syntax**
+
+```sql
+emptyArrayUInt16()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(UInt16)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayUInt16());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 65535) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex    33	[]
+1231	Alex    33	[65535]
+```
+
+## emptyArrayUInt32
+
+Accepts zero arguments and returns an empty UInt32 array.
+
+**Syntax**
+
+```sql
+emptyArrayUInt32()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(UInt32)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayUInt32());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 4294967295) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex	33	[]
+1231	Alex	33	[4294967295]
+```
+
+## emptyArrayUInt64
+
+Accepts zero arguments and returns an empty UInt64 array.
+
+**Syntax**
+
+```sql
+emptyArrayUInt64()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(UInt64)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayUInt64());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 18446744073709551615) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex	33	[]
+1231	Alex	33	[18446744073709551615]
+```
 
 ## emptyArrayInt8, emptyArrayInt16, emptyArrayInt32, emptyArrayInt64
 

From 515cb59b00ac358a95f65ab7b76b8349bc6e02e7 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Thu, 25 Jan 2024 12:29:23 -0400
Subject: [PATCH 270/985] Adds emptyArrayIntX docs.

---
 .../functions/array-functions.md              | 172 +++++++++++++++++-
 1 file changed, 171 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/array-functions.md b/docs/en/sql-reference/functions/array-functions.md
index 6dea8e89b6a..ebeac4196d7 100644
--- a/docs/en/sql-reference/functions/array-functions.md
+++ b/docs/en/sql-reference/functions/array-functions.md
@@ -276,7 +276,177 @@ Result:
 1231	Alex	33	[18446744073709551615]
 ```
 
-## emptyArrayInt8, emptyArrayInt16, emptyArrayInt32, emptyArrayInt64
+## emptyArrayInt8
+
+Accepts zero arguments and returns an empty Int8 array.
+
+**Syntax**
+
+```sql
+emptyArrayInt8()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int8)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayInt8());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 127) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1234	Alex	33	[]
+1234	Alex	33	[127]
+```
+
+## emptyArrayInt16
+
+Accepts zero arguments and returns an empty Int16 array.
+
+**Syntax**
+
+```sql
+emptyArrayInt16()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int16)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayInt16());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 32767) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex    33	[]
+1231	Alex    33	[32767]
+```
+
+## emptyArrayInt32
+
+Accepts zero arguments and returns an empty Int32 array.
+
+**Syntax**
+
+```sql
+emptyArrayInt32()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int32)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayInt32());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 2147483647) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex	33	[]
+1231	Alex	33	[2147483647]
+```
+
+## emptyArrayInt64
+
+Accepts zero arguments and returns an empty Int64 array.
+
+**Syntax**
+
+```sql
+emptyArrayInt64()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int64)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayInt64());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 9223372036854775807) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex	33	[]
+1231	Alex	33	[9223372036854775807]
+```
 
 ## emptyArrayFloat32, emptyArrayFloat64
 

From c3895c3546b66d3d1b8eac0e3e9377d4da9a1f29 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Thu, 25 Jan 2024 14:41:32 -0400
Subject: [PATCH 271/985] Adds emptyArrayFloat32/64 docs.

---
 .../functions/array-functions.md              | 86 ++++++++++++++++++-
 1 file changed, 85 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/array-functions.md b/docs/en/sql-reference/functions/array-functions.md
index ebeac4196d7..471dd0ff3f5 100644
--- a/docs/en/sql-reference/functions/array-functions.md
+++ b/docs/en/sql-reference/functions/array-functions.md
@@ -448,7 +448,91 @@ Result:
 1231	Alex	33	[9223372036854775807]
 ```
 
-## emptyArrayFloat32, emptyArrayFloat64
+## emptyArrayFloat32 
+
+Returns an empty Float32 array. Accepts zero arguments.
+
+**Syntax**
+
+```sql
+emptyArrayFloat32()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int32)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayFloat32());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 3.4e+38) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex	33	[]
+1231	Alex	33	[-2147483648]
+```
+
+## emptyArrayFloat64
+
+Accepts zero arguments and returns an empty Float64 array.
+
+**Syntax**
+
+```sql
+emptyArrayFloat64()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayFloat64());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 1.999999999e+9) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex	33	[]
+1231	Alex	33	[1999999999]
+```
 
 ## emptyArrayDate, emptyArrayDateTime
 

From ade0f9f75fcf0d8e7394655a1938a16ed86c85a1 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Mon, 29 Jan 2024 14:21:58 -0400
Subject: [PATCH 272/985] Adds docs for emptyArrayDate and emptyArrayDateTime.

---
 .../functions/array-functions.md              | 123 +++++++++++++++++-
 1 file changed, 122 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/array-functions.md b/docs/en/sql-reference/functions/array-functions.md
index 471dd0ff3f5..d811112a861 100644
--- a/docs/en/sql-reference/functions/array-functions.md
+++ b/docs/en/sql-reference/functions/array-functions.md
@@ -536,9 +536,130 @@ Result:
 
 ## emptyArrayDate, emptyArrayDateTime
 
+## emptyArrayDate
+
+Accepts zero arguments and returns an empty Date array.
+
+**Syntax**
+
+```sql
+emptyArrayDate()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, userDates Array(Date)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayDate());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE userDates = arrayPushBack(userDates, today()) WHERE uid = 1231;
+ALTER TABLE users UPDATE userDates = arrayPushBack(userDates, addDays(today(), 1)) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+## emptyArrayDateTime
+
+Accepts zero arguments and returns an empty DateTime array.
+
+**Syntax**
+
+```sql
+emptyArrayDateTime()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, userDates Array(DateTime)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayDateTime());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE userDates = arrayPushBack(userDates, now()) WHERE uid = 1231;
+ALTER TABLE users UPDATE userDates = arrayPushBack(userDates, addDays(now(), 1)) WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex	33	[]
+1231	Alex	33	['2024-01-29 18:08:01','2024-01-30 18:08:01']
+```
+
 ## emptyArrayString
 
-Accepts zero arguments and returns an empty array of the appropriate type.
+Accepts zero arguments and returns an empty String array.
+
+**Syntax**
+
+```sql
+emptyArrayString()
+```
+
+**Arguments**
+
+None.
+
+**Returned value**
+
+An empty array.
+
+**Implementation details**
+
+None.
+
+**Examples**
+
+Query:
+
+```sql
+CREATE TABLE users (uid Int16, name String, age Int16, aliases Array(String)) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayString());
+SELECT * FROM users;
+
+ALTER TABLE users UPDATE aliases = arrayPushBack(aliases, 'Al') WHERE uid = 1231;
+ALTER TABLE users UPDATE aliases = arrayPushBack(aliases, 'Little Alex') WHERE uid = 1231;
+SELECT * FROM users;
+```
+
+Result:
+
+```response
+1231	Alex	33	[]
+1231	Alex	33	['Al','Little Alex']
+```
 
 ## emptyArrayToSingle
 

From e7270069a487be62e067e1f158ad0d745280622b Mon Sep 17 00:00:00 2001
From: Johnny <9611008+johnnymatthews@users.noreply.github.com>
Date: Mon, 29 Jan 2024 14:26:20 -0400
Subject: [PATCH 273/985] Removes dupliated h2 header.

---
 docs/en/sql-reference/functions/array-functions.md | 2 --
 1 file changed, 2 deletions(-)

diff --git a/docs/en/sql-reference/functions/array-functions.md b/docs/en/sql-reference/functions/array-functions.md
index d811112a861..d3054d25106 100644
--- a/docs/en/sql-reference/functions/array-functions.md
+++ b/docs/en/sql-reference/functions/array-functions.md
@@ -534,8 +534,6 @@ Result:
 1231	Alex	33	[1999999999]
 ```
 
-## emptyArrayDate, emptyArrayDateTime
-
 ## emptyArrayDate
 
 Accepts zero arguments and returns an empty Date array.

From 3c60e829710ffb72c8571ef664ad146cfcd3f266 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 11 Mar 2024 07:39:08 +0000
Subject: [PATCH 274/985] Incorporate review feedback

---
 .../functions/array-functions.md              | 222 +++---------------
 1 file changed, 39 insertions(+), 183 deletions(-)

diff --git a/docs/en/sql-reference/functions/array-functions.md b/docs/en/sql-reference/functions/array-functions.md
index d3054d25106..67a4c026851 100644
--- a/docs/en/sql-reference/functions/array-functions.md
+++ b/docs/en/sql-reference/functions/array-functions.md
@@ -106,7 +106,7 @@ Alias: `OCTET_LENGTH`
 
 ## emptyArrayUInt8
 
-Accepts zero arguments and returns an empty UInt8 array.
+Returns an empty UInt8 array.
 
 **Syntax**
 
@@ -122,34 +122,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(UInt8)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayUInt8());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 255) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayUInt8();
 ```
 
 Result:
 
 ```response
-1234	Alex	33	[]
-1234	Alex	33	[255]
+[]
 ```
 
 ## emptyArrayUInt16
 
-Accepts zero arguments and returns an empty UInt16 array.
+Returns an empty UInt16 array.
 
 **Syntax**
 
@@ -165,34 +154,24 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(UInt16)) ENGINE=Memory;
+SELECT emptyArrayUInt16();
 
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayUInt16());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 65535) WHERE uid = 1231;
-SELECT * FROM users;
 ```
 
 Result:
 
 ```response
-1231	Alex    33	[]
-1231	Alex    33	[65535]
+[]
 ```
 
 ## emptyArrayUInt32
 
-Accepts zero arguments and returns an empty UInt32 array.
+Returns an empty UInt32 array.
 
 **Syntax**
 
@@ -208,34 +187,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(UInt32)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayUInt32());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 4294967295) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayUInt32();
 ```
 
 Result:
 
 ```response
-1231	Alex	33	[]
-1231	Alex	33	[4294967295]
+[]
 ```
 
 ## emptyArrayUInt64
 
-Accepts zero arguments and returns an empty UInt64 array.
+Returns an empty UInt64 array.
 
 **Syntax**
 
@@ -251,34 +219,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(UInt64)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayUInt64());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 18446744073709551615) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayUInt64();
 ```
 
 Result:
 
 ```response
-1231	Alex	33	[]
-1231	Alex	33	[18446744073709551615]
+[]
 ```
 
 ## emptyArrayInt8
 
-Accepts zero arguments and returns an empty Int8 array.
+Returns an empty Int8 array.
 
 **Syntax**
 
@@ -294,34 +251,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int8)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayInt8());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 127) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayInt8();
 ```
 
 Result:
 
 ```response
-1234	Alex	33	[]
-1234	Alex	33	[127]
+[]
 ```
 
 ## emptyArrayInt16
 
-Accepts zero arguments and returns an empty Int16 array.
+Returns an empty Int16 array.
 
 **Syntax**
 
@@ -337,34 +283,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int16)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayInt16());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 32767) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayInt16();
 ```
 
 Result:
 
 ```response
-1231	Alex    33	[]
-1231	Alex    33	[32767]
+[]
 ```
 
 ## emptyArrayInt32
 
-Accepts zero arguments and returns an empty Int32 array.
+Returns an empty Int32 array.
 
 **Syntax**
 
@@ -380,34 +315,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int32)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayInt32());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 2147483647) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayInt32();
 ```
 
 Result:
 
 ```response
-1231	Alex	33	[]
-1231	Alex	33	[2147483647]
+[]
 ```
 
 ## emptyArrayInt64
 
-Accepts zero arguments and returns an empty Int64 array.
+Returns an empty Int64 array.
 
 **Syntax**
 
@@ -423,34 +347,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int64)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayInt64());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 9223372036854775807) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayInt64();
 ```
 
 Result:
 
 ```response
-1231	Alex	33	[]
-1231	Alex	33	[9223372036854775807]
+[]
 ```
 
 ## emptyArrayFloat32 
 
-Returns an empty Float32 array. Accepts zero arguments.
+Returns an empty Float32 array.
 
 **Syntax**
 
@@ -466,34 +379,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int32)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayFloat32());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 3.4e+38) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayFloat32();
 ```
 
 Result:
 
 ```response
-1231	Alex	33	[]
-1231	Alex	33	[-2147483648]
+[]
 ```
 
 ## emptyArrayFloat64
 
-Accepts zero arguments and returns an empty Float64 array.
+Returns an empty Float64 array.
 
 **Syntax**
 
@@ -509,34 +411,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, contacts Array(Int)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayFloat64());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE contacts = arrayPushBack(contacts, 1.999999999e+9) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayFloat64();
 ```
 
 Result:
 
 ```response
-1231	Alex	33	[]
-1231	Alex	33	[1999999999]
+[]
 ```
 
 ## emptyArrayDate
 
-Accepts zero arguments and returns an empty Date array.
+Returns an empty Date array.
 
 **Syntax**
 
@@ -552,33 +443,22 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, userDates Array(Date)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayDate());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE userDates = arrayPushBack(userDates, today()) WHERE uid = 1231;
-ALTER TABLE users UPDATE userDates = arrayPushBack(userDates, addDays(today(), 1)) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayDate();
 ```
 
 ## emptyArrayDateTime
 
-Accepts zero arguments and returns an empty DateTime array.
+Returns an empty DateTime array.
 
 **Syntax**
 
 ```sql
-emptyArrayDateTime()
+[]
 ```
 
 **Arguments**
@@ -589,35 +469,23 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, userDates Array(DateTime)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayDateTime());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE userDates = arrayPushBack(userDates, now()) WHERE uid = 1231;
-ALTER TABLE users UPDATE userDates = arrayPushBack(userDates, addDays(now(), 1)) WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayDateTime();
 ```
 
 Result:
 
 ```response
-1231	Alex	33	[]
-1231	Alex	33	['2024-01-29 18:08:01','2024-01-30 18:08:01']
+[]
 ```
 
 ## emptyArrayString
 
-Accepts zero arguments and returns an empty String array.
+Returns an empty String array.
 
 **Syntax**
 
@@ -633,30 +501,18 @@ None.
 
 An empty array.
 
-**Implementation details**
-
-None.
-
 **Examples**
 
 Query:
 
 ```sql
-CREATE TABLE users (uid Int16, name String, age Int16, aliases Array(String)) ENGINE=Memory;
-
-INSERT INTO users VALUES (1231, 'Alex', 33, emptyArrayString());
-SELECT * FROM users;
-
-ALTER TABLE users UPDATE aliases = arrayPushBack(aliases, 'Al') WHERE uid = 1231;
-ALTER TABLE users UPDATE aliases = arrayPushBack(aliases, 'Little Alex') WHERE uid = 1231;
-SELECT * FROM users;
+SELECT emptyArrayString();
 ```
 
 Result:
 
 ```response
-1231	Alex	33	[]
-1231	Alex	33	['Al','Little Alex']
+[]
 ```
 
 ## emptyArrayToSingle

From 27099cedcb974d704e240cedf4da547d50debb19 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 11 Mar 2024 08:34:01 +0000
Subject: [PATCH 275/985] Some fixups

---
 .../functions/random-functions.md             | 84 +++++--------------
 .../functions/type-conversion-functions.md    | 16 ++--
 .../sql-reference/functions/url-functions.md  |  6 +-
 3 files changed, 34 insertions(+), 72 deletions(-)

diff --git a/docs/en/sql-reference/functions/random-functions.md b/docs/en/sql-reference/functions/random-functions.md
index b745d2833d3..2d7752ed022 100644
--- a/docs/en/sql-reference/functions/random-functions.md
+++ b/docs/en/sql-reference/functions/random-functions.md
@@ -20,7 +20,9 @@ The random numbers are generated by non-cryptographic algorithms.
 
 ## rand
 
-Returns a random UInt32 number.
+Returns a random UInt32 number with uniform distribution.
+
+Uses a linear congruential generator with an initial state obtained from the system, which means that while it appears random, it's not truly random and can be predictable if the initial state is known. For scenarios where true randomness is crucial, consider using alternative methods like system-level calls or integrating with external libraries.
 
 ### Syntax
 
@@ -28,18 +30,16 @@ Returns a random UInt32 number.
 rand()
 ```
 
-### Parameters
+Alias: `rand32`
+
+### Arguments
 
 None.
 
-### Output
+### Returned value
 
 Returns a number of type UInt32.
 
-### Implementation details
-
-Uses a linear congruential generator.
-
 ### Example
 
 ```sql
@@ -47,44 +47,12 @@ SELECT rand();
 ```
 
 ```response
-1569354847
+1569354847 -- Note: The actual output will be a random number, not the specific number shown in the example
 ```
 
-**Note:** The actual output will be a random number, not the specific number shown in the example.
-
-## rand32
-
-Returns a random 32-bit unsigned integer (UInt32) number.
-
-### Syntax
-
-```sql
-rand32()
-```
-
-### Parameters
-
-None.
-
-### Output
-
-Returns a number of type UInt32, evenly distributed across the range of all possible UInt32 values.
-
-### Example
-
-```sql
-SELECT rand32();
-```
-
-```response
-2754546224
-```
-
-**Note:** The actual output will be a random number, not the specific number shown in the example.
-
 ## rand64
 
-Returns a random 64-bit unsigned integer (UInt64) number.
+Returns a random UInt64 integer (UInt64) number
 
 ### Syntax
 
@@ -92,17 +60,15 @@ Returns a random 64-bit unsigned integer (UInt64) number.
 rand64()
 ```
 
-### Parameters
+### Arguments
 
 None.
 
-### Output
+### Returned value
 
-Returns a number of type UInt64, evenly distributed across the range of all possible UInt64 values.
+Returns a number UInt64 number with uniform distribution.
 
-### Implementation details
-
-The `rand64` function uses a linear congruential generator, which means that while it appears random, it's not truly random and can be predictable if the initial state is known. For scenarios where true randomness is crucial, consider using alternative methods like system-level calls or integrating with external libraries.
+Uses a linear congruential generator with an initial state obtained from the system, which means that while it appears random, it's not truly random and can be predictable if the initial state is known. For scenarios where true randomness is crucial, consider using alternative methods like system-level calls or integrating with external libraries.
 
 ### Example
 
@@ -111,14 +77,12 @@ SELECT rand64();
 ```
 
 ```response
-15030268859237645412
+15030268859237645412 -- Note: The actual output will be a random number, not the specific number shown in the example.
 ```
 
-**Note:** The actual output will be a random number, not the specific number shown in the example.
-
 ## randCanonical
 
-Returns a random floating-point number of type Float64, evenly distributed within the closed interval.
+Returns a random Float64 number.
 
 ### Syntax
 
@@ -126,11 +90,11 @@ Returns a random floating-point number of type Float64, evenly distributed withi
 randCanonical()
 ```
 
-### Parameters
+### Arguments
 
 None.
 
-### Output
+### Returned value
 
 Returns a Float64 value between 0 (inclusive) and 1 (exclusive).
 
@@ -141,14 +105,12 @@ SELECT randCanonical();
 ```
 
 ```response
-0.3452178901234567
+0.3452178901234567 - Note: The actual output will be a random Float64 number between 0 and 1, not the specific number shown in the example.
 ```
 
-**Note:** The actual output will be a random decimal number between 0 and 1, not the specific number shown in the example.
-
 ## randConstant
 
-Generates a single constant column filled with a random value. Unlike `rand`, `randConstant` ensures the same random value appears in every row of the generated column, making it useful for scenarios requiring a consistent random seed across rows in a single query.
+Generates a single constant column filled with a random value. Unlike `rand`, this function ensures the same random value appears in every row of the generated column, making it useful for scenarios requiring a consistent random seed across rows in a single query.
 
 ### Syntax
 
@@ -156,11 +118,11 @@ Generates a single constant column filled with a random value. Unlike `rand`, `r
 randConstant([x]);
 ```
 
-### Parameters
+### Arguments
 
 - **[x] (Optional):** An optional expression that influences the generated random value. Even if provided, the resulting value will still be constant within the same query execution. Different queries using the same expression will likely generate different constant values.
 
-### Output
+### Returned value
 
 Returns a column of type UInt32 containing the same random value in each row.
 
@@ -200,12 +162,12 @@ Returns a random Float64 drawn uniformly from interval [`min`, `max`].
 randUniform(min, max)
 ```
 
-### Parameters
+### Arguments
 
 - `min` - `Float64` - left boundary of the range,
 - `max` - `Float64` - right boundary of the range.
 
-### Output
+### Returned value
 
 A random number of type [Float64](/docs/en/sql-reference/data-types/float.md).
 
diff --git a/docs/en/sql-reference/functions/type-conversion-functions.md b/docs/en/sql-reference/functions/type-conversion-functions.md
index 37d4ac30648..ea08ffa50e7 100644
--- a/docs/en/sql-reference/functions/type-conversion-functions.md
+++ b/docs/en/sql-reference/functions/type-conversion-functions.md
@@ -968,7 +968,7 @@ Converts a numeric value to String with the number of fractional digits in the o
 toDecimalString(number, scale)
 ```
 
-**Parameters**
+**Arguments**
 
 - `number` — Value to be represented as String, [Int, UInt](/docs/en/sql-reference/data-types/int-uint.md), [Float](/docs/en/sql-reference/data-types/float.md), [Decimal](/docs/en/sql-reference/data-types/decimal.md),
 - `scale` — Number of fractional digits, [UInt8](/docs/en/sql-reference/data-types/int-uint.md).
@@ -1261,7 +1261,7 @@ Converts input value `x` to the specified data type `T`. Always returns [Nullabl
 accurateCastOrNull(x, T)
 ```
 
-**Parameters**
+**Arguments**
 
 - `x` — Input value.
 - `T` — The name of the returned data type.
@@ -1314,7 +1314,7 @@ Converts input value `x` to the specified data type `T`. Returns default type va
 accurateCastOrDefault(x, T)
 ```
 
-**Parameters**
+**Arguments**
 
 - `x` — Input value.
 - `T` — The name of the returned data type.
@@ -1675,7 +1675,7 @@ Same as [parseDateTimeBestEffort](#parsedatetimebesteffort) function but also pa
 parseDateTime64BestEffort(time_string [, precision [, time_zone]])
 ```
 
-**Parameters**
+**Arguments**
 
 - `time_string` — String containing a date or date with time to convert. [String](/docs/en/sql-reference/data-types/string.md).
 - `precision` — Required precision. `3` — for milliseconds, `6` — for microseconds. Default — `3`. Optional. [UInt8](/docs/en/sql-reference/data-types/int-uint.md).
@@ -1990,7 +1990,7 @@ Extracts the timestamp component of a [Snowflake ID](https://en.wikipedia.org/wi
 snowflakeToDateTime(value[, time_zone])
 ```
 
-**Parameters**
+**Arguments**
 
 - `value` — Snowflake ID. [Int64](/docs/en/sql-reference/data-types/int-uint.md).
 - `time_zone` — [Timezone](/docs/en/operations/server-configuration-parameters/settings.md/#server_configuration_parameters-timezone). The function parses `time_string` according to the timezone. Optional. [String](/docs/en/sql-reference/data-types/string.md).
@@ -2026,7 +2026,7 @@ Extracts the timestamp component of a [Snowflake ID](https://en.wikipedia.org/wi
 snowflakeToDateTime64(value[, time_zone])
 ```
 
-**Parameters**
+**Arguments**
 
 - `value` — Snowflake ID. [Int64](/docs/en/sql-reference/data-types/int-uint.md).
 - `time_zone` — [Timezone](/docs/en/operations/server-configuration-parameters/settings.md/#server_configuration_parameters-timezone). The function parses `time_string` according to the timezone. Optional. [String](/docs/en/sql-reference/data-types/string.md).
@@ -2062,7 +2062,7 @@ Converts a [DateTime](/docs/en/sql-reference/data-types/datetime.md) value to th
 dateTimeToSnowflake(value)
 ```
 
-**Parameters**
+**Arguments**
 
 - `value` — Date with time. [DateTime](/docs/en/sql-reference/data-types/datetime.md).
 
@@ -2096,7 +2096,7 @@ Convert a [DateTime64](/docs/en/sql-reference/data-types/datetime64.md) to the f
 dateTime64ToSnowflake(value)
 ```
 
-**Parameters**
+**Arguments**
 
 - `value` — Date with time. [DateTime64](/docs/en/sql-reference/data-types/datetime64.md).
 
diff --git a/docs/en/sql-reference/functions/url-functions.md b/docs/en/sql-reference/functions/url-functions.md
index f6871c86c4f..ac81815b47f 100644
--- a/docs/en/sql-reference/functions/url-functions.md
+++ b/docs/en/sql-reference/functions/url-functions.md
@@ -155,7 +155,7 @@ Configuration example:
 cutToFirstSignificantSubdomain(URL, TLD)
 ```
 
-**Parameters**
+**Arguments**
 
 - `URL` — URL. [String](../../sql-reference/data-types/string.md).
 - `TLD` — Custom TLD list name. [String](../../sql-reference/data-types/string.md).
@@ -209,7 +209,7 @@ Configuration example:
 cutToFirstSignificantSubdomainCustomWithWWW(URL, TLD)
 ```
 
-**Parameters**
+**Arguments**
 
 - `URL` — URL. [String](../../sql-reference/data-types/string.md).
 - `TLD` — Custom TLD list name. [String](../../sql-reference/data-types/string.md).
@@ -263,7 +263,7 @@ Configuration example:
 firstSignificantSubdomainCustom(URL, TLD)
 ```
 
-**Parameters**
+**Arguments**
 
 - `URL` — URL. [String](../../sql-reference/data-types/string.md).
 - `TLD` — Custom TLD list name. [String](../../sql-reference/data-types/string.md).

From 318fc7efcf197d4b9c23ee118b16556c37424174 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 10 Mar 2024 23:57:37 +0100
Subject: [PATCH 276/985] Fix
 test_distributed_directory_monitor_split_batch_on_failure flakienss

The memory limit had been changed in #52439

CI: https://s3.amazonaws.com/clickhouse-test-reports/61132/04d885b570325b1e66bf0c7c13d4732b4d9340ec/integration_tests__tsan__[2_6].html
Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../test.py                                              | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/tests/integration/test_distributed_directory_monitor_split_batch_on_failure/test.py b/tests/integration/test_distributed_directory_monitor_split_batch_on_failure/test.py
index 0ad00c39a3b..43728ff600f 100644
--- a/tests/integration/test_distributed_directory_monitor_split_batch_on_failure/test.py
+++ b/tests/integration/test_distributed_directory_monitor_split_batch_on_failure/test.py
@@ -67,7 +67,7 @@ def test_distributed_background_insert_split_batch_on_failure_OFF(started_cluste
                 f"insert into dist select number/100, number from system.numbers limit {limit} offset {limit*i}",
                 settings={
                     # max_memory_usage is the limit for the batch on the remote node
-                    # (local query should not be affected since 30MB is enough for 100K rows)
+                    # (local query should not be affected since 20MB is enough for 100K rows)
                     "max_memory_usage": "20Mi",
                     "max_untracked_memory": "0",
                 },
@@ -76,7 +76,8 @@ def test_distributed_background_insert_split_batch_on_failure_OFF(started_cluste
         if setting == "background_insert_batch" and setting_value == 1:
             with pytest.raises(
                 QueryRuntimeException,
-                match=r"DB::Exception: Received from.*Memory limit \(for query\) exceeded: .*while pushing to view default\.mv",
+                # no DOTALL in pytest.raises, use '(.|\n)'
+                match=r"DB::Exception: Received from.*Memory limit \(for query\) exceeded: (.|\n)*While sending a batch",
             ):
                 node2.query("system flush distributed dist")
             assert int(node2.query("select count() from dist_data")) == 0
@@ -94,8 +95,8 @@ def test_distributed_background_insert_split_batch_on_failure_ON(started_cluster
                 f"insert into dist select number/100, number from system.numbers limit {limit} offset {limit*i}",
                 settings={
                     # max_memory_usage is the limit for the batch on the remote node
-                    # (local query should not be affected since 30MB is enough for 100K rows)
-                    "max_memory_usage": "30Mi",
+                    # (local query should not be affected since 20MB is enough for 100K rows)
+                    "max_memory_usage": "20Mi",
                     "max_untracked_memory": "0",
                 },
             )

From 49b78e0a0c6b7729045ce78874756b69193775a5 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Mon, 11 Mar 2024 08:45:58 +0000
Subject: [PATCH 277/985] CI: check cpp and py files style on changes only 
 #do_not_test

---
 tests/ci/report.py                            |  3 ++
 tests/ci/style_check.py                       | 50 ++++++++++++++-----
 .../{check_cpp_docs.sh => check_cpp.sh}       | 34 +++++++------
 utils/check-style/check_docs.sh               | 20 ++++++++
 utils/check-style/check_py.sh                 | 17 ++++---
 .../check-style/process_style_check_result.py | 11 ++--
 6 files changed, 96 insertions(+), 39 deletions(-)
 rename utils/check-style/{check_cpp_docs.sh => check_cpp.sh} (55%)
 create mode 100755 utils/check-style/check_docs.sh

diff --git a/tests/ci/report.py b/tests/ci/report.py
index 669409d1729..a3c9b53637a 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -288,6 +288,9 @@ class JobReport:
     # if False no GH commit status will be created by CI
     need_commit_status: bool = True
 
+    def __post_init__(self):
+        assert self.status in (SUCCESS, ERROR, FAILURE, PENDING)
+
     @classmethod
     def exist(cls) -> bool:
         return JOB_REPORT_FILE.is_file()
diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index d0565e136d3..9f113b6e6f9 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -4,13 +4,14 @@ from concurrent.futures import ProcessPoolExecutor
 import csv
 import logging
 import os
+import shutil
 import subprocess
 import sys
 from pathlib import Path
 from typing import List, Tuple
 
 from docker_images_helper import get_docker_image, pull_image
-from env_helper import REPO_COPY, TEMP_PATH
+from env_helper import CI, REPO_COPY, TEMP_PATH
 from git_helper import GIT_PREFIX, git_runner
 from pr_info import PRInfo
 from report import ERROR, FAILURE, SUCCESS, JobReport, TestResults, read_test_results
@@ -126,34 +127,57 @@ def main():
 
     repo_path = Path(REPO_COPY)
     temp_path = Path(TEMP_PATH)
+    if temp_path.is_dir():
+        shutil.rmtree(temp_path)
     temp_path.mkdir(parents=True, exist_ok=True)
 
-    # pr_info = PRInfo()
+    pr_info = PRInfo()
 
     IMAGE_NAME = "clickhouse/style-test"
     image = pull_image(get_docker_image(IMAGE_NAME))
-    cmd_1 = (
+    cmd_cpp = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
         f"--entrypoint= -w/ClickHouse/utils/check-style "
-        f"{image} ./check_cpp_docs.sh"
+        f"{image} ./check_cpp.sh"
     )
-    cmd_2 = (
+    cmd_py = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
         f"--entrypoint= -w/ClickHouse/utils/check-style "
         f"{image} ./check_py.sh"
     )
-    logging.info("Is going to run the command: %s", cmd_1)
-    logging.info("Is going to run the command: %s", cmd_2)
+    cmd_docs = (
+        f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
+        f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
+        f"--entrypoint= -w/ClickHouse/utils/check-style "
+        f"{image} ./check_docs.sh"
+    )
 
     with ProcessPoolExecutor(max_workers=2) as executor:
-        # Submit commands for execution in parallel
-        future1 = executor.submit(subprocess.run, cmd_1, shell=True)
-        future2 = executor.submit(subprocess.run, cmd_2, shell=True)
-        # Wait for both commands to complete
-        _ = future1.result()
-        _ = future2.result()
+        logging.info("Run docs files check: %s", cmd_docs)
+        future = executor.submit(subprocess.run, cmd_docs, shell=True)
+        # Parallelization  does not make it faster - run subsequently
+        _ = future.result()
+
+        run_cppcheck = True
+        run_pycheck = True
+        if CI and pr_info.number > 0:
+            pr_info.fetch_changed_files()
+            if not any(file.endswith(".py") for file in pr_info.changed_files):
+                run_pycheck = False
+            if all(file.endswith(".py") for file in pr_info.changed_files):
+                run_cppcheck = False
+
+        if run_cppcheck:
+            logging.info("Run source files check: %s", cmd_cpp)
+            future1 = executor.submit(subprocess.run, cmd_cpp, shell=True)
+            _ = future1.result()
+
+        if run_pycheck:
+            logging.info("Run py files check: %s", cmd_py)
+            future2 = executor.submit(subprocess.run, cmd_py, shell=True)
+            _ = future2.result()
 
     # if args.push:
     #     checkout_head(pr_info)
diff --git a/utils/check-style/check_cpp_docs.sh b/utils/check-style/check_cpp.sh
similarity index 55%
rename from utils/check-style/check_cpp_docs.sh
rename to utils/check-style/check_cpp.sh
index 7ad3cede758..ea90d79418c 100755
--- a/utils/check-style/check_cpp_docs.sh
+++ b/utils/check-style/check_cpp.sh
@@ -4,31 +4,35 @@
 
 cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_output/check_status.tsv
 
+start_total=`date +%s`
+
 # FIXME: 30 sec to wait
 # echo "Check duplicates" | ts
 # ./check-duplicate-includes.sh |& tee /test_output/duplicate_includes_output.txt
 
-echo "Check style" | ts
+start=`date +%s`
 ./check-style -n              |& tee /test_output/style_output.txt
-echo "Check typos" | ts
-./check-typos                 |& tee /test_output/typos_output.txt
-echo "Check docs spelling" | ts
-./check-doc-aspell            |& tee /test_output/docs_spelling_output.txt
-echo "Check whitespaces" | ts
+runtime=$((`date +%s`-start))
+echo "Check style. Done. $runtime seconds."
+
+start=`date +%s`
 ./check-whitespaces -n        |& tee /test_output/whitespaces_output.txt
-echo "Check workflows" | ts
+runtime=$((`date +%s`-start))
+echo "Check whitespaces. Done. $runtime seconds."
+
+start=`date +%s`
 ./check-workflows             |& tee /test_output/workflows_output.txt
-echo "Check submodules" | ts
+runtime=$((`date +%s`-start))
+echo "Check workflows. Done. $runtime seconds."
+
+start=`date +%s`
 ./check-submodules            |& tee /test_output/submodules_output.txt
-echo "Check style. Done" | ts
+runtime=$((`date +%s`-start))
+echo "Check submodules. Done. $runtime seconds."
 
 # FIXME: 6 min to wait
 # echo "Check shell scripts with shellcheck" | ts
 # ./shellcheck-run.sh           |& tee /test_output/shellcheck_output.txt
 
-
-# FIXME: move out
-# /process_style_check_result.py || echo -e "failure\tCannot parse results" > /test_output/check_status.tsv
-# echo "Check help for changelog generator works" | ts
-# cd ../changelog || exit 1
-# ./changelog.py -h 2>/dev/null 1>&2
+runtime=$((`date +%s`-start_total))
+echo "Check style total. Done. $runtime seconds."
diff --git a/utils/check-style/check_docs.sh b/utils/check-style/check_docs.sh
new file mode 100755
index 00000000000..78b8a402ea0
--- /dev/null
+++ b/utils/check-style/check_docs.sh
@@ -0,0 +1,20 @@
+#!/bin/bash
+
+# yaml check is not the best one
+
+cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_output/check_status.tsv
+
+start_total=`date +%s`
+
+start=`date +%s`
+./check-typos                 |& tee /test_output/typos_output.txt
+runtime=$((`date +%s`-start))
+echo "Check typos. Done. $runtime seconds."
+
+start=`date +%s`
+./check-doc-aspell            |& tee /test_output/docs_spelling_output.txt
+runtime=$((`date +%s`-start))
+echo "Check docs spelling. Done. $runtime seconds."
+
+runtime=$((`date +%s`-start_total))
+echo "Check Docs, total. Done. $runtime seconds."
diff --git a/utils/check-style/check_py.sh b/utils/check-style/check_py.sh
index 48c02013734..b729cd78124 100755
--- a/utils/check-style/check_py.sh
+++ b/utils/check-style/check_py.sh
@@ -1,17 +1,22 @@
 #!/bin/bash
 
-# yaml check is not the best one
-
 cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_output/check_status.tsv
 
+start_total=`date +%s`
+
 # FIXME: 1 min to wait + head checkout
 # echo "Check python formatting with black" | ts
 # ./check-black -n              |& tee /test_output/black_output.txt
 
-echo "Check pylint" | ts
+start=`date +%s`
 ./check-pylint -n               |& tee /test_output/pylint_output.txt
-echo "Check pylint. Done" | ts
+runtime=$((`date +%s`-start))
+echo "Check pylint. Done. $runtime seconds."
 
-echo "Check python type hinting with mypy" | ts
+start=`date +%s`
 ./check-mypy -n               |& tee /test_output/mypy_output.txt
-echo "Check python type hinting with mypy. Done" | ts
+runtime=$((`date +%s`-start))
+echo "Check python type hinting with mypy. Done. $runtime seconds."
+
+runtime=$((`date +%s`-start_total))
+echo "Check python total. Done. $runtime seconds."
diff --git a/utils/check-style/process_style_check_result.py b/utils/check-style/process_style_check_result.py
index 7980c01dd37..e620d85b9d0 100755
--- a/utils/check-style/process_style_check_result.py
+++ b/utils/check-style/process_style_check_result.py
@@ -13,11 +13,11 @@ def process_result(result_folder):
     description = ""
     test_results = []
     checks = (
-        #"duplicate includes",
-        #"shellcheck",
+        # "duplicate includes",
+        # "shellcheck",
         "style",
         "pylint",
-        #"black",
+        # "black",
         "mypy",
         "typos",
         "whitespaces",
@@ -30,8 +30,7 @@ def process_result(result_folder):
         out_file = name.replace(" ", "_") + "_output.txt"
         full_path = os.path.join(result_folder, out_file)
         if not os.path.exists(full_path):
-            logging.info("No %s check log on path %s", name, full_path)
-            return "exception", f"No {name} check log", []
+            test_results.append((f"Check {name}", "SKIPPED"))
         elif os.stat(full_path).st_size != 0:
             description += f"Check {name} failed. "
             test_results.append((f"Check {name}", "FAIL"))
@@ -42,6 +41,8 @@ def process_result(result_folder):
     if not description:
         description += "Style check success"
 
+    assert test_results, "No single style-check output found"
+
     return status, description, test_results
 
 
From 61c3d917ae82bb6ae14cea3a4a7c36c19f6d3b22 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Mon, 11 Mar 2024 10:33:09 +0000
Subject: [PATCH 278/985] Use `boost::algorithm::join`

---
 src/Common/FunctionDocumentation.cpp | 12 +++---------
 1 file changed, 3 insertions(+), 9 deletions(-)

diff --git a/src/Common/FunctionDocumentation.cpp b/src/Common/FunctionDocumentation.cpp
index 0dc5b48f9d1..7b554539a4f 100644
--- a/src/Common/FunctionDocumentation.cpp
+++ b/src/Common/FunctionDocumentation.cpp
@@ -1,5 +1,7 @@
 #include <Common/FunctionDocumentation.h>
 
+#include <boost/algorithm/string.hpp>
+
 namespace DB
 {
 
@@ -31,15 +33,7 @@ std::string FunctionDocumentation::examplesAsString() const
 
 std::string FunctionDocumentation::categoriesAsString() const
 {
-    if (categories.empty())
-        return "";
-
-    auto it = categories.begin();
-    std::string res = *it;
-    ++it;
-    for (; it != categories.end(); ++it)
-        res += ", " + *it;
-    return res;
+    return boost::algorithm::join(categories, ", ");
 }
 
 }

From 8a11afeba1e80f3f0210af5d19338550f631ceab Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 11 Mar 2024 11:44:34 +0100
Subject: [PATCH 279/985] Updated settings changed history

---
 src/Core/SettingsChangesHistory.h | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index b68789d5f43..d458f935edf 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -93,6 +93,12 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"input_format_json_use_string_type_for_ambiguous_paths_in_named_tuples_inference_from_objects", false, false, "Allow to use String type for ambiguous paths during named tuple inference from JSON objects"},
               {"throw_if_deduplication_in_dependent_materialized_views_enabled_with_async_insert", false, true, "Deduplication is dependent materialized view cannot work together with async inserts."},
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
+              {"azure_max_inflight_parts_for_one_file", 20, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited."},
+              {"azure_strict_upload_part_size", 0, 0, "The exact size of part to upload during multipart upload to Azure blob storage."},
+              {"azure_min_upload_part_size", 16*1024*1024, 16*1024*1024, "The minimum size of part to upload during multipart upload to Azure blob storage."},
+              {"azure_max_upload_part_size", 5ull*1024*1024*1024, 5ull*1024*1024*1024, "The maximum size of part to upload during multipart upload to Azure blob storage."},
+              {"azure_upload_part_size_multiply_factor", 2, 2, "Multiply azure_min_upload_part_size by this factor each time azure_multiply_parts_count_threshold parts were uploaded from a single write to Azure blob storage."},
+              {"azure_upload_part_size_multiply_parts_count_threshold", 500, 500, "Each time this number of parts was uploaded to Azure blob storage, azure_min_upload_part_size is multiplied by azure_upload_part_size_multiply_factor."},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
@@ -122,7 +128,6 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"default_normal_view_sql_security", "INVOKER", "INVOKER", "Allows to set default `SQL SECURITY` option while creating a normal view"},
               {"mysql_map_string_to_text_in_show_columns", false, true, "Reduce the configuration effort to connect ClickHouse with BI tools."},
               {"mysql_map_fixed_string_to_text_in_show_columns", false, true, "Reduce the configuration effort to connect ClickHouse with BI tools."},
-              {"azure_max_inflight_parts_for_one_file", 20, 20, "The maximum number of a concurrent loaded parts in multipart upload request. 0 means unlimited."},
               }},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},

From ecb11005e34948a365555da1e2271e9da31d5074 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 11 Mar 2024 10:56:26 +0000
Subject: [PATCH 280/985] List clang-tidy checks as list instead of a string

The string representation will be deprecated at some point:
https://reviews.llvm.org/D147876
---
 .clang-tidy | 195 ++++++++++++++++++++++++++--------------------------
 1 file changed, 97 insertions(+), 98 deletions(-)

diff --git a/.clang-tidy b/.clang-tidy
index 0dacf813c7e..4aeb38ca409 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -5,128 +5,127 @@
 # a) the new check is not controversial (this includes many checks in readability-* and google-*) or
 # b) too noisy (checks with > 100 new warnings are considered noisy, this includes e.g. cppcoreguidelines-*).
 
-# TODO: Once clang(-tidy) 17 is the minimum, we can convert this list to YAML
-# See https://releases.llvm.org/17.0.1/tools/clang/tools/extra/docs/ReleaseNotes.html#improvements-to-clang-tidy
-
 # TODO Let clang-tidy check headers in further directories
 #      --> HeaderFilterRegex: '^.*/(src|base|programs|utils)/.*(h|hpp)$'
 HeaderFilterRegex: '^.*/(base|programs|utils)/.*(h|hpp)$'
 
-Checks: '*,
-    -abseil-*,
+Checks: [
+  '*',
 
-    -altera-*,
+  '-abseil-*',
 
-    -android-*,
+  '-altera-*',
 
-    -bugprone-assignment-in-if-condition,
-    -bugprone-branch-clone,
-    -bugprone-easily-swappable-parameters,
-    -bugprone-exception-escape,
-    -bugprone-implicit-widening-of-multiplication-result,
-    -bugprone-narrowing-conversions,
-    -bugprone-not-null-terminated-result,
-    -bugprone-reserved-identifier, # useful but too slow, TODO retry when https://reviews.llvm.org/rG1c282052624f9d0bd273bde0b47b30c96699c6c7 is merged
-    -bugprone-unchecked-optional-access,
+  '-android-*',
 
-    -cert-dcl16-c,
-    -cert-dcl37-c,
-    -cert-dcl51-cpp,
-    -cert-err58-cpp,
-    -cert-msc32-c,
-    -cert-msc51-cpp,
-    -cert-oop54-cpp,
-    -cert-oop57-cpp,
+  '-bugprone-assignment-in-if-condition',
+  '-bugprone-branch-clone',
+  '-bugprone-easily-swappable-parameters',
+  '-bugprone-exception-escape',
+  '-bugprone-implicit-widening-of-multiplication-result',
+  '-bugprone-narrowing-conversions',
+  '-bugprone-not-null-terminated-result',
+  '-bugprone-reserved-identifier', # useful but too slow, TODO retry when https://reviews.llvm.org/rG1c282052624f9d0bd273bde0b47b30c96699c6c7 is merged
+  '-bugprone-unchecked-optional-access',
 
-    -clang-analyzer-unix.Malloc,
+  '-cert-dcl16-c',
+  '-cert-dcl37-c',
+  '-cert-dcl51-cpp',
+  '-cert-err58-cpp',
+  '-cert-msc32-c',
+  '-cert-msc51-cpp',
+  '-cert-oop54-cpp',
+  '-cert-oop57-cpp',
 
-    -cppcoreguidelines-*, # impractical in a codebase as large as ClickHouse, also slow
+  '-clang-analyzer-unix.Malloc',
 
-    -darwin-*,
+  '-cppcoreguidelines-*', # impractical in a codebase as large as ClickHouse, also slow
 
-    -fuchsia-*,
+  '-darwin-*',
 
-    -google-build-using-namespace,
-    -google-readability-braces-around-statements,
-    -google-readability-casting,
-    -google-readability-function-size,
-    -google-readability-namespace-comments,
-    -google-readability-todo,
+  '-fuchsia-*',
 
-    -hicpp-avoid-c-arrays,
-    -hicpp-avoid-goto,
-    -hicpp-braces-around-statements,
-    -hicpp-explicit-conversions,
-    -hicpp-function-size,
-    -hicpp-member-init,
-    -hicpp-move-const-arg,
-    -hicpp-multiway-paths-covered,
-    -hicpp-named-parameter,
-    -hicpp-no-array-decay,
-    -hicpp-no-assembler,
-    -hicpp-no-malloc,
-    -hicpp-signed-bitwise,
-    -hicpp-special-member-functions,
-    -hicpp-uppercase-literal-suffix,
-    -hicpp-use-auto,
-    -hicpp-use-emplace,
-    -hicpp-vararg,
+  '-google-build-using-namespace',
+  '-google-readability-braces-around-statements',
+  '-google-readability-casting',
+  '-google-readability-function-size',
+  '-google-readability-namespace-comments',
+  '-google-readability-todo',
 
-    -linuxkernel-*,
+  '-hicpp-avoid-c-arrays',
+  '-hicpp-avoid-goto',
+  '-hicpp-braces-around-statements',
+  '-hicpp-explicit-conversions',
+  '-hicpp-function-size',
+  '-hicpp-member-init',
+  '-hicpp-move-const-arg',
+  '-hicpp-multiway-paths-covered',
+  '-hicpp-named-parameter',
+  '-hicpp-no-array-decay',
+  '-hicpp-no-assembler',
+  '-hicpp-no-malloc',
+  '-hicpp-signed-bitwise',
+  '-hicpp-special-member-functions',
+  '-hicpp-uppercase-literal-suffix',
+  '-hicpp-use-auto',
+  '-hicpp-use-emplace',
+  '-hicpp-vararg',
 
-    -llvm-*,
+  '-linuxkernel-*',
 
-    -llvmlibc-*,
+  '-llvm-*',
 
-    -openmp-*,
+  '-llvmlibc-*',
 
-    -misc-const-correctness,
-    -misc-include-cleaner, # useful but far too many occurrences
-    -misc-no-recursion,
-    -misc-non-private-member-variables-in-classes,
-    -misc-confusable-identifiers, # useful but slooow
-    -misc-use-anonymous-namespace,
+  '-openmp-*',
 
-    -modernize-avoid-c-arrays,
-    -modernize-concat-nested-namespaces,
-    -modernize-macro-to-enum,
-    -modernize-pass-by-value,
-    -modernize-return-braced-init-list,
-    -modernize-use-auto,
-    -modernize-use-default-member-init,
-    -modernize-use-emplace,
-    -modernize-use-nodiscard,
-    -modernize-use-override,
-    -modernize-use-trailing-return-type,
+  '-misc-const-correctness',
+  '-misc-include-cleaner', # useful but far too many occurrences
+  '-misc-no-recursion',
+  '-misc-non-private-member-variables-in-classes',
+  '-misc-confusable-identifiers', # useful but slooo
+  '-misc-use-anonymous-namespace',
 
-    -performance-inefficient-string-concatenation,
-    -performance-no-int-to-ptr,
-    -performance-avoid-endl,
-    -performance-unnecessary-value-param,
+  '-modernize-avoid-c-arrays',
+  '-modernize-concat-nested-namespaces',
+  '-modernize-macro-to-enum',
+  '-modernize-pass-by-value',
+  '-modernize-return-braced-init-list',
+  '-modernize-use-auto',
+  '-modernize-use-default-member-init',
+  '-modernize-use-emplace',
+  '-modernize-use-nodiscard',
+  '-modernize-use-override',
+  '-modernize-use-trailing-return-type',
 
-    -portability-simd-intrinsics,
+  '-performance-inefficient-string-concatenation',
+  '-performance-no-int-to-ptr',
+  '-performance-avoid-endl',
+  '-performance-unnecessary-value-param',
 
-    -readability-avoid-unconditional-preprocessor-if,
-    -readability-braces-around-statements,
-    -readability-convert-member-functions-to-static,
-    -readability-else-after-return,
-    -readability-function-cognitive-complexity,
-    -readability-function-size,
-    -readability-identifier-length,
-    -readability-identifier-naming, # useful but too slow
-    -readability-implicit-bool-conversion,
-    -readability-isolate-declaration,
-    -readability-magic-numbers,
-    -readability-named-parameter,
-    -readability-redundant-declaration,
-    -readability-simplify-boolean-expr,
-    -readability-static-accessed-through-instance,
-    -readability-suspicious-call-argument,
-    -readability-uppercase-literal-suffix,
-    -readability-use-anyofallof,
+  '-portability-simd-intrinsics',
 
-    -zircon-*,
-'
+  '-readability-avoid-unconditional-preprocessor-if',
+  '-readability-braces-around-statements',
+  '-readability-convert-member-functions-to-static',
+  '-readability-else-after-return',
+  '-readability-function-cognitive-complexity',
+  '-readability-function-size',
+  '-readability-identifier-length',
+  '-readability-identifier-naming', # useful but too slow
+  '-readability-implicit-bool-conversion',
+  '-readability-isolate-declaration',
+  '-readability-magic-numbers',
+  '-readability-named-parameter',
+  '-readability-redundant-declaration',
+  '-readability-simplify-boolean-expr',
+  '-readability-static-accessed-through-instance',
+  '-readability-suspicious-call-argument',
+  '-readability-uppercase-literal-suffix',
+  '-readability-use-anyofallof',
+
+  '-zircon-*'
+]
 
 WarningsAsErrors: '*'
 

From e5e84419aff0f559bc545737bfdc0518a732f7ff Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Sun, 10 Mar 2024 14:29:18 +0000
Subject: [PATCH 281/985] Fix clang-tidy-s

---
 contrib/libmetrohash/src/metrohash128.h          |  3 +++
 src/Access/AccessControl.h                       | 10 +++++-----
 src/Access/IAccessStorage.cpp                    |  2 +-
 src/Access/IAccessStorage.h                      |  2 +-
 src/Common/Arena.h                               |  4 +---
 src/Common/DNSResolver.cpp                       |  2 +-
 src/Common/DNSResolver.h                         |  2 +-
 src/Common/DateLUTImpl.h                         |  2 +-
 src/Common/MultiVersion.h                        |  4 ++--
 src/Common/PODArray.h                            |  6 +++---
 src/Common/SipHash.h                             |  2 +-
 src/Common/TransactionID.h                       |  2 +-
 src/Common/ZooKeeper/IKeeper.cpp                 |  8 ++++----
 src/Common/ZooKeeper/IKeeper.h                   | 16 ++++++++--------
 src/Common/logger_useful.h                       | 16 ++++++++--------
 src/Core/PostgreSQL/insertPostgreSQLValue.cpp    |  4 ++--
 src/Core/PostgreSQL/insertPostgreSQLValue.h      |  4 ++--
 src/Core/Settings.h                              |  2 ++
 src/Dictionaries/CacheDictionary.cpp             |  4 ++--
 src/Dictionaries/CacheDictionary.h               |  2 +-
 .../GeodataProviders/IHierarchiesProvider.h      |  2 +-
 src/Dictionaries/RegExpTreeDictionary.cpp        |  2 +-
 src/Dictionaries/RegExpTreeDictionary.h          |  2 +-
 src/Functions/IFunction.h                        |  4 ----
 src/IO/ReadSettings.h                            |  1 +
 src/Interpreters/AsynchronousInsertQueue.cpp     |  2 +-
 src/Interpreters/AsynchronousInsertQueue.h       |  2 +-
 src/Interpreters/Context.h                       |  4 ++--
 src/Interpreters/IExternalLoadable.h             |  2 +-
 src/Interpreters/ProcessList.h                   |  2 +-
 src/Processors/Chunk.h                           |  2 +-
 .../Algorithms/AggregatingSortedAlgorithm.cpp    |  2 +-
 src/Processors/Port.h                            |  2 +-
 src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp    |  4 ++--
 src/Processors/TTL/TTLUpdateInfoAlgorithm.h      |  4 ++--
 src/Storages/StorageInMemoryMetadata.h           |  4 ++--
 36 files changed, 69 insertions(+), 69 deletions(-)

diff --git a/contrib/libmetrohash/src/metrohash128.h b/contrib/libmetrohash/src/metrohash128.h
index 2dbb6ca5a8a..f507c917caf 100644
--- a/contrib/libmetrohash/src/metrohash128.h
+++ b/contrib/libmetrohash/src/metrohash128.h
@@ -17,6 +17,8 @@
 #ifndef METROHASH_METROHASH_128_H
 #define METROHASH_METROHASH_128_H
 
+// NOLINTBEGIN(readability-avoid-const-params-in-decls)
+
 #include <stdint.h>
 
 class MetroHash128
@@ -68,5 +70,6 @@ private:
 void metrohash128_1(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * out);
 void metrohash128_2(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * out);
 
+// NOLINTEND(readability-avoid-const-params-in-decls)
 
 #endif // #ifndef METROHASH_METROHASH_128_H
diff --git a/src/Access/AccessControl.h b/src/Access/AccessControl.h
index 55ea4e4f717..1af74e02fb7 100644
--- a/src/Access/AccessControl.h
+++ b/src/Access/AccessControl.h
@@ -133,20 +133,20 @@ public:
     /// This function also enables custom prefixes to be used.
     void setCustomSettingsPrefixes(const Strings & prefixes);
     void setCustomSettingsPrefixes(const String & comma_separated_prefixes);
-    bool isSettingNameAllowed(const std::string_view name) const;
-    void checkSettingNameIsAllowed(const std::string_view name) const;
+    bool isSettingNameAllowed(std::string_view name) const;
+    void checkSettingNameIsAllowed(std::string_view name) const;
 
     /// Allows implicit user creation without password (by default it's allowed).
     /// In other words, allow 'CREATE USER' queries without 'IDENTIFIED WITH' clause.
-    void setImplicitNoPasswordAllowed(const bool allow_implicit_no_password_);
+    void setImplicitNoPasswordAllowed(bool allow_implicit_no_password_);
     bool isImplicitNoPasswordAllowed() const;
 
     /// Allows users without password (by default it's allowed).
-    void setNoPasswordAllowed(const bool allow_no_password_);
+    void setNoPasswordAllowed(bool allow_no_password_);
     bool isNoPasswordAllowed() const;
 
     /// Allows users with plaintext password (by default it's allowed).
-    void setPlaintextPasswordAllowed(const bool allow_plaintext_password_);
+    void setPlaintextPasswordAllowed(bool allow_plaintext_password_);
     bool isPlaintextPasswordAllowed() const;
 
     /// Default password type when the user does not specify it.
diff --git a/src/Access/IAccessStorage.cpp b/src/Access/IAccessStorage.cpp
index fbe9e231002..1d6b8d99cd5 100644
--- a/src/Access/IAccessStorage.cpp
+++ b/src/Access/IAccessStorage.cpp
@@ -616,7 +616,7 @@ UUID IAccessStorage::generateRandomID()
 }
 
 
-void IAccessStorage::clearConflictsInEntitiesList(std::vector<std::pair<UUID, AccessEntityPtr>> & entities, const LoggerPtr log_)
+void IAccessStorage::clearConflictsInEntitiesList(std::vector<std::pair<UUID, AccessEntityPtr>> & entities, LoggerPtr log_)
 {
     std::unordered_map<UUID, size_t> positions_by_id;
     std::unordered_map<std::string_view, size_t> positions_by_type_and_name[static_cast<size_t>(AccessEntityType::MAX)];
diff --git a/src/Access/IAccessStorage.h b/src/Access/IAccessStorage.h
index ebb5a39cdf0..ad78bf92e02 100644
--- a/src/Access/IAccessStorage.h
+++ b/src/Access/IAccessStorage.h
@@ -228,7 +228,7 @@ protected:
     static UUID generateRandomID();
     LoggerPtr getLogger() const;
     static String formatEntityTypeWithName(AccessEntityType type, const String & name) { return AccessEntityTypeInfo::get(type).formatEntityNameWithType(name); }
-    static void clearConflictsInEntitiesList(std::vector<std::pair<UUID, AccessEntityPtr>> & entities, const LoggerPtr log_);
+    static void clearConflictsInEntitiesList(std::vector<std::pair<UUID, AccessEntityPtr>> & entities, LoggerPtr log_);
     [[noreturn]] void throwNotFound(const UUID & id) const;
     [[noreturn]] void throwNotFound(AccessEntityType type, const String & name) const;
     [[noreturn]] static void throwBadCast(const UUID & id, AccessEntityType type, const String & name, AccessEntityType required_type);
diff --git a/src/Common/Arena.h b/src/Common/Arena.h
index cb26397844b..ba5b9ea9205 100644
--- a/src/Common/Arena.h
+++ b/src/Common/Arena.h
@@ -47,9 +47,7 @@ private:
 
         std::unique_ptr<MemoryChunk> prev;
 
-        MemoryChunk()
-        {
-        }
+        MemoryChunk() = default;
 
         void swap(MemoryChunk & other)
         {
diff --git a/src/Common/DNSResolver.cpp b/src/Common/DNSResolver.cpp
index e36e1483da8..4b577a251af 100644
--- a/src/Common/DNSResolver.cpp
+++ b/src/Common/DNSResolver.cpp
@@ -297,7 +297,7 @@ void DNSResolver::setDisableCacheFlag(bool is_disabled)
     impl->disable_cache = is_disabled;
 }
 
-void DNSResolver::setCacheMaxEntries(const UInt64 cache_max_entries)
+void DNSResolver::setCacheMaxEntries(UInt64 cache_max_entries)
 {
     impl->cache_address.setMaxSizeInBytes(cache_max_entries);
     impl->cache_host.setMaxSizeInBytes(cache_max_entries);
diff --git a/src/Common/DNSResolver.h b/src/Common/DNSResolver.h
index e3030e51a96..1ddd9d3b991 100644
--- a/src/Common/DNSResolver.h
+++ b/src/Common/DNSResolver.h
@@ -56,7 +56,7 @@ public:
     void setDisableCacheFlag(bool is_disabled = true);
 
     /// Set a limit of entries in cache
-    void setCacheMaxEntries(const UInt64 cache_max_entries);
+    void setCacheMaxEntries(UInt64 cache_max_entries);
 
     /// Drops all caches
     void dropCache();
diff --git a/src/Common/DateLUTImpl.h b/src/Common/DateLUTImpl.h
index 7bf66c0504a..4087e77d588 100644
--- a/src/Common/DateLUTImpl.h
+++ b/src/Common/DateLUTImpl.h
@@ -255,7 +255,7 @@ private:
 
     static LUTIndex toLUTIndex(ExtendedDayNum d)
     {
-        return normalizeLUTIndex(static_cast<Int64>(d + daynum_offset_epoch));
+        return normalizeLUTIndex(static_cast<Int64>(d) + daynum_offset_epoch);
     }
 
     LUTIndex toLUTIndex(Time t) const
diff --git a/src/Common/MultiVersion.h b/src/Common/MultiVersion.h
index 8f488f9fcbc..680e224f869 100644
--- a/src/Common/MultiVersion.h
+++ b/src/Common/MultiVersion.h
@@ -41,9 +41,9 @@ public:
     }
 
     /// There is no copy constructor because only one MultiVersion should own the same object.
-    MultiVersion(MultiVersion && src) { *this = std::move(src); }
+    MultiVersion(MultiVersion && src) { *this = std::move(src); } /// NOLINT
 
-    MultiVersion & operator=(MultiVersion && src)
+    MultiVersion & operator=(MultiVersion && src) /// NOLINT
     {
         if (this != &src)
         {
diff --git a/src/Common/PODArray.h b/src/Common/PODArray.h
index 1a4047a2588..af863e01fb2 100644
--- a/src/Common/PODArray.h
+++ b/src/Common/PODArray.h
@@ -25,7 +25,7 @@
   */
 template <typename T, typename U>
 constexpr bool memcpy_can_be_used_for_assignment = std::is_same_v<T, U>
-    || (std::is_integral_v<T> && std::is_integral_v<U> && sizeof(T) == sizeof(U));
+    || (std::is_integral_v<T> && std::is_integral_v<U> && sizeof(T) == sizeof(U)); /// NOLINT(misc-redundant-expression)
 
 namespace DB
 {
@@ -558,7 +558,7 @@ public:
     }
 
     template <typename... TAllocatorParams>
-    void swap(PODArray & rhs, TAllocatorParams &&... allocator_params)
+    void swap(PODArray & rhs, TAllocatorParams &&... allocator_params) /// NOLINT(performance-noexcept-swap)
     {
 #ifndef NDEBUG
         this->unprotect();
@@ -756,7 +756,7 @@ public:
 };
 
 template <typename T, size_t initial_bytes, typename TAllocator, size_t pad_right_, size_t pad_left_>
-void swap(PODArray<T, initial_bytes, TAllocator, pad_right_, pad_left_> & lhs, PODArray<T, initial_bytes, TAllocator, pad_right_, pad_left_> & rhs)
+void swap(PODArray<T, initial_bytes, TAllocator, pad_right_, pad_left_> & lhs, PODArray<T, initial_bytes, TAllocator, pad_right_, pad_left_> & rhs) /// NOLINT
 {
     lhs.swap(rhs);
 }
diff --git a/src/Common/SipHash.h b/src/Common/SipHash.h
index 729fb76a573..c89ee2c9d90 100644
--- a/src/Common/SipHash.h
+++ b/src/Common/SipHash.h
@@ -149,7 +149,7 @@ public:
 
         /// Pad the remainder, which is missing up to an 8-byte word.
         current_word = 0;
-        switch (end - data)
+        switch (end - data) /// NOLINT(bugprone-switch-missing-default-case)
         {
             case 7: current_bytes[CURRENT_BYTES_IDX(6)] = data[6]; [[fallthrough]];
             case 6: current_bytes[CURRENT_BYTES_IDX(5)] = data[5]; [[fallthrough]];
diff --git a/src/Common/TransactionID.h b/src/Common/TransactionID.h
index 3ab86f7589c..97d0072bc14 100644
--- a/src/Common/TransactionID.h
+++ b/src/Common/TransactionID.h
@@ -16,7 +16,7 @@ class MergeTreeTransaction;
 /// or transaction object is not needed and not passed intentionally.
 #ifndef NO_TRANSACTION_PTR
 #define NO_TRANSACTION_PTR std::shared_ptr<MergeTreeTransaction>(nullptr)
-#define NO_TRANSACTION_RAW static_cast<MergeTreeTransaction *>(nullptr)
+#define NO_TRANSACTION_RAW static_cast<MergeTreeTransaction *>(nullptr) /// NOLINT(bugprone-macro-parentheses)
 #endif
 
 /// Commit Sequence Number
diff --git a/src/Common/ZooKeeper/IKeeper.cpp b/src/Common/ZooKeeper/IKeeper.cpp
index 6c47ea68b84..7d2602bde1e 100644
--- a/src/Common/ZooKeeper/IKeeper.cpp
+++ b/src/Common/ZooKeeper/IKeeper.cpp
@@ -23,7 +23,7 @@ namespace ProfileEvents
 namespace Coordination
 {
 
-void Exception::incrementErrorMetrics(const Error code_)
+void Exception::incrementErrorMetrics(Error code_)
 {
     if (Coordination::isUserError(code_))
         ProfileEvents::increment(ProfileEvents::ZooKeeperUserExceptions);
@@ -33,14 +33,14 @@ void Exception::incrementErrorMetrics(const Error code_)
         ProfileEvents::increment(ProfileEvents::ZooKeeperOtherExceptions);
 }
 
-Exception::Exception(const std::string & msg, const Error code_, int)
+Exception::Exception(const std::string & msg, Error code_, int)
     : DB::Exception(msg, DB::ErrorCodes::KEEPER_EXCEPTION)
     , code(code_)
 {
     incrementErrorMetrics(code);
 }
 
-Exception::Exception(PreformattedMessage && msg, const Error code_)
+Exception::Exception(PreformattedMessage && msg, Error code_)
     : DB::Exception(std::move(msg), DB::ErrorCodes::KEEPER_EXCEPTION)
     , code(code_)
 {
@@ -48,7 +48,7 @@ Exception::Exception(PreformattedMessage && msg, const Error code_)
     incrementErrorMetrics(code);
 }
 
-Exception::Exception(const Error code_)
+Exception::Exception(Error code_)
     : Exception(code_, "Coordination error: {}", errorMessage(code_))
 {
 }
diff --git a/src/Common/ZooKeeper/IKeeper.h b/src/Common/ZooKeeper/IKeeper.h
index c7b902ea03a..ec49c94808e 100644
--- a/src/Common/ZooKeeper/IKeeper.h
+++ b/src/Common/ZooKeeper/IKeeper.h
@@ -466,13 +466,13 @@ class Exception : public DB::Exception
 {
 private:
     /// Delegate constructor, used to minimize repetition; last parameter used for overload resolution.
-    Exception(const std::string & msg, const Error code_, int); /// NOLINT
-    Exception(PreformattedMessage && msg, const Error code_);
+    Exception(const std::string & msg, Error code_, int); /// NOLINT
+    Exception(PreformattedMessage && msg, Error code_);
 
     /// Message must be a compile-time constant
     template <typename T>
     requires std::is_convertible_v<T, String>
-    Exception(T && message, const Error code_) : DB::Exception(std::forward<T>(message), DB::ErrorCodes::KEEPER_EXCEPTION, /* remote_= */ false), code(code_)
+    Exception(T && message, Error code_) : DB::Exception(std::forward<T>(message), DB::ErrorCodes::KEEPER_EXCEPTION, /* remote_= */ false), code(code_)
     {
         incrementErrorMetrics(code);
     }
@@ -480,23 +480,23 @@ private:
     static void incrementErrorMetrics(Error code_);
 
 public:
-    explicit Exception(const Error code_); /// NOLINT
+    explicit Exception(Error code_); /// NOLINT
     Exception(const Exception & exc);
 
     template <typename... Args>
-    Exception(const Error code_, FormatStringHelper<Args...> fmt, Args &&... args)
+    Exception(Error code_, FormatStringHelper<Args...> fmt, Args &&... args)
         : DB::Exception(DB::ErrorCodes::KEEPER_EXCEPTION, std::move(fmt), std::forward<Args>(args)...)
         , code(code_)
     {
         incrementErrorMetrics(code);
     }
 
-    inline static Exception createDeprecated(const std::string & msg, const Error code_)
+    inline static Exception createDeprecated(const std::string & msg, Error code_)
     {
         return Exception(msg, code_, 0);
     }
 
-    inline static Exception fromPath(const Error code_, const std::string & path)
+    inline static Exception fromPath(Error code_, const std::string & path)
     {
         return Exception(code_, "Coordination error: {}, path {}", errorMessage(code_), path);
     }
@@ -504,7 +504,7 @@ public:
     /// Message must be a compile-time constant
     template <typename T>
     requires std::is_convertible_v<T, String>
-    inline static Exception fromMessage(const Error code_, T && message)
+    inline static Exception fromMessage(Error code_, T && message)
     {
         return Exception(std::forward<T>(message), code_);
     }
diff --git a/src/Common/logger_useful.h b/src/Common/logger_useful.h
index 8e78e93e198..013b35e695e 100644
--- a/src/Common/logger_useful.h
+++ b/src/Common/logger_useful.h
@@ -19,14 +19,14 @@ namespace Poco { class Logger; }
 
 using LogSeriesLimiterPtr = std::shared_ptr<LogSeriesLimiter>;
 
-namespace
+namespace impl
 {
-    [[maybe_unused]] LoggerPtr getLoggerHelper(const LoggerPtr & logger) { return logger; }
-    [[maybe_unused]] LoggerPtr getLoggerHelper(const AtomicLogger & logger) { return logger.load(); }
-    [[maybe_unused]] const ::Poco::Logger * getLoggerHelper(const ::Poco::Logger * logger) { return logger; }
-    [[maybe_unused]] std::unique_ptr<LogToStrImpl> getLoggerHelper(std::unique_ptr<LogToStrImpl> && logger) { return logger; }
-    [[maybe_unused]] std::unique_ptr<LogFrequencyLimiterIml> getLoggerHelper(std::unique_ptr<LogFrequencyLimiterIml> && logger) { return logger; }
-    [[maybe_unused]] LogSeriesLimiterPtr getLoggerHelper(LogSeriesLimiterPtr & logger) { return logger; }
+    [[maybe_unused]] inline LoggerPtr getLoggerHelper(const LoggerPtr & logger) { return logger; }
+    [[maybe_unused]] inline LoggerPtr getLoggerHelper(const AtomicLogger & logger) { return logger.load(); }
+    [[maybe_unused]] inline const ::Poco::Logger * getLoggerHelper(const ::Poco::Logger * logger) { return logger; }
+    [[maybe_unused]] inline std::unique_ptr<LogToStrImpl> getLoggerHelper(std::unique_ptr<LogToStrImpl> && logger) { return logger; }
+    [[maybe_unused]] inline std::unique_ptr<LogFrequencyLimiterIml> getLoggerHelper(std::unique_ptr<LogFrequencyLimiterIml> && logger) { return logger; }
+    [[maybe_unused]] inline LogSeriesLimiterPtr getLoggerHelper(LogSeriesLimiterPtr & logger) { return logger; }
 }
 
 #define LOG_IMPL_FIRST_ARG(X, ...) X
@@ -65,7 +65,7 @@ namespace
 
 #define LOG_IMPL(logger, priority, PRIORITY, ...) do                                                                \
 {                                                                                                                   \
-    auto _logger = ::getLoggerHelper(logger);                                                                             \
+    auto _logger = ::impl::getLoggerHelper(logger);                                                                 \
     const bool _is_clients_log = (DB::CurrentThread::getGroup() != nullptr) &&                                      \
         (DB::CurrentThread::get().getClientLogsLevel() >= (priority));                                              \
     if (!_is_clients_log && !_logger->is((PRIORITY)))                                                               \
diff --git a/src/Core/PostgreSQL/insertPostgreSQLValue.cpp b/src/Core/PostgreSQL/insertPostgreSQLValue.cpp
index aa60bdee28a..b507b300769 100644
--- a/src/Core/PostgreSQL/insertPostgreSQLValue.cpp
+++ b/src/Core/PostgreSQL/insertPostgreSQLValue.cpp
@@ -36,7 +36,7 @@ void insertDefaultPostgreSQLValue(IColumn & column, const IColumn & sample_colum
 
 void insertPostgreSQLValue(
         IColumn & column, std::string_view value,
-        const ExternalResultDescription::ValueType type, const DataTypePtr data_type,
+        ExternalResultDescription::ValueType type, DataTypePtr data_type,
         const std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t idx)
 {
     switch (type)
@@ -170,7 +170,7 @@ void insertPostgreSQLValue(
 
 
 void preparePostgreSQLArrayInfo(
-        std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t column_idx, const DataTypePtr data_type)
+        std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t column_idx, DataTypePtr data_type)
 {
     const auto * array_type = typeid_cast<const DataTypeArray *>(data_type.get());
     auto nested = array_type->getNestedType();
diff --git a/src/Core/PostgreSQL/insertPostgreSQLValue.h b/src/Core/PostgreSQL/insertPostgreSQLValue.h
index 3bc83292b96..bfb85422aa1 100644
--- a/src/Core/PostgreSQL/insertPostgreSQLValue.h
+++ b/src/Core/PostgreSQL/insertPostgreSQLValue.h
@@ -22,11 +22,11 @@ struct PostgreSQLArrayInfo
 
 void insertPostgreSQLValue(
         IColumn & column, std::string_view value,
-        const ExternalResultDescription::ValueType type, const DataTypePtr data_type,
+        ExternalResultDescription::ValueType type, DataTypePtr data_type,
         const std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t idx);
 
 void preparePostgreSQLArrayInfo(
-        std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t column_idx, const DataTypePtr data_type);
+        std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t column_idx, DataTypePtr data_type);
 
 void insertDefaultPostgreSQLValue(IColumn & column, const IColumn & sample_column);
 
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d70a6cf51c5..c41db9d2141 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1192,6 +1192,7 @@ class IColumn;
     FORMAT_FACTORY_SETTINGS(M, ALIAS)  \
     OBSOLETE_FORMAT_SETTINGS(M, ALIAS) \
 
+/// NOLINTNEXTLINE(clang-analyzer-optin.performance.Padding)
 DECLARE_SETTINGS_TRAITS_ALLOW_CUSTOM_SETTINGS(SettingsTraits, LIST_OF_SETTINGS)
 
 
@@ -1236,6 +1237,7 @@ private:
 /*
  * User-specified file format settings for File and URL engines.
  */
+/// NOLINTNEXTLINE(clang-analyzer-optin.performance.Padding)
 DECLARE_SETTINGS_TRAITS(FormatFactorySettingsTraits, LIST_OF_ALL_FORMAT_SETTINGS)
 
 struct FormatFactorySettings : public BaseSettings<FormatFactorySettingsTraits>
diff --git a/src/Dictionaries/CacheDictionary.cpp b/src/Dictionaries/CacheDictionary.cpp
index 8444042db9e..6e9b09f8919 100644
--- a/src/Dictionaries/CacheDictionary.cpp
+++ b/src/Dictionaries/CacheDictionary.cpp
@@ -423,7 +423,7 @@ MutableColumns CacheDictionary<dictionary_key_type>::aggregateColumnsInOrderOfKe
     const DictionaryStorageFetchRequest & request,
     const MutableColumns & fetched_columns,
     const PaddedPODArray<KeyState> & key_index_to_state,
-    IColumn::Filter * const default_mask) const
+    IColumn::Filter * default_mask) const
 {
     MutableColumns aggregated_columns = request.makeAttributesResultColumns();
 
@@ -473,7 +473,7 @@ MutableColumns CacheDictionary<dictionary_key_type>::aggregateColumns(
         const PaddedPODArray<KeyState> & key_index_to_fetched_columns_from_storage_result,
         const MutableColumns & fetched_columns_during_update,
         const HashMap<KeyType, size_t> & found_keys_to_fetched_columns_during_update_index,
-        IColumn::Filter * const default_mask) const
+        IColumn::Filter * default_mask) const
 {
     /**
     * Aggregation of columns fetched from storage and from source during update.
diff --git a/src/Dictionaries/CacheDictionary.h b/src/Dictionaries/CacheDictionary.h
index 8897fb40fa9..c02fb91c60e 100644
--- a/src/Dictionaries/CacheDictionary.h
+++ b/src/Dictionaries/CacheDictionary.h
@@ -162,7 +162,7 @@ private:
         const DictionaryStorageFetchRequest & request,
         const MutableColumns & fetched_columns,
         const PaddedPODArray<KeyState> & key_index_to_state,
-        IColumn::Filter * const default_mask = nullptr) const;
+        IColumn::Filter * default_mask = nullptr) const;
 
     MutableColumns aggregateColumns(
         const PaddedPODArray<KeyType> & keys,
diff --git a/src/Dictionaries/Embedded/GeodataProviders/IHierarchiesProvider.h b/src/Dictionaries/Embedded/GeodataProviders/IHierarchiesProvider.h
index 68ab0fdca2d..a4b88127786 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/IHierarchiesProvider.h
+++ b/src/Dictionaries/Embedded/GeodataProviders/IHierarchiesProvider.h
@@ -14,7 +14,7 @@ class IRegionsHierarchyReader
 public:
     virtual bool readNext(RegionEntry & entry) = 0;
 
-    virtual ~IRegionsHierarchyReader() {}
+    virtual ~IRegionsHierarchyReader() = default;
 };
 
 using IRegionsHierarchyReaderPtr = std::unique_ptr<IRegionsHierarchyReader>;
diff --git a/src/Dictionaries/RegExpTreeDictionary.cpp b/src/Dictionaries/RegExpTreeDictionary.cpp
index 4d82aa9ca0e..1f5c2d6d2c7 100644
--- a/src/Dictionaries/RegExpTreeDictionary.cpp
+++ b/src/Dictionaries/RegExpTreeDictionary.cpp
@@ -568,7 +568,7 @@ bool RegExpTreeDictionary::setAttributesShortCircuit(
     const String & data,
     std::unordered_set<UInt64> & visited_nodes,
     const std::unordered_map<String, const DictionaryAttribute &> & attributes,
-    std::unordered_set<String> * const defaults) const
+    std::unordered_set<String> * defaults) const
 {
     if (visited_nodes.contains(id))
         return attributes_to_set.attributesFull() == attributes.size();
diff --git a/src/Dictionaries/RegExpTreeDictionary.h b/src/Dictionaries/RegExpTreeDictionary.h
index 9e14abb49d0..d6bc90ef651 100644
--- a/src/Dictionaries/RegExpTreeDictionary.h
+++ b/src/Dictionaries/RegExpTreeDictionary.h
@@ -210,7 +210,7 @@ private:
         const String & data,
         std::unordered_set<UInt64> & visited_nodes,
         const std::unordered_map<String, const DictionaryAttribute &> & attributes,
-        std::unordered_set<String> * const defaults) const;
+        std::unordered_set<String> * defaults) const;
 
     struct RegexTreeNode;
     using RegexTreeNodePtr = std::shared_ptr<RegexTreeNode>;
diff --git a/src/Functions/IFunction.h b/src/Functions/IFunction.h
index 05aa08e2ad7..9b7cdf12d57 100644
--- a/src/Functions/IFunction.h
+++ b/src/Functions/IFunction.h
@@ -13,10 +13,6 @@
 
 #include <memory>
 
-#if USE_EMBEDDED_COMPILER
-#    include <Core/ValuesWithType.h>
-#endif
-
 /// This file contains user interface for functions.
 
 namespace llvm
diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index 38904df4403..5c401c0c8d9 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -63,6 +63,7 @@ enum class RemoteFSReadMethod
 class MMappedFileCache;
 class PageCache;
 
+/// NOLINTNEXTLINE(clang-analyzer-optin.performance.Padding)
 struct ReadSettings
 {
     /// Method to use reading from local filesystem.
diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index 7d56dbabe3c..9327f31b6ff 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -905,7 +905,7 @@ Chunk AsynchronousInsertQueue::processEntriesWithParsing(
     const InsertDataPtr & data,
     const Block & header,
     const ContextPtr & insert_context,
-    const LoggerPtr logger,
+    LoggerPtr logger,
     LogFunc && add_to_async_insert_log)
 {
     size_t total_rows = 0;
diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index f60b3d343fb..5076701d0b0 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -265,7 +265,7 @@ private:
         const InsertDataPtr & data,
         const Block & header,
         const ContextPtr & insert_context,
-        const LoggerPtr logger,
+        LoggerPtr logger,
         LogFunc && add_to_async_insert_log);
 
     template <typename LogFunc>
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index c8aa3604a6f..43df8d6adf2 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -330,7 +330,7 @@ protected:
             return *this;
         }
 
-        void swap(QueryAccessInfo & rhs)
+        void swap(QueryAccessInfo & rhs) noexcept
         {
             std::swap(databases, rhs.databases);
             std::swap(tables, rhs.tables);
@@ -680,7 +680,7 @@ public:
     void addSpecialScalar(const String & name, const Block & block);
 
     const QueryAccessInfo & getQueryAccessInfo() const { return *getQueryAccessInfoPtr(); }
-    const QueryAccessInfoPtr getQueryAccessInfoPtr() const { return query_access_info; }
+    QueryAccessInfoPtr getQueryAccessInfoPtr() const { return query_access_info; }
     void setQueryAccessInfo(QueryAccessInfoPtr other) { query_access_info = other; }
 
     void addQueryAccessInfo(
diff --git a/src/Interpreters/IExternalLoadable.h b/src/Interpreters/IExternalLoadable.h
index 3c004508b0a..47031778876 100644
--- a/src/Interpreters/IExternalLoadable.h
+++ b/src/Interpreters/IExternalLoadable.h
@@ -23,7 +23,7 @@ struct ExternalLoadableLifetime
     UInt64 max_sec = 0;
 
     ExternalLoadableLifetime(const Poco::Util::AbstractConfiguration & config, const std::string & config_prefix);
-    ExternalLoadableLifetime() {}
+    ExternalLoadableLifetime() = default;
 };
 
 /// Get delay before trying to load again after error.
diff --git a/src/Interpreters/ProcessList.h b/src/Interpreters/ProcessList.h
index 1c253f562e8..ad47041c762 100644
--- a/src/Interpreters/ProcessList.h
+++ b/src/Interpreters/ProcessList.h
@@ -318,7 +318,7 @@ public:
     ~ProcessListEntry();
 
     QueryStatusPtr getQueryStatus() { return *it; }
-    const QueryStatusPtr getQueryStatus() const { return *it; }
+    QueryStatusPtr getQueryStatus() const { return *it; }
 };
 
 
diff --git a/src/Processors/Chunk.h b/src/Processors/Chunk.h
index 9a7d6bc294d..4f753798eaa 100644
--- a/src/Processors/Chunk.h
+++ b/src/Processors/Chunk.h
@@ -59,7 +59,7 @@ public:
 
     Chunk clone() const;
 
-    void swap(Chunk & other)
+    void swap(Chunk & other) noexcept
     {
         columns.swap(other.columns);
         chunk_info.swap(other.chunk_info);
diff --git a/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.cpp b/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.cpp
index d2d2434c477..3bd0b532d90 100644
--- a/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.cpp
+++ b/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.cpp
@@ -126,7 +126,7 @@ static void postprocessChunk(Chunk & chunk, const AggregatingSortedAlgorithm::Co
 
 
 AggregatingSortedAlgorithm::SimpleAggregateDescription::SimpleAggregateDescription(
-    AggregateFunctionPtr function_, const size_t column_number_,
+    AggregateFunctionPtr function_, size_t column_number_,
     DataTypePtr nested_type_, DataTypePtr real_type_)
     : function(std::move(function_)), column_number(column_number_)
     , nested_type(std::move(nested_type_)), real_type(std::move(real_type_))
diff --git a/src/Processors/Port.h b/src/Processors/Port.h
index 67af2f041aa..f3c7bbb5fee 100644
--- a/src/Processors/Port.h
+++ b/src/Processors/Port.h
@@ -110,7 +110,7 @@ protected:
                 return result;
             }
 
-            uintptr_t ALWAYS_INLINE swap(std::atomic<Data *> & value, std::uintptr_t flags, std::uintptr_t mask)
+            uintptr_t ALWAYS_INLINE swap(std::atomic<Data *> & value, std::uintptr_t flags, std::uintptr_t mask) /// NOLINT
             {
                 Data * expected = nullptr;
                 Data * desired = getPtr(flags | getUInt(data));
diff --git a/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp b/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp
index b7cddf3c165..13d3030bbb8 100644
--- a/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp
+++ b/src/Processors/TTL/TTLUpdateInfoAlgorithm.cpp
@@ -6,8 +6,8 @@ namespace DB
 TTLUpdateInfoAlgorithm::TTLUpdateInfoAlgorithm(
     const TTLExpressions & ttl_expressions_,
     const TTLDescription & description_,
-    const TTLUpdateField ttl_update_field_,
-    const String ttl_update_key_,
+    TTLUpdateField ttl_update_field_,
+    String ttl_update_key_,
     const TTLInfo & old_ttl_info_,
     time_t current_time_,
     bool force_)
diff --git a/src/Processors/TTL/TTLUpdateInfoAlgorithm.h b/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
index 0cf31765aef..b6aee6f7cb0 100644
--- a/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
+++ b/src/Processors/TTL/TTLUpdateInfoAlgorithm.h
@@ -22,8 +22,8 @@ public:
     TTLUpdateInfoAlgorithm(
         const TTLExpressions & ttl_expressions_,
         const TTLDescription & description_,
-        const TTLUpdateField ttl_update_field_,
-        const String ttl_update_key_,
+        TTLUpdateField ttl_update_field_,
+        String ttl_update_key_,
         const TTLInfo & old_ttl_info_,
         time_t current_time_, bool force_
     );
diff --git a/src/Storages/StorageInMemoryMetadata.h b/src/Storages/StorageInMemoryMetadata.h
index 2823aba1224..69cd3422a7d 100644
--- a/src/Storages/StorageInMemoryMetadata.h
+++ b/src/Storages/StorageInMemoryMetadata.h
@@ -72,8 +72,8 @@ struct StorageInMemoryMetadata
     StorageInMemoryMetadata(const StorageInMemoryMetadata & other);
     StorageInMemoryMetadata & operator=(const StorageInMemoryMetadata & other);
 
-    StorageInMemoryMetadata(StorageInMemoryMetadata && other) = default;
-    StorageInMemoryMetadata & operator=(StorageInMemoryMetadata && other) = default;
+    StorageInMemoryMetadata(StorageInMemoryMetadata && other) = default; /// NOLINT
+    StorageInMemoryMetadata & operator=(StorageInMemoryMetadata && other) = default; /// NOLINT
 
     /// NOTE: Thread unsafe part. You should not modify same StorageInMemoryMetadata
     /// structure from different threads. It should be used as MultiVersion

From e562d97ff59739da3ca3650a33644bf9700becd7 Mon Sep 17 00:00:00 2001
From: Nikolay Yankin <211292+kolya7k@users.noreply.github.com>
Date: Mon, 11 Mar 2024 14:07:19 +0300
Subject: [PATCH 282/985] Update install.md

https://packages.clickhouse.com/tgz/stable/ is multi-paged now and  sorted by date asc so we can't get very last version
---
 docs/en/getting-started/install.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/getting-started/install.md b/docs/en/getting-started/install.md
index 234420de374..3b01434ecc5 100644
--- a/docs/en/getting-started/install.md
+++ b/docs/en/getting-started/install.md
@@ -262,7 +262,7 @@ The required version can be downloaded with `curl` or `wget` from repository htt
 After that downloaded archives should be unpacked and installed with installation scripts. Example for the latest stable version:
 
 ``` bash
-LATEST_VERSION=$(curl -s https://packages.clickhouse.com/tgz/stable/ | \
+LATEST_VERSION=$(curl -s -L https://api.github.com/repos/ClickHouse/ClickHouse/tags | \
     grep -Eo '[0-9]+\.[0-9]+\.[0-9]+\.[0-9]+' | sort -V -r | head -n 1)
 export LATEST_VERSION
 

From 90b27432a26c0a5204e09ff5ff5f2ae8df3055af Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 11 Mar 2024 12:18:58 +0100
Subject: [PATCH 283/985] Update test.py

---
 tests/integration/test_backup_restore_s3/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_backup_restore_s3/test.py b/tests/integration/test_backup_restore_s3/test.py
index 452a9143067..f3f4837c317 100644
--- a/tests/integration/test_backup_restore_s3/test.py
+++ b/tests/integration/test_backup_restore_s3/test.py
@@ -130,7 +130,7 @@ def check_system_tables(backup_query_id=None):
         if disk
     ]
     expected_disks = (
-        ("default", "local", "", ""),
+        ("default", "local", "None", "None"),
         ("disk_s3", "object_storage", "s3", "local"),
         ("disk_s3_cache", "object_storage", "s3", "local"),
         ("disk_s3_other_bucket", "object_storage", "s3", "local"),

From 57f6263f67dd91e624003199295c840a228947a0 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 11 Mar 2024 12:31:40 +0100
Subject: [PATCH 284/985] Lock contention fix

---
 src/Common/ProfileEvents.cpp           |  1 +
 src/Interpreters/Cache/FileCache.cpp   | 12 +++++++++---
 src/Interpreters/Cache/FileCache.h     |  2 +-
 src/Interpreters/Cache/FileCache_fwd.h |  1 +
 src/Interpreters/Cache/Guards.h        | 15 ++++++++++++---
 5 files changed, 24 insertions(+), 7 deletions(-)

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index c1ac3d08245..ab1a16a3edf 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -476,6 +476,7 @@ The server successfully detected this situation and will download merged part fr
     M(FileSegmentRemoveMicroseconds, "File segment remove() time") \
     M(FileSegmentHolderCompleteMicroseconds, "File segments holder complete() time") \
     M(FileSegmentFailToIncreasePriority, "Number of times the priority was not increased due to a high contention on the cache lock") \
+    M(FilesystemCacheFailToReserveSpaceBecauseOfLockContention, "Number of times space reservation was skipped due to a high contention on the cache lock") \
     M(FilesystemCacheHoldFileSegments, "Filesystem cache file segments count, which were hold") \
     M(FilesystemCacheUnusedHoldFileSegments, "Filesystem cache file segments count, which were hold, but not used (because of seek or LIMIT n, etc)") \
     \
diff --git a/src/Interpreters/Cache/FileCache.cpp b/src/Interpreters/Cache/FileCache.cpp
index 9c705ddc27c..5650b9ce44e 100644
--- a/src/Interpreters/Cache/FileCache.cpp
+++ b/src/Interpreters/Cache/FileCache.cpp
@@ -27,6 +27,7 @@ namespace ProfileEvents
     extern const Event FilesystemCacheReserveMicroseconds;
     extern const Event FilesystemCacheGetOrSetMicroseconds;
     extern const Event FilesystemCacheGetMicroseconds;
+    extern const Event FilesystemCacheFailToReserveSpaceBecauseOfLockContention;
 }
 
 namespace DB
@@ -188,9 +189,9 @@ CacheGuard::Lock FileCache::lockCache() const
     return cache_guard.lock();
 }
 
-CacheGuard::Lock FileCache::tryLockCache() const
+CacheGuard::Lock FileCache::tryLockCache(std::optional<std::chrono::milliseconds> acquire_timeout) const
 {
-    return cache_guard.tryLock();
+    return acquire_timeout.has_value() ? cache_guard.tryLockFor(acquire_timeout.value()) : cache_guard.tryLock();
 }
 
 FileSegments FileCache::getImpl(const LockedKey & locked_key, const FileSegment::Range & range, size_t file_segments_limit) const
@@ -781,7 +782,12 @@ bool FileCache::tryReserve(
     ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheReserveMicroseconds);
 
     assertInitialized();
-    auto cache_lock = lockCache();
+    auto cache_lock = tryLockCache(std::chrono::milliseconds(FILECACHE_TRY_RESERVE_LOCK_TIMEOUT_MILLISECONDS));
+    if (!cache_lock)
+    {
+        ProfileEvents::increment(ProfileEvents::FilesystemCacheFailToReserveSpaceBecauseOfLockContention);
+        return false;
+    }
 
     LOG_TEST(
         log, "Trying to reserve space ({} bytes) for {}:{}, current usage {}/{}",
diff --git a/src/Interpreters/Cache/FileCache.h b/src/Interpreters/Cache/FileCache.h
index 5b665ad0271..7434b2ac78a 100644
--- a/src/Interpreters/Cache/FileCache.h
+++ b/src/Interpreters/Cache/FileCache.h
@@ -173,7 +173,7 @@ public:
     void deactivateBackgroundOperations();
 
     CacheGuard::Lock lockCache() const;
-    CacheGuard::Lock tryLockCache() const;
+    CacheGuard::Lock tryLockCache(std::optional<std::chrono::milliseconds> acquire_timeout = std::nullopt) const;
 
     std::vector<FileSegment::Info> sync();
 
diff --git a/src/Interpreters/Cache/FileCache_fwd.h b/src/Interpreters/Cache/FileCache_fwd.h
index 06261b19db7..eaed279e7fd 100644
--- a/src/Interpreters/Cache/FileCache_fwd.h
+++ b/src/Interpreters/Cache/FileCache_fwd.h
@@ -12,6 +12,7 @@ static constexpr int FILECACHE_DEFAULT_LOAD_METADATA_THREADS = 16;
 static constexpr int FILECACHE_DEFAULT_MAX_ELEMENTS = 10000000;
 static constexpr int FILECACHE_DEFAULT_HITS_THRESHOLD = 0;
 static constexpr size_t FILECACHE_BYPASS_THRESHOLD = 256 * 1024 * 1024;
+static constexpr size_t FILECACHE_TRY_RESERVE_LOCK_TIMEOUT_MILLISECONDS = 1000; /// 1 sec.
 
 class FileCache;
 using FileCachePtr = std::shared_ptr<FileCache>;
diff --git a/src/Interpreters/Cache/Guards.h b/src/Interpreters/Cache/Guards.h
index 5729620d82f..0ac7cb80483 100644
--- a/src/Interpreters/Cache/Guards.h
+++ b/src/Interpreters/Cache/Guards.h
@@ -61,17 +61,26 @@ namespace DB
  */
 struct CacheGuard : private boost::noncopyable
 {
+    using Mutex = std::timed_mutex;
     /// struct is used (not keyword `using`) to make CacheGuard::Lock non-interchangable with other guards locks
     /// so, we wouldn't be able to pass CacheGuard::Lock to a function which accepts KeyGuard::Lock, for example
-    struct Lock : public std::unique_lock<std::mutex>
+    struct Lock : public std::unique_lock<Mutex>
     {
-        using Base = std::unique_lock<std::mutex>;
+        using Base = std::unique_lock<Mutex>;
         using Base::Base;
     };
 
     Lock lock() { return Lock(mutex); }
+
     Lock tryLock() { return Lock(mutex, std::try_to_lock); }
-    std::mutex mutex;
+
+    Lock tryLockFor(const std::chrono::milliseconds & acquire_timeout)
+    {
+        return Lock(mutex, std::chrono::duration<double, std::milli>(acquire_timeout));
+    }
+
+private:
+    Mutex mutex;
 };
 
 /**

From c0689f3760c738dc1f73cf58c1c9de12b4c096a7 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Thu, 7 Mar 2024 11:24:34 +0000
Subject: [PATCH 285/985] Fix ASTRenameQuery::clone

---
 src/Parsers/ASTRenameQuery.h       |  1 +
 src/Parsers/tests/gtest_Parser.cpp | 38 ++++++++++++++++++++++++++----
 2 files changed, 35 insertions(+), 4 deletions(-)

diff --git a/src/Parsers/ASTRenameQuery.h b/src/Parsers/ASTRenameQuery.h
index 73d12be094a..582060ab34a 100644
--- a/src/Parsers/ASTRenameQuery.h
+++ b/src/Parsers/ASTRenameQuery.h
@@ -60,6 +60,7 @@ public:
     ASTPtr clone() const override
     {
         auto res = std::make_shared<ASTRenameQuery>(*this);
+        res->cloneChildren();
         cloneOutputOptions(*res);
         return res;
     }
diff --git a/src/Parsers/tests/gtest_Parser.cpp b/src/Parsers/tests/gtest_Parser.cpp
index 36d2deae8d7..19947cd38cc 100644
--- a/src/Parsers/tests/gtest_Parser.cpp
+++ b/src/Parsers/tests/gtest_Parser.cpp
@@ -9,6 +9,7 @@
 #include <Parsers/ParserAlterQuery.h>
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/ParserOptimizeQuery.h>
+#include <Parsers/ParserRenameQuery.h>
 #include <Parsers/ParserQueryWithOutput.h>
 #include <Parsers/ParserAttachAccessEntity.h>
 #include <Parsers/formatAST.h>
@@ -62,10 +63,29 @@ TEST_P(ParserTest, parseQuery)
             if (std::string("CREATE USER or ALTER USER query") != parser->getName()
                     && std::string("ATTACH access entity query") != parser->getName())
             {
-                WriteBufferFromOwnString buf;
-                formatAST(*ast->clone(), buf, false, false);
-                String formatted_ast = buf.str();
-                EXPECT_EQ(expected_ast, formatted_ast);
+                ASTPtr ast_clone = ast->clone();
+                {
+                    WriteBufferFromOwnString buf;
+                    formatAST(*ast_clone, buf, false, false);
+                    String formatted_ast = buf.str();
+                    EXPECT_EQ(expected_ast, formatted_ast);
+                }
+
+
+                ASTPtr ast_clone2 = ast_clone->clone();
+                /// Break `ast_clone2`, it should not affect `ast_clone` if `clone()` implemented properly
+                for (auto & child : ast_clone2->children)
+                {
+                    if (auto * identifier = dynamic_cast<ASTIdentifier *>(child.get()))
+                        identifier->setShortName("new_name");
+                }
+
+                {
+                    WriteBufferFromOwnString buf;
+                    formatAST(*ast_clone, buf, false, false);
+                    String formatted_ast = buf.str();
+                    EXPECT_EQ(expected_ast, formatted_ast);
+                }
             }
             else
             {
@@ -299,6 +319,16 @@ INSTANTIATE_TEST_SUITE_P(ParserAttachUserQuery, ParserTest,
         }
 })));
 
+INSTANTIATE_TEST_SUITE_P(ParserRenameQuery, ParserTest,
+    ::testing::Combine(
+        ::testing::Values(std::make_shared<ParserRenameQuery>()),
+        ::testing::ValuesIn(std::initializer_list<ParserTestCase>{
+        {
+            "RENAME TABLE eligible_test TO eligible_test2",
+            "RENAME TABLE eligible_test TO eligible_test2"
+        }
+})));
+
 INSTANTIATE_TEST_SUITE_P(ParserKQLQuery, ParserKQLTest,
     ::testing::Combine(
         ::testing::Values(std::make_shared<ParserKQLQuery>()),

From 38b8e7ac7e87b0efcea7560735697de0583e0f17 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Fri, 8 Mar 2024 11:54:20 +0000
Subject: [PATCH 286/985] Maintain list of ASTRenameQuery children

---
 src/Interpreters/AddDefaultDatabaseVisitor.h  |  8 +---
 src/Interpreters/InterpreterCreateQuery.cpp   |  3 +-
 src/Interpreters/InterpreterRenameQuery.cpp   |  8 ++--
 .../MySQL/InterpretersMySQLDDLQuery.cpp       | 25 ++++++------
 src/Interpreters/SystemLog.cpp                |  3 +-
 src/Parsers/ASTRenameQuery.h                  | 38 ++++++++++++++++++-
 src/Parsers/ParserRenameQuery.cpp             | 26 ++++---------
 src/Storages/StorageMaterializedView.cpp      |  5 ++-
 8 files changed, 69 insertions(+), 47 deletions(-)

diff --git a/src/Interpreters/AddDefaultDatabaseVisitor.h b/src/Interpreters/AddDefaultDatabaseVisitor.h
index b977a73d461..e36f22e8ba1 100644
--- a/src/Interpreters/AddDefaultDatabaseVisitor.h
+++ b/src/Interpreters/AddDefaultDatabaseVisitor.h
@@ -275,13 +275,7 @@ private:
         if (only_replace_current_database_function)
             return;
 
-        for (ASTRenameQuery::Element & elem : node.elements)
-        {
-            if (!elem.from.database)
-                elem.from.database = std::make_shared<ASTIdentifier>(database_name);
-            if (!elem.to.database)
-                elem.to.database = std::make_shared<ASTIdentifier>(database_name);
-        }
+        node.setDatabaseIfNotExists(database_name);
     }
 
     void visitDDL(ASTAlterQuery & node, ASTPtr &) const
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index d05d8b8deb1..edd7452c130 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -1612,7 +1612,6 @@ BlockIO InterpreterCreateQuery::doCreateOrReplaceTable(ASTCreateQuery & create,
         executeTrivialBlockIO(fill_io, getContext());
 
         /// Replace target table with created one
-        auto ast_rename = std::make_shared<ASTRenameQuery>();
         ASTRenameQuery::Element elem
         {
             ASTRenameQuery::Table
@@ -1627,7 +1626,7 @@ BlockIO InterpreterCreateQuery::doCreateOrReplaceTable(ASTCreateQuery & create,
             }
         };
 
-        ast_rename->elements.push_back(std::move(elem));
+        auto ast_rename = std::make_shared<ASTRenameQuery>(ASTRenameQuery::Elements{std::move(elem)});
         ast_rename->dictionary = create.is_dictionary;
         if (create.create_or_replace)
         {
diff --git a/src/Interpreters/InterpreterRenameQuery.cpp b/src/Interpreters/InterpreterRenameQuery.cpp
index 52001fdcaf4..06b6ebc9cbb 100644
--- a/src/Interpreters/InterpreterRenameQuery.cpp
+++ b/src/Interpreters/InterpreterRenameQuery.cpp
@@ -47,12 +47,12 @@ BlockIO InterpreterRenameQuery::execute()
       */
 
     RenameDescriptions descriptions;
-    descriptions.reserve(rename.elements.size());
+    descriptions.reserve(rename.getElements().size());
 
     /// Don't allow to drop tables (that we are renaming); don't allow to create tables in places where tables will be renamed.
     TableGuards table_guards;
 
-    for (const auto & elem : rename.elements)
+    for (const auto & elem : rename.getElements())
     {
         descriptions.emplace_back(elem, current_database);
         const auto & description = descriptions.back();
@@ -186,7 +186,7 @@ AccessRightsElements InterpreterRenameQuery::getRequiredAccess(InterpreterRename
 {
     AccessRightsElements required_access;
     const auto & rename = query_ptr->as<const ASTRenameQuery &>();
-    for (const auto & elem : rename.elements)
+    for (const auto & elem : rename.getElements())
     {
         if (type == RenameType::RenameTable)
         {
@@ -214,7 +214,7 @@ AccessRightsElements InterpreterRenameQuery::getRequiredAccess(InterpreterRename
 void InterpreterRenameQuery::extendQueryLogElemImpl(QueryLogElement & elem, const ASTPtr & ast, ContextPtr) const
 {
     const auto & rename = ast->as<const ASTRenameQuery &>();
-    for (const auto & element : rename.elements)
+    for (const auto & element : rename.getElements())
     {
         {
             String database = backQuoteIfNeed(!element.from.database ? getContext()->getCurrentDatabase() : element.from.getDatabase());
diff --git a/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp b/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp
index 107b435ded4..fd7ffca2872 100644
--- a/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp
+++ b/src/Interpreters/MySQL/InterpretersMySQLDDLQuery.cpp
@@ -579,7 +579,7 @@ ASTs InterpreterRenameImpl::getRewrittenQueries(
     const InterpreterRenameImpl::TQuery & rename_query, ContextPtr context, const String & mapped_to_database, const String & mysql_database)
 {
     ASTRenameQuery::Elements elements;
-    for (const auto & rename_element : rename_query.elements)
+    for (const auto & rename_element : rename_query.getElements())
     {
         const auto & to_database = resolveDatabase(rename_element.to.getDatabase(), mysql_database, mapped_to_database, context);
         const auto & from_database = resolveDatabase(rename_element.from.getDatabase(), mysql_database, mapped_to_database, context);
@@ -600,8 +600,7 @@ ASTs InterpreterRenameImpl::getRewrittenQueries(
     if (elements.empty())
         return ASTs{};
 
-    auto rewritten_query = std::make_shared<ASTRenameQuery>();
-    rewritten_query->elements = elements;
+    auto rewritten_query = std::make_shared<ASTRenameQuery>(std::move(elements));
     return ASTs{rewritten_query};
 }
 
@@ -616,7 +615,8 @@ ASTs InterpreterAlterImpl::getRewrittenQueries(
         return {};
 
     auto rewritten_alter_query = std::make_shared<ASTAlterQuery>();
-    auto rewritten_rename_query = std::make_shared<ASTRenameQuery>();
+    ASTRenameQuery::Elements rename_elements;
+
     rewritten_alter_query->setDatabase(mapped_to_database);
     rewritten_alter_query->setTable(alter_query.table);
     rewritten_alter_query->alter_object = ASTAlterQuery::AlterObjectType::TABLE;
@@ -749,13 +749,13 @@ ASTs InterpreterAlterImpl::getRewrittenQueries(
 
             /// For ALTER TABLE table_name RENAME TO new_table_name_1, RENAME TO new_table_name_2;
             /// We just need to generate RENAME TABLE table_name TO new_table_name_2;
-            if (rewritten_rename_query->elements.empty())
-                rewritten_rename_query->elements.push_back(ASTRenameQuery::Element());
+            if (rename_elements.empty())
+                rename_elements.push_back(ASTRenameQuery::Element());
 
-            rewritten_rename_query->elements.back().from.database = std::make_shared<ASTIdentifier>(mapped_to_database);
-            rewritten_rename_query->elements.back().from.table = std::make_shared<ASTIdentifier>(alter_query.table);
-            rewritten_rename_query->elements.back().to.database = std::make_shared<ASTIdentifier>(mapped_to_database);
-            rewritten_rename_query->elements.back().to.table = std::make_shared<ASTIdentifier>(alter_command->new_table_name);
+            rename_elements.back().from.database = std::make_shared<ASTIdentifier>(mapped_to_database);
+            rename_elements.back().from.table = std::make_shared<ASTIdentifier>(alter_query.table);
+            rename_elements.back().to.database = std::make_shared<ASTIdentifier>(mapped_to_database);
+            rename_elements.back().to.table = std::make_shared<ASTIdentifier>(alter_command->new_table_name);
         }
     }
 
@@ -765,8 +765,11 @@ ASTs InterpreterAlterImpl::getRewrittenQueries(
     if (!rewritten_alter_query->command_list->children.empty())
         rewritten_queries.push_back(rewritten_alter_query);
 
-    if (!rewritten_rename_query->elements.empty())
+    if (!rename_elements.empty())
+    {
+        auto rewritten_rename_query = std::make_shared<ASTRenameQuery>(std::move(rename_elements));
         rewritten_queries.push_back(rewritten_rename_query);
+    }
 
     return rewritten_queries;
 }
diff --git a/src/Interpreters/SystemLog.cpp b/src/Interpreters/SystemLog.cpp
index 6580dc3e9b7..a74b5c67726 100644
--- a/src/Interpreters/SystemLog.cpp
+++ b/src/Interpreters/SystemLog.cpp
@@ -563,7 +563,6 @@ void SystemLog<LogElement>::prepareTable()
                 {table_id.database_name, table_id.table_name + "_" + toString(suffix)}, getContext()))
                 ++suffix;
 
-            auto rename = std::make_shared<ASTRenameQuery>();
             ASTRenameQuery::Element elem
             {
                 ASTRenameQuery::Table
@@ -586,7 +585,7 @@ void SystemLog<LogElement>::prepareTable()
                 old_create_query,
                 create_query);
 
-            rename->elements.emplace_back(std::move(elem));
+            auto rename = std::make_shared<ASTRenameQuery>(ASTRenameQuery::Elements{std::move(elem)});
 
             ActionLock merges_lock;
             if (DatabaseCatalog::instance().getDatabase(table_id.database_name)->getUUID() == UUIDHelpers::Nil)
diff --git a/src/Parsers/ASTRenameQuery.h b/src/Parsers/ASTRenameQuery.h
index 582060ab34a..beaf93c4761 100644
--- a/src/Parsers/ASTRenameQuery.h
+++ b/src/Parsers/ASTRenameQuery.h
@@ -45,7 +45,6 @@ public:
     };
 
     using Elements = std::vector<Element>;
-    Elements elements;
 
     bool exchange{false};   /// For EXCHANGE TABLES
     bool database{false};   /// For RENAME DATABASE
@@ -54,6 +53,41 @@ public:
     /// Special flag for CREATE OR REPLACE. Do not throw if the second table does not exist.
     bool rename_if_cannot_exchange{false};
 
+    explicit ASTRenameQuery(Elements elements_ = {})
+        : elements(std::move(elements_))
+    {
+        for (const auto & elem : elements)
+        {
+            if (elem.from.database)
+                children.push_back(elem.from.database);
+            if (elem.from.table)
+                children.push_back(elem.from.table);
+            if (elem.to.database)
+                children.push_back(elem.to.database);
+            if (elem.to.table)
+                children.push_back(elem.to.table);
+        }
+    }
+
+    void setDatabaseIfNotExists(const String & database_name)
+    {
+        for (auto & elem : elements)
+        {
+            if (!elem.from.database)
+            {
+                elem.from.database = std::make_shared<ASTIdentifier>(database_name);
+                children.push_back(elem.from.database);
+            }
+            if (!elem.to.database)
+            {
+                elem.to.database = std::make_shared<ASTIdentifier>(database_name);
+                children.push_back(elem.to.database);
+            }
+        }
+    }
+
+    const Elements & getElements() const { return elements; }
+
     /** Get the text that identifies this element. */
     String getID(char) const override { return "Rename"; }
 
@@ -146,6 +180,8 @@ protected:
 
         formatOnCluster(settings);
     }
+
+    Elements elements;
 };
 
 }
diff --git a/src/Parsers/ParserRenameQuery.cpp b/src/Parsers/ParserRenameQuery.cpp
index 27f2ed1cd22..f9d29108ed6 100644
--- a/src/Parsers/ParserRenameQuery.cpp
+++ b/src/Parsers/ParserRenameQuery.cpp
@@ -44,15 +44,14 @@ bool ParserRenameQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
                 return false;
         }
+        ASTRenameQuery::Elements rename_elements;
+        rename_elements.emplace_back();
+        rename_elements.back().if_exists = if_exists;
+        rename_elements.back().from.database = from_db;
+        rename_elements.back().to.database = to_db;
 
-        auto query = std::make_shared<ASTRenameQuery>();
+        auto query = std::make_shared<ASTRenameQuery>(std::move(rename_elements));
         query->database = true;
-        query->elements.emplace({});
-        query->elements.front().if_exists = if_exists;
-        query->elements.front().from.database = from_db;
-        query->elements.front().to.database = to_db;
-        query->children.push_back(std::move(from_db));
-        query->children.push_back(std::move(to_db));
         query->cluster = cluster_str;
         node = query;
         return true;
@@ -75,9 +74,8 @@ bool ParserRenameQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
     const auto ignore_delim = [&] { return exchange ? s_and.ignore(pos) : s_to.ignore(pos); };
 
-    auto query = std::make_shared<ASTRenameQuery>();
 
-    ASTRenameQuery::Elements & elements = query->elements;
+    ASTRenameQuery::Elements elements;
 
     while (true)
     {
@@ -93,15 +91,6 @@ bool ParserRenameQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             || !ignore_delim()
             || !parseDatabaseAndTableAsAST(pos, expected, ref.to.database, ref.to.table))
             return false;
-
-        if (ref.from.database)
-            query->children.push_back(ref.from.database);
-        if (ref.from.table)
-            query->children.push_back(ref.from.table);
-        if (ref.to.database)
-            query->children.push_back(ref.to.database);
-        if (ref.to.table)
-            query->children.push_back(ref.to.table);
     }
 
     String cluster_str;
@@ -111,6 +100,7 @@ bool ParserRenameQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             return false;
     }
 
+    auto query = std::make_shared<ASTRenameQuery>(std::move(elements));
     query->cluster = cluster_str;
     query->exchange = exchange;
     query->dictionary = dictionary;
diff --git a/src/Storages/StorageMaterializedView.cpp b/src/Storages/StorageMaterializedView.cpp
index 02cba1cf753..9958d65819b 100644
--- a/src/Storages/StorageMaterializedView.cpp
+++ b/src/Storages/StorageMaterializedView.cpp
@@ -465,8 +465,8 @@ void StorageMaterializedView::renameInMemory(const StorageID & new_table_id)
     if (!from_atomic_to_atomic_database && has_inner_table && tryGetTargetTable())
     {
         auto new_target_table_name = generateInnerTableName(new_table_id);
-        auto rename = std::make_shared<ASTRenameQuery>();
 
+        ASTRenameQuery::Elements rename_elements;
         assert(inner_table_id.database_name == old_table_id.database_name);
 
         ASTRenameQuery::Element elem
@@ -482,8 +482,9 @@ void StorageMaterializedView::renameInMemory(const StorageID & new_table_id)
                 std::make_shared<ASTIdentifier>(new_target_table_name)
             }
         };
-        rename->elements.emplace_back(std::move(elem));
+        rename_elements.emplace_back(std::move(elem));
 
+        auto rename = std::make_shared<ASTRenameQuery>(std::move(rename_elements));
         InterpreterRenameQuery(rename, getContext()).execute();
         updateTargetTableId(new_table_id.database_name, new_target_table_name);
     }

From 59c6311ead26e48f861e27d19d58deffe4c6d622 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Mon, 11 Mar 2024 09:55:13 +0000
Subject: [PATCH 287/985] improve report  #do_not_test

---
 utils/check-style/process_style_check_result.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/utils/check-style/process_style_check_result.py b/utils/check-style/process_style_check_result.py
index e620d85b9d0..b043aa548d7 100755
--- a/utils/check-style/process_style_check_result.py
+++ b/utils/check-style/process_style_check_result.py
@@ -32,8 +32,13 @@ def process_result(result_folder):
         if not os.path.exists(full_path):
             test_results.append((f"Check {name}", "SKIPPED"))
         elif os.stat(full_path).st_size != 0:
+            with open(full_path, 'r') as file:
+                lines = file.readlines()
+                if len(lines) > 100:
+                    lines = lines[:100] + ['====TRIMMED====']
+                content = "\n".join(lines)
             description += f"Check {name} failed. "
-            test_results.append((f"Check {name}", "FAIL"))
+            test_results.append((f"Check {name}", "FAIL", None, content))
             status = "failure"
         else:
             test_results.append((f"Check {name}", "OK"))

From 8f2ff2ccd833dd1cc839922c59a90360f2b882c7 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 11 Mar 2024 13:07:39 +0100
Subject: [PATCH 288/985] Enable black back

---
 tests/ci/style_check.py                        | 18 +++++++++---------
 utils/check-style/check_py.sh                  |  4 ++--
 .../check-style/process_style_check_result.py  | 10 +++++-----
 3 files changed, 16 insertions(+), 16 deletions(-)

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 9f113b6e6f9..7fb5d22a3ce 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -1,12 +1,12 @@
 #!/usr/bin/env python3
 import argparse
-from concurrent.futures import ProcessPoolExecutor
 import csv
 import logging
 import os
 import shutil
 import subprocess
 import sys
+from concurrent.futures import ProcessPoolExecutor
 from pathlib import Path
 from typing import List, Tuple
 
@@ -121,7 +121,7 @@ def checkout_last_ref(pr_info: PRInfo) -> None:
 def main():
     logging.basicConfig(level=logging.INFO)
     logging.getLogger("git_helper").setLevel(logging.DEBUG)
-    # args = parse_args()
+    args = parse_args()
 
     stopwatch = Stopwatch()
 
@@ -141,12 +141,14 @@ def main():
         f"--entrypoint= -w/ClickHouse/utils/check-style "
         f"{image} ./check_cpp.sh"
     )
+
     cmd_py = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
         f"--entrypoint= -w/ClickHouse/utils/check-style "
         f"{image} ./check_py.sh"
     )
+
     cmd_docs = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
@@ -175,12 +177,14 @@ def main():
             _ = future1.result()
 
         if run_pycheck:
+            if args.push:
+                checkout_head(pr_info)
             logging.info("Run py files check: %s", cmd_py)
             future2 = executor.submit(subprocess.run, cmd_py, shell=True)
             _ = future2.result()
-
-    # if args.push:
-    #     checkout_head(pr_info)
+            if args.push:
+                commit_push_staged(pr_info)
+                checkout_last_ref(pr_info)
 
     subprocess.check_call(
         f"python3 ../../utils/check-style/process_style_check_result.py --in-results-dir {temp_path} "
@@ -189,10 +193,6 @@ def main():
         shell=True,
     )
 
-    # if args.push:
-    #     commit_push_staged(pr_info)
-    #     checkout_last_ref(pr_info)
-
     state, description, test_results, additional_files = process_result(temp_path)
 
     JobReport(
diff --git a/utils/check-style/check_py.sh b/utils/check-style/check_py.sh
index b729cd78124..13f4e754ed3 100755
--- a/utils/check-style/check_py.sh
+++ b/utils/check-style/check_py.sh
@@ -5,8 +5,8 @@ cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_ou
 start_total=`date +%s`
 
 # FIXME: 1 min to wait + head checkout
-# echo "Check python formatting with black" | ts
-# ./check-black -n              |& tee /test_output/black_output.txt
+echo "Check python formatting with black" | ts
+./check-black -n              |& tee /test_output/black_output.txt
 
 start=`date +%s`
 ./check-pylint -n               |& tee /test_output/pylint_output.txt
diff --git a/utils/check-style/process_style_check_result.py b/utils/check-style/process_style_check_result.py
index b043aa548d7..8c9837b4fc6 100755
--- a/utils/check-style/process_style_check_result.py
+++ b/utils/check-style/process_style_check_result.py
@@ -1,9 +1,9 @@
 #!/usr/bin/env python3
 
-import os
-import logging
 import argparse
 import csv
+import logging
+import os
 
 
 # TODO: add typing and log files to the fourth column, think about launching
@@ -17,7 +17,7 @@ def process_result(result_folder):
         # "shellcheck",
         "style",
         "pylint",
-        # "black",
+        "black",
         "mypy",
         "typos",
         "whitespaces",
@@ -32,10 +32,10 @@ def process_result(result_folder):
         if not os.path.exists(full_path):
             test_results.append((f"Check {name}", "SKIPPED"))
         elif os.stat(full_path).st_size != 0:
-            with open(full_path, 'r') as file:
+            with open(full_path, "r") as file:
                 lines = file.readlines()
                 if len(lines) > 100:
-                    lines = lines[:100] + ['====TRIMMED====']
+                    lines = lines[:100] + ["====TRIMMED===="]
                 content = "\n".join(lines)
             description += f"Check {name} failed. "
             test_results.append((f"Check {name}", "FAIL", None, content))

From 1ea68265b50a8c8ded253e392181b3b81df72815 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 11 Mar 2024 12:46:30 +0000
Subject: [PATCH 289/985] Revert "Adds makeDateTime64 function."

This reverts commit bd194aab41401492c5d628269df53e68243a1211.
---
 .../functions/date-time-functions.md          | 137 ++++--------------
 .../functions/other-functions.md              |  65 +--------
 2 files changed, 32 insertions(+), 170 deletions(-)

diff --git a/docs/en/sql-reference/functions/date-time-functions.md b/docs/en/sql-reference/functions/date-time-functions.md
index 12f0c996ce7..41503abfa2f 100644
--- a/docs/en/sql-reference/functions/date-time-functions.md
+++ b/docs/en/sql-reference/functions/date-time-functions.md
@@ -26,115 +26,66 @@ SELECT
 
 ## makeDate
 
-Creates a [Date](../../sql-reference/data-types/date.md) from either one of the following sets of arguments:
+Creates a [Date](../../sql-reference/data-types/date.md)
+- from a year, month and day argument, or
+- from a year and day of year argument.
 
-- a year, month, and day.
-- a year and day of year.
+**Syntax**
 
-### Syntax
-
-Using a year, month, and day:
-
-```sql
-makeDate(year, month, day)
+``` sql
+makeDate(year, month, day);
+makeDate(year, day_of_year);
 ```
 
-Using a year and day of year:
+Alias:
+- `MAKEDATE(year, month, day);`
+- `MAKEDATE(year, day_of_year);`
 
-```sql
-makeDate(year, day_of_year)
-```
-
-### Arguments
+**Arguments**
 
 - `year` — Year. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
 - `month` — Month. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
 - `day` — Day. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
 - `day_of_year` — Day of the year. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
 
-### Returned values
+**Returned value**
 
-A date created from the arguments.
+- A date created from the arguments.
 
 Type: [Date](../../sql-reference/data-types/date.md).
 
-### Examples
+**Example**
 
 Create a Date from a year, month and day:
 
-```sql
+``` sql
 SELECT makeDate(2023, 2, 28) AS Date;
 ```
 
-```response
-2023-02-28
+Result:
+
+``` text
+┌───────date─┐
+│ 2023-02-28 │
+└────────────┘
 ```
 
-Create a Date from a year and day of year:
+Create a Date from a year and day of year argument:
 
 ``` sql
 SELECT makeDate(2023, 42) AS Date;
 ```
 
-```response
-2023-02-11
-```
+Result:
 
+``` text
+┌───────date─┐
+│ 2023-02-11 │
+└────────────┘
+```
 ## makeDate32
 
-Creates a date of type [Date32](../../sql-reference/data-types/date32.md) from either one of the following sets of arguments:
-
-- a year, month, and day.
-- a year and day of year.
-
-### Syntax
-
-Using a year, month, and day:
-
-```sql
-makeDate32(year, month, day)
-```
-
-Using a year and day of year:
-
-```sql
-makeDate32(year, day_of_year)
-```
-
-### Arguments
-
-- `year` — Year. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
-- `month` — Month. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
-- `day` — Day. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
-- `day_of_year` — Day of the year. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md).
-
-### Returned values
-
-A date created from the arguments.
-
-Type: [Date32](../../sql-reference/data-types/date32.md).
-
-### Examples
-
-Create a date from a year, month, and day:
-
-```sql
-SELECT makeDate32(2024, 1, 1);
-```
-
-```response
-2024-01-01
-```
-
-Create a Date from a year and day of year:
-
-``` sql
-SELECT makeDate32(2024, 100);
-```
-
-```response
-2024-04-09
-```
+Like [makeDate](#makeDate) but produces a [Date32](../../sql-reference/data-types/date32.md).
 
 ## makeDateTime
 
@@ -178,38 +129,12 @@ Result:
 
 ## makeDateTime64
 
-Create a [DateTime64](../../sql-reference/data-types/datetime64.md) data type value from its components (year, month, day, hour, minute, second, and optionally, subsecond precision).
-
-The DateTime64 data type stores both the date and time components in a single 64-bit integer value. The precision of the time component is configurable, allowing you to store time values with subsecond precision up to nanoseconds.
+Like [makeDateTime](#makedatetime) but produces a [DateTime64](../../sql-reference/data-types/datetime64.md).
 
 **Syntax**
 
-```sql
-makeDateTime64(year, month, day, hour, minute, second[, fraction[, precision]])
-```
-
-**Arguments**
-
-- `year` — [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The year component (0-9999).
-- `month` — Month. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The month component (1-12).
-- `day` — Day. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The day component (1-31).
-- `hour` — Hour. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The hour component (0-23).
-- `minute` — Minute. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The minute component (0-59).
-- `second` — Second. [Integer](../../sql-reference/data-types/int-uint.md), [Float](../../sql-reference/data-types/float.md) or [Decimal](../../sql-reference/data-types/decimal.md). The second component (0-59).
-- `subsecond_precision` (optional) [Integer](../../sql-reference/data-types/int-uint.md): The precision of the subsecond component (0-9, where 0 means no subsecond precision, and 9 means nanosecond precision).
-
-**Returned value**
-
-A date and time element of type [DateTime64](../../sql-reference/data-types/datetime64.md) with created from the supplied arguments.
-
-**Example**
-
 ``` sql
-SELECT makeDateTime64(2023, 5, 15, 10, 30, 45, 779, 5);
-```
-
-```response
-2023-05-15 10:30:45.00779
+makeDateTime64(year, month, day, hour, minute, second[, fraction[, precision[, timezone]]])
 ```
 
 ## timestamp
diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index 10ceedad9aa..739b688a0d2 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -1866,7 +1866,7 @@ As you can see, `runningAccumulate` merges states for each group of rows separat
 
 ## joinGet
 
-Allows you to extract data from a specific column in a Join table, similar to how you would access a value from a dictionary.
+The function lets you extract data from the table the same way as from a [dictionary](../../sql-reference/dictionaries/index.md).
 
 Gets the data from [Join](../../engines/table-engines/special/join.md#creating-a-table) tables using the specified join key.
 
@@ -1927,69 +1927,6 @@ Result:
 └──────────────────────────────────────────────────┘
 ```
 
-## joinGetOrNull
-
-Allows you to extract data from a specific column in a Join table, similar to how you would access a value from a dictionary.
-
-Gets the data from [Join](../../engines/table-engines/special/join.md#creating-a-table) tables using the specified join key.
-
-Only supports tables created with the `ENGINE = Join(ANY, LEFT, <join_keys>)` statement.
-
-### Syntax
-
-```sql
-joinGet(join_storage_table_name, `value_column`, join_keys)
-```
-
-### Parameters
-
-- `join_storage_table_name` — an [identifier](../../sql-reference/syntax.md#syntax-identifiers) indicating where the search is performed. The identifier is searched in the default database (see setting `default_database` in the config file). To override the default database, use `USE db_name` or specify the database and the table through the separator `db_name.db_table` as in the example.
-- `value_column` — name of the column of the table that contains required data.
-- `join_keys` — list of keys.
-
-### Returned value
-
-Returns a list of values corresponded to list of keys.
-
-If certain does not exist in source table then `0` or `null` will be returned based on [join_use_nulls](../../operations/settings/settings.md#join_use_nulls) setting.
-
-More info about `join_use_nulls` in [Join operation](../../engines/table-engines/special/join.md).
-
-**Example**
-
-Input table:
-
-``` sql
-CREATE DATABASE db_test
-CREATE TABLE db_test.id_val(`id` UInt32, `val` UInt32) ENGINE = Join(ANY, LEFT, id) SETTINGS join_use_nulls = 1
-INSERT INTO db_test.id_val VALUES (1,11)(2,12)(4,13)
-```
-
-``` text
-┌─id─┬─val─┐
-│  4 │  13 │
-│  2 │  12 │
-│  1 │  11 │
-└────┴─────┘
-```
-
-Query:
-
-``` sql
-SELECT joinGet(db_test.id_val, 'val', toUInt32(number)) from numbers(4) SETTINGS join_use_nulls = 1
-```
-
-Result:
-
-``` text
-┌─joinGet(db_test.id_val, 'val', toUInt32(number))─┐
-│                                                0 │
-│                                               11 │
-│                                               12 │
-│                                                0 │
-└──────────────────────────────────────────────────┘
-```
-
 ## catboostEvaluate(path_to_model, feature_1, feature_2, …, feature_n)
 
 :::note

From a7350299396d5ba3f2322584195554a7d946562f Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 11 Mar 2024 12:50:54 +0000
Subject: [PATCH 290/985] Fix tests

---
 src/Common/DateLUTImpl.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/DateLUTImpl.h b/src/Common/DateLUTImpl.h
index 4087e77d588..082127e717c 100644
--- a/src/Common/DateLUTImpl.h
+++ b/src/Common/DateLUTImpl.h
@@ -255,7 +255,7 @@ private:
 
     static LUTIndex toLUTIndex(ExtendedDayNum d)
     {
-        return normalizeLUTIndex(static_cast<Int64>(d) + daynum_offset_epoch);
+        return normalizeLUTIndex(static_cast<Int64>(d + daynum_offset_epoch)); /// NOLINT
     }
 
     LUTIndex toLUTIndex(Time t) const

From 802bae9661a6f22a8c42a6f88f9816e3497d9355 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 11 Mar 2024 12:54:34 +0000
Subject: [PATCH 291/985] GCC --> clang pragmas

---
 base/base/coverage.cpp                             | 2 +-
 base/base/sort.h                                   | 6 +++---
 programs/client/Client.cpp                         | 4 ++--
 programs/copier/ClusterCopierApp.cpp               | 4 ++--
 programs/extract-from-config/ExtractFromConfig.cpp | 4 ++--
 programs/format/Format.cpp                         | 4 ++--
 programs/local/LocalServer.cpp                     | 4 ++--
 programs/obfuscator/Obfuscator.cpp                 | 4 ++--
 src/Common/SSH/Wrappers.cpp                        | 8 ++++----
 src/Functions/GatherUtils/Sources.h                | 8 ++++----
 10 files changed, 24 insertions(+), 24 deletions(-)

diff --git a/base/base/coverage.cpp b/base/base/coverage.cpp
index 99b897c4571..d96b3ea1e9a 100644
--- a/base/base/coverage.cpp
+++ b/base/base/coverage.cpp
@@ -1,7 +1,7 @@
 #include "coverage.h"
 #include <sys/mman.h>
 
-#pragma GCC diagnostic ignored "-Wreserved-identifier"
+#pragma clang diagnostic ignored "-Wreserved-identifier"
 
 
 /// WITH_COVERAGE enables the default implementation of code coverage,
diff --git a/base/base/sort.h b/base/base/sort.h
index 99bf8a0830e..e46c388d185 100644
--- a/base/base/sort.h
+++ b/base/base/sort.h
@@ -59,8 +59,8 @@ using ComparatorWrapper = Comparator;
 
 #endif
 
-#pragma GCC diagnostic push
-#pragma GCC diagnostic ignored "-Wold-style-cast"
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wold-style-cast"
 
 #include <miniselect/floyd_rivest_select.h>
 
@@ -115,7 +115,7 @@ void partial_sort(RandomIt first, RandomIt middle, RandomIt last)
     ::partial_sort(first, middle, last, comparator());
 }
 
-#pragma GCC diagnostic pop
+#pragma clang diagnostic pop
 
 template <typename RandomIt, typename Compare>
 void sort(RandomIt first, RandomIt last, Compare compare)
diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index a2bd6b6016a..1c7e57dac76 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -1377,8 +1377,8 @@ void Client::readArguments(
 }
 
 
-#pragma GCC diagnostic ignored "-Wunused-function"
-#pragma GCC diagnostic ignored "-Wmissing-declarations"
+#pragma clang diagnostic ignored "-Wunused-function"
+#pragma clang diagnostic ignored "-Wmissing-declarations"
 
 int mainEntryClickHouseClient(int argc, char ** argv)
 {
diff --git a/programs/copier/ClusterCopierApp.cpp b/programs/copier/ClusterCopierApp.cpp
index fdf07dec61a..ed748a17a55 100644
--- a/programs/copier/ClusterCopierApp.cpp
+++ b/programs/copier/ClusterCopierApp.cpp
@@ -232,8 +232,8 @@ int ClusterCopierApp::main(const std::vector<std::string> &)
 
 }
 
-#pragma GCC diagnostic ignored "-Wunused-function"
-#pragma GCC diagnostic ignored "-Wmissing-declarations"
+#pragma clang diagnostic ignored "-Wunused-function"
+#pragma clang diagnostic ignored "-Wmissing-declarations"
 
 int mainEntryClickHouseClusterCopier(int argc, char ** argv)
 {
diff --git a/programs/extract-from-config/ExtractFromConfig.cpp b/programs/extract-from-config/ExtractFromConfig.cpp
index 56041ee382f..61d451664e3 100644
--- a/programs/extract-from-config/ExtractFromConfig.cpp
+++ b/programs/extract-from-config/ExtractFromConfig.cpp
@@ -109,8 +109,8 @@ static std::vector<std::string> extractFromConfig(
     return {configuration->getString(key)};
 }
 
-#pragma GCC diagnostic ignored "-Wunused-function"
-#pragma GCC diagnostic ignored "-Wmissing-declarations"
+#pragma clang diagnostic ignored "-Wunused-function"
+#pragma clang diagnostic ignored "-Wmissing-declarations"
 
 int mainEntryClickHouseExtractFromConfig(int argc, char ** argv)
 {
diff --git a/programs/format/Format.cpp b/programs/format/Format.cpp
index a1c51565ae3..c92106e2f90 100644
--- a/programs/format/Format.cpp
+++ b/programs/format/Format.cpp
@@ -70,8 +70,8 @@ void skipSpacesAndComments(const char*& pos, const char* end, bool print_comment
 
 }
 
-#pragma GCC diagnostic ignored "-Wunused-function"
-#pragma GCC diagnostic ignored "-Wmissing-declarations"
+#pragma clang diagnostic ignored "-Wunused-function"
+#pragma clang diagnostic ignored "-Wmissing-declarations"
 
 extern const char * auto_time_zones[];
 
diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 68f0e52ce08..99639d5e604 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -944,8 +944,8 @@ void LocalServer::readArguments(int argc, char ** argv, Arguments & common_argum
 
 }
 
-#pragma GCC diagnostic ignored "-Wunused-function"
-#pragma GCC diagnostic ignored "-Wmissing-declarations"
+#pragma clang diagnostic ignored "-Wunused-function"
+#pragma clang diagnostic ignored "-Wmissing-declarations"
 
 int mainEntryClickHouseLocal(int argc, char ** argv)
 {
diff --git a/programs/obfuscator/Obfuscator.cpp b/programs/obfuscator/Obfuscator.cpp
index 242e995e466..317d93aaf0c 100644
--- a/programs/obfuscator/Obfuscator.cpp
+++ b/programs/obfuscator/Obfuscator.cpp
@@ -1204,8 +1204,8 @@ public:
 
 }
 
-#pragma GCC diagnostic ignored "-Wunused-function"
-#pragma GCC diagnostic ignored "-Wmissing-declarations"
+#pragma clang diagnostic ignored "-Wunused-function"
+#clang GCC diagnostic ignored "-Wmissing-declarations"
 
 int mainEntryClickHouseObfuscator(int argc, char ** argv)
 try
diff --git a/src/Common/SSH/Wrappers.cpp b/src/Common/SSH/Wrappers.cpp
index 463338dbe3f..a9b9f758c6e 100644
--- a/src/Common/SSH/Wrappers.cpp
+++ b/src/Common/SSH/Wrappers.cpp
@@ -2,13 +2,13 @@
 # if USE_SSH
 #    include <stdexcept>
 
-#    pragma GCC diagnostic push
-#    pragma GCC diagnostic ignored "-Wreserved-macro-identifier"
-#    pragma GCC diagnostic ignored "-Wreserved-identifier"
+#    pragma clang diagnostic push
+#    pragma clang diagnostic ignored "-Wreserved-macro-identifier"
+#    pragma clang diagnostic ignored "-Wreserved-identifier"
 
 #    include <libssh/libssh.h>
 
-#    pragma GCC diagnostic pop
+#    pragma clang diagnostic pop
 
 namespace
 {
diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 222f9f19168..80fb9ce3900 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -140,9 +140,9 @@ struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
 
 
 /// The methods can be virtual or not depending on the template parameter. See IStringSource.
-#pragma GCC diagnostic push
-#pragma GCC diagnostic ignored "-Wsuggest-override"
-#pragma GCC diagnostic ignored "-Wsuggest-destructor-override"
+#pragma clang diagnostic push
+#pragma clang diagnostic ignored "-Wsuggest-override"
+#pragma clang diagnostic ignored "-Wsuggest-destructor-override"
 
 template <typename Base>
 struct ConstSource : public Base
@@ -231,7 +231,7 @@ struct ConstSource : public Base
     }
 };
 
-#pragma GCC diagnostic pop
+#pragma clang diagnostic pop
 
 struct StringSource
 {

From a7568ddbfaf107e9dafa6fa83c9d5f747a0e7153 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 11 Mar 2024 12:58:20 +0000
Subject: [PATCH 292/985] Fix spelling

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 3614bcb7452..473907b45ae 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1846,6 +1846,7 @@ linearized
 lineasstring
 linefeeds
 lineorder
+linestring
 linux
 llvm
 loadDefaultCAFile
@@ -2204,7 +2205,9 @@ rankCorr
 rapidjson
 rawblob
 readWKTMultiPolygon
+readWKTPoint
 readWKTPolygon
+readWKTRing
 readahead
 readline
 readme

From c4f29af8ec0927c09b9d12d83767607020915c30 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Mon, 11 Mar 2024 13:35:05 +0000
Subject: [PATCH 293/985] CI: fix nightly job issue

 #do_not_test
---
 tests/ci/ci.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 1eec9a6771b..9d57f161be3 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1756,7 +1756,8 @@ def main() -> int:
         result["build"] = build_digest
         result["docs"] = docs_digest
         result["ci_flags"] = ci_flags
-        result["stages_data"] = _generate_ci_stage_config(jobs_data)
+        if not args.skip_jobs:
+            result["stages_data"] = _generate_ci_stage_config(jobs_data)
         result["jobs_data"] = jobs_data
         result["docker_data"] = docker_data
     ### CONFIGURE action: end

From 19d8256fa83a4e8353dcad372067085ec8f0828d Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 11 Mar 2024 14:44:19 +0100
Subject: [PATCH 294/985] Update test.py

---
 tests/integration/test_backup_restore_s3/test.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/tests/integration/test_backup_restore_s3/test.py b/tests/integration/test_backup_restore_s3/test.py
index f3f4837c317..d65fc1f09d6 100644
--- a/tests/integration/test_backup_restore_s3/test.py
+++ b/tests/integration/test_backup_restore_s3/test.py
@@ -130,11 +130,11 @@ def check_system_tables(backup_query_id=None):
         if disk
     ]
     expected_disks = (
-        ("default", "local", "None", "None"),
-        ("disk_s3", "object_storage", "s3", "local"),
-        ("disk_s3_cache", "object_storage", "s3", "local"),
-        ("disk_s3_other_bucket", "object_storage", "s3", "local"),
-        ("disk_s3_plain", "object_storage", "s3", "plain"),
+        ("default", "Local", "None", "None"),
+        ("disk_s3", "ObjectStorage", "S3", "Local"),
+        ("disk_s3_cache", "ObjectStorage", "S3", "Local"),
+        ("disk_s3_other_bucket", "ObjectStorage", "S3", "Local"),
+        ("disk_s3_plain", "ObjectStorage", "S3", "Plain"),
     )
     assert len(expected_disks) == len(disks)
     for expected_disk in expected_disks:

From 9bada70f45654495a30e394d94a374a862c24fb5 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 11 Mar 2024 14:52:32 +0100
Subject: [PATCH 295/985] Remove a bunch of transitive dependencies

---
 src/Backups/BackupCoordinationRemote.cpp     |  2 ++
 src/Formats/ReadSchemaUtils.cpp              |  9 +++++----
 src/Interpreters/DatabaseCatalog.h           |  7 +++----
 src/Interpreters/GraceHashJoin.cpp           | 15 ++++++---------
 src/Interpreters/TemporaryDataOnDisk.h       |  6 +++---
 src/Planner/PlannerExpressionAnalysis.cpp    |  2 ++
 src/Processors/QueryPlan/AggregatingStep.cpp |  1 +
 src/Processors/QueryPlan/CubeStep.cpp        |  7 ++++---
 src/Processors/QueryPlan/SortingStep.cpp     |  1 +
 9 files changed, 27 insertions(+), 23 deletions(-)

diff --git a/src/Backups/BackupCoordinationRemote.cpp b/src/Backups/BackupCoordinationRemote.cpp
index 9c509858b2a..ec652f20069 100644
--- a/src/Backups/BackupCoordinationRemote.cpp
+++ b/src/Backups/BackupCoordinationRemote.cpp
@@ -14,6 +14,8 @@
 #include <IO/WriteBufferFromString.h>
 #include <IO/WriteHelpers.h>
 
+#include <boost/algorithm/string.hpp>
+
 
 namespace DB
 {
diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index 5badf4301bf..b05b768899b 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -1,10 +1,11 @@
 #include <Formats/ReadSchemaUtils.h>
-#include <Interpreters/Context.h>
-#include <Processors/Formats/ISchemaReader.h>
-#include <Common/assert_cast.h>
-#include <IO/WithFileSize.h>
 #include <IO/EmptyReadBuffer.h>
 #include <IO/PeekableReadBuffer.h>
+#include <IO/WithFileSize.h>
+#include <Interpreters/Context.h>
+#include <Processors/Formats/ISchemaReader.h>
+#include <Storages/IStorage.h>
+#include <Common/assert_cast.h>
 
 namespace DB
 {
diff --git a/src/Interpreters/DatabaseCatalog.h b/src/Interpreters/DatabaseCatalog.h
index 4fe114cc493..6f05a3cea0f 100644
--- a/src/Interpreters/DatabaseCatalog.h
+++ b/src/Interpreters/DatabaseCatalog.h
@@ -1,15 +1,14 @@
 #pragma once
 
 #include <Core/UUID.h>
+#include <Databases/IDatabase.h>
+#include <Databases/TablesDependencyGraph.h>
 #include <Interpreters/Context_fwd.h>
 #include <Interpreters/StorageID.h>
-#include <Databases/TablesDependencyGraph.h>
 #include <Parsers/IAST_fwd.h>
 #include <Storages/IStorage_fwd.h>
-#include "Common/NamePrompter.h"
+#include <Common/NamePrompter.h>
 #include <Common/SharedMutex.h>
-#include "Storages/IStorage.h"
-#include "Databases/IDatabase.h"
 
 #include <boost/noncopyable.hpp>
 #include <Poco/Logger.h>
diff --git a/src/Interpreters/GraceHashJoin.cpp b/src/Interpreters/GraceHashJoin.cpp
index 5fb92a68a29..53d1f48c291 100644
--- a/src/Interpreters/GraceHashJoin.cpp
+++ b/src/Interpreters/GraceHashJoin.cpp
@@ -1,21 +1,18 @@
+#include <Compression/CompressedWriteBuffer.h>
+#include <Formats/NativeWriter.h>
+#include <Formats/formatBlock.h>
+#include <Interpreters/Context.h>
 #include <Interpreters/GraceHashJoin.h>
 #include <Interpreters/HashJoin.h>
 #include <Interpreters/TableJoin.h>
-
-#include <Formats/NativeWriter.h>
 #include <Interpreters/TemporaryDataOnDisk.h>
-
-#include <Compression/CompressedWriteBuffer.h>
+#include <base/FnTraits.h>
 #include <Common/formatReadable.h>
 #include <Common/logger_useful.h>
 #include <Common/thread_local_rng.h>
 
-#include <base/FnTraits.h>
-#include <fmt/format.h>
-
-#include <Formats/formatBlock.h>
-
 #include <numeric>
+#include <fmt/format.h>
 
 
 namespace CurrentMetrics
diff --git a/src/Interpreters/TemporaryDataOnDisk.h b/src/Interpreters/TemporaryDataOnDisk.h
index e57d9130369..8b0649be1b1 100644
--- a/src/Interpreters/TemporaryDataOnDisk.h
+++ b/src/Interpreters/TemporaryDataOnDisk.h
@@ -2,11 +2,11 @@
 
 #include <boost/noncopyable.hpp>
 
-#include <Interpreters/Context.h>
-#include <Disks/TemporaryFileOnDisk.h>
+#include <Core/Block.h>
 #include <Disks/IVolume.h>
-#include <Common/CurrentMetrics.h>
+#include <Disks/TemporaryFileOnDisk.h>
 #include <Interpreters/Cache/FileSegment.h>
+#include <Common/CurrentMetrics.h>
 
 
 namespace CurrentMetrics
diff --git a/src/Planner/PlannerExpressionAnalysis.cpp b/src/Planner/PlannerExpressionAnalysis.cpp
index 52001eb27c5..30d90a68072 100644
--- a/src/Planner/PlannerExpressionAnalysis.cpp
+++ b/src/Planner/PlannerExpressionAnalysis.cpp
@@ -3,6 +3,8 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeNullable.h>
 
+#include <Interpreters/Context.h>
+
 #include <Analyzer/FunctionNode.h>
 #include <Analyzer/ConstantNode.h>
 #include <Analyzer/WindowNode.h>
diff --git a/src/Processors/QueryPlan/AggregatingStep.cpp b/src/Processors/QueryPlan/AggregatingStep.cpp
index f374a7b7b10..a76bacdd97b 100644
--- a/src/Processors/QueryPlan/AggregatingStep.cpp
+++ b/src/Processors/QueryPlan/AggregatingStep.cpp
@@ -8,6 +8,7 @@
 #include <IO/Operators.h>
 #include <Interpreters/Aggregator.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/ExpressionActions.h>
 #include <Processors/Merges/AggregatingSortedTransform.h>
 #include <Processors/Merges/FinishAggregatingInOrderTransform.h>
 #include <Processors/QueryPlan/AggregatingStep.h>
diff --git a/src/Processors/QueryPlan/CubeStep.cpp b/src/Processors/QueryPlan/CubeStep.cpp
index 0c632c346c7..d010a3327a6 100644
--- a/src/Processors/QueryPlan/CubeStep.cpp
+++ b/src/Processors/QueryPlan/CubeStep.cpp
@@ -1,10 +1,11 @@
+#include <DataTypes/DataTypesNumber.h>
+#include <Functions/FunctionFactory.h>
+#include <Interpreters/ExpressionActions.h>
+#include <Processors/QueryPlan/AggregatingStep.h>
 #include <Processors/QueryPlan/CubeStep.h>
 #include <Processors/Transforms/CubeTransform.h>
 #include <Processors/Transforms/ExpressionTransform.h>
-#include <Processors/QueryPlan/AggregatingStep.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <Functions/FunctionFactory.h>
 
 namespace DB
 {
diff --git a/src/Processors/QueryPlan/SortingStep.cpp b/src/Processors/QueryPlan/SortingStep.cpp
index 641b9036d4c..d0491cb4b82 100644
--- a/src/Processors/QueryPlan/SortingStep.cpp
+++ b/src/Processors/QueryPlan/SortingStep.cpp
@@ -1,6 +1,7 @@
 #include <memory>
 #include <stdexcept>
 #include <IO/Operators.h>
+#include <Interpreters/Context.h>
 #include <Processors/Merges/MergingSortedTransform.h>
 #include <Processors/QueryPlan/SortingStep.h>
 #include <Processors/Transforms/FinishSortingTransform.h>

From 91de3825171eefb8f828c2907181b6a5e6b0f017 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Mon, 11 Mar 2024 14:00:01 +0000
Subject: [PATCH 296/985] Spit `DictionaryPipelineExecutor` into separate file

---
 src/Dictionaries/CacheDictionary.cpp          |  2 +-
 .../DictionaryPipelineExecutor.cpp            | 42 +++++++++++++++++++
 src/Dictionaries/DictionaryPipelineExecutor.h | 27 ++++++++++++
 src/Dictionaries/DictionarySourceHelpers.cpp  | 29 -------------
 src/Dictionaries/DictionarySourceHelpers.h    | 17 --------
 src/Dictionaries/FlatDictionary.cpp           |  2 +-
 src/Dictionaries/HashedArrayDictionary.cpp    |  1 +
 src/Dictionaries/HashedDictionary.h           |  2 +-
 src/Dictionaries/IPAddressDictionary.cpp      |  1 +
 src/Dictionaries/PolygonDictionary.cpp        |  3 +-
 src/Dictionaries/RangeHashedDictionary.h      |  6 +--
 src/Dictionaries/RegExpTreeDictionary.cpp     |  1 +
 .../registerRangeHashedDictionary.cpp         |  5 ++-
 13 files changed, 82 insertions(+), 56 deletions(-)
 create mode 100644 src/Dictionaries/DictionaryPipelineExecutor.cpp
 create mode 100644 src/Dictionaries/DictionaryPipelineExecutor.h

diff --git a/src/Dictionaries/CacheDictionary.cpp b/src/Dictionaries/CacheDictionary.cpp
index 8444042db9e..b136d5ebd71 100644
--- a/src/Dictionaries/CacheDictionary.cpp
+++ b/src/Dictionaries/CacheDictionary.cpp
@@ -9,7 +9,7 @@
 #include <Common/ProfilingScopedRWLock.h>
 
 #include <Dictionaries/DictionarySource.h>
-#include <Dictionaries/DictionarySourceHelpers.h>
+#include <Dictionaries/DictionaryPipelineExecutor.h>
 #include <Dictionaries/HierarchyDictionariesUtils.h>
 
 #include <QueryPipeline/QueryPipelineBuilder.h>
diff --git a/src/Dictionaries/DictionaryPipelineExecutor.cpp b/src/Dictionaries/DictionaryPipelineExecutor.cpp
new file mode 100644
index 00000000000..30d1ab95f53
--- /dev/null
+++ b/src/Dictionaries/DictionaryPipelineExecutor.cpp
@@ -0,0 +1,42 @@
+#include <Dictionaries/DictionaryPipelineExecutor.h>
+
+#include <Core/Block.h>
+#include <Processors/Executors/PullingAsyncPipelineExecutor.h>
+#include <Processors/Executors/PullingPipelineExecutor.h>
+#include <QueryPipeline/QueryPipeline.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+extern const int LOGICAL_ERROR;
+}
+
+DictionaryPipelineExecutor::DictionaryPipelineExecutor(QueryPipeline & pipeline_, bool async)
+    : async_executor(async ? std::make_unique<PullingAsyncPipelineExecutor>(pipeline_) : nullptr)
+    , executor(async ? nullptr : std::make_unique<PullingPipelineExecutor>(pipeline_))
+{
+}
+
+bool DictionaryPipelineExecutor::pull(Block & block)
+{
+    if (async_executor)
+    {
+        while (true)
+        {
+            bool has_data = async_executor->pull(block);
+            if (has_data && !block)
+                continue;
+            return has_data;
+        }
+    }
+    else if (executor)
+        return executor->pull(block);
+    else
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "DictionaryPipelineExecutor is not initialized");
+}
+
+DictionaryPipelineExecutor::~DictionaryPipelineExecutor() = default;
+
+}
diff --git a/src/Dictionaries/DictionaryPipelineExecutor.h b/src/Dictionaries/DictionaryPipelineExecutor.h
new file mode 100644
index 00000000000..601213e5039
--- /dev/null
+++ b/src/Dictionaries/DictionaryPipelineExecutor.h
@@ -0,0 +1,27 @@
+#pragma once
+
+#include <memory>
+
+namespace DB
+{
+
+class Block;
+class QueryPipeline;
+class PullingAsyncPipelineExecutor;
+class PullingPipelineExecutor;
+
+/// Wrapper for `Pulling(Async)PipelineExecutor` to dynamically dispatch calls to the right executor
+class DictionaryPipelineExecutor
+{
+public:
+    DictionaryPipelineExecutor(QueryPipeline & pipeline_, bool async);
+    bool pull(Block & block);
+
+    ~DictionaryPipelineExecutor();
+
+private:
+    std::unique_ptr<PullingAsyncPipelineExecutor> async_executor;
+    std::unique_ptr<PullingPipelineExecutor> executor;
+};
+
+}
diff --git a/src/Dictionaries/DictionarySourceHelpers.cpp b/src/Dictionaries/DictionarySourceHelpers.cpp
index d9a4d9ccbcf..f0e1bc4109a 100644
--- a/src/Dictionaries/DictionarySourceHelpers.cpp
+++ b/src/Dictionaries/DictionarySourceHelpers.cpp
@@ -9,15 +9,11 @@
 #include <Poco/Util/AbstractConfiguration.h>
 #include <Common/SettingsChanges.h>
 
-#include <Processors/Executors/PullingPipelineExecutor.h>
-#include <Processors/Executors/PullingAsyncPipelineExecutor.h>
-
 namespace DB
 {
 
 namespace ErrorCodes
 {
-    extern const int LOGICAL_ERROR;
     extern const int SIZES_OF_COLUMNS_DOESNT_MATCH;
 }
 
@@ -135,29 +131,4 @@ String TransformWithAdditionalColumns::getName() const
     return "TransformWithAdditionalColumns";
 }
 
-DictionaryPipelineExecutor::DictionaryPipelineExecutor(QueryPipeline & pipeline_, bool async)
-    : async_executor(async ? std::make_unique<PullingAsyncPipelineExecutor>(pipeline_) : nullptr)
-    , executor(async ? nullptr : std::make_unique<PullingPipelineExecutor>(pipeline_))
-{}
-
-bool DictionaryPipelineExecutor::pull(Block & block)
-{
-    if (async_executor)
-    {
-        while (true)
-        {
-            bool has_data = async_executor->pull(block);
-            if (has_data && !block)
-                continue;
-            return has_data;
-        }
-    }
-    else if (executor)
-        return executor->pull(block);
-    else
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "DictionaryPipelineExecutor is not initialized");
-}
-
-DictionaryPipelineExecutor::~DictionaryPipelineExecutor() = default;
-
 }
diff --git a/src/Dictionaries/DictionarySourceHelpers.h b/src/Dictionaries/DictionarySourceHelpers.h
index a545b5cdac7..39c6e7b3c42 100644
--- a/src/Dictionaries/DictionarySourceHelpers.h
+++ b/src/Dictionaries/DictionarySourceHelpers.h
@@ -16,10 +16,6 @@ namespace DB
 struct DictionaryStructure;
 class SettingsChanges;
 
-class PullingPipelineExecutor;
-class PullingAsyncPipelineExecutor;
-class QueryPipeline;
-
 /// For simple key
 
 Block blockForIds(
@@ -55,17 +51,4 @@ private:
     size_t current_range_index = 0;
 };
 
-/// Wrapper for `Pulling(Async)PipelineExecutor` to dynamically dispatch calls to the right executor
-class DictionaryPipelineExecutor
-{
-public:
-    DictionaryPipelineExecutor(QueryPipeline & pipeline_, bool async);
-    bool pull(Block & block);
-
-    ~DictionaryPipelineExecutor();
-private:
-    std::unique_ptr<PullingAsyncPipelineExecutor> async_executor;
-    std::unique_ptr<PullingPipelineExecutor> executor;
-};
-
 }
diff --git a/src/Dictionaries/FlatDictionary.cpp b/src/Dictionaries/FlatDictionary.cpp
index efb7d0a176c..fc58ff525bd 100644
--- a/src/Dictionaries/FlatDictionary.cpp
+++ b/src/Dictionaries/FlatDictionary.cpp
@@ -15,7 +15,7 @@
 #include <QueryPipeline/QueryPipelineBuilder.h>
 
 #include <Dictionaries/DictionarySource.h>
-#include <Dictionaries/DictionarySourceHelpers.h>
+#include <Dictionaries/DictionaryPipelineExecutor.h>
 #include <Dictionaries/DictionaryFactory.h>
 #include <Dictionaries/HierarchyDictionariesUtils.h>
 
diff --git a/src/Dictionaries/HashedArrayDictionary.cpp b/src/Dictionaries/HashedArrayDictionary.cpp
index d09f402143e..2420c07277c 100644
--- a/src/Dictionaries/HashedArrayDictionary.cpp
+++ b/src/Dictionaries/HashedArrayDictionary.cpp
@@ -10,6 +10,7 @@
 #include <Dictionaries/ClickHouseDictionarySource.h>
 #include <Dictionaries/DictionarySource.h>
 #include <Dictionaries/DictionarySourceHelpers.h>
+#include <Dictionaries/DictionaryPipelineExecutor.h>
 #include <Dictionaries/DictionaryFactory.h>
 #include <Dictionaries/HierarchyDictionariesUtils.h>
 
diff --git a/src/Dictionaries/HashedDictionary.h b/src/Dictionaries/HashedDictionary.h
index b3b8cc56868..46a0af487f5 100644
--- a/src/Dictionaries/HashedDictionary.h
+++ b/src/Dictionaries/HashedDictionary.h
@@ -6,7 +6,7 @@
 #include <Dictionaries/DictionaryHelpers.h>
 #include <Dictionaries/ClickHouseDictionarySource.h>
 #include <Dictionaries/DictionarySource.h>
-#include <Dictionaries/DictionarySourceHelpers.h>
+#include <Dictionaries/DictionaryPipelineExecutor.h>
 #include <Dictionaries/HierarchyDictionariesUtils.h>
 #include <Dictionaries/HashedDictionaryCollectionType.h>
 #include <Dictionaries/HashedDictionaryCollectionTraits.h>
diff --git a/src/Dictionaries/IPAddressDictionary.cpp b/src/Dictionaries/IPAddressDictionary.cpp
index e1c9572e607..1bc6d16c932 100644
--- a/src/Dictionaries/IPAddressDictionary.cpp
+++ b/src/Dictionaries/IPAddressDictionary.cpp
@@ -19,6 +19,7 @@
 #include <Dictionaries/ClickHouseDictionarySource.h>
 #include <Dictionaries/DictionarySource.h>
 #include <Dictionaries/DictionarySourceHelpers.h>
+#include <Dictionaries/DictionaryPipelineExecutor.h>
 #include <Dictionaries/DictionaryFactory.h>
 #include <Functions/FunctionHelpers.h>
 
diff --git a/src/Dictionaries/PolygonDictionary.cpp b/src/Dictionaries/PolygonDictionary.cpp
index 485b48d9d81..1456a0db750 100644
--- a/src/Dictionaries/PolygonDictionary.cpp
+++ b/src/Dictionaries/PolygonDictionary.cpp
@@ -1,6 +1,5 @@
 #include "PolygonDictionary.h"
 
-#include <numeric>
 #include <cmath>
 
 #include <base/sort.h>
@@ -15,7 +14,7 @@
 #include <Processors/Sources/SourceFromSingleChunk.h>
 #include <Dictionaries/DictionaryFactory.h>
 #include <Dictionaries/DictionarySource.h>
-#include <Dictionaries/DictionarySourceHelpers.h>
+#include <Dictionaries/DictionaryPipelineExecutor.h>
 
 
 namespace DB
diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index 1a6ee7e81d4..509b991b30c 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -15,6 +15,8 @@
 #include <Dictionaries/IDictionary.h>
 #include <Dictionaries/IDictionarySource.h>
 #include <Dictionaries/DictionaryHelpers.h>
+#include <Dictionaries/DictionarySource.h>
+#include <Dictionaries/DictionaryPipelineExecutor.h>
 
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypesDecimal.h>
@@ -29,10 +31,6 @@
 #include <Functions/FunctionHelpers.h>
 #include <Interpreters/castColumn.h>
 
-#include <Dictionaries/ClickHouseDictionarySource.h>
-#include <Dictionaries/DictionarySource.h>
-#include <Dictionaries/DictionarySourceHelpers.h>
-
 
 namespace DB
 {
diff --git a/src/Dictionaries/RegExpTreeDictionary.cpp b/src/Dictionaries/RegExpTreeDictionary.cpp
index 4d82aa9ca0e..8930074bbe0 100644
--- a/src/Dictionaries/RegExpTreeDictionary.cpp
+++ b/src/Dictionaries/RegExpTreeDictionary.cpp
@@ -27,6 +27,7 @@
 #include <Dictionaries/DictionaryHelpers.h>
 #include <Dictionaries/DictionaryStructure.h>
 #include <Dictionaries/DictionarySourceHelpers.h>
+#include <Dictionaries/DictionaryPipelineExecutor.h>
 #include <Dictionaries/RegExpTreeDictionary.h>
 #include <Dictionaries/YAMLRegExpTreeDictionarySource.h>
 
diff --git a/src/Dictionaries/registerRangeHashedDictionary.cpp b/src/Dictionaries/registerRangeHashedDictionary.cpp
index 4e20abfdb79..8123b811198 100644
--- a/src/Dictionaries/registerRangeHashedDictionary.cpp
+++ b/src/Dictionaries/registerRangeHashedDictionary.cpp
@@ -1,5 +1,8 @@
-#include "RangeHashedDictionary.h"
+#include <Dictionaries/RangeHashedDictionary.h>
+
 #include <Dictionaries/DictionarySource.h>
+#include <Dictionaries/ClickHouseDictionarySource.h>
+#include <Dictionaries/DictionarySourceHelpers.h>
 #include <Dictionaries/DictionaryFactory.h>
 
 namespace DB

From 8b5ccb4735365ef81af4debcc3180f296452268d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 11 Mar 2024 15:53:46 +0100
Subject: [PATCH 297/985] Remove one template

---
 src/Interpreters/Aggregator.cpp | 65 +++++++++++++--------------------
 src/Interpreters/Aggregator.h   |  4 +-
 2 files changed, 28 insertions(+), 41 deletions(-)

diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 80a98683867..69625dbd57d 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -2609,8 +2609,9 @@ void NO_INLINE Aggregator::mergeDataNullKey(
     }
 }
 
-template <typename Method, bool use_compiled_functions, bool prefetch, typename Table>
-void NO_INLINE Aggregator::mergeDataImpl(Table & table_dst, Table & table_src, Arena * arena) const
+template <typename Method, bool prefetch, typename Table>
+void NO_INLINE
+Aggregator::mergeDataImpl(Table & table_dst, Table & table_src, Arena * arena, bool use_compiled_functions [[maybe_unused]]) const
 {
     if constexpr (Method::low_cardinality_optimization || Method::one_key_nullable_optimization)
         mergeDataNullKey<Method, Table>(table_dst, table_src, arena);
@@ -2637,7 +2638,7 @@ void NO_INLINE Aggregator::mergeDataImpl(Table & table_dst, Table & table_src, A
     table_src.clearAndShrink();
 
 #if USE_EMBEDDED_COMPILER
-    if constexpr (use_compiled_functions)
+    if (use_compiled_functions)
     {
         const auto & compiled_functions = compiled_aggregate_functions_holder->compiled_aggregate_functions;
         compiled_functions.merge_aggregate_states_function(dst_places.data(), src_places.data(), dst_places.size());
@@ -2787,26 +2788,16 @@ void NO_INLINE Aggregator::mergeSingleLevelDataImpl(
 
         if (!no_more_keys)
         {
+            bool use_compiled_functions = false;
 #if USE_EMBEDDED_COMPILER
-            if (compiled_aggregate_functions_holder)
-            {
-                if (prefetch)
-                    mergeDataImpl<Method, true, true>(
-                        getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool);
-                else
-                    mergeDataImpl<Method, true, false>(
-                        getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool);
-            }
-            else
+            use_compiled_functions = compiled_aggregate_functions_holder != nullptr;
 #endif
-            {
-                if (prefetch)
-                    mergeDataImpl<Method, false, true>(
-                        getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool);
-                else
-                    mergeDataImpl<Method, false, false>(
-                        getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool);
-            }
+            if (prefetch)
+                mergeDataImpl<Method, true>(
+                    getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool, use_compiled_functions);
+            else
+                mergeDataImpl<Method, false>(
+                    getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool, use_compiled_functions);
         }
         else if (res->without_key)
         {
@@ -2851,26 +2842,22 @@ void NO_INLINE Aggregator::mergeBucketImpl(
             return;
 
         AggregatedDataVariants & current = *data[result_num];
+        bool use_compiled_functions = false;
 #if USE_EMBEDDED_COMPILER
-        if (compiled_aggregate_functions_holder)
-        {
-            if (prefetch)
-                mergeDataImpl<Method, true, true>(
-                    getDataVariant<Method>(*res).data.impls[bucket], getDataVariant<Method>(current).data.impls[bucket], arena);
-            else
-                mergeDataImpl<Method, true, false>(
-                    getDataVariant<Method>(*res).data.impls[bucket], getDataVariant<Method>(current).data.impls[bucket], arena);
-        }
-        else
+        use_compiled_functions = compiled_aggregate_functions_holder != nullptr;
 #endif
-        {
-            if (prefetch)
-                mergeDataImpl<Method, false, true>(
-                    getDataVariant<Method>(*res).data.impls[bucket], getDataVariant<Method>(current).data.impls[bucket], arena);
-            else
-                mergeDataImpl<Method, false, false>(
-                    getDataVariant<Method>(*res).data.impls[bucket], getDataVariant<Method>(current).data.impls[bucket], arena);
-        }
+        if (prefetch)
+            mergeDataImpl<Method, true>(
+                getDataVariant<Method>(*res).data.impls[bucket],
+                getDataVariant<Method>(current).data.impls[bucket],
+                arena,
+                use_compiled_functions);
+        else
+            mergeDataImpl<Method, false>(
+                getDataVariant<Method>(*res).data.impls[bucket],
+                getDataVariant<Method>(current).data.impls[bucket],
+                arena,
+                use_compiled_functions);
     }
 }
 
diff --git a/src/Interpreters/Aggregator.h b/src/Interpreters/Aggregator.h
index 375b8986101..67e82cdd784 100644
--- a/src/Interpreters/Aggregator.h
+++ b/src/Interpreters/Aggregator.h
@@ -1429,8 +1429,8 @@ private:
             Arena * arena) const;
 
     /// Merge data from hash table `src` into `dst`.
-    template <typename Method, bool use_compiled_functions, bool prefetch, typename Table>
-    void mergeDataImpl(Table & table_dst, Table & table_src, Arena * arena) const;
+    template <typename Method, bool prefetch, typename Table>
+    void mergeDataImpl(Table & table_dst, Table & table_src, Arena * arena, bool use_compiled_functions) const;
 
     /// Merge data from hash table `src` into `dst`, but only for keys that already exist in dst. In other cases, merge the data into `overflows`.
     template <typename Method, typename Table>

From 724cc903afb9283a8369a62a836d04eceae42e57 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 11 Mar 2024 15:56:02 +0100
Subject: [PATCH 298/985] Restart CI

---
 tests/queries/0_stateless/03001_parallel_parsing_deadlock.sh | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/queries/0_stateless/03001_parallel_parsing_deadlock.sh b/tests/queries/0_stateless/03001_parallel_parsing_deadlock.sh
index 1bf21dfc53b..6cd5c3b486c 100755
--- a/tests/queries/0_stateless/03001_parallel_parsing_deadlock.sh
+++ b/tests/queries/0_stateless/03001_parallel_parsing_deadlock.sh
@@ -9,4 +9,3 @@ DATA_FILE=$CLICKHOUSE_TEST_UNIQUE_NAME.csv
 $CLICKHOUSE_LOCAL -q "select number > 1000000 ? 'error' : toString(number) from numbers(2000000) format CSV" > $DATA_FILE
 $CLICKHOUSE_LOCAL -q "select * from file($DATA_FILE, CSV, 'x UInt64') format Null settings input_format_allow_errors_ratio=1"
 rm $DATA_FILE
-

From ecc30448baa1c6283f3f0f13c83cfd1bf4428b9b Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 11 Mar 2024 15:26:29 +0000
Subject: [PATCH 299/985] Fix filtering when
 optimize_use_implicit_projections=1

---
 .../optimizeUseAggregateProjection.cpp        |  4 ++
 src/Storages/VirtualColumnUtils.cpp           |  2 +-
 src/Storages/VirtualColumnUtils.h             |  3 +
 ...ions_non_deterministoc_functions.reference | 55 +++++++++++++++++++
 ...rojections_non_deterministoc_functions.sql | 28 ++++++++++
 5 files changed, 91 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/03008_filter_projections_non_deterministoc_functions.reference
 create mode 100644 tests/queries/0_stateless/03008_filter_projections_non_deterministoc_functions.sql

diff --git a/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp b/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp
index 91f4213ff43..b40fea47b3c 100644
--- a/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp
+++ b/src/Processors/QueryPlan/Optimizations/optimizeUseAggregateProjection.cpp
@@ -18,6 +18,7 @@
 
 #include <Common/logger_useful.h>
 #include <Storages/StorageDummy.h>
+#include <Storages/VirtualColumnUtils.h>
 #include <Planner/PlannerExpressionAnalysis.h>
 #include <Interpreters/InterpreterSelectQuery.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
@@ -464,6 +465,9 @@ AggregateProjectionCandidates getAggregateProjectionCandidates(
     // LOG_TRACE(getLogger("optimizeUseProjections"), "Query DAG: {}", dag.dag->dumpDAG());
 
     candidates.has_filter = dag.filter_node;
+    /// We can't use minmax projection if filter has non-deterministic functions.
+    if (dag.filter_node && !VirtualColumnUtils::isDeterministicInScopeOfQuery(dag.filter_node))
+        can_use_minmax_projection = false;
 
     if (can_use_minmax_projection)
     {
diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index 897090223d6..c3ac27903c9 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -238,7 +238,7 @@ static bool canEvaluateSubtree(const ActionsDAG::Node * node, const Block & allo
     return true;
 }
 
-static bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node)
+bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node)
 {
     for (const auto * child : node->children)
     {
diff --git a/src/Storages/VirtualColumnUtils.h b/src/Storages/VirtualColumnUtils.h
index b5526fc5c7f..83494872cac 100644
--- a/src/Storages/VirtualColumnUtils.h
+++ b/src/Storages/VirtualColumnUtils.h
@@ -25,6 +25,9 @@ void filterBlockWithPredicate(const ActionsDAG::Node * predicate, Block & block,
 /// Just filters block. Block should contain all the required columns.
 void filterBlockWithDAG(ActionsDAGPtr dag, Block & block, ContextPtr context);
 
+/// Recursively checks if all functions used in DAG are deterministic in scope of query.
+bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node);
+
 /// Extract a part of predicate that can be evaluated using only columns from input_names.
 ActionsDAGPtr splitFilterDagForAllowedInputs(const ActionsDAG::Node * predicate, const Block * allowed_inputs);
 
diff --git a/tests/queries/0_stateless/03008_filter_projections_non_deterministoc_functions.reference b/tests/queries/0_stateless/03008_filter_projections_non_deterministoc_functions.reference
new file mode 100644
index 00000000000..8233925d609
--- /dev/null
+++ b/tests/queries/0_stateless/03008_filter_projections_non_deterministoc_functions.reference
@@ -0,0 +1,55 @@
+-- count
+100000	all_10_10_0
+100000	all_1_1_0
+100000	all_2_2_0
+100000	all_3_3_0
+100000	all_4_4_0
+100000	all_5_5_0
+100000	all_6_6_0
+100000	all_7_7_0
+100000	all_8_8_0
+100000	all_9_9_0
+-- rand()%2=0:
+1	all_10_10_0
+1	all_1_1_0
+1	all_2_2_0
+1	all_3_3_0
+1	all_4_4_0
+1	all_5_5_0
+1	all_6_6_0
+1	all_7_7_0
+1	all_8_8_0
+1	all_9_9_0
+-- optimize_use_implicit_projections=0
+1	all_10_10_0
+1	all_1_1_0
+1	all_2_2_0
+1	all_3_3_0
+1	all_4_4_0
+1	all_5_5_0
+1	all_6_6_0
+1	all_7_7_0
+1	all_8_8_0
+1	all_9_9_0
+-- optimize_trivial_count_query=0
+1	all_10_10_0
+1	all_1_1_0
+1	all_2_2_0
+1	all_3_3_0
+1	all_4_4_0
+1	all_5_5_0
+1	all_6_6_0
+1	all_7_7_0
+1	all_8_8_0
+1	all_9_9_0
+-- optimize_trivial_count_query=0, optimize_use_implicit_projections=0
+1	all_10_10_0
+1	all_1_1_0
+1	all_2_2_0
+1	all_3_3_0
+1	all_4_4_0
+1	all_5_5_0
+1	all_6_6_0
+1	all_7_7_0
+1	all_8_8_0
+1	all_9_9_0
diff --git a/tests/queries/0_stateless/03008_filter_projections_non_deterministoc_functions.sql b/tests/queries/0_stateless/03008_filter_projections_non_deterministoc_functions.sql
new file mode 100644
index 00000000000..3be9bc3982a
--- /dev/null
+++ b/tests/queries/0_stateless/03008_filter_projections_non_deterministoc_functions.sql
@@ -0,0 +1,28 @@
+create table test (number UInt64) engine=MergeTree order by number;
+system stop merges test;
+INSERT INTO test select number from numbers(100000);
+INSERT INTO test select number from numbers(100000);
+INSERT INTO test select number from numbers(100000);
+INSERT INTO test select number from numbers(100000);
+INSERT INTO test select number from numbers(100000);
+INSERT INTO test select number from numbers(100000);
+INSERT INTO test select number from numbers(100000);
+INSERT INTO test select number from numbers(100000);
+INSERT INTO test select number from numbers(100000);
+INSERT INTO test select number from numbers(100000);
+
+select '-- count';
+SELECT count(), _part FROM test GROUP BY _part ORDER BY _part;
+
+select '-- rand()%2=0:';
+SELECT count() > 0 AND count() < 100000, _part FROM test WHERE rand(1)%2=1 GROUP BY _part ORDER BY _part;
+
+select '-- optimize_use_implicit_projections=0';
+SELECT count() > 0 AND count() < 100000, _part FROM test WHERE rand(2)%2=1 GROUP BY _part ORDER BY _part settings optimize_use_implicit_projections=0;
+
+select '-- optimize_trivial_count_query=0';
+SELECT count() > 0 AND count() < 100000, _part FROM test WHERE rand(3)%2=1 GROUP BY _part ORDER BY _part settings optimize_trivial_count_query=0;
+
+select '-- optimize_trivial_count_query=0, optimize_use_implicit_projections=0';
+SELECT count() > 0 AND count() < 100000, _part FROM test WHERE rand(4)%2=1 GROUP BY _part ORDER BY _part settings optimize_trivial_count_query=0,optimize_use_implicit_projections=0;
+

From 879f7f2f8c862aae51ddc5a8faebb8d07b5d4493 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 11 Mar 2024 16:28:25 +0100
Subject: [PATCH 300/985] Remove more templates for JIT

---
 src/Interpreters/Aggregator.cpp | 185 ++++++++++++++------------------
 src/Interpreters/Aggregator.h   |  21 ++--
 2 files changed, 96 insertions(+), 110 deletions(-)

diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 69625dbd57d..c7ce3e46446 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -1111,6 +1111,7 @@ void NO_INLINE Aggregator::executeImpl(
     bool all_keys_are_const,
     AggregateDataPtr overflow_row) const
 {
+    bool use_compiled_functions = false;
     if (!no_more_keys)
     {
         /// Prefetching doesn't make sense for small hash tables, because they fit in caches entirely.
@@ -1118,33 +1119,47 @@ void NO_INLINE Aggregator::executeImpl(
             && (method.data.getBufferSizeInBytes() > min_bytes_for_prefetch);
 
 #if USE_EMBEDDED_COMPILER
-        if (compiled_aggregate_functions_holder && !hasSparseArguments(aggregate_instructions))
-        {
-            if (prefetch)
-                executeImplBatch<false, true, true>(
-                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
-            else
-                executeImplBatch<false, true, false>(
-                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
-        }
-        else
+        use_compiled_functions = compiled_aggregate_functions_holder && !hasSparseArguments(aggregate_instructions);
 #endif
-        {
-            if (prefetch)
-                executeImplBatch<false, false, true>(
-                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
-            else
-                executeImplBatch<false, false, false>(
-                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
-        }
+        if (prefetch)
+            executeImplBatch<false, true>(
+                method,
+                state,
+                aggregates_pool,
+                row_begin,
+                row_end,
+                aggregate_instructions,
+                all_keys_are_const,
+                use_compiled_functions,
+                overflow_row);
+        else
+            executeImplBatch<false, false>(
+                method,
+                state,
+                aggregates_pool,
+                row_begin,
+                row_end,
+                aggregate_instructions,
+                all_keys_are_const,
+                use_compiled_functions,
+                overflow_row);
     }
     else
     {
-        executeImplBatch<true, false, false>(method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
+        executeImplBatch<true, false>(
+            method,
+            state,
+            aggregates_pool,
+            row_begin,
+            row_end,
+            aggregate_instructions,
+            all_keys_are_const,
+            use_compiled_functions,
+            overflow_row);
     }
 }
 
-template <bool no_more_keys, bool use_compiled_functions, bool prefetch, typename Method, typename State>
+template <bool no_more_keys, bool prefetch, typename Method, typename State>
 void NO_INLINE Aggregator::executeImplBatch(
     Method & method,
     State & state,
@@ -1153,6 +1168,7 @@ void NO_INLINE Aggregator::executeImplBatch(
     size_t row_end,
     AggregateFunctionInstruction * aggregate_instructions,
     bool all_keys_are_const,
+    bool use_compiled_functions [[maybe_unused]],
     AggregateDataPtr overflow_row) const
 {
     using KeyHolder = decltype(state.getKeyHolder(0, std::declval<Arena &>()));
@@ -1284,7 +1300,7 @@ void NO_INLINE Aggregator::executeImplBatch(
                 aggregate_data = aggregates_pool->alignedAlloc(total_size_of_aggregate_states, align_aggregate_states);
 
 #if USE_EMBEDDED_COMPILER
-                if constexpr (use_compiled_functions)
+                if (use_compiled_functions)
                 {
                     const auto & compiled_aggregate_functions = compiled_aggregate_functions_holder->compiled_aggregate_functions;
                     compiled_aggregate_functions.create_aggregate_states_function(aggregate_data);
@@ -1293,20 +1309,6 @@ void NO_INLINE Aggregator::executeImplBatch(
                         static constexpr bool skip_compiled_aggregate_functions = true;
                         createAggregateStates<skip_compiled_aggregate_functions>(aggregate_data);
                     }
-
-#if defined(MEMORY_SANITIZER)
-
-                    /// We compile only functions that do not allocate some data in Arena. Only store necessary state in AggregateData place.
-                    for (size_t aggregate_function_index = 0; aggregate_function_index < aggregate_functions.size(); ++aggregate_function_index)
-                    {
-                        if (!is_aggregate_function_compiled[aggregate_function_index])
-                            continue;
-
-                        auto aggregate_data_with_offset = aggregate_data + offsets_of_aggregate_states[aggregate_function_index];
-                        auto data_size = params.aggregates[aggregate_function_index].function->sizeOfData();
-                        __msan_unpoison(aggregate_data_with_offset, data_size);
-                    }
-#endif
                 }
                 else
 #endif
@@ -1339,7 +1341,7 @@ void NO_INLINE Aggregator::executeImplBatch(
     }
 
 #if USE_EMBEDDED_COMPILER
-    if constexpr (use_compiled_functions)
+    if (use_compiled_functions)
     {
         std::vector<ColumnData> columns_data;
 
@@ -1372,9 +1374,8 @@ void NO_INLINE Aggregator::executeImplBatch(
     for (size_t i = 0; i < aggregate_functions.size(); ++i)
     {
 #if USE_EMBEDDED_COMPILER
-        if constexpr (use_compiled_functions)
-            if (is_aggregate_function_compiled[i])
-                continue;
+        if (use_compiled_functions && is_aggregate_function_compiled[i])
+            continue;
 #endif
 
         AggregateFunctionInstruction * inst = aggregate_instructions + i;
@@ -1387,18 +1388,19 @@ void NO_INLINE Aggregator::executeImplBatch(
 }
 
 
-template <bool use_compiled_functions>
 void NO_INLINE Aggregator::executeWithoutKeyImpl(
     AggregatedDataWithoutKey & res,
-    size_t row_begin, size_t row_end,
+    size_t row_begin,
+    size_t row_end,
     AggregateFunctionInstruction * aggregate_instructions,
-    Arena * arena) const
+    Arena * arena,
+    bool use_compiled_functions [[maybe_unused]]) const
 {
     if (row_begin == row_end)
         return;
 
 #if USE_EMBEDDED_COMPILER
-    if constexpr (use_compiled_functions)
+    if (use_compiled_functions)
     {
         std::vector<ColumnData> columns_data;
 
@@ -1418,20 +1420,6 @@ void NO_INLINE Aggregator::executeWithoutKeyImpl(
 
         auto add_into_aggregate_states_function_single_place = compiled_aggregate_functions_holder->compiled_aggregate_functions.add_into_aggregate_states_function_single_place;
         add_into_aggregate_states_function_single_place(row_begin, row_end, columns_data.data(), res);
-
-#if defined(MEMORY_SANITIZER)
-
-        /// We compile only functions that do not allocate some data in Arena. Only store necessary state in AggregateData place.
-        for (size_t aggregate_function_index = 0; aggregate_function_index < aggregate_functions.size(); ++aggregate_function_index)
-        {
-            if (!is_aggregate_function_compiled[aggregate_function_index])
-                continue;
-
-            auto aggregate_data_with_offset = res + offsets_of_aggregate_states[aggregate_function_index];
-            auto data_size = params.aggregates[aggregate_function_index].function->sizeOfData();
-            __msan_unpoison(aggregate_data_with_offset, data_size);
-        }
-#endif
     }
 #endif
 
@@ -1439,13 +1427,10 @@ void NO_INLINE Aggregator::executeWithoutKeyImpl(
     for (size_t i = 0; i < aggregate_functions.size(); ++i)
     {
         AggregateFunctionInstruction * inst = aggregate_instructions + i;
-
 #if USE_EMBEDDED_COMPILER
-        if constexpr (use_compiled_functions)
-            if (is_aggregate_function_compiled[i])
-                continue;
+        if (use_compiled_functions && is_aggregate_function_compiled[i])
+            continue;
 #endif
-
         addBatchSinglePlace(row_begin, row_end, inst, res + inst->state_offset, arena);
     }
 }
@@ -1704,16 +1689,14 @@ bool Aggregator::executeOnBlock(Columns columns,
     if (result.type == AggregatedDataVariants::Type::without_key)
     {
         /// TODO: Enable compilation after investigation
-// #if USE_EMBEDDED_COMPILER
-//         if (compiled_aggregate_functions_holder)
-//         {
-//             executeWithoutKeyImpl<true>(result.without_key, row_begin, row_end, aggregate_functions_instructions.data(), result.aggregates_pool);
-//         }
-//         else
-// #endif
-        {
-            executeWithoutKeyImpl<false>(result.without_key, row_begin, row_end, aggregate_functions_instructions.data(), result.aggregates_pool);
-        }
+        bool use_compiled_functions = false;
+        executeWithoutKeyImpl(
+            result.without_key,
+            row_begin,
+            row_end,
+            aggregate_functions_instructions.data(),
+            result.aggregates_pool,
+            use_compiled_functions);
     }
     else
     {
@@ -1965,19 +1948,13 @@ Aggregator::convertToBlockImpl(Method & method, Table & data, Arena * arena, Are
 
     ConvertToBlockRes<return_single_block> res;
 
+    bool use_compiled_functions = false;
     if (final)
     {
 #if USE_EMBEDDED_COMPILER
-        if (compiled_aggregate_functions_holder)
-        {
-            static constexpr bool use_compiled_functions = !Method::low_cardinality_optimization;
-            res = convertToBlockImplFinal<Method, use_compiled_functions, return_single_block>(method, data, arena, aggregates_pools, rows);
-        }
-        else
+        use_compiled_functions = compiled_aggregate_functions_holder != nullptr && !Method::low_cardinality_optimization;
 #endif
-        {
-            res = convertToBlockImplFinal<Method, false, return_single_block>(method, data, arena, aggregates_pools, rows);
-        }
+        res = convertToBlockImplFinal<Method, return_single_block>(method, data, arena, aggregates_pools, use_compiled_functions, rows);
     }
     else
     {
@@ -2059,8 +2036,12 @@ inline void Aggregator::insertAggregatesIntoColumns(Mapped & mapped, MutableColu
 }
 
 
-template <bool use_compiled_functions>
-Block Aggregator::insertResultsIntoColumns(PaddedPODArray<AggregateDataPtr> & places, OutputBlockColumns && out_cols, Arena * arena, bool has_null_key_data [[maybe_unused]]) const
+Block Aggregator::insertResultsIntoColumns(
+    PaddedPODArray<AggregateDataPtr> & places,
+    OutputBlockColumns && out_cols,
+    Arena * arena,
+    bool has_null_key_data [[maybe_unused]],
+    bool use_compiled_functions [[maybe_unused]]) const
 {
     std::exception_ptr exception;
     size_t aggregate_functions_destroy_index = 0;
@@ -2068,7 +2049,7 @@ Block Aggregator::insertResultsIntoColumns(PaddedPODArray<AggregateDataPtr> & pl
     try
     {
 #if USE_EMBEDDED_COMPILER
-        if constexpr (use_compiled_functions)
+        if (use_compiled_functions)
         {
             /** For JIT compiled functions we need to resize columns before pass them into compiled code.
               * insert_aggregates_into_columns_function function does not throw exception.
@@ -2098,14 +2079,13 @@ Block Aggregator::insertResultsIntoColumns(PaddedPODArray<AggregateDataPtr> & pl
 
         for (; aggregate_functions_destroy_index < params.aggregates_size;)
         {
-            if constexpr (use_compiled_functions)
+#if USE_EMBEDDED_COMPILER
+            if (use_compiled_functions && is_aggregate_function_compiled[aggregate_functions_destroy_index])
             {
-                if (is_aggregate_function_compiled[aggregate_functions_destroy_index])
-                {
-                    ++aggregate_functions_destroy_index;
-                    continue;
-                }
+                ++aggregate_functions_destroy_index;
+                continue;
             }
+#endif
 
             auto & final_aggregate_column = out_cols.final_aggregate_columns[aggregate_functions_destroy_index];
             size_t offset = offsets_of_aggregate_states[aggregate_functions_destroy_index];
@@ -2127,14 +2107,13 @@ Block Aggregator::insertResultsIntoColumns(PaddedPODArray<AggregateDataPtr> & pl
 
     for (; aggregate_functions_destroy_index < params.aggregates_size; ++aggregate_functions_destroy_index)
     {
-        if constexpr (use_compiled_functions)
+#if USE_EMBEDDED_COMPILER
+        if (use_compiled_functions && is_aggregate_function_compiled[aggregate_functions_destroy_index])
         {
-            if (is_aggregate_function_compiled[aggregate_functions_destroy_index])
-            {
-                ++aggregate_functions_destroy_index;
-                continue;
-            }
+            ++aggregate_functions_destroy_index;
+            continue;
         }
+#endif
 
         size_t offset = offsets_of_aggregate_states[aggregate_functions_destroy_index];
         aggregate_functions[aggregate_functions_destroy_index]->destroyBatch(0, places.size(), places.data(), offset);
@@ -2146,9 +2125,9 @@ Block Aggregator::insertResultsIntoColumns(PaddedPODArray<AggregateDataPtr> & pl
     return finalizeBlock(params, getHeader(/* final */ true), std::move(out_cols), /* final */ true, places.size());
 }
 
-template <typename Method, bool use_compiled_functions, bool return_single_block, typename Table>
-Aggregator::ConvertToBlockRes<return_single_block> NO_INLINE
-Aggregator::convertToBlockImplFinal(Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, size_t) const
+template <typename Method, bool return_single_block, typename Table>
+Aggregator::ConvertToBlockRes<return_single_block> NO_INLINE Aggregator::convertToBlockImplFinal(
+    Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, bool use_compiled_functions [[maybe_unused]], size_t) const
 {
     /// +1 for nullKeyData, if `data` doesn't have it - not a problem, just some memory for one excessive row will be preallocated
     const size_t max_block_size = (return_single_block ? data.size() : std::min(params.max_block_size, data.size())) + 1;
@@ -2204,7 +2183,8 @@ Aggregator::convertToBlockImplFinal(Method & method, Table & data, Arena * arena
             {
                 if (places.size() >= max_block_size)
                 {
-                    res.emplace_back(insertResultsIntoColumns<use_compiled_functions>(places, std::move(out_cols.value()), arena, has_null_key_data));
+                    res.emplace_back(
+                        insertResultsIntoColumns(places, std::move(out_cols.value()), arena, has_null_key_data, use_compiled_functions));
                     places.clear();
                     out_cols.reset();
                     has_null_key_data = false;
@@ -2214,12 +2194,13 @@ Aggregator::convertToBlockImplFinal(Method & method, Table & data, Arena * arena
 
     if constexpr (return_single_block)
     {
-        return insertResultsIntoColumns<use_compiled_functions>(places, std::move(out_cols.value()), arena, has_null_key_data);
+        return insertResultsIntoColumns(places, std::move(out_cols.value()), arena, has_null_key_data, use_compiled_functions);
     }
     else
     {
         if (out_cols.has_value())
-            res.emplace_back(insertResultsIntoColumns<use_compiled_functions>(places, std::move(out_cols.value()), arena, has_null_key_data));
+            res.emplace_back(
+                insertResultsIntoColumns(places, std::move(out_cols.value()), arena, has_null_key_data, use_compiled_functions));
         return res;
     }
 }
diff --git a/src/Interpreters/Aggregator.h b/src/Interpreters/Aggregator.h
index 67e82cdd784..d7bbe5950a0 100644
--- a/src/Interpreters/Aggregator.h
+++ b/src/Interpreters/Aggregator.h
@@ -1395,7 +1395,7 @@ private:
         AggregateDataPtr overflow_row) const;
 
     /// Specialization for a particular value no_more_keys.
-    template <bool no_more_keys, bool use_compiled_functions, bool prefetch, typename Method, typename State>
+    template <bool no_more_keys, bool prefetch, typename Method, typename State>
     void executeImplBatch(
         Method & method,
         State & state,
@@ -1404,16 +1404,17 @@ private:
         size_t row_end,
         AggregateFunctionInstruction * aggregate_instructions,
         bool all_keys_are_const,
+        bool use_compiled_functions,
         AggregateDataPtr overflow_row) const;
 
     /// For case when there are no keys (all aggregate into one row).
-    template <bool use_compiled_functions>
     void executeWithoutKeyImpl(
         AggregatedDataWithoutKey & res,
         size_t row_begin,
         size_t row_end,
         AggregateFunctionInstruction * aggregate_instructions,
-        Arena * arena) const;
+        Arena * arena,
+        bool use_compiled_functions) const;
 
     template <typename Method>
     void writeToTemporaryFileImpl(
@@ -1467,12 +1468,16 @@ private:
         MutableColumns & final_aggregate_columns,
         Arena * arena) const;
 
-    template <bool use_compiled_functions>
-    Block insertResultsIntoColumns(PaddedPODArray<AggregateDataPtr> & places, OutputBlockColumns && out_cols, Arena * arena, bool has_null_key_data) const;
+    Block insertResultsIntoColumns(
+        PaddedPODArray<AggregateDataPtr> & places,
+        OutputBlockColumns && out_cols,
+        Arena * arena,
+        bool has_null_key_data,
+        bool use_compiled_functions) const;
 
-    template <typename Method, bool use_compiled_functions, bool return_single_block, typename Table>
-    ConvertToBlockRes<return_single_block>
-    convertToBlockImplFinal(Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, size_t rows) const;
+    template <typename Method, bool return_single_block, typename Table>
+    ConvertToBlockRes<return_single_block> convertToBlockImplFinal(
+        Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, bool use_compiled_functions, size_t rows) const;
 
     template <bool return_single_block, typename Method, typename Table>
     ConvertToBlockRes<return_single_block>

From 81b2a1f621d9bd64fde2c4e4f6a83c9b3b0c461a Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 11 Mar 2024 15:34:02 +0000
Subject: [PATCH 301/985] Fix build

---
 programs/obfuscator/Obfuscator.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/obfuscator/Obfuscator.cpp b/programs/obfuscator/Obfuscator.cpp
index 317d93aaf0c..b2bf942af4e 100644
--- a/programs/obfuscator/Obfuscator.cpp
+++ b/programs/obfuscator/Obfuscator.cpp
@@ -1205,7 +1205,7 @@ public:
 }
 
 #pragma clang diagnostic ignored "-Wunused-function"
-#clang GCC diagnostic ignored "-Wmissing-declarations"
+#pragma clang diagnostic ignored "-Wmissing-declarations"
 
 int mainEntryClickHouseObfuscator(int argc, char ** argv)
 try

From 38f41ee311d0a36d194965e5815489a25c60e449 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 11 Mar 2024 16:55:30 +0100
Subject: [PATCH 302/985] Fix integration test

---
 tests/integration/test_disk_types/test.py              | 10 +++++-----
 .../test_endpoint_macro_substitution/test.py           | 10 +++++-----
 2 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/tests/integration/test_disk_types/test.py b/tests/integration/test_disk_types/test.py
index af482b97be3..86579911b3e 100644
--- a/tests/integration/test_disk_types/test.py
+++ b/tests/integration/test_disk_types/test.py
@@ -3,10 +3,10 @@ from helpers.cluster import ClickHouseCluster
 from helpers.test_tools import TSV
 
 disk_types = {
-    "default": "local",
-    "disk_s3": "s3",
-    "disk_hdfs": "hdfs",
-    "disk_encrypted": "s3",
+    "default": "Local",
+    "disk_s3": "S3",
+    "disk_hdfs": "HDFS",
+    "disk_encrypted": "S3",
 }
 
 
@@ -55,7 +55,7 @@ def test_different_types(cluster):
 def test_select_by_type(cluster):
     node = cluster.instances["node"]
     for name, disk_type in list(disk_types.items()):
-        if disk_type != "s3":
+        if disk_type != "S3":
             assert (
                 node.query(
                     "SELECT name FROM system.disks WHERE type='" + disk_type + "'"
diff --git a/tests/integration/test_endpoint_macro_substitution/test.py b/tests/integration/test_endpoint_macro_substitution/test.py
index 42a8ddbda84..bec3d9de0e3 100644
--- a/tests/integration/test_endpoint_macro_substitution/test.py
+++ b/tests/integration/test_endpoint_macro_substitution/test.py
@@ -4,10 +4,10 @@ from helpers.test_tools import TSV
 from pyhdfs import HdfsClient
 
 disk_types = {
-    "default": "local",
-    "disk_s3": "s3",
-    "disk_hdfs": "hdfs",
-    "disk_encrypted": "s3",
+    "default": "Local",
+    "disk_s3": "S3",
+    "disk_hdfs": "HDFS",
+    "disk_encrypted": "S3",
 }
 
 
@@ -63,7 +63,7 @@ def test_select_by_type(cluster):
     fs = HdfsClient(hosts=cluster.hdfs_ip)
 
     for name, disk_type in list(disk_types.items()):
-        if disk_type != "s3":
+        if disk_type != "S3":
             assert (
                 node.query(
                     "SELECT name FROM system.disks WHERE type='" + disk_type + "'"

From 5db08292455fb0c6f47fc0344382ab7cf3508e91 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 11 Mar 2024 17:20:53 +0100
Subject: [PATCH 303/985] Remove another template

---
 src/Interpreters/Aggregator.cpp | 55 ++++++++++++++-------------------
 src/Interpreters/Aggregator.h   |  3 +-
 2 files changed, 26 insertions(+), 32 deletions(-)

diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index c7ce3e46446..a9578b5540f 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -2906,11 +2906,12 @@ ManyAggregatedDataVariants Aggregator::prepareVariantsToMerge(ManyAggregatedData
     return non_empty_data;
 }
 
-template <bool no_more_keys, typename State, typename Table>
+template <typename State, typename Table>
 void NO_INLINE Aggregator::mergeStreamsImplCase(
     Arena * aggregates_pool,
     State & state,
     Table & data,
+    bool no_more_keys,
     AggregateDataPtr overflow_row,
     size_t row_begin,
     size_t row_end,
@@ -2922,36 +2923,34 @@ void NO_INLINE Aggregator::mergeStreamsImplCase(
     if (!arena_for_keys)
         arena_for_keys = aggregates_pool;
 
-    for (size_t i = row_begin; i < row_end; ++i)
+    if (no_more_keys)
     {
-        AggregateDataPtr aggregate_data = nullptr;
-
-        if constexpr (!no_more_keys)
+        for (size_t i = row_begin; i < row_end; i++)
         {
-            auto emplace_result = state.emplaceKey(data, i, *arena_for_keys); // NOLINT
-            if (emplace_result.isInserted())
+            auto find_result = state.findKey(data, i, *arena_for_keys);
+            /// aggregate_date == nullptr means that the new key did not fit in the hash table because of no_more_keys.
+            AggregateDataPtr value = find_result.isFound() ? find_result.getMapped() : overflow_row;
+            places[i] = value;
+        }
+    }
+    else
+    {
+        for (size_t i = row_begin; i < row_end; i++)
+        {
+            auto emplace_result = state.emplaceKey(data, i, *arena_for_keys);
+            if (!emplace_result.isInserted())
+                places[i] = emplace_result.getMapped();
+            else
             {
                 emplace_result.setMapped(nullptr);
 
-                aggregate_data = aggregates_pool->alignedAlloc(total_size_of_aggregate_states, align_aggregate_states);
+                AggregateDataPtr aggregate_data = aggregates_pool->alignedAlloc(total_size_of_aggregate_states, align_aggregate_states);
                 createAggregateStates(aggregate_data);
 
                 emplace_result.setMapped(aggregate_data);
+                places[i] = aggregate_data;
             }
-            else
-                aggregate_data = emplace_result.getMapped();
         }
-        else
-        {
-            auto find_result = state.findKey(data, i, *arena_for_keys);
-            if (find_result.isFound())
-                aggregate_data = find_result.getMapped();
-        }
-
-        /// aggregate_date == nullptr means that the new key did not fit in the hash table because of no_more_keys.
-
-        AggregateDataPtr value = aggregate_data ? aggregate_data : overflow_row;
-        places[i] = value;
     }
 
     for (size_t j = 0; j < params.aggregates_size; ++j)
@@ -3005,22 +3004,16 @@ void NO_INLINE Aggregator::mergeStreamsImpl(
     if (use_cache)
     {
         typename Method::State state(key_columns, key_sizes, aggregation_state_cache);
-
-        if (!no_more_keys)
-            mergeStreamsImplCase<false>(aggregates_pool, state, data, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
-        else
-            mergeStreamsImplCase<true>(aggregates_pool, state, data, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
+        mergeStreamsImplCase(
+            aggregates_pool, state, data, no_more_keys, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
 
         consecutive_keys_cache_stats.update(row_end - row_begin, state.getCacheMissesSinceLastReset());
     }
     else
     {
         typename Method::StateNoCache state(key_columns, key_sizes, aggregation_state_cache);
-
-        if (!no_more_keys)
-            mergeStreamsImplCase<false>(aggregates_pool, state, data, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
-        else
-            mergeStreamsImplCase<true>(aggregates_pool, state, data, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
+        mergeStreamsImplCase(
+            aggregates_pool, state, data, no_more_keys, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
     }
 }
 
diff --git a/src/Interpreters/Aggregator.h b/src/Interpreters/Aggregator.h
index d7bbe5950a0..6c357623003 100644
--- a/src/Interpreters/Aggregator.h
+++ b/src/Interpreters/Aggregator.h
@@ -1513,11 +1513,12 @@ private:
         bool final,
         ThreadPool * thread_pool) const;
 
-    template <bool no_more_keys, typename State, typename Table>
+    template <typename State, typename Table>
     void mergeStreamsImplCase(
         Arena * aggregates_pool,
         State & state,
         Table & data,
+        bool no_more_keys,
         AggregateDataPtr overflow_row,
         size_t row_begin,
         size_t row_end,

From 74281b0a4e3d9328d01379129ace85e03c145fa4 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 11 Mar 2024 16:42:45 +0000
Subject: [PATCH 304/985] Avoid some logical errors in experimantal Object type

---
 src/Columns/ColumnObject.cpp                  |  8 ++--
 src/Common/ErrorCodes.cpp                     |  1 +
 src/DataTypes/ObjectUtils.cpp                 | 41 ++++++++++++++-----
 .../Serializations/SerializationObject.cpp    |  6 +--
 4 files changed, 38 insertions(+), 18 deletions(-)

diff --git a/src/Columns/ColumnObject.cpp b/src/Columns/ColumnObject.cpp
index ac2ee309e87..25a62440629 100644
--- a/src/Columns/ColumnObject.cpp
+++ b/src/Columns/ColumnObject.cpp
@@ -20,12 +20,12 @@ namespace DB
 
 namespace ErrorCodes
 {
-    extern const int LOGICAL_ERROR;
     extern const int ILLEGAL_COLUMN;
     extern const int DUPLICATE_COLUMN;
     extern const int NUMBER_OF_DIMENSIONS_MISMATCHED;
     extern const int SIZES_OF_COLUMNS_DOESNT_MATCH;
     extern const int ARGUMENT_OUT_OF_BOUND;
+    extern const int EXPERIMENTAL_FEATURE_ERROR;
 }
 
 namespace
@@ -247,7 +247,7 @@ void ColumnObject::Subcolumn::checkTypes() const
         prefix_types.push_back(current_type);
         auto prefix_common_type = getLeastSupertype(prefix_types);
         if (!prefix_common_type->equals(*current_type))
-            throw Exception(ErrorCodes::LOGICAL_ERROR,
+            throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR,
                 "Data type {} of column at position {} cannot represent all columns from i-th prefix",
                 current_type->getName(), i);
     }
@@ -635,7 +635,7 @@ void ColumnObject::checkConsistency() const
     {
         if (num_rows != leaf->data.size())
         {
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Sizes of subcolumns are inconsistent in ColumnObject."
+            throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Sizes of subcolumns are inconsistent in ColumnObject."
                 " Subcolumn '{}' has {} rows, but expected size is {}",
                 leaf->path.getPath(), leaf->data.size(), num_rows);
         }
@@ -919,7 +919,7 @@ void ColumnObject::addSubcolumn(const PathInData & key, size_t new_size)
 void ColumnObject::addNestedSubcolumn(const PathInData & key, const FieldInfo & field_info, size_t new_size)
 {
     if (!key.hasNested())
-        throw Exception(ErrorCodes::LOGICAL_ERROR,
+        throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR,
             "Cannot add Nested subcolumn, because path doesn't contain Nested");
 
     bool inserted = false;
diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index 44463f7f437..9f2572cbfc6 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -598,6 +598,7 @@
     M(714, UNEXPECTED_CLUSTER) \
     M(715, CANNOT_DETECT_FORMAT) \
     M(716, CANNOT_FORGET_PARTITION) \
+    M(717, EXPERIMENTAL_FEATURE_ERROR) \
     \
     M(999, KEEPER_EXCEPTION) \
     M(1000, POCO_EXCEPTION) \
diff --git a/src/DataTypes/ObjectUtils.cpp b/src/DataTypes/ObjectUtils.cpp
index 23d29136c85..48392a614a5 100644
--- a/src/DataTypes/ObjectUtils.cpp
+++ b/src/DataTypes/ObjectUtils.cpp
@@ -28,9 +28,9 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int TYPE_MISMATCH;
-    extern const int LOGICAL_ERROR;
     extern const int INCOMPATIBLE_COLUMNS;
     extern const int NOT_IMPLEMENTED;
+    extern const int EXPERIMENTAL_FEATURE_ERROR;
 }
 
 size_t getNumberOfDimensions(const IDataType & type)
@@ -92,7 +92,7 @@ ColumnPtr createArrayOfColumn(ColumnPtr column, size_t num_dimensions)
 Array createEmptyArrayField(size_t num_dimensions)
 {
     if (num_dimensions == 0)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot create array field with 0 dimensions");
+        throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Cannot create array field with 0 dimensions");
 
     Array array;
     Array * current_array = &array;
@@ -231,7 +231,7 @@ static std::pair<ColumnPtr, DataTypePtr> recursivlyConvertDynamicColumnToTuple(
         };
     }
 
-    throw Exception(ErrorCodes::LOGICAL_ERROR, "Type {} unexpectedly has dynamic columns", type->getName());
+    throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Type {} unexpectedly has dynamic columns", type->getName());
 }
 
 void convertDynamicColumnsToTuples(Block & block, const StorageSnapshotPtr & storage_snapshot)
@@ -247,7 +247,7 @@ void convertDynamicColumnsToTuples(Block & block, const StorageSnapshotPtr & sto
         GetColumnsOptions options(GetColumnsOptions::AllPhysical);
         auto storage_column = storage_snapshot->tryGetColumn(options, column.name);
         if (!storage_column)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Column '{}' not found in storage", column.name);
+            throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Column '{}' not found in storage", column.name);
 
         auto storage_column_concrete = storage_snapshot->getColumn(options.withExtendedObjects(), column.name);
 
@@ -315,7 +315,7 @@ static DataTypePtr getLeastCommonTypeForObject(const DataTypes & types, bool che
     {
         const auto * type_tuple = typeid_cast<const DataTypeTuple *>(type.get());
         if (!type_tuple)
-            throw Exception(ErrorCodes::LOGICAL_ERROR,
+            throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR,
                 "Least common type for object can be deduced only from tuples, but {} given", type->getName());
 
         auto [tuple_paths, tuple_types] = flattenTuple(type);
@@ -427,7 +427,7 @@ static DataTypePtr getLeastCommonTypeForDynamicColumnsImpl(
     if (const auto * type_tuple = typeid_cast<const DataTypeTuple *>(type_in_storage.get()))
         return getLeastCommonTypeForTuple(*type_tuple, concrete_types, check_ambiguos_paths);
 
-    throw Exception(ErrorCodes::LOGICAL_ERROR, "Type {} unexpectedly has dynamic columns", type_in_storage->getName());
+    throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Type {} unexpectedly has dynamic columns", type_in_storage->getName());
 }
 
 DataTypePtr getLeastCommonTypeForDynamicColumns(
@@ -481,7 +481,7 @@ DataTypePtr createConcreteEmptyDynamicColumn(const DataTypePtr & type_in_storage
         return recreateTupleWithElements(*type_tuple, new_elements);
     }
 
-    throw Exception(ErrorCodes::LOGICAL_ERROR, "Type {} unexpectedly has dynamic columns", type_in_storage->getName());
+    throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Type {} unexpectedly has dynamic columns", type_in_storage->getName());
 }
 
 bool hasDynamicSubcolumns(const ColumnsDescription & columns)
@@ -613,7 +613,7 @@ DataTypePtr reduceNumberOfDimensions(DataTypePtr type, size_t dimensions_to_redu
     {
         const auto * type_array = typeid_cast<const DataTypeArray *>(type.get());
         if (!type_array)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Not enough dimensions to reduce");
+            throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Not enough dimensions to reduce");
 
         type = type_array->getNestedType();
     }
@@ -627,7 +627,7 @@ ColumnPtr reduceNumberOfDimensions(ColumnPtr column, size_t dimensions_to_reduce
     {
         const auto * column_array = typeid_cast<const ColumnArray *>(column.get());
         if (!column_array)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Not enough dimensions to reduce");
+            throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Not enough dimensions to reduce");
 
         column = column_array->getDataPtr();
     }
@@ -705,6 +705,7 @@ ColumnWithTypeAndDimensions createTypeFromNode(const Node & node)
         size_t num_elements = tuple_columns.size();
         Columns tuple_elements_columns(num_elements);
         DataTypes tuple_elements_types(num_elements);
+        size_t last_offset = assert_cast<const ColumnArray::ColumnOffsets &>(*offsets_columns.back()).getData().back();
 
         /// Reduce extra array dimensions to get columns and types of Nested elements.
         for (size_t i = 0; i < num_elements; ++i)
@@ -712,6 +713,14 @@ ColumnWithTypeAndDimensions createTypeFromNode(const Node & node)
             assert(tuple_columns[i].array_dimensions == tuple_columns[0].array_dimensions);
             tuple_elements_columns[i] = reduceNumberOfDimensions(tuple_columns[i].column, tuple_columns[i].array_dimensions);
             tuple_elements_types[i] = reduceNumberOfDimensions(tuple_columns[i].type, tuple_columns[i].array_dimensions);
+            if (tuple_elements_columns[i]->size() != last_offset)
+                throw Exception(
+                    ErrorCodes::EXPERIMENTAL_FEATURE_ERROR,
+                    "Cannot create a type for subcolumn {} in Object data type: offsets_column has data inconsistent with nested_column. "
+                    "Data size: {}, last offset: {}",
+                    node.path.getPath(),
+                    tuple_elements_columns[i]->size(),
+                    last_offset);
         }
 
         auto result_column = ColumnArray::create(ColumnTuple::create(tuple_elements_columns), offsets_columns.back());
@@ -720,6 +729,16 @@ ColumnWithTypeAndDimensions createTypeFromNode(const Node & node)
         /// Recreate result Array type and Array column.
         for (auto it = offsets_columns.rbegin() + 1; it != offsets_columns.rend(); ++it)
         {
+            last_offset = assert_cast<const ColumnArray::ColumnOffsets &>((**it)).getData().back();
+            if (result_column->size() != last_offset)
+                throw Exception(
+                    ErrorCodes::EXPERIMENTAL_FEATURE_ERROR,
+                    "Cannot create a type for subcolumn {} in Object data type: offsets_column has data inconsistent with nested_column. "
+                    "Data size: {}, last offset: {}",
+                    node.path.getPath(),
+                    result_column->size(),
+                    last_offset);
+
             result_column = ColumnArray::create(result_column, *it);
             result_type = std::make_shared<DataTypeArray>(result_type);
         }
@@ -822,7 +841,7 @@ std::pair<ColumnPtr, DataTypePtr> unflattenTuple(
     assert(paths.size() == tuple_columns.size());
 
     if (paths.empty())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot unflatten empty Tuple");
+        throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Cannot unflatten empty Tuple");
 
     /// We add all paths to the subcolumn tree and then create a type from it.
     /// The tree stores column, type and number of array dimensions
@@ -841,7 +860,7 @@ std::pair<ColumnPtr, DataTypePtr> unflattenTuple(
         tree.add(paths[i], [&](Node::Kind kind, bool exists) -> std::shared_ptr<Node>
             {
                 if (pos >= num_parts)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR,
+                    throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR,
                         "Not enough name parts for path {}. Expected at least {}, got {}",
                             paths[i].getPath(), pos + 1, num_parts);
 
diff --git a/src/DataTypes/Serializations/SerializationObject.cpp b/src/DataTypes/Serializations/SerializationObject.cpp
index e6dc16ef5a0..1bdc29daebd 100644
--- a/src/DataTypes/Serializations/SerializationObject.cpp
+++ b/src/DataTypes/Serializations/SerializationObject.cpp
@@ -29,7 +29,7 @@ namespace ErrorCodes
     extern const int INCORRECT_DATA;
     extern const int CANNOT_READ_ALL_DATA;
     extern const int ARGUMENT_OUT_OF_BOUND;
-    extern const int LOGICAL_ERROR;
+    extern const int EXPERIMENTAL_FEATURE_ERROR;
 }
 
 template <typename Parser>
@@ -177,7 +177,7 @@ void SerializationObject<Parser>::serializeBinaryBulkStatePrefix(
     auto * stream = settings.getter(settings.path);
 
     if (!stream)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Missing stream for kind of binary serialization");
+        throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Missing stream for kind of binary serialization");
 
     auto [tuple_column, tuple_type] = unflattenObjectToTuple(column_object);
 
@@ -288,7 +288,7 @@ void SerializationObject<Parser>::serializeBinaryBulkWithMultipleStreams(
 
     if (!state_object->nested_type->equals(*tuple_type))
     {
-        throw Exception(ErrorCodes::LOGICAL_ERROR,
+        throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR,
             "Types of internal column of Object mismatched. Expected: {}, Got: {}",
             state_object->nested_type->getName(), tuple_type->getName());
     }

From 260c6387555b3823e56db135f80adaa5e0c300ab Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 11 Mar 2024 16:59:01 +0000
Subject: [PATCH 305/985] Replace forgotten logical error

---
 src/DataTypes/ObjectUtils.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/DataTypes/ObjectUtils.cpp b/src/DataTypes/ObjectUtils.cpp
index 48392a614a5..c565930f49a 100644
--- a/src/DataTypes/ObjectUtils.cpp
+++ b/src/DataTypes/ObjectUtils.cpp
@@ -653,7 +653,7 @@ ColumnWithTypeAndDimensions createTypeFromNode(const Node & node)
     auto collect_tuple_elemets = [](const auto & children)
     {
         if (children.empty())
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot create type from empty Tuple or Nested node");
+            throw Exception(ErrorCodes::EXPERIMENTAL_FEATURE_ERROR, "Cannot create type from empty Tuple or Nested node");
 
         std::vector<std::tuple<String, ColumnWithTypeAndDimensions>> tuple_elements;
         tuple_elements.reserve(children.size());

From 16e01eb93ad449c61417dcaccd570439364b0714 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 11 Mar 2024 18:05:51 +0100
Subject: [PATCH 306/985] Fix style

---
 src/Core/Settings.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Core/Settings.cpp b/src/Core/Settings.cpp
index fb456b46d89..8257b94cd9f 100644
--- a/src/Core/Settings.cpp
+++ b/src/Core/Settings.cpp
@@ -15,6 +15,7 @@ namespace ErrorCodes
     extern const int THERE_IS_NO_PROFILE;
     extern const int NO_ELEMENTS_IN_CONFIG;
     extern const int UNKNOWN_ELEMENT_IN_CONFIG;
+    extern const int BAD_ARGUMENTS;
 }
 
 IMPLEMENT_SETTINGS_TRAITS(SettingsTraits, LIST_OF_SETTINGS)

From f656a015385898602cb651b419b46927f99ab602 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Mon, 11 Mar 2024 16:39:13 +0000
Subject: [PATCH 307/985] CI: fix sync build issue with reuse  #do_not_test

---
 tests/ci/ci.py | 21 +++++++++++++++------
 1 file changed, 15 insertions(+), 6 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 9d57f161be3..cc4d0b11eef 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -140,7 +140,7 @@ class CiCache:
         self.s3 = s3
         self.job_digests = job_digests
         self.cache_s3_paths = {
-            job_type: f"{self._S3_CACHE_PREFIX}/{job_type.value}-{self.job_digests[self._get_reference_job_name(job_type)]}/"
+            job_type: f"{self._S3_CACHE_PREFIX}/{job_type.value}-{self._get_digest_for_job_type(self.job_digests, job_type)}/"
             for job_type in self.JobType
         }
         self.s3_record_prefixes = {
@@ -155,14 +155,23 @@ class CiCache:
         if not self._LOCAL_CACHE_PATH.exists():
             self._LOCAL_CACHE_PATH.mkdir(parents=True, exist_ok=True)
 
-    def _get_reference_job_name(self, job_type: JobType) -> str:
-        res = Build.PACKAGE_RELEASE
+    def _get_digest_for_job_type(
+        self, job_digests: Dict[str, str], job_type: JobType
+    ) -> str:
         if job_type == self.JobType.DOCS:
-            res = JobNames.DOCS_CHECK
+            res = job_digests[JobNames.DOCS_CHECK]
         elif job_type == self.JobType.SRCS:
-            res = Build.PACKAGE_RELEASE
+            # any build type job has the same digest - pick up Build.PACKAGE_RELEASE or Build.PACKAGE_ASAN as a failover
+            # Build.PACKAGE_RELEASE may not exist in the list if we have reduced CI pipeline
+            if Build.PACKAGE_RELEASE in job_digests:
+                res = job_digests[Build.PACKAGE_RELEASE]
+            elif Build.PACKAGE_ASAN in job_digests:
+                # failover, if failover does not work - fix it!
+                res = job_digests[Build.PACKAGE_ASAN]
+            else:
+                assert False, "BUG, no build job in digest' list"
         else:
-            assert False
+            assert False, "BUG, New JobType? - please update func"
         return res
 
     def _get_record_file_name(

From f973e405eeb4f28a6a937c26d19cad54acd00eb4 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Wed, 7 Feb 2024 19:36:28 +0000
Subject: [PATCH 308/985] CI: fixing ARM integration tests

 #do_not_test
---
 tests/ci/ci.py | 41 ++++++++++++++++++++++++++++++++++++-----
 1 file changed, 36 insertions(+), 5 deletions(-)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 9d57f161be3..898d23be843 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1183,13 +1183,13 @@ def _configure_jobs(
 
         if batches_to_do:
             jobs_to_do.append(job)
+            jobs_params[job] = {
+                "batches": batches_to_do,
+                "num_batches": num_batches,
+            }
         elif add_to_skip:
             # treat job as being skipped only if it's controlled by digest
             jobs_to_skip.append(job)
-        jobs_params[job] = {
-            "batches": batches_to_do,
-            "num_batches": num_batches,
-        }
 
     if not pr_info.is_release_branch():
         # randomization bucket filtering (pick one random job from each bucket, for jobs with configured random_bucket property)
@@ -1268,6 +1268,33 @@ def _configure_jobs(
             jobs_to_do = list(
                 set(job for job in jobs_to_do_requested if job not in jobs_to_skip)
             )
+            # if requested job does not have params in jobs_params (it happens for "run_by_label" job)
+            #   we need to add params - otherwise it won't run as "batches" list will be empty
+            for job in jobs_to_do:
+                if job not in jobs_params:
+                    num_batches = CI_CONFIG.get_job_config(job).num_batches
+                    jobs_params[job] = {
+                        "batches": list(range(num_batches)),
+                        "num_batches": num_batches,
+                    }
+
+        requested_batches = set()
+        for token in commit_tokens:
+            if token.startswith("batch_"):
+                try:
+                    batches = [
+                        int(batch) for batch in token.removeprefix("batch_").split("_")
+                    ]
+                except Exception:
+                    print(f"ERROR: failed to parse commit tag [{token}]")
+                requested_batches.update(batches)
+        if requested_batches:
+            print(
+                f"NOTE: Only specific job batches were requested [{list(requested_batches)}]"
+            )
+            for job, params in jobs_params.items():
+                if params["num_batches"] > 1:
+                    params["batches"] = list(requested_batches)
 
     return {
         "digests": digests,
@@ -1372,7 +1399,11 @@ def _update_gh_statuses_action(indata: Dict, s3: S3Helper) -> None:
 def _fetch_commit_tokens(message: str) -> List[str]:
     pattern = r"#[\w-]+"
     matches = [match[1:] for match in re.findall(pattern, message)]
-    res = [match for match in matches if match in Labels or match.startswith("job_")]
+    res = [
+        match
+        for match in matches
+        if match in Labels or match.startswith("job_") or match.startswith("batch_")
+    ]
     return res
 
 
From 4b94bcd54ebd8713db8aefc453edaf15a1aa55ab Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Mon, 11 Mar 2024 18:41:17 +0100
Subject: [PATCH 309/985] Update ReadSettings.h

---
 src/IO/ReadSettings.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index fb8cbaf4a98..c0a63bf51b1 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -99,7 +99,6 @@ struct ReadSettings
     bool enable_filesystem_cache = true;
     bool read_from_filesystem_cache_if_exists_otherwise_bypass_cache = false;
     bool enable_filesystem_cache_log = false;
-    bool force_read_through_cache_merges = false;
     size_t filesystem_cache_segments_batch_size = 20;
 
     bool use_page_cache_for_disks_without_file_cache = false;

From fd68fed0470214d5c8734b0c89fbb779cf9b821f Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Mon, 11 Mar 2024 19:21:35 +0100
Subject: [PATCH 310/985] fix flaky 02949_ttl_group_by_bug

---
 tests/queries/0_stateless/02949_ttl_group_by_bug.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02949_ttl_group_by_bug.sql b/tests/queries/0_stateless/02949_ttl_group_by_bug.sql
index 2888f6e7d66..a3d0794c897 100644
--- a/tests/queries/0_stateless/02949_ttl_group_by_bug.sql
+++ b/tests/queries/0_stateless/02949_ttl_group_by_bug.sql
@@ -2,7 +2,7 @@ DROP TABLE IF EXISTS ttl_group_by_bug;
 
 CREATE TABLE ttl_group_by_bug
 (key UInt32, ts DateTime, value UInt32, min_value UInt32 default value, max_value UInt32 default value)
-ENGINE = MergeTree() PARTITION BY toYYYYMM(ts)
+ENGINE = MergeTree()
 ORDER BY (key, toStartOfInterval(ts, toIntervalMinute(3)), ts)
 TTL ts + INTERVAL 5 MINUTE GROUP BY key, toStartOfInterval(ts, toIntervalMinute(3))
 SET value = sum(value), min_value = min(min_value), max_value = max(max_value),  ts=min(toStartOfInterval(ts, toIntervalMinute(3)));

From a1e5161cee50650a5c4e87ca60e7ed9eb61451b4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 11 Mar 2024 19:25:34 +0100
Subject: [PATCH 311/985] Disable sanitizers with
 02784_parallel_replicas_automatic_decision_join

---
 .../02784_parallel_replicas_automatic_decision_join.sh         | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh b/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh
index ef3e6000903..801cd22b79f 100755
--- a/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh
+++ b/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh
@@ -1,5 +1,6 @@
 #!/usr/bin/env bash
-## Note: The analyzer doesn't support JOIN with parallel replicas yet
+# Tags: no-tsan, no-asan, no-msan
+# It's not clear why distributed aggregation is much slower with sanitizers (https://github.com/ClickHouse/ClickHouse/issues/60625)
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From 55a82047613c607dedb592fed019d04455e8c8e8 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 11 Mar 2024 19:43:30 +0100
Subject: [PATCH 312/985] Fix test

---
 .../0_stateless/03003_compatibility_setting_bad_value.sql       | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03003_compatibility_setting_bad_value.sql b/tests/queries/0_stateless/03003_compatibility_setting_bad_value.sql
index 9a6f4e7944a..48e98798c51 100644
--- a/tests/queries/0_stateless/03003_compatibility_setting_bad_value.sql
+++ b/tests/queries/0_stateless/03003_compatibility_setting_bad_value.sql
@@ -1,2 +1,2 @@
-select 42 settings compatibility=NULL;  -- {clientError BAD_GET}
+select 42 settings compatibility=NULL;  -- {clientError BAD_ARGUMENTS}
 

From 5a71636411cb358c94e58b7caac18c22104b0e1c Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 11 Mar 2024 19:44:52 +0100
Subject: [PATCH 313/985] Fxi

---
 tests/integration/test_disk_types/test.py     | 30 +++++++++++++++++++
 .../test_endpoint_macro_substitution/test.py  |  9 +++++-
 2 files changed, 38 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_disk_types/test.py b/tests/integration/test_disk_types/test.py
index 86579911b3e..5047cdc605e 100644
--- a/tests/integration/test_disk_types/test.py
+++ b/tests/integration/test_disk_types/test.py
@@ -50,6 +50,36 @@ def test_different_types(cluster):
             assert (
                 fields[encrypted_col_ix] == "0"
             ), f"{fields[name_col_ix]} expected to be non-encrypted!"
+def test_different_types(cluster):
+    node = cluster.instances["node"]
+    response = TSV.toMat(node.query("SELECT * FROM system.disks FORMAT TSVWithNames"))
+
+    assert len(response) > len(disk_types)  # at least one extra line for header
+
+    name_col_ix = response[0].index("name")
+    type_col_ix = response[0].index("type")
+    encrypted_col_ix = response[0].index("is_encrypted")
+
+    for fields in response[1:]:  # skip header
+        assert len(fields) >= 7
+        expected_disk_type = disk_types.get(fields[name_col_ix], "UNKNOWN")
+
+        if expected_disk_type != "Local":
+            disk_type = fields[response[0].index("object_storage_type")]
+        else:
+            disk_type = fields[type_col_ix]
+
+        assert (
+            expected_disk_type == disk_type
+        ), f"Wrong type ({fields[type_col_ix]}) for disk {fields[name_col_ix]}!"
+        if "encrypted" in fields[name_col_ix]:
+            assert (
+                fields[encrypted_col_ix] == "1"
+            ), f"{fields[name_col_ix]} expected to be encrypted!"
+        else:
+            assert (
+                fields[encrypted_col_ix] == "0"
+            ), f"{fields[name_col_ix]} expected to be non-encrypted!"
 
 
 def test_select_by_type(cluster):
diff --git a/tests/integration/test_endpoint_macro_substitution/test.py b/tests/integration/test_endpoint_macro_substitution/test.py
index bec3d9de0e3..e161d8e82ff 100644
--- a/tests/integration/test_endpoint_macro_substitution/test.py
+++ b/tests/integration/test_endpoint_macro_substitution/test.py
@@ -45,8 +45,15 @@ def test_different_types(cluster):
 
     for fields in response[1:]:  # skip header
         assert len(fields) >= 7
+        expected_disk_type = disk_types.get(fields[name_col_ix], "UNKNOWN")
+
+        if expected_disk_type != "Local":
+            disk_type = fields[response[0].index("object_storage_type")]
+        else:
+            disk_type = fields[type_col_ix]
+
         assert (
-            disk_types.get(fields[name_col_ix], "UNKNOWN") == fields[type_col_ix]
+            expected_disk_type == disk_type
         ), f"Wrong type ({fields[type_col_ix]}) for disk {fields[name_col_ix]}!"
         if "encrypted" in fields[name_col_ix]:
             assert (

From b7b83085d1722b192d802ffc3677ea6d0f03c85a Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Mon, 11 Mar 2024 18:49:45 +0000
Subject: [PATCH 314/985] CI: ci.py hot style fix

 #do_not_test
---
 tests/ci/ci.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index a699642691b..29906e6571f 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -55,6 +55,8 @@ from report import ERROR, SUCCESS, BuildResult, JobReport
 from s3_helper import S3Helper
 from version_helper import get_version_from_repo
 
+# pylint: disable=too-many-lines
+
 
 @dataclass
 class PendingState:

From 5a400c181b818cf3bbf371eb388a937ee816a66c Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Mon, 11 Mar 2024 09:49:25 +0100
Subject: [PATCH 315/985] Fix llvm symbolizer on CI

In #61011 the whole toolchain installation had been removed from the
base image to reduce image sizes, and this is a good thing indeed.

However it also breaks the symbolizer for sanitizers, which makes
stacktraces unreadable, so let's fix this by getting back llvm package,
this should be OK, since it's size is not gigabytes, but only 48MiB (at
least for llvm-14):

    # dpkg -L llvm-14| xargs file | grep -v directory | cut -d: -f1 | xargs du -sch | grep total
    48M     total

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 docker/test/base/Dockerfile     | 3 +++
 docker/test/fasttest/Dockerfile | 3 ---
 docker/test/util/Dockerfile     | 2 ++
 3 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/docker/test/base/Dockerfile b/docker/test/base/Dockerfile
index 55229e893de..2317f84e0cb 100644
--- a/docker/test/base/Dockerfile
+++ b/docker/test/base/Dockerfile
@@ -33,6 +33,9 @@ ENV TSAN_OPTIONS='halt_on_error=1 abort_on_error=1 history_size=7 memory_limit_m
 ENV UBSAN_OPTIONS='print_stacktrace=1'
 ENV MSAN_OPTIONS='abort_on_error=1 poison_in_dtor=1'
 
+# for external_symbolizer_path
+RUN ln -s /usr/bin/llvm-symbolizer-${LLVM_VERSION} /usr/bin/llvm-symbolizer
+
 RUN echo "en_US.UTF-8 UTF-8" > /etc/locale.gen && locale-gen en_US.UTF-8
 ENV LC_ALL en_US.UTF-8
 
diff --git a/docker/test/fasttest/Dockerfile b/docker/test/fasttest/Dockerfile
index 62cdcc3f830..912ff191e57 100644
--- a/docker/test/fasttest/Dockerfile
+++ b/docker/test/fasttest/Dockerfile
@@ -14,7 +14,6 @@ RUN apt-get update \
         libclang-${LLVM_VERSION}-dev \
         libclang-rt-${LLVM_VERSION}-dev \
         lld-${LLVM_VERSION} \
-        llvm-${LLVM_VERSION} \
         llvm-${LLVM_VERSION}-dev \
         lsof \
         ninja-build \
@@ -37,8 +36,6 @@ RUN pip3 install numpy==1.26.3 scipy==1.12.0 pandas==1.5.3 Jinja2==3.1.3
 
 # This symlink is required by gcc to find the lld linker
 RUN ln -s /usr/bin/lld-${LLVM_VERSION} /usr/bin/ld.lld
-# for external_symbolizer_path
-RUN ln -s /usr/bin/llvm-symbolizer-${LLVM_VERSION} /usr/bin/llvm-symbolizer
 # FIXME: workaround for "The imported target "merge-fdata" references the file" error
 # https://salsa.debian.org/pkg-llvm-team/llvm-toolchain/-/commit/992e52c0b156a5ba9c6a8a54f8c4857ddd3d371d
 RUN sed -i '/_IMPORT_CHECK_FILES_FOR_\(mlir-\|llvm-bolt\|merge-fdata\|MLIR\)/ {s|^|#|}' /usr/lib/llvm-${LLVM_VERSION}/lib/cmake/llvm/LLVMExports-*.cmake
diff --git a/docker/test/util/Dockerfile b/docker/test/util/Dockerfile
index 4f2dc9df849..5446adf3793 100644
--- a/docker/test/util/Dockerfile
+++ b/docker/test/util/Dockerfile
@@ -26,6 +26,8 @@ RUN apt-get update \
     && export CODENAME="$(lsb_release --codename --short | tr 'A-Z' 'a-z')" \
     && echo "deb https://apt.llvm.org/${CODENAME}/ llvm-toolchain-${CODENAME}-${LLVM_VERSION} main" >> \
         /etc/apt/sources.list \
+    && apt-get update \
+    && apt-get install --yes --no-install-recommends --verbose-versions llvm-${LLVM_VERSION} \
     && apt-get clean \
     && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
 

From 9b055c3a43039387b42e755efddd83b9a8934ca6 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 11 Mar 2024 20:38:30 +0100
Subject: [PATCH 316/985] Use assert_cast to prevent nullptr dereference on bad
 column types in FunctionsConversion

---
 src/Functions/FunctionsConversion.h | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index 1522e76893e..f338af28240 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -4561,7 +4561,7 @@ arguments, result_type, input_rows_count); \
 
                 if (from_low_cardinality)
                 {
-                    const auto * col_low_cardinality = typeid_cast<const ColumnLowCardinality *>(arguments[0].column.get());
+                    const auto * col_low_cardinality = assert_cast<const ColumnLowCardinality *>(arguments[0].column.get());
 
                     if (skip_not_null_check && col_low_cardinality->containsNull())
                         throw Exception(ErrorCodes::CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN, "Cannot convert NULL value to non-Nullable type");
@@ -4586,7 +4586,7 @@ arguments, result_type, input_rows_count); \
             if (to_low_cardinality)
             {
                 auto res_column = to_low_cardinality->createColumn();
-                auto * col_low_cardinality = typeid_cast<ColumnLowCardinality *>(res_column.get());
+                auto * col_low_cardinality = assert_cast<ColumnLowCardinality *>(res_column.get());
 
                 if (from_low_cardinality && !src_converted_to_full_column)
                 {

From 3a26b9c89ee3083884fde341c2af418bcde2f4cf Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Mon, 11 Mar 2024 19:42:25 +0000
Subject: [PATCH 317/985] impl

---
 .../0_stateless/02887_mutations_subcolumns.reference        | 6 +++---
 tests/queries/0_stateless/02887_mutations_subcolumns.sql    | 4 ++--
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/tests/queries/0_stateless/02887_mutations_subcolumns.reference b/tests/queries/0_stateless/02887_mutations_subcolumns.reference
index c2d6cbbd225..1ccc83b48a3 100644
--- a/tests/queries/0_stateless/02887_mutations_subcolumns.reference
+++ b/tests/queries/0_stateless/02887_mutations_subcolumns.reference
@@ -5,6 +5,6 @@
 4	ttt
 5	ttt
 6	ttt
-{"a":"1","obj":{"k1":1,"k2":null,"k3":null}}
-{"a":"3","obj":{"k1":null,"k2":null,"k3":1}}
-{"a":"1","obj":{"k1":1,"k2":null,"k3":null}}
+1	[('k1',1)]
+3	[('k3',1)]
+1	[('k1',1)]
diff --git a/tests/queries/0_stateless/02887_mutations_subcolumns.sql b/tests/queries/0_stateless/02887_mutations_subcolumns.sql
index a01158e1b06..87b3009e929 100644
--- a/tests/queries/0_stateless/02887_mutations_subcolumns.sql
+++ b/tests/queries/0_stateless/02887_mutations_subcolumns.sql
@@ -40,9 +40,9 @@ INSERT INTO t_mutations_subcolumns VALUES (2, '{"k2": 1}');
 INSERT INTO t_mutations_subcolumns VALUES (3, '{"k3": 1}');
 
 ALTER TABLE t_mutations_subcolumns DELETE WHERE obj.k2 = 1;
-SELECT * FROM t_mutations_subcolumns ORDER BY a FORMAT JSONEachRow;
+SELECT a, arrayFilter(x -> not isNull(x.2), tupleToNameValuePairs(obj)) FROM t_mutations_subcolumns ORDER BY a;
 
 ALTER TABLE t_mutations_subcolumns DELETE WHERE isNull(obj.k1);
-SELECT * FROM t_mutations_subcolumns ORDER BY a FORMAT JSONEachRow;
+SELECT a, arrayFilter(x -> not isNull(x.2), tupleToNameValuePairs(obj)) FROM t_mutations_subcolumns ORDER BY a;
 
 DROP TABLE t_mutations_subcolumns;

From 2e74685ba6ea8a3cc32ff0e21d0ee657517ef5a4 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 11 Mar 2024 19:58:43 +0000
Subject: [PATCH 318/985] Make variant tests a bit faster

---
 .../02941_variant_type_2.reference            | 80 +++++++++----------
 .../0_stateless/02941_variant_type_2.sh       | 12 +--
 ...different_local_and_global_order.reference | 30 +++----
 ...e_with_different_local_and_global_order.sh |  8 +-
 4 files changed, 65 insertions(+), 65 deletions(-)

diff --git a/tests/queries/0_stateless/02941_variant_type_2.reference b/tests/queries/0_stateless/02941_variant_type_2.reference
index 4b6d53c52ac..20a5176cb5e 100644
--- a/tests/queries/0_stateless/02941_variant_type_2.reference
+++ b/tests/queries/0_stateless/02941_variant_type_2.reference
@@ -1,51 +1,51 @@
 Memory
 test4 insert
 test4 select
-1000000
-200000
-200000
-200000
-200000
-200000
-200000
-200000
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
 MergeTree compact
 test4 insert
 test4 select
-1000000
-200000
-200000
-200000
-200000
-200000
-200000
-200000
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
 test4 select
-1000000
-200000
-200000
-200000
-200000
-200000
-200000
-200000
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
 MergeTree wide
 test4 insert
 test4 select
-1000000
-200000
-200000
-200000
-200000
-200000
-200000
-200000
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
 test4 select
-1000000
-200000
-200000
-200000
-200000
-200000
-200000
-200000
+500000
+100000
+100000
+100000
+100000
+100000
+100000
+100000
diff --git a/tests/queries/0_stateless/02941_variant_type_2.sh b/tests/queries/0_stateless/02941_variant_type_2.sh
index 509c537e7fc..d1fa0a777c9 100755
--- a/tests/queries/0_stateless/02941_variant_type_2.sh
+++ b/tests/queries/0_stateless/02941_variant_type_2.sh
@@ -12,12 +12,12 @@ CH_CLIENT="$CLICKHOUSE_CLIENT --allow_experimental_variant_type=1 --allow_suspic
 function test4_insert()
 {
     echo "test4 insert"
-    $CH_CLIENT -nmq "insert into test select number, NULL from numbers(200000);
-insert into test select number + 200000, number from numbers(200000);
-insert into test select number + 400000, 'str_' || toString(number) from numbers(200000);
-insert into test select number + 600000, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(200000);
-insert into test select number + 800000, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(200000);
-insert into test select number + 1000000, range(number % 20 + 1)::Array(UInt64) from numbers(200000);"
+    $CH_CLIENT -nmq "insert into test select number, NULL from numbers(100000);
+insert into test select number + 100000, number from numbers(100000);
+insert into test select number + 200000, 'str_' || toString(number) from numbers(100000);
+insert into test select number + 300000, ('lc_str_' || toString(number))::LowCardinality(String) from numbers(100000);
+insert into test select number + 400000, tuple(number, number + 1)::Tuple(a UInt32, b UInt32) from numbers(100000);
+insert into test select number + 500000, range(number % 20 + 1)::Array(UInt64) from numbers(100000);"
 }
 
 function test4_select
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
index 1736a307c42..4109a88997c 100644
--- a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.reference
@@ -44,9 +44,9 @@ str_38	str_38	\N
 -----------------------------------------------------------------------------------------------------------
 test2 insert
 test2 select
-2500000
-750000
-1750000
+500000
+100000
+400000
 -----------------------------------------------------------------------------------------------------------
 MergeTree compact
 test1 insert
@@ -136,14 +136,14 @@ str_38	str_38	\N
 -----------------------------------------------------------------------------------------------------------
 test2 insert
 test2 select
-2500000
-750000
-1750000
+500000
+100000
+400000
 -----------------------------------------------------------------------------------------------------------
 test2 select
-2500000
-750000
-1750000
+500000
+100000
+400000
 -----------------------------------------------------------------------------------------------------------
 MergeTree wide
 test1 insert
@@ -233,12 +233,12 @@ str_38	str_38	\N
 -----------------------------------------------------------------------------------------------------------
 test2 insert
 test2 select
-2500000
-750000
-1750000
+500000
+100000
+400000
 -----------------------------------------------------------------------------------------------------------
 test2 select
-2500000
-750000
-1750000
+500000
+100000
+400000
 -----------------------------------------------------------------------------------------------------------
diff --git a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
index 3bb37719a3f..1d88757a5d6 100755
--- a/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
+++ b/tests/queries/0_stateless/02943_variant_type_with_different_local_and_global_order.sh
@@ -29,10 +29,10 @@ function test1_select()
 function test2_insert()
 {
     echo "test2 insert"
-    $CH_CLIENT -q "insert into test select number, number::Variant(UInt64)::Variant(UInt64, Array(UInt64)) from numbers(1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
-    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(1000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
-    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64)) as res from numbers(2000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
-    $CH_CLIENT -q "insert into test select number, if(number < 3500000, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(3000000, 1000000) settings max_insert_block_size = 100000, min_insert_block_size_rows=100000"
+    $CH_CLIENT -q "insert into test select number, number::Variant(UInt64)::Variant(UInt64, Array(UInt64)) from numbers(200000) settings max_insert_block_size = 10000, min_insert_block_size_rows=10000"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)) as res from numbers(200000, 200000) settings max_insert_block_size = 10000, min_insert_block_size_rows=10000"
+    $CH_CLIENT -q "insert into test select number, if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64)) as res from numbers(400000, 200000) settings max_insert_block_size = 10000, min_insert_block_size_rows=10000"
+    $CH_CLIENT -q "insert into test select number, if(number < 3500000, if(number % 2, NULL, number)::Variant(UInt64)::Variant(UInt64, String, Array(UInt64)), if(number % 2, NULL, 'str_' || toString(number))::Variant(String)::Variant(UInt64, String, Array(UInt64))) from numbers(600000, 200000) settings max_insert_block_size = 10000, min_insert_block_size_rows=10000"
 }
 
 function test2_select()

From a90a6e9a271515dec58e4d4f716bcd591f245c00 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 11 Mar 2024 21:05:44 +0100
Subject: [PATCH 319/985] Revert "Don't allow to set max_parallel_replicas to 0
 as it doesn't make sense"

---
 src/Client/ConnectionPoolWithFailover.cpp              | 10 ----------
 src/Client/HedgedConnectionsFactory.cpp                |  6 +-----
 src/Client/HedgedConnectionsFactory.h                  |  2 +-
 src/Interpreters/InterpreterSelectQuery.cpp            |  2 +-
 src/Planner/PlannerJoinTree.cpp                        |  4 ++--
 .../03001_max_parallel_replicas_zero_value.reference   |  0
 .../03001_max_parallel_replicas_zero_value.sql         |  5 -----
 7 files changed, 5 insertions(+), 24 deletions(-)
 delete mode 100644 tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.reference
 delete mode 100644 tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.sql

diff --git a/src/Client/ConnectionPoolWithFailover.cpp b/src/Client/ConnectionPoolWithFailover.cpp
index ad8ed0067d8..492fd4ae9e2 100644
--- a/src/Client/ConnectionPoolWithFailover.cpp
+++ b/src/Client/ConnectionPoolWithFailover.cpp
@@ -21,7 +21,6 @@ namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
     extern const int ALL_CONNECTION_TRIES_FAILED;
-    extern const int BAD_ARGUMENTS;
 }
 
 
@@ -192,20 +191,11 @@ std::vector<ConnectionPoolWithFailover::TryResult> ConnectionPoolWithFailover::g
         max_entries = nested_pools.size();
     }
     else if (pool_mode == PoolMode::GET_ONE)
-    {
         max_entries = 1;
-    }
     else if (pool_mode == PoolMode::GET_MANY)
-    {
-        if (settings.max_parallel_replicas == 0)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "The value of the setting max_parallel_replicas must be greater than 0");
-
         max_entries = settings.max_parallel_replicas;
-    }
     else
-    {
         throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Unknown pool allocation mode");
-    }
 
     if (!priority_func)
         priority_func = makeGetPriorityFunc(settings);
diff --git a/src/Client/HedgedConnectionsFactory.cpp b/src/Client/HedgedConnectionsFactory.cpp
index 703cc1f8821..f5b074a0257 100644
--- a/src/Client/HedgedConnectionsFactory.cpp
+++ b/src/Client/HedgedConnectionsFactory.cpp
@@ -19,7 +19,6 @@ namespace ErrorCodes
     extern const int ALL_CONNECTION_TRIES_FAILED;
     extern const int ALL_REPLICAS_ARE_STALE;
     extern const int LOGICAL_ERROR;
-    extern const int BAD_ARGUMENTS;
 }
 
 HedgedConnectionsFactory::HedgedConnectionsFactory(
@@ -83,10 +82,7 @@ std::vector<Connection *> HedgedConnectionsFactory::getManyConnections(PoolMode
         }
         case PoolMode::GET_MANY:
         {
-            if (max_parallel_replicas == 0)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "The value of the setting max_parallel_replicas must be greater than 0");
-
-            max_entries = std::min(max_parallel_replicas, shuffled_pools.size());
+            max_entries = max_parallel_replicas;
             break;
         }
     }
diff --git a/src/Client/HedgedConnectionsFactory.h b/src/Client/HedgedConnectionsFactory.h
index dd600d58e1e..ce7b553acdd 100644
--- a/src/Client/HedgedConnectionsFactory.h
+++ b/src/Client/HedgedConnectionsFactory.h
@@ -158,7 +158,7 @@ private:
     /// checking the number of requested replicas that are still in process).
     size_t requested_connections_count = 0;
 
-    const size_t max_parallel_replicas = 1;
+    const size_t max_parallel_replicas = 0;
     const bool skip_unavailable_shards = 0;
 };
 
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index e28d8366aa7..bcedba7346d 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -947,7 +947,7 @@ bool InterpreterSelectQuery::adjustParallelReplicasAfterAnalysis()
     if (number_of_replicas_to_use <= 1)
     {
         context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
-        context->setSetting("max_parallel_replicas", UInt64{1});
+        context->setSetting("max_parallel_replicas", UInt64{0});
         LOG_DEBUG(log, "Disabling parallel replicas because there aren't enough rows to read");
         return true;
     }
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 0fe943e0bc7..7b3fb0c5c91 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -295,7 +295,7 @@ bool applyTrivialCountIfPossible(
 
         /// The query could use trivial count if it didn't use parallel replicas, so let's disable it
         query_context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
-        query_context->setSetting("max_parallel_replicas", UInt64{1});
+        query_context->setSetting("max_parallel_replicas", UInt64{0});
         LOG_TRACE(getLogger("Planner"), "Disabling parallel replicas to be able to use a trivial count optimization");
 
     }
@@ -756,7 +756,7 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
                     {
                         planner_context->getMutableQueryContext()->setSetting(
                             "allow_experimental_parallel_reading_from_replicas", Field(0));
-                        planner_context->getMutableQueryContext()->setSetting("max_parallel_replicas", UInt64{1});
+                        planner_context->getMutableQueryContext()->setSetting("max_parallel_replicas", UInt64{0});
                         LOG_DEBUG(getLogger("Planner"), "Disabling parallel replicas because there aren't enough rows to read");
                     }
                     else if (number_of_replicas_to_use < settings.max_parallel_replicas)
diff --git a/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.reference b/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.reference
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.sql b/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.sql
deleted file mode 100644
index 611aa4777ba..00000000000
--- a/tests/queries/0_stateless/03001_max_parallel_replicas_zero_value.sql
+++ /dev/null
@@ -1,5 +0,0 @@
-drop table if exists test_d;
-create table test_d engine=Distributed(test_cluster_two_shard_three_replicas_localhost, system, numbers);
-select * from test_d limit 10 settings max_parallel_replicas = 0, prefer_localhost_replica = 0; --{serverError BAD_ARGUMENTS}
-drop table test_d;
-

From 120a1fdb5f817b442bf659da243407fb7003eaa1 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Mon, 11 Mar 2024 17:24:33 -0300
Subject: [PATCH 320/985] Improves varPop docs. Adds varPopStable.

---
 .../aggregate-functions/reference/varpop.md   | 99 +++++++++++++++++--
 1 file changed, 91 insertions(+), 8 deletions(-)

diff --git a/docs/en/sql-reference/aggregate-functions/reference/varpop.md b/docs/en/sql-reference/aggregate-functions/reference/varpop.md
index 751688b0830..5f18bdc30f6 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/varpop.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/varpop.md
@@ -1,16 +1,99 @@
 ---
-slug: /en/sql-reference/aggregate-functions/reference/varpop
+title: "varPop"
+slug: "/en/sql-reference/aggregate-functions/reference/varpop"
 sidebar_position: 32
 ---
 
-# varPop(x)
+This page covers the `varPop` and `varPopStable` functions available in ClickHouse.
 
-Calculates the amount `Σ((x - x̅)^2) / n`, where `n` is the sample size and `x̅`is the average value of `x`.
+## varPop
 
-In other words, dispersion for a set of values. Returns `Float64`.
+Calculates the population covariance between two data columns. The population covariance measures the degree to which two variables vary together. Calculates the amount `Σ((x - x̅)^2) / n`, where `n` is the sample size and `x̅`is the average value of `x`.
 
-Alias: `VAR_POP`.
+**Syntax**
 
-:::note
-This function uses a numerically unstable algorithm. If you need [numerical stability](https://en.wikipedia.org/wiki/Numerical_stability) in calculations, use the `varPopStable` function. It works slower but provides a lower computational error.
-:::
\ No newline at end of file
+```sql
+covarPop(x, y)
+```
+
+**Parameters**
+
+- `x`: The first data column. [Numeric](../../../native-protocol/columns.md)
+- `y`: The second data column. [Numeric](../../../native-protocol/columns.md)
+
+**Returned value**
+
+Returns an integer of type `Float64`.
+
+**Implementation details**
+
+This function uses a numerically unstable algorithm. If you need numerical stability in calculations, use the slower but more stable [`varPopStable` function](#varPopStable). 
+
+**Example**
+
+```sql
+DROP TABLE IF EXISTS test_data;
+CREATE TABLE test_data
+(
+    x Int32,
+    y Int32
+)
+ENGINE = Memory;
+
+INSERT INTO test_data VALUES (1, 2), (2, 3), (3, 5), (4, 6), (5, 8);
+
+SELECT
+    covarPop(x, y) AS covar_pop
+FROM test_data;
+```
+
+```response
+3
+```
+
+## varPopStable
+
+Calculates population covariance between two data columns using a stable, numerically accurate method to calculate the variance. This function is designed to provide reliable results even with large datasets or values that might cause numerical instability in other implementations.
+
+**Syntax**
+
+```sql
+covarPopStable(x, y)
+```
+
+**Parameters**
+
+- `x`: The first data column. [String literal](../syntax#syntax-string-literal)
+- `y`: The second data column. [Expression](../syntax#syntax-expressions)
+
+**Returned value**
+
+Returns an integer of type `Float64`.
+
+**Implementation details**
+
+Unlike [`varPop()`](#varPop), this function uses a stable, numerically accurate algorithm to calculate the population variance to avoid issues like catastrophic cancellation or loss of precision. This function also handles `NaN` and `Inf` values correctly, excluding them from calculations.
+
+**Example**
+
+Query:
+
+```sql
+DROP TABLE IF EXISTS test_data;
+CREATE TABLE test_data
+(
+    x Int32,
+    y Int32
+)
+ENGINE = Memory;
+
+INSERT INTO test_data VALUES (1, 2), (2, 9), (9, 5), (4, 6), (5, 8);
+
+SELECT
+    covarPopStable(x, y) AS covar_pop_stable
+FROM test_data;
+```
+
+```response
+0.5999999999999999
+```

From 281dc8d29deba2980e6b191edefa3b62114d38a7 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Mon, 11 Mar 2024 17:48:12 -0300
Subject: [PATCH 321/985] Improves varSamp docs. Adds varSampStable docs.

---
 .../aggregate-functions/reference/varsamp.md  | 126 ++++++++++++++++--
 1 file changed, 118 insertions(+), 8 deletions(-)

diff --git a/docs/en/sql-reference/aggregate-functions/reference/varsamp.md b/docs/en/sql-reference/aggregate-functions/reference/varsamp.md
index 9b2b94936ec..e75cb075ff8 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/varsamp.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/varsamp.md
@@ -1,18 +1,128 @@
 ---
+title: "varSamp"
 slug: /en/sql-reference/aggregate-functions/reference/varsamp
 sidebar_position: 33
 ---
 
-# varSamp
+This page contains information on the `varSamp` and `varSampStable` ClickHouse functions.
 
-Calculates the amount `Σ((x - x̅)^2) / (n - 1)`, where `n` is the sample size and `x̅`is the average value of `x`.
+## varSamp
 
-It represents an unbiased estimate of the variance of a random variable if passed values from its sample.
+Calculate the sample variance of a data set. 
 
-Returns `Float64`. When `n <= 1`, returns `+∞`.
+**Syntax**
 
-Alias: `VAR_SAMP`.
+```sql
+varSamp(expr)
+```
 
-:::note
-This function uses a numerically unstable algorithm. If you need [numerical stability](https://en.wikipedia.org/wiki/Numerical_stability) in calculations, use the `varSampStable` function. It works slower but provides a lower computational error.
-:::
+**Parameters**
+
+- `expr`: An expression representing the data set for which you want to calculate the sample variance. [Expression](../syntax#syntax-expressions)
+
+**Returned value**
+
+Returns a Float64 value representing the sample variance of the input data set.
+
+**Implementation details**
+
+The `varSamp()` function calculates the sample variance using the following formula:
+
+```plaintext
+∑(x - mean(x))^2 / (n - 1)
+```
+
+Where:
+
+- `x` is each individual data point in the data set.
+- `mean(x)` is the arithmetic mean of the data set.
+- `n` is the number of data points in the data set.
+
+The function assumes that the input data set represents a sample from a larger population. If you want to calculate the variance of the entire population (when you have the complete data set), you should use the [`varPop()` function](./varpop#varpop) instead.
+
+This function uses a numerically unstable algorithm. If you need numerical stability in calculations, use the slower but more stable [`varSampStable` function](#varSampStable).
+
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE example_table
+(
+    id UInt64,
+    value Float64
+)
+ENGINE = MergeTree
+ORDER BY id;
+
+INSERT INTO example_table VALUES (1, 10.5), (2, 12.3), (3, 9.8), (4, 11.2), (5, 10.7);
+
+SELECT varSamp(value) FROM example_table;
+```
+
+Response:
+
+```response
+0.8650000000000091
+```
+
+## varSampStable
+
+Calculate the sample variance of a data set using a numerically stable algorithm.
+
+**Syntax**
+
+```sql
+varSampStable(expr)
+```
+
+**Parameters**
+
+- `expr`: An expression representing the data set for which you want to calculate the sample variance. [Expression](../syntax#syntax-expressions)
+
+**Returned value**
+
+The `varSampStable()` function returns a Float64 value representing the sample variance of the input data set.
+
+**Implementation details**
+
+The `varSampStable()` function calculates the sample variance using the same formula as the [`varSamp()`](#varSamp function):
+
+```plaintext
+∑(x - mean(x))^2 / (n - 1)
+```
+
+Where:
+- `x` is each individual data point in the data set.
+- `mean(x)` is the arithmetic mean of the data set.
+- `n` is the number of data points in the data set.
+
+The difference between `varSampStable()` and `varSamp()` is that `varSampStable()` is designed to provide a more deterministic and stable result when dealing with floating-point arithmetic. It uses an algorithm that minimizes the accumulation of rounding errors, which can be particularly important when dealing with large data sets or data with a wide range of values.
+
+Like `varSamp()`, the `varSampStable()` function assumes that the input data set represents a sample from a larger population. If you want to calculate the variance of the entire population (when you have the complete data set), you should use the [`varPopStable()` function](./varpop#varpopstable) instead.
+
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE example_table
+(
+    id UInt64,
+    value Float64
+)
+ENGINE = MergeTree
+ORDER BY id;
+
+INSERT INTO example_table VALUES (1, 10.5), (2, 12.3), (3, 9.8), (4, 11.2), (5, 10.7);
+
+SELECT varSampStable(value) FROM example_table;
+```
+
+Response:
+
+```response
+0.865
+```
+
+This query calculates the sample variance of the `value` column in the `example_table` using the `varSampStable()` function. The result shows that the sample variance of the values `[10.5, 12.3, 9.8, 11.2, 10.7]` is approximately 0.865, which may differ slightly from the result of `varSamp()` due to the more precise handling of floating-point arithmetic.

From 563df9bdcb425810a0c2d3ecb11302e22039c048 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 11 Mar 2024 22:49:18 +0100
Subject: [PATCH 322/985] Fix multiple bugs in groupArraySorted

---
 .../AggregateFunctionGroupArraySorted.cpp                 | 8 +++++---
 .../0_stateless/03008_groupSortedArray_field.reference    | 3 +++
 .../queries/0_stateless/03008_groupSortedArray_field.sql  | 6 ++++++
 3 files changed, 14 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/03008_groupSortedArray_field.reference
 create mode 100644 tests/queries/0_stateless/03008_groupSortedArray_field.sql

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index 0e9856cfab9..0692ff28f18 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -310,10 +310,12 @@ public:
         {
             for (Field & element : values)
             {
-                UInt8 is_null = 0;
-                readBinary(is_null, buf);
-                if (!is_null)
+                bool has_value = 0;
+                readBinary(has_value, buf);
+                if (has_value)
                     serialization->deserializeBinary(element, buf, {});
+                else
+                    element = Field{};
             }
         }
         else
diff --git a/tests/queries/0_stateless/03008_groupSortedArray_field.reference b/tests/queries/0_stateless/03008_groupSortedArray_field.reference
new file mode 100644
index 00000000000..a7f89ebcf58
--- /dev/null
+++ b/tests/queries/0_stateless/03008_groupSortedArray_field.reference
@@ -0,0 +1,3 @@
+0A01003C79A557B3C43400C4865AA84C3B4B01000650BC18F7DE0B00FAAF43E708213401008ED706EA0A9F13007228F915F5602C0100C692CA8FB81405003A6D357047EB1A01008416B7C3239EE3FF7BE9483CDC61DC01003E133A7C081AF5FFC1ECC583F7E5EA01000000000000000000000000000000000100C4865AA84C3BCBFF3B79A557B3C4B4010024C46EF500F1ECFFDB3B910AFF0ED301005E2FC14EBAEAE5FFA1D03EB14515DA
+070109000000010600000001080000000103000000010500000001040000000107000000	AggregateFunction(groupArraySorted(10), Nullable(Decimal(3, 0)))
+[3,4,5,6,7,8,9]
diff --git a/tests/queries/0_stateless/03008_groupSortedArray_field.sql b/tests/queries/0_stateless/03008_groupSortedArray_field.sql
new file mode 100644
index 00000000000..6d2aea641a5
--- /dev/null
+++ b/tests/queries/0_stateless/03008_groupSortedArray_field.sql
@@ -0,0 +1,6 @@
+-- https://github.com/ClickHouse/ClickHouse/issues/61186
+SELECT hex(CAST(unhex('0A01003C79A557B3C43400C4865AA84C3B4B01000650BC18F7DE0B00FAAF43E708213401008ED706EA0A9F13007228F915F5602C0100C692CA8FB81405003A6D357047EB1A01008416B7C3239EE3FF7BE9483CDC61DC01003E133A7C081AF5FFC1ECC583F7E5EA01000000000000000000000000000000000100C4865AA84C3BCBFF3B79A557B3C4B4010024C46EF500F1ECFFDB3B910AFF0ED301005E2FC14EBAEAE5FFA1D03EB14515DA'),
+                'AggregateFunction(groupArraySorted(10), Decimal(38, 38))'));
+
+Select hex(groupArraySortedState(10)((number < 3 ? NULL : number)::Nullable(Decimal(3))) as t), toTypeName(t) from numbers(10);
+Select finalizeAggregation(unhex('070109000000010600000001080000000103000000010500000001040000000107000000')::AggregateFunction(groupArraySorted(10), Nullable(Decimal(3, 0))));

From 1b04cc0b4da6d32fd4741ea953dfed060f846d0b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 12 Mar 2024 03:56:10 +0100
Subject: [PATCH 323/985] Fix strange log message

---
 src/Loggers/Loggers.cpp | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Loggers/Loggers.cpp b/src/Loggers/Loggers.cpp
index 1d17585cc96..cc6e4691737 100644
--- a/src/Loggers/Loggers.cpp
+++ b/src/Loggers/Loggers.cpp
@@ -304,6 +304,9 @@ void Loggers::buildLoggers(Poco::Util::AbstractConfiguration & config, Poco::Log
 
         log_settings.turn_off_logger = DB::TextLog::shouldTurnOffLogger();
 
+        log_settings.database = config.getString("text_log.database", "system");
+        log_settings.table = config.getString("text_log.table", "text_log");
+
         split->addTextLog(DB::TextLog::getLogQueue(log_settings), text_log_level);
     }
 #endif

From 29fce4143d1f177efdf1864d41429cfadea22ff1 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 12 Mar 2024 12:07:24 +0800
Subject: [PATCH 324/985] [fix] log level from fatal->error when hardlink and
 copy both fail

---
 src/Storages/MergeTree/MergeTreeData.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index c76ffeee874..97968f1b9c1 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7174,7 +7174,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
             }
         }
         if (!copy_successful)
-            LOG_FATAL(&Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail");
+            LOG_ERROR(&Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail");
     }
 
 
From c628eaca8ba19584fe36067dee8e6ec3e8f5cc4b Mon Sep 17 00:00:00 2001
From: Zhuo Qiu <jewelz.q.915@gmail.com>
Date: Tue, 26 Dec 2023 14:13:07 +0800
Subject: [PATCH 325/985] Consider deleted rows when selecting parts to merge

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 90 +++++++++++++++++++
 src/Storages/MergeTree/IMergeTreeDataPart.h   | 13 +++
 .../MergeTree/MergeFromLogEntryTask.cpp       |  2 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |  1 +
 .../MergeTree/MergeTreeDataMergerMutator.cpp  | 11 ++-
 .../MergeTree/MergeTreeDataMergerMutator.h    |  2 +-
 .../MergeTree/MergeTreeDataWriter.cpp         |  1 +
 src/Storages/MergeTree/MergeTreeSettings.h    |  2 +
 .../MergeTree/MergedBlockOutputStream.cpp     |  5 ++
 .../MergeTree/MutateFromLogEntryTask.cpp      |  2 +-
 src/Storages/MergeTree/MutateTask.cpp         | 54 +++++++++++
 .../MergeTree/ReplicatedMergeTreeQueue.cpp    |  5 +-
 src/Storages/StorageMergeTree.cpp             |  4 +-
 .../03001_consider_lwd_when_merge.reference   |  3 +
 .../03001_consider_lwd_when_merge.sql         | 23 +++++
 15 files changed, 208 insertions(+), 10 deletions(-)
 create mode 100644 tests/queries/0_stateless/03001_consider_lwd_when_merge.reference
 create mode 100644 tests/queries/0_stateless/03001_consider_lwd_when_merge.sql

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 3fea6d04944..c099512d636 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -609,6 +609,15 @@ UInt64 IMergeTreeDataPart::getMarksCount() const
     return index_granularity.getMarksCount();
 }
 
+UInt64 IMergeTreeDataPart::getExistingBytesOnDisk() const
+{
+    if (storage.getSettings()->exclude_deleted_rows_for_part_size_in_merge && supportLightweightDeleteMutate() && hasLightweightDelete()
+        && existing_rows_count.has_value() && existing_rows_count.value() < rows_count && rows_count > 0)
+        return bytes_on_disk * existing_rows_count.value() / rows_count;
+    else
+        return bytes_on_disk;
+}
+
 size_t IMergeTreeDataPart::getFileSizeOrZero(const String & file_name) const
 {
     auto checksum = checksums.files.find(file_name);
@@ -691,6 +700,7 @@ void IMergeTreeDataPart::loadColumnsChecksumsIndexes(bool require_columns_checks
 
         calculateColumnsAndSecondaryIndicesSizesOnDisk();
         loadRowsCount(); /// Must be called after loadIndexGranularity() as it uses the value of `index_granularity`.
+        loadExistingRowsCount(); /// Must be called after loadRowsCount() as it uses the value of `rows_count`.
         loadPartitionAndMinMaxIndex();
         if (!parent_part)
         {
@@ -1313,6 +1323,86 @@ void IMergeTreeDataPart::loadRowsCount()
     }
 }
 
+void IMergeTreeDataPart::loadExistingRowsCount()
+{
+    if (existing_rows_count.has_value())
+        return;
+
+    if (!rows_count || !storage.getSettings()->load_existing_rows_count_for_old_parts || !supportLightweightDeleteMutate()
+        || !hasLightweightDelete())
+        existing_rows_count = rows_count;
+    else
+        existing_rows_count = readExistingRowsCount();
+}
+
+UInt64 IMergeTreeDataPart::readExistingRowsCount()
+{
+    const size_t total_mark = getMarksCount();
+    if (!total_mark)
+        return rows_count;
+
+    NamesAndTypesList cols;
+    cols.push_back(LightweightDeleteDescription::FILTER_COLUMN);
+
+    StorageMetadataPtr metadata_ptr = storage.getInMemoryMetadataPtr();
+    StorageSnapshotPtr storage_snapshot_ptr = std::make_shared<StorageSnapshot>(storage, metadata_ptr);
+
+    MergeTreeReaderPtr reader = getReader(
+        cols,
+        storage_snapshot_ptr,
+        MarkRanges{MarkRange(0, total_mark)},
+        nullptr,
+        storage.getContext()->getMarkCache().get(),
+        std::make_shared<AlterConversions>(),
+        MergeTreeReaderSettings{},
+        ValueSizeMap{},
+        ReadBufferFromFileBase::ProfileCallback{});
+
+    if (!reader)
+    {
+        LOG_WARNING(storage.log, "Create reader failed while reading existing rows count");
+        return rows_count;
+    }
+
+    size_t current_mark = 0;
+    bool continue_reading = false;
+    size_t current_row = 0;
+    size_t existing_count = 0;
+
+    while (current_row < rows_count)
+    {
+        size_t rows_to_read = index_granularity.getMarkRows(current_mark);
+        continue_reading = (current_mark != 0);
+
+        Columns result;
+        result.resize(1);
+
+        size_t rows_read = reader->readRows(current_mark, total_mark, continue_reading, rows_to_read, result);
+        if (!rows_read)
+        {
+            LOG_WARNING(storage.log, "Part {} has lightweight delete, but _row_exists column not found", name);
+            return rows_count;
+        }
+
+        current_row += rows_read;
+        current_mark += (rows_to_read == rows_read);
+
+        const ColumnUInt8 * row_exists_col = typeid_cast<const ColumnUInt8 *>(result[0].get());
+        if (!row_exists_col)
+        {
+            LOG_WARNING(storage.log, "Part {} _row_exists column type is not UInt8", name);
+            return rows_count;
+        }
+
+        for (UInt8 row_exists : row_exists_col->getData())
+            if (row_exists)
+                existing_count++;
+    }
+
+    LOG_DEBUG(storage.log, "Part {} existing_rows_count = {}", name, existing_count);
+    return existing_count;
+}
+
 void IMergeTreeDataPart::appendFilesOfRowsCount(Strings & files)
 {
     files.push_back("count.txt");
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index aaae64a5970..8bd32e777bc 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -231,6 +231,9 @@ public:
 
     size_t rows_count = 0;
 
+    /// Existing rows count (excluding lightweight deleted rows)
+    std::optional<size_t> existing_rows_count;
+
     time_t modification_time = 0;
     /// When the part is removed from the working set. Changes once.
     mutable std::atomic<time_t> remove_time { std::numeric_limits<time_t>::max() };
@@ -373,6 +376,10 @@ public:
     void setBytesOnDisk(UInt64 bytes_on_disk_) { bytes_on_disk = bytes_on_disk_; }
     void setBytesUncompressedOnDisk(UInt64 bytes_uncompressed_on_disk_) { bytes_uncompressed_on_disk = bytes_uncompressed_on_disk_; }
 
+    /// Returns estimated size of existing rows if setting exclude_deleted_rows_for_part_size_in_merge is true
+    /// Otherwise returns bytes_on_disk
+    UInt64 getExistingBytesOnDisk() const;
+
     size_t getFileSizeOrZero(const String & file_name) const;
     auto getFilesChecksums() const { return checksums.files; }
 
@@ -499,6 +506,9 @@ public:
     /// True if here is lightweight deleted mask file in part.
     bool hasLightweightDelete() const;
 
+    /// Read existing rows count from _row_exists column
+    UInt64 readExistingRowsCount();
+
     void writeChecksums(const MergeTreeDataPartChecksums & checksums_, const WriteSettings & settings);
 
     /// Checks the consistency of this data part.
@@ -664,6 +674,9 @@ private:
     /// For the older format version calculates rows count from the size of a column with a fixed size.
     void loadRowsCount();
 
+    /// Load existing rows count from _row_exists column if load_existing_rows_count_for_old_parts is true.
+    void loadExistingRowsCount();
+
     static void appendFilesOfRowsCount(Strings & files);
 
     /// Loads ttl infos in json format from file ttl.txt. If file doesn't exists assigns ttl infos with all zeros
diff --git a/src/Storages/MergeTree/MergeFromLogEntryTask.cpp b/src/Storages/MergeTree/MergeFromLogEntryTask.cpp
index ae6e398026d..5ef004ec019 100644
--- a/src/Storages/MergeTree/MergeFromLogEntryTask.cpp
+++ b/src/Storages/MergeTree/MergeFromLogEntryTask.cpp
@@ -174,7 +174,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
     }
 
     /// Start to make the main work
-    size_t estimated_space_for_merge = MergeTreeDataMergerMutator::estimateNeededDiskSpace(parts);
+    size_t estimated_space_for_merge = MergeTreeDataMergerMutator::estimateNeededDiskSpace(parts, true);
 
     /// Can throw an exception while reserving space.
     IMergeTreeDataPart::TTLInfos ttl_infos;
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index d56cf761cf4..5e05f75c1c5 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -8261,6 +8261,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::createE
 
     new_data_part->setColumns(columns, {}, metadata_snapshot->getMetadataVersion());
     new_data_part->rows_count = block.rows();
+    new_data_part->existing_rows_count = block.rows();
 
     new_data_part->partition = partition;
 
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index 1bf1d4a3c29..90144a8cc8f 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -405,7 +405,7 @@ MergeTreeDataMergerMutator::MergeSelectingInfo MergeTreeDataMergerMutator::getPo
         }
 
         IMergeSelector::Part part_info;
-        part_info.size = part->getBytesOnDisk();
+        part_info.size = part->getExistingBytesOnDisk();
         part_info.age = res.current_time - part->modification_time;
         part_info.level = part->info.level;
         part_info.data = &part;
@@ -611,7 +611,7 @@ SelectPartsDecision MergeTreeDataMergerMutator::selectAllPartsToMergeWithinParti
             return SelectPartsDecision::CANNOT_SELECT;
         }
 
-        sum_bytes += (*it)->getBytesOnDisk();
+        sum_bytes += (*it)->getExistingBytesOnDisk();
 
         prev_it = it;
         ++it;
@@ -793,7 +793,7 @@ MergeTreeData::DataPartPtr MergeTreeDataMergerMutator::renameMergedTemporaryPart
 }
 
 
-size_t MergeTreeDataMergerMutator::estimateNeededDiskSpace(const MergeTreeData::DataPartsVector & source_parts)
+size_t MergeTreeDataMergerMutator::estimateNeededDiskSpace(const MergeTreeData::DataPartsVector & source_parts, const bool & is_merge)
 {
     size_t res = 0;
     time_t current_time = std::time(nullptr);
@@ -804,7 +804,10 @@ size_t MergeTreeDataMergerMutator::estimateNeededDiskSpace(const MergeTreeData::
         if (part_max_ttl && part_max_ttl <= current_time)
             continue;
 
-        res += part->getBytesOnDisk();
+        if (is_merge)
+            res += part->getExistingBytesOnDisk();
+        else
+            res += part->getBytesOnDisk();
     }
 
     return static_cast<size_t>(res * DISK_USAGE_COEFFICIENT_TO_RESERVE);
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
index f3a3f51b6c3..731c5e1d176 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
@@ -193,7 +193,7 @@ public:
 
 
     /// The approximate amount of disk space needed for merge or mutation. With a surplus.
-    static size_t estimateNeededDiskSpace(const MergeTreeData::DataPartsVector & source_parts);
+    static size_t estimateNeededDiskSpace(const MergeTreeData::DataPartsVector & source_parts, const bool & is_merge);
 
 private:
     /** Select all parts belonging to the same partition.
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index fdac16ae19a..2ba74e44b40 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -537,6 +537,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
 
     new_data_part->setColumns(columns, infos, metadata_snapshot->getMetadataVersion());
     new_data_part->rows_count = block.rows();
+    new_data_part->existing_rows_count = block.rows();
     new_data_part->partition = std::move(partition);
     new_data_part->minmax_idx = std::move(minmax_idx);
     new_data_part->is_temp = true;
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 925dc973dc3..ea54f61b4b6 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -42,6 +42,7 @@ struct Settings;
     M(UInt64, compact_parts_max_bytes_to_buffer, 128 * 1024 * 1024, "Only available in ClickHouse Cloud", 0) \
     M(UInt64, compact_parts_max_granules_to_buffer, 128, "Only available in ClickHouse Cloud", 0) \
     M(UInt64, compact_parts_merge_max_bytes_to_prefetch_part, 16 * 1024 * 1024, "Only available in ClickHouse Cloud", 0) \
+    M(Bool, load_existing_rows_count_for_old_parts, false, "Whether to load existing_rows_count for existing parts. If false, existing_rows_count will be equal to rows_count for existing parts.", 0) \
     \
     /** Merge settings. */ \
     M(UInt64, merge_max_block_size, 8192, "How many rows in blocks should be formed for merge operations. By default has the same value as `index_granularity`.", 0) \
@@ -79,6 +80,7 @@ struct Settings;
     M(UInt64, number_of_mutations_to_throw, 1000, "If table has at least that many unfinished mutations, throw 'Too many mutations' exception. Disabled if set to 0", 0) \
     M(UInt64, min_delay_to_mutate_ms, 10, "Min delay of mutating MergeTree table in milliseconds, if there are a lot of unfinished mutations", 0) \
     M(UInt64, max_delay_to_mutate_ms, 1000, "Max delay of mutating MergeTree table in milliseconds, if there are a lot of unfinished mutations", 0) \
+    M(Bool, exclude_deleted_rows_for_part_size_in_merge, false, "Use an estimated source part size (excluding lightweight deleted rows) when selecting parts to merge", 0) \
     \
     /** Inserts settings. */ \
     M(UInt64, parts_to_delay_insert, 1000, "If table contains at least that many active parts in single partition, artificially slow down insert into table. Disabled if set to 0", 0) \
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.cpp b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
index f2fe2e0f255..d8555d69788 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
@@ -188,6 +188,11 @@ MergedBlockOutputStream::Finalizer MergedBlockOutputStream::finalizePartAsync(
     new_part->index_granularity = writer->getIndexGranularity();
     new_part->calculateColumnsAndSecondaryIndicesSizesOnDisk();
 
+    /// In mutation, existing_rows_count is already calculated in PartMergerWriter
+    /// In merge situation, lightweight deleted rows was physically deleted, existing_rows_count equals rows_count
+    if (!new_part->existing_rows_count.has_value())
+        new_part->existing_rows_count = rows_count;
+
     if (default_codec != nullptr)
         new_part->default_codec = default_codec;
 
diff --git a/src/Storages/MergeTree/MutateFromLogEntryTask.cpp b/src/Storages/MergeTree/MutateFromLogEntryTask.cpp
index a9ff687fe4d..620b0e34c6a 100644
--- a/src/Storages/MergeTree/MutateFromLogEntryTask.cpp
+++ b/src/Storages/MergeTree/MutateFromLogEntryTask.cpp
@@ -49,7 +49,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
     }
 
     /// TODO - some better heuristic?
-    size_t estimated_space_for_result = MergeTreeDataMergerMutator::estimateNeededDiskSpace({source_part});
+    size_t estimated_space_for_result = MergeTreeDataMergerMutator::estimateNeededDiskSpace({source_part}, false);
 
     if (entry.create_time + storage_settings_ptr->prefer_fetch_merged_part_time_threshold.totalSeconds() <= time(nullptr)
         && estimated_space_for_result >= storage_settings_ptr->prefer_fetch_merged_part_size_threshold)
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 150cc27c369..3d31d2f05db 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -60,6 +60,26 @@ static bool checkOperationIsNotCanceled(ActionBlocker & merges_blocker, MergeLis
     return true;
 }
 
+static UInt64 getExistingRowsCount(const Block & block)
+{
+    auto column = block.getByName(LightweightDeleteDescription::FILTER_COLUMN.name).column;
+    const ColumnUInt8 * row_exists_col = typeid_cast<const ColumnUInt8 *>(column.get());
+
+    if (!row_exists_col)
+    {
+        LOG_WARNING(&Poco::Logger::get("MutationHelpers::getExistingRowsCount"), "_row_exists column type is not UInt8");
+        return block.rows();
+    }
+
+    UInt64 existing_count = 0;
+
+    for (UInt8 row_exists : row_exists_col->getData())
+        if (row_exists)
+            existing_count++;
+
+    return existing_count;
+}
+
 /** Split mutation commands into two parts:
 *   First part should be executed by mutations interpreter.
 *   Other is just simple drop/renames, so they can be executed without interpreter.
@@ -997,6 +1017,9 @@ struct MutationContext
     bool need_prefix = true;
 
     scope_guard temporary_directory_lock;
+
+    /// Whether this mutation contains lightweight delete
+    bool has_lightweight_delete;
 };
 
 using MutationContextPtr = std::shared_ptr<MutationContext>;
@@ -1191,6 +1214,7 @@ public:
             }
             case State::SUCCESS:
             {
+                finalize();
                 return false;
             }
         }
@@ -1226,6 +1250,11 @@ private:
     const ProjectionsDescription & projections;
 
     ExecutableTaskPtr merge_projection_parts_task_ptr;
+
+    /// Existing rows count calculated during part writing.
+    /// It is initialized in prepare(), calculated in mutateOriginalPartAndPrepareProjections()
+    /// and set to new_data_part in finalize()
+    size_t existing_rows_count;
 };
 
 
@@ -1238,6 +1267,8 @@ void PartMergerWriter::prepare()
         // We split the materialization into multiple stages similar to the process of INSERT SELECT query.
         projection_squashes.emplace_back(settings.min_insert_block_size_rows, settings.min_insert_block_size_bytes);
     }
+
+    existing_rows_count = 0;
 }
 
 
@@ -1251,6 +1282,9 @@ bool PartMergerWriter::mutateOriginalPartAndPrepareProjections()
 
         ctx->out->write(cur_block);
 
+        if (ctx->has_lightweight_delete)
+            existing_rows_count += MutationHelpers::getExistingRowsCount(cur_block);
+
         for (size_t i = 0, size = ctx->projections_to_build.size(); i < size; ++i)
         {
             const auto & projection = *ctx->projections_to_build[i];
@@ -1340,6 +1374,12 @@ bool PartMergerWriter::iterateThroughAllProjections()
     return true;
 }
 
+void PartMergerWriter::finalize()
+{
+    if (ctx->has_lightweight_delete)
+        ctx->new_data_part->existing_rows_count = existing_rows_count;
+}
+
 class MutateAllPartColumnsTask : public IExecutableTask
 {
 public:
@@ -2185,6 +2225,20 @@ bool MutateTask::prepare()
     if (ctx->mutating_pipeline_builder.initialized())
         ctx->execute_ttl_type = MutationHelpers::shouldExecuteTTL(ctx->metadata_snapshot, ctx->interpreter->getColumnDependencies());
 
+    if (ctx->updated_header.has(LightweightDeleteDescription::FILTER_COLUMN.name))
+    {
+        /// This mutation contains lightweight delete, reset existing_rows_count of new data part to 0
+        /// It will be updated while writing _row_exists column
+        ctx->has_lightweight_delete = true;
+    }
+    else
+    {
+        ctx->has_lightweight_delete = false;
+
+        /// This mutation does not contains lightweight delete, copy existing_rows_count from source part
+        ctx->new_data_part->existing_rows_count = ctx->source_part->existing_rows_count.value_or(ctx->source_part->rows_count);
+    }
+
     /// All columns from part are changed and may be some more that were missing before in part
     /// TODO We can materialize compact part without copying data
     if (!isWidePart(ctx->source_part) || !isFullPartStorage(ctx->source_part->getDataPartStorage())
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
index 858eae4afd9..42f564f40da 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
@@ -1350,7 +1350,10 @@ bool ReplicatedMergeTreeQueue::shouldExecuteLogEntry(
             auto part = data.getPartIfExists(name, {MergeTreeDataPartState::PreActive, MergeTreeDataPartState::Active, MergeTreeDataPartState::Outdated});
             if (part)
             {
-                sum_parts_size_in_bytes += part->getBytesOnDisk();
+                if (entry.type == LogEntry::MERGE_PARTS)
+                    sum_parts_size_in_bytes += part->getExistingBytesOnDisk();
+                else
+                    sum_parts_size_in_bytes += part->getBytesOnDisk();
 
                 if (entry.type == LogEntry::MUTATE_PART && !storage.mutation_backoff_policy.partCanBeMutated(part->name))
                 {
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 663e7f435b7..c816a6f0dce 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -1113,7 +1113,7 @@ MergeMutateSelectedEntryPtr StorageMergeTree::selectPartsToMerge(
     if (isTTLMergeType(future_part->merge_type))
         getContext()->getMergeList().bookMergeWithTTL();
 
-    merging_tagger = std::make_unique<CurrentlyMergingPartsTagger>(future_part, MergeTreeDataMergerMutator::estimateNeededDiskSpace(future_part->parts), *this, metadata_snapshot, false);
+    merging_tagger = std::make_unique<CurrentlyMergingPartsTagger>(future_part, MergeTreeDataMergerMutator::estimateNeededDiskSpace(future_part->parts, true), *this, metadata_snapshot, false);
     return std::make_shared<MergeMutateSelectedEntry>(future_part, std::move(merging_tagger), std::make_shared<MutationCommands>());
 }
 
@@ -1336,7 +1336,7 @@ MergeMutateSelectedEntryPtr StorageMergeTree::selectPartsToMutate(
             future_part->name = part->getNewName(new_part_info);
             future_part->part_format = part->getFormat();
 
-            tagger = std::make_unique<CurrentlyMergingPartsTagger>(future_part, MergeTreeDataMergerMutator::estimateNeededDiskSpace({part}), *this, metadata_snapshot, true);
+            tagger = std::make_unique<CurrentlyMergingPartsTagger>(future_part, MergeTreeDataMergerMutator::estimateNeededDiskSpace({part}, false), *this, metadata_snapshot, true);
             return std::make_shared<MergeMutateSelectedEntry>(future_part, std::move(tagger), commands, txn);
         }
     }
diff --git a/tests/queries/0_stateless/03001_consider_lwd_when_merge.reference b/tests/queries/0_stateless/03001_consider_lwd_when_merge.reference
new file mode 100644
index 00000000000..19920de3d3c
--- /dev/null
+++ b/tests/queries/0_stateless/03001_consider_lwd_when_merge.reference
@@ -0,0 +1,3 @@
+2
+2
+1
diff --git a/tests/queries/0_stateless/03001_consider_lwd_when_merge.sql b/tests/queries/0_stateless/03001_consider_lwd_when_merge.sql
new file mode 100644
index 00000000000..a65e8877020
--- /dev/null
+++ b/tests/queries/0_stateless/03001_consider_lwd_when_merge.sql
@@ -0,0 +1,23 @@
+DROP TABLE IF EXISTS lwd_merge;
+
+CREATE TABLE lwd_merge (id UInt64 CODEC(NONE))
+    ENGINE = MergeTree ORDER BY id
+SETTINGS max_bytes_to_merge_at_max_space_in_pool = 80000, exclude_deleted_rows_for_part_size_in_merge = 0;
+
+INSERT INTO lwd_merge SELECT number FROM numbers(10000);
+INSERT INTO lwd_merge SELECT number FROM numbers(10000, 10000);
+
+OPTIMIZE TABLE lwd_merge;
+SELECT count() FROM system.parts WHERE database = currentDatabase() AND table = 'lwd_merge' AND active = 1;
+
+DELETE FROM lwd_merge WHERE id % 10 > 0;
+
+OPTIMIZE TABLE lwd_merge;
+SELECT count() FROM system.parts WHERE database = currentDatabase() AND table = 'lwd_merge' AND active = 1;
+
+ALTER TABLE lwd_merge MODIFY SETTING exclude_deleted_rows_for_part_size_in_merge = 1;
+
+OPTIMIZE TABLE lwd_merge;
+SELECT count() FROM system.parts WHERE database = currentDatabase() AND table = 'lwd_merge' AND active = 1;
+
+DROP TABLE IF EXISTS lwd_merge;

From 4ad8141a162b3b7735e2f08c069e98b9c2ba2382 Mon Sep 17 00:00:00 2001
From: Zhuo Qiu <jewelz.q.915@gmail.com>
Date: Wed, 28 Feb 2024 19:54:21 -0600
Subject: [PATCH 326/985] Maintain compatibility of estimateNeededDiskSpace()

Co-authored-by: Yakov Olkhovskiy <99031427+yakov-olkhovskiy@users.noreply.github.com>
---
 src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp | 4 ++--
 src/Storages/MergeTree/MergeTreeDataMergerMutator.h   | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
index 90144a8cc8f..53d49b51e8f 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.cpp
@@ -793,7 +793,7 @@ MergeTreeData::DataPartPtr MergeTreeDataMergerMutator::renameMergedTemporaryPart
 }
 
 
-size_t MergeTreeDataMergerMutator::estimateNeededDiskSpace(const MergeTreeData::DataPartsVector & source_parts, const bool & is_merge)
+size_t MergeTreeDataMergerMutator::estimateNeededDiskSpace(const MergeTreeData::DataPartsVector & source_parts, const bool & account_for_deleted)
 {
     size_t res = 0;
     time_t current_time = std::time(nullptr);
@@ -804,7 +804,7 @@ size_t MergeTreeDataMergerMutator::estimateNeededDiskSpace(const MergeTreeData::
         if (part_max_ttl && part_max_ttl <= current_time)
             continue;
 
-        if (is_merge)
+        if (account_for_deleted)
             res += part->getExistingBytesOnDisk();
         else
             res += part->getBytesOnDisk();
diff --git a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
index 731c5e1d176..669ee040af3 100644
--- a/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
+++ b/src/Storages/MergeTree/MergeTreeDataMergerMutator.h
@@ -193,7 +193,7 @@ public:
 
 
     /// The approximate amount of disk space needed for merge or mutation. With a surplus.
-    static size_t estimateNeededDiskSpace(const MergeTreeData::DataPartsVector & source_parts, const bool & is_merge);
+    static size_t estimateNeededDiskSpace(const MergeTreeData::DataPartsVector & source_parts, const bool & account_for_deleted = false);
 
 private:
     /** Select all parts belonging to the same partition.

From 10c7ea7a29d8426fcf4d0ca09c778cdd3e56fbbd Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 12 Mar 2024 14:32:07 +0800
Subject: [PATCH 327/985] [debug] fast test again

---
 src/Storages/StorageMergeTree.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 055a48ad998..928ee094583 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2083,7 +2083,6 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
         MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
 
         IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
-
         bool on_same_disk = false;
         for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
             if (disk->getName() == src_part->getDataPartStorage().getDiskName())

From 05969a39f390445c8d0df43b7077e0eb81db3538 Mon Sep 17 00:00:00 2001
From: Zhuo Qiu <jewelz.q.915@gmail.com>
Date: Tue, 12 Mar 2024 14:45:25 +0800
Subject: [PATCH 328/985] resolve conflicts

---
 src/Storages/MergeTree/IMergeTreeDataPart.cpp | 5 +++--
 src/Storages/MergeTree/MutateTask.cpp         | 4 ++--
 2 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index c099512d636..5fede923252 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1342,7 +1342,7 @@ UInt64 IMergeTreeDataPart::readExistingRowsCount()
         return rows_count;
 
     NamesAndTypesList cols;
-    cols.push_back(LightweightDeleteDescription::FILTER_COLUMN);
+    cols.emplace_back(RowExistsColumn::name, RowExistsColumn::type);
 
     StorageMetadataPtr metadata_ptr = storage.getInMemoryMetadataPtr();
     StorageSnapshotPtr storage_snapshot_ptr = std::make_shared<StorageSnapshot>(storage, metadata_ptr);
@@ -1351,7 +1351,8 @@ UInt64 IMergeTreeDataPart::readExistingRowsCount()
         cols,
         storage_snapshot_ptr,
         MarkRanges{MarkRange(0, total_mark)},
-        nullptr,
+        /*virtual_fields=*/ {},
+        /*uncompressed_cache=*/{},
         storage.getContext()->getMarkCache().get(),
         std::make_shared<AlterConversions>(),
         MergeTreeReaderSettings{},
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 3d31d2f05db..4d1e60f450e 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -62,7 +62,7 @@ static bool checkOperationIsNotCanceled(ActionBlocker & merges_blocker, MergeLis
 
 static UInt64 getExistingRowsCount(const Block & block)
 {
-    auto column = block.getByName(LightweightDeleteDescription::FILTER_COLUMN.name).column;
+    auto column = block.getByName(RowExistsColumn::name).column;
     const ColumnUInt8 * row_exists_col = typeid_cast<const ColumnUInt8 *>(column.get());
 
     if (!row_exists_col)
@@ -2225,7 +2225,7 @@ bool MutateTask::prepare()
     if (ctx->mutating_pipeline_builder.initialized())
         ctx->execute_ttl_type = MutationHelpers::shouldExecuteTTL(ctx->metadata_snapshot, ctx->interpreter->getColumnDependencies());
 
-    if (ctx->updated_header.has(LightweightDeleteDescription::FILTER_COLUMN.name))
+    if (ctx->updated_header.has(RowExistsColumn::name))
     {
         /// This mutation contains lightweight delete, reset existing_rows_count of new data part to 0
         /// It will be updated while writing _row_exists column

From c1b94b2170acbf72d066928fd168c18dc571d505 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Tue, 12 Mar 2024 15:33:43 +0800
Subject: [PATCH 329/985] [debug] fast test again again

---
 src/Storages/MergeTree/MergeTreeData.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 97968f1b9c1..7fc504d71f1 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7174,7 +7174,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
             }
         }
         if (!copy_successful)
-            LOG_ERROR(&Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail");
+            LOG_ERROR(&Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail.");
     }
 
 
From 5f1991fbef2f959f1d55c62194d948814d199fa9 Mon Sep 17 00:00:00 2001
From: lgbo-ustc <lgbo.ustc@gmail.com>
Date: Tue, 12 Mar 2024 15:53:28 +0800
Subject: [PATCH 330/985] too big translation unit in Aggregator

---
 src/Common/HashTable/FixedHashMap.h           |    3 +
 .../HashTable/TwoLevelStringHashTable.h       |    1 +
 src/Interpreters/AggregatedData.h             |  142 +++
 src/Interpreters/AggregatedDataVariants.cpp   |  255 ++++
 src/Interpreters/AggregatedDataVariants.h     |  320 +++++
 src/Interpreters/AggregationMethod.cpp        |  215 ++++
 src/Interpreters/AggregationMethod.h          |  320 +++++
 src/Interpreters/Aggregator.cpp               |  512 ++++----
 src/Interpreters/Aggregator.h                 | 1035 +----------------
 9 files changed, 1541 insertions(+), 1262 deletions(-)
 create mode 100644 src/Interpreters/AggregatedData.h
 create mode 100644 src/Interpreters/AggregatedDataVariants.cpp
 create mode 100644 src/Interpreters/AggregatedDataVariants.h
 create mode 100644 src/Interpreters/AggregationMethod.cpp
 create mode 100644 src/Interpreters/AggregationMethod.h

diff --git a/src/Common/HashTable/FixedHashMap.h b/src/Common/HashTable/FixedHashMap.h
index e835a6fba94..537f37a9e6c 100644
--- a/src/Common/HashTable/FixedHashMap.h
+++ b/src/Common/HashTable/FixedHashMap.h
@@ -109,6 +109,9 @@ public:
 
     using Base::Base;
 
+    FixedHashMap() = default;
+    FixedHashMap(size_t ) {} /// NOLINT
+
     template <typename Func, bool>
     void ALWAYS_INLINE mergeToViaEmplace(Self & that, Func && func)
     {
diff --git a/src/Common/HashTable/TwoLevelStringHashTable.h b/src/Common/HashTable/TwoLevelStringHashTable.h
index 54c208c5b60..1ce6b3d02e3 100644
--- a/src/Common/HashTable/TwoLevelStringHashTable.h
+++ b/src/Common/HashTable/TwoLevelStringHashTable.h
@@ -38,6 +38,7 @@ public:
     Impl impls[NUM_BUCKETS];
 
     TwoLevelStringHashTable() = default;
+    TwoLevelStringHashTable(size_t ) {} /// NOLINT
 
     template <typename Source>
     explicit TwoLevelStringHashTable(const Source & src)
diff --git a/src/Interpreters/AggregatedData.h b/src/Interpreters/AggregatedData.h
new file mode 100644
index 00000000000..6cd6b190801
--- /dev/null
+++ b/src/Interpreters/AggregatedData.h
@@ -0,0 +1,142 @@
+#pragma once
+#include <AggregateFunctions/IAggregateFunction.h>
+
+#include <Common/HashTable/FixedHashMap.h>
+#include <Common/HashTable/StringHashMap.h>
+#include <Common/HashTable/TwoLevelHashMap.h>
+#include <Common/HashTable/TwoLevelStringHashMap.h>
+namespace DB
+{
+/** Different data structures that can be used for aggregation
+  * For efficiency, the aggregation data itself is put into the pool.
+  * Data and pool ownership (states of aggregate functions)
+  *  is acquired later - in `convertToBlocks` function, by the ColumnAggregateFunction object.
+  *
+  * Most data structures exist in two versions: normal and two-level (TwoLevel).
+  * A two-level hash table works a little slower with a small number of different keys,
+  *  but with a large number of different keys scales better, because it allows
+  *  parallelize some operations (merging, post-processing) in a natural way.
+  *
+  * To ensure efficient work over a wide range of conditions,
+  *  first single-level hash tables are used,
+  *  and when the number of different keys is large enough,
+  *  they are converted to two-level ones.
+  *
+  * PS. There are many different approaches to the effective implementation of parallel and distributed aggregation,
+  *  best suited for different cases, and this approach is just one of them, chosen for a combination of reasons.
+  */
+
+using AggregatedDataWithoutKey = AggregateDataPtr;
+
+using AggregatedDataWithUInt8Key = FixedImplicitZeroHashMapWithCalculatedSize<UInt8, AggregateDataPtr>;
+using AggregatedDataWithUInt16Key = FixedImplicitZeroHashMap<UInt16, AggregateDataPtr>;
+
+using AggregatedDataWithUInt32Key = HashMap<UInt32, AggregateDataPtr, HashCRC32<UInt32>>;
+using AggregatedDataWithUInt64Key = HashMap<UInt64, AggregateDataPtr, HashCRC32<UInt64>>;
+
+using AggregatedDataWithShortStringKey = StringHashMap<AggregateDataPtr>;
+
+using AggregatedDataWithStringKey = HashMapWithSavedHash<StringRef, AggregateDataPtr>;
+
+using AggregatedDataWithKeys128 = HashMap<UInt128, AggregateDataPtr, UInt128HashCRC32>;
+using AggregatedDataWithKeys256 = HashMap<UInt256, AggregateDataPtr, UInt256HashCRC32>;
+
+using AggregatedDataWithUInt32KeyTwoLevel = TwoLevelHashMap<UInt32, AggregateDataPtr, HashCRC32<UInt32>>;
+using AggregatedDataWithUInt64KeyTwoLevel = TwoLevelHashMap<UInt64, AggregateDataPtr, HashCRC32<UInt64>>;
+
+using AggregatedDataWithShortStringKeyTwoLevel = TwoLevelStringHashMap<AggregateDataPtr>;
+
+using AggregatedDataWithStringKeyTwoLevel = TwoLevelHashMapWithSavedHash<StringRef, AggregateDataPtr>;
+
+using AggregatedDataWithKeys128TwoLevel = TwoLevelHashMap<UInt128, AggregateDataPtr, UInt128HashCRC32>;
+using AggregatedDataWithKeys256TwoLevel = TwoLevelHashMap<UInt256, AggregateDataPtr, UInt256HashCRC32>;
+
+/** Variants with better hash function, using more than 32 bits for hash.
+  * Using for merging phase of external aggregation, where number of keys may be far greater than 4 billion,
+  *  but we keep in memory and merge only sub-partition of them simultaneously.
+  * TODO We need to switch for better hash function not only for external aggregation,
+  *  but also for huge aggregation results on machines with terabytes of RAM.
+  */
+
+using AggregatedDataWithUInt64KeyHash64 = HashMap<UInt64, AggregateDataPtr, DefaultHash<UInt64>>;
+using AggregatedDataWithStringKeyHash64 = HashMapWithSavedHash<StringRef, AggregateDataPtr, StringRefHash64>;
+using AggregatedDataWithKeys128Hash64 = HashMap<UInt128, AggregateDataPtr, UInt128Hash>;
+using AggregatedDataWithKeys256Hash64 = HashMap<UInt256, AggregateDataPtr, UInt256Hash>;
+
+template <typename Base>
+struct AggregationDataWithNullKey : public Base
+{
+    using Base::Base;
+
+    bool & hasNullKeyData() { return has_null_key_data; }
+    AggregateDataPtr & getNullKeyData() { return null_key_data; }
+    bool hasNullKeyData() const { return has_null_key_data; }
+    const AggregateDataPtr & getNullKeyData() const { return null_key_data; }
+    size_t size() const { return Base::size() + (has_null_key_data ? 1 : 0); }
+    bool empty() const { return Base::empty() && !has_null_key_data; }
+    void clear()
+    {
+        Base::clear();
+        has_null_key_data = false;
+    }
+    void clearAndShrink()
+    {
+        Base::clearAndShrink();
+        has_null_key_data = false;
+    }
+
+private:
+    bool has_null_key_data = false;
+    AggregateDataPtr null_key_data = nullptr;
+};
+
+template <typename Base>
+struct AggregationDataWithNullKeyTwoLevel : public Base
+{
+    using Base::Base;
+    using Base::impls;
+
+    AggregationDataWithNullKeyTwoLevel() = default;
+
+    template <typename Other>
+    explicit AggregationDataWithNullKeyTwoLevel(const Other & other) : Base(other)
+    {
+        impls[0].hasNullKeyData() = other.hasNullKeyData();
+        impls[0].getNullKeyData() = other.getNullKeyData();
+    }
+
+    bool & hasNullKeyData() { return impls[0].hasNullKeyData(); }
+    AggregateDataPtr & getNullKeyData() { return impls[0].getNullKeyData(); }
+    bool hasNullKeyData() const { return impls[0].hasNullKeyData(); }
+    const AggregateDataPtr & getNullKeyData() const { return impls[0].getNullKeyData(); }
+};
+
+template <typename ... Types>
+using HashTableWithNullKey = AggregationDataWithNullKey<HashMapTable<Types ...>>;
+template <typename ... Types>
+using StringHashTableWithNullKey = AggregationDataWithNullKey<StringHashMap<Types ...>>;
+
+using AggregatedDataWithNullableUInt8Key = AggregationDataWithNullKey<AggregatedDataWithUInt8Key>;
+using AggregatedDataWithNullableUInt16Key = AggregationDataWithNullKey<AggregatedDataWithUInt16Key>;
+using AggregatedDataWithNullableUInt32Key = AggregationDataWithNullKey<AggregatedDataWithUInt32Key>;
+
+
+using AggregatedDataWithNullableUInt64Key = AggregationDataWithNullKey<AggregatedDataWithUInt64Key>;
+using AggregatedDataWithNullableStringKey = AggregationDataWithNullKey<AggregatedDataWithStringKey>;
+using AggregatedDataWithNullableShortStringKey = AggregationDataWithNullKey<AggregatedDataWithShortStringKey>;
+
+
+using AggregatedDataWithNullableUInt32KeyTwoLevel = AggregationDataWithNullKeyTwoLevel<
+    TwoLevelHashMap<UInt32, AggregateDataPtr, HashCRC32<UInt32>,
+                    TwoLevelHashTableGrower<>, HashTableAllocator, HashTableWithNullKey>>;
+using AggregatedDataWithNullableUInt64KeyTwoLevel = AggregationDataWithNullKeyTwoLevel<
+        TwoLevelHashMap<UInt64, AggregateDataPtr, HashCRC32<UInt64>,
+        TwoLevelHashTableGrower<>, HashTableAllocator, HashTableWithNullKey>>;
+
+using AggregatedDataWithNullableShortStringKeyTwoLevel = AggregationDataWithNullKeyTwoLevel<
+        TwoLevelStringHashMap<AggregateDataPtr, HashTableAllocator, StringHashTableWithNullKey>>;
+
+using AggregatedDataWithNullableStringKeyTwoLevel = AggregationDataWithNullKeyTwoLevel<
+        TwoLevelHashMapWithSavedHash<StringRef, AggregateDataPtr, DefaultHash<StringRef>,
+        TwoLevelHashTableGrower<>, HashTableAllocator, HashTableWithNullKey>>;
+}
diff --git a/src/Interpreters/AggregatedDataVariants.cpp b/src/Interpreters/AggregatedDataVariants.cpp
new file mode 100644
index 00000000000..0c86c58bd3e
--- /dev/null
+++ b/src/Interpreters/AggregatedDataVariants.cpp
@@ -0,0 +1,255 @@
+#include <Interpreters/AggregatedDataVariants.h>
+#include <Interpreters/Aggregator.h>
+
+namespace ProfileEvents
+{
+    extern const Event AggregationPreallocatedElementsInHashTables;
+}
+
+namespace DB
+{
+namespace ErrorCodes
+{
+    extern const int UNKNOWN_AGGREGATED_DATA_VARIANT;
+    extern const int LOGICAL_ERROR;
+
+}
+using ColumnsHashing::HashMethodContext;
+using ColumnsHashing::HashMethodContextPtr;
+using ColumnsHashing::LastElementCacheStats;
+
+AggregatedDataVariants::AggregatedDataVariants() : aggregates_pools(1, std::make_shared<Arena>()), aggregates_pool(aggregates_pools.back().get()) {}
+
+AggregatedDataVariants::~AggregatedDataVariants()
+{
+    if (aggregator && !aggregator->all_aggregates_has_trivial_destructor)
+    {
+        try
+        {
+            aggregator->destroyAllAggregateStates(*this);
+        }
+        catch (...)
+        {
+            tryLogCurrentException(__PRETTY_FUNCTION__);
+        }
+    }
+}
+
+// The std::is_constructible trait isn't suitable here because some classes have template constructors with semantics different from providing size hints.
+// Also string hash table variants are not supported due to the fact that both local perf tests and tests in CI showed slowdowns for them.
+template <typename...>
+struct HasConstructorOfNumberOfElements : std::false_type
+{
+};
+
+template <typename... Ts>
+struct HasConstructorOfNumberOfElements<HashMapTable<Ts...>> : std::true_type
+{
+};
+
+template <typename Key, typename Cell, typename Hash, typename Grower, typename Allocator, template <typename...> typename ImplTable>
+struct HasConstructorOfNumberOfElements<TwoLevelHashMapTable<Key, Cell, Hash, Grower, Allocator, ImplTable>> : std::true_type
+{
+};
+
+template <typename... Ts>
+struct HasConstructorOfNumberOfElements<HashTable<Ts...>> : std::true_type
+{
+};
+
+template <typename... Ts>
+struct HasConstructorOfNumberOfElements<TwoLevelHashTable<Ts...>> : std::true_type
+{
+};
+
+template <template <typename> typename Method, typename Base>
+struct HasConstructorOfNumberOfElements<Method<Base>> : HasConstructorOfNumberOfElements<Base>
+{
+};
+
+template <typename Method>
+auto constructWithReserveIfPossible(size_t size_hint)
+{
+    if constexpr (HasConstructorOfNumberOfElements<typename Method::Data>::value)
+    {
+        ProfileEvents::increment(ProfileEvents::AggregationPreallocatedElementsInHashTables, size_hint);
+        return std::make_unique<Method>(size_hint);
+    }
+    else
+        return std::make_unique<Method>();
+}
+
+void AggregatedDataVariants::init(Type type_, std::optional<size_t> size_hint)
+{
+    switch (type_)
+    {
+        case Type::EMPTY:
+        case Type::without_key:
+            break;
+
+    #define M(NAME, IS_TWO_LEVEL) \
+        case Type::NAME: \
+            if (size_hint) \
+                (NAME) = constructWithReserveIfPossible<decltype(NAME)::element_type>(*size_hint); \
+            else \
+                (NAME) = std::make_unique<decltype(NAME)::element_type>(); \
+            break;
+        APPLY_FOR_AGGREGATED_VARIANTS(M)
+#undef M
+    }
+
+    type = type_;
+}
+
+size_t AggregatedDataVariants::size() const
+{
+    switch (type)
+    {
+        case Type::EMPTY:
+            return 0;
+        case Type::without_key:
+            return 1;
+
+    #define M(NAME, IS_TWO_LEVEL) \
+        case Type::NAME: \
+            return (NAME)->data.size() + (without_key != nullptr);
+        APPLY_FOR_AGGREGATED_VARIANTS(M)
+    #undef M
+    }
+
+    UNREACHABLE();
+}
+
+size_t AggregatedDataVariants::sizeWithoutOverflowRow() const
+{
+    switch (type)
+    {
+        case Type::EMPTY:
+        return 0;
+        case Type::without_key:
+        return 1;
+
+    #define M(NAME, IS_TWO_LEVEL) \
+        case Type::NAME: \
+            return (NAME)->data.size();
+        APPLY_FOR_AGGREGATED_VARIANTS(M)
+    #undef M
+    }
+
+    UNREACHABLE();
+}
+
+const char * AggregatedDataVariants::getMethodName() const
+{
+    switch (type)
+    {
+        case Type::EMPTY:
+        return "EMPTY";
+        case Type::without_key:
+        return "without_key";
+
+    #define M(NAME, IS_TWO_LEVEL) \
+        case Type::NAME: \
+            return #NAME;
+        APPLY_FOR_AGGREGATED_VARIANTS(M)
+    #undef M
+    }
+
+    UNREACHABLE();
+}
+
+bool AggregatedDataVariants::isTwoLevel() const
+{
+    switch (type)
+    {
+        case Type::EMPTY:
+        return false;
+        case Type::without_key:
+        return false;
+
+    #define M(NAME, IS_TWO_LEVEL) \
+        case Type::NAME: \
+            return IS_TWO_LEVEL;
+        APPLY_FOR_AGGREGATED_VARIANTS(M)
+    #undef M
+    }
+
+    UNREACHABLE();
+}
+
+bool AggregatedDataVariants::isConvertibleToTwoLevel() const
+{
+    switch (type)
+    {
+    #define M(NAME) \
+        case Type::NAME: \
+            return true;
+
+        APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
+
+    #undef M
+        default:
+        return false;
+    }
+}
+
+void AggregatedDataVariants::convertToTwoLevel()
+{
+    if (aggregator)
+        LOG_TRACE(aggregator->log, "Converting aggregation data to two-level.");
+
+    switch (type)
+    {
+#define M(NAME) \
+        case Type::NAME: \
+            NAME ## _two_level = std::make_unique<decltype(NAME ## _two_level)::element_type>(*(NAME)); \
+            (NAME).reset(); \
+            type = Type::NAME ## _two_level; \
+            break;
+
+        APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
+
+    #undef M
+
+        default:
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong data variant passed.");
+    }
+}
+
+bool AggregatedDataVariants::isLowCardinality() const
+{
+    switch (type)
+    {
+    #define M(NAME) \
+        case Type::NAME: \
+            return true;
+
+        APPLY_FOR_LOW_CARDINALITY_VARIANTS(M)
+    #undef M
+        default:
+            return false;
+    }
+}
+
+HashMethodContextPtr AggregatedDataVariants::createCache(Type type, const HashMethodContext::Settings & settings)
+{
+    switch (type)
+    {
+        case Type::without_key:
+            return nullptr;
+
+    #define M(NAME, IS_TWO_LEVEL) \
+        case Type::NAME: { \
+            using TPtr##NAME = decltype(AggregatedDataVariants::NAME); \
+            using T##NAME = typename TPtr##NAME ::element_type; \
+            return T##NAME ::State::createContext(settings); \
+        }
+
+            APPLY_FOR_AGGREGATED_VARIANTS(M)
+    #undef M
+
+        default:
+            throw Exception(ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT, "Unknown aggregated data variant.");
+    }
+}
+}
diff --git a/src/Interpreters/AggregatedDataVariants.h b/src/Interpreters/AggregatedDataVariants.h
new file mode 100644
index 00000000000..8b82c5d9842
--- /dev/null
+++ b/src/Interpreters/AggregatedDataVariants.h
@@ -0,0 +1,320 @@
+#pragma once
+#include <boost/noncopyable.hpp>
+#include <memory.h>
+#include <AggregateFunctions/IAggregateFunction.h>
+#include <Common/ColumnsHashing.h>
+#include <Interpreters/AggregatedData.h>
+#include <Interpreters/AggregationMethod.h>
+
+namespace DB
+{
+class Arena;
+class Aggregator;
+
+struct AggregatedDataVariants : private boost::noncopyable
+{
+    /** Working with states of aggregate functions in the pool is arranged in the following (inconvenient) way:
+      * - when aggregating, states are created in the pool using IAggregateFunction::create (inside - `placement new` of arbitrary structure);
+      * - they must then be destroyed using IAggregateFunction::destroy (inside - calling the destructor of arbitrary structure);
+      * - if aggregation is complete, then, in the Aggregator::convertToBlocks function, pointers to the states of aggregate functions
+      *   are written to ColumnAggregateFunction; ColumnAggregateFunction "acquires ownership" of them, that is - calls `destroy` in its destructor.
+      * - if during the aggregation, before call to Aggregator::convertToBlocks, an exception was thrown,
+      *   then the states of aggregate functions must still be destroyed,
+      *   otherwise, for complex states (eg, AggregateFunctionUniq), there will be memory leaks;
+      * - in this case, to destroy states, the destructor calls Aggregator::destroyAggregateStates method,
+      *   but only if the variable aggregator (see below) is not nullptr;
+      * - that is, until you transfer ownership of the aggregate function states in the ColumnAggregateFunction, set the variable `aggregator`,
+      *   so that when an exception occurs, the states are correctly destroyed.
+      *
+      * PS. This can be corrected by making a pool that knows about which states of aggregate functions and in which order are put in it, and knows how to destroy them.
+      * But this can hardly be done simply because it is planned to put variable-length strings into the same pool.
+      * In this case, the pool will not be able to know with what offsets objects are stored.
+      */
+    const Aggregator * aggregator = nullptr;
+
+    size_t keys_size{};  /// Number of keys. NOTE do we need this field?
+    Sizes key_sizes;     /// Dimensions of keys, if keys of fixed length
+
+    /// Pools for states of aggregate functions. Ownership will be later transferred to ColumnAggregateFunction.
+    using ArenaPtr = std::shared_ptr<Arena>;
+    using Arenas = std::vector<ArenaPtr>;
+    Arenas aggregates_pools;
+    Arena * aggregates_pool{};    /// The pool that is currently used for allocation.
+
+    /** Specialization for the case when there are no keys, and for keys not fitted into max_rows_to_group_by.
+      */
+    AggregatedDataWithoutKey without_key = nullptr;
+
+    /// Stats of a cache for consecutive keys optimization.
+    /// Stats can be used to disable the cache in case of a lot of misses.
+    ColumnsHashing::LastElementCacheStats consecutive_keys_cache_stats;
+
+    // Disable consecutive key optimization for Uint8/16, because they use a FixedHashMap
+    // and the lookup there is almost free, so we don't need to cache the last lookup result
+    std::unique_ptr<AggregationMethodOneNumber<UInt8, AggregatedDataWithUInt8Key, false>>           key8;
+    std::unique_ptr<AggregationMethodOneNumber<UInt16, AggregatedDataWithUInt16Key, false>>         key16;
+
+    std::unique_ptr<AggregationMethodOneNumber<UInt32, AggregatedDataWithUInt64Key>>         key32;
+    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithUInt64Key>>         key64;
+    std::unique_ptr<AggregationMethodStringNoCache<AggregatedDataWithShortStringKey>>               key_string;
+    std::unique_ptr<AggregationMethodFixedStringNoCache<AggregatedDataWithShortStringKey>>          key_fixed_string;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt16Key, false, false, false>>  keys16;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt32Key>>                   keys32;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt64Key>>                   keys64;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128>>                   keys128;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256>>                   keys256;
+    std::unique_ptr<AggregationMethodSerialized<AggregatedDataWithStringKey>>                          serialized;
+    std::unique_ptr<AggregationMethodNullableSerialized<AggregatedDataWithStringKey>>                  nullable_serialized;
+    std::unique_ptr<AggregationMethodPreallocSerialized<AggregatedDataWithStringKey>>                  prealloc_serialized;
+    std::unique_ptr<AggregationMethodNullablePreallocSerialized<AggregatedDataWithStringKey>>          nullable_prealloc_serialized;
+
+    std::unique_ptr<AggregationMethodOneNumber<UInt32, AggregatedDataWithUInt64KeyTwoLevel>> key32_two_level;
+    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithUInt64KeyTwoLevel>> key64_two_level;
+    std::unique_ptr<AggregationMethodStringNoCache<AggregatedDataWithShortStringKeyTwoLevel>>       key_string_two_level;
+    std::unique_ptr<AggregationMethodFixedStringNoCache<AggregatedDataWithShortStringKeyTwoLevel>>  key_fixed_string_two_level;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt32KeyTwoLevel>>           keys32_two_level;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt64KeyTwoLevel>>           keys64_two_level;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128TwoLevel>>           keys128_two_level;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256TwoLevel>>           keys256_two_level;
+    std::unique_ptr<AggregationMethodSerialized<AggregatedDataWithStringKeyTwoLevel>>                  serialized_two_level;
+    std::unique_ptr<AggregationMethodNullableSerialized<AggregatedDataWithStringKeyTwoLevel>>          nullable_serialized_two_level;
+    std::unique_ptr<AggregationMethodPreallocSerialized<AggregatedDataWithStringKeyTwoLevel>>          prealloc_serialized_two_level;
+    std::unique_ptr<AggregationMethodNullablePreallocSerialized<AggregatedDataWithStringKeyTwoLevel>>  nullable_prealloc_serialized_two_level;
+
+    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithUInt64KeyHash64>>   key64_hash64;
+    std::unique_ptr<AggregationMethodString<AggregatedDataWithStringKeyHash64>>              key_string_hash64;
+    std::unique_ptr<AggregationMethodFixedString<AggregatedDataWithStringKeyHash64>>         key_fixed_string_hash64;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128Hash64>>             keys128_hash64;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256Hash64>>             keys256_hash64;
+    std::unique_ptr<AggregationMethodSerialized<AggregatedDataWithStringKeyHash64>>                  serialized_hash64;
+    std::unique_ptr<AggregationMethodNullableSerialized<AggregatedDataWithStringKeyHash64>>          nullable_serialized_hash64;
+    std::unique_ptr<AggregationMethodPreallocSerialized<AggregatedDataWithStringKeyHash64>>          prealloc_serialized_hash64;
+    std::unique_ptr<AggregationMethodNullablePreallocSerialized<AggregatedDataWithStringKeyHash64>>  nullable_prealloc_serialized_hash64;
+
+    /// Support for nullable keys.
+    std::unique_ptr<AggregationMethodOneNumber<UInt8, AggregatedDataWithNullableUInt8Key, false, true>>         nullable_key8;
+    std::unique_ptr<AggregationMethodOneNumber<UInt16, AggregatedDataWithNullableUInt16Key, false, true>>         nullable_key16;
+    std::unique_ptr<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt32Key, true, true>>         nullable_key32;
+    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64Key, true, true>>         nullable_key64;
+    std::unique_ptr<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt32KeyTwoLevel, true, true>>         nullable_key32_two_level;
+    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64KeyTwoLevel, true, true>>         nullable_key64_two_level;
+
+    std::unique_ptr<AggregationMethodStringNoCache<AggregatedDataWithNullableShortStringKey, true>> nullable_key_string;
+    std::unique_ptr<AggregationMethodFixedStringNoCache<AggregatedDataWithNullableShortStringKey, true>> nullable_key_fixed_string;
+    std::unique_ptr<AggregationMethodStringNoCache<AggregatedDataWithNullableShortStringKeyTwoLevel, true>> nullable_key_string_two_level;
+    std::unique_ptr<AggregationMethodFixedStringNoCache<AggregatedDataWithNullableShortStringKeyTwoLevel, true>> nullable_key_fixed_string_two_level;
+
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128, true>>             nullable_keys128;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256, true>>             nullable_keys256;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128TwoLevel, true>>     nullable_keys128_two_level;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256TwoLevel, true>>     nullable_keys256_two_level;
+
+    /// Support for low cardinality.
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt8, AggregatedDataWithNullableUInt8Key, false>>> low_cardinality_key8;
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt16, AggregatedDataWithNullableUInt16Key, false>>> low_cardinality_key16;
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt64Key>>> low_cardinality_key32;
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64Key>>> low_cardinality_key64;
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodString<AggregatedDataWithNullableStringKey>>> low_cardinality_key_string;
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodFixedString<AggregatedDataWithNullableStringKey>>> low_cardinality_key_fixed_string;
+
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt64KeyTwoLevel>>> low_cardinality_key32_two_level;
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64KeyTwoLevel>>> low_cardinality_key64_two_level;
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodString<AggregatedDataWithNullableStringKeyTwoLevel>>> low_cardinality_key_string_two_level;
+    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodFixedString<AggregatedDataWithNullableStringKeyTwoLevel>>> low_cardinality_key_fixed_string_two_level;
+
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128, false, true>>      low_cardinality_keys128;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256, false, true>>      low_cardinality_keys256;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128TwoLevel, false, true>> low_cardinality_keys128_two_level;
+    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256TwoLevel, false, true>> low_cardinality_keys256_two_level;
+
+    /// In this and similar macros, the option without_key is not considered.
+    #define APPLY_FOR_AGGREGATED_VARIANTS(M) \
+        M(key8,                       false) \
+        M(key16,                      false) \
+        M(key32,                      false) \
+        M(key64,                      false) \
+        M(key_string,                 false) \
+        M(key_fixed_string,           false) \
+        M(keys16,                    false) \
+        M(keys32,                    false) \
+        M(keys64,                    false) \
+        M(keys128,                    false) \
+        M(keys256,                    false) \
+        M(serialized,                   false) \
+        M(nullable_serialized,          false) \
+        M(prealloc_serialized,          false) \
+        M(nullable_prealloc_serialized, false) \
+        M(key32_two_level,            true) \
+        M(key64_two_level,            true) \
+        M(key_string_two_level,       true) \
+        M(key_fixed_string_two_level, true) \
+        M(keys32_two_level,          true) \
+        M(keys64_two_level,          true) \
+        M(keys128_two_level,          true) \
+        M(keys256_two_level,          true) \
+        M(serialized_two_level,                   true) \
+        M(nullable_serialized_two_level,          true) \
+        M(prealloc_serialized_two_level,          true) \
+        M(nullable_prealloc_serialized_two_level, true) \
+        M(key64_hash64,               false) \
+        M(key_string_hash64,          false) \
+        M(key_fixed_string_hash64,    false) \
+        M(keys128_hash64,             false) \
+        M(keys256_hash64,             false) \
+        M(serialized_hash64,                   false) \
+        M(nullable_serialized_hash64,          false) \
+        M(prealloc_serialized_hash64,          false) \
+        M(nullable_prealloc_serialized_hash64, false) \
+        M(nullable_key8,             false) \
+        M(nullable_key16,             false) \
+        M(nullable_key32,             false) \
+        M(nullable_key64,             false) \
+        M(nullable_key32_two_level,   true) \
+        M(nullable_key64_two_level,   true) \
+        M(nullable_key_string,        false) \
+        M(nullable_key_fixed_string,  false) \
+        M(nullable_key_string_two_level, true) \
+        M(nullable_key_fixed_string_two_level, true) \
+        M(nullable_keys128,           false) \
+        M(nullable_keys256,           false) \
+        M(nullable_keys128_two_level, true) \
+        M(nullable_keys256_two_level, true) \
+        M(low_cardinality_key8, false) \
+        M(low_cardinality_key16, false) \
+        M(low_cardinality_key32, false) \
+        M(low_cardinality_key64, false) \
+        M(low_cardinality_keys128, false) \
+        M(low_cardinality_keys256, false) \
+        M(low_cardinality_key_string, false) \
+        M(low_cardinality_key_fixed_string, false) \
+        M(low_cardinality_key32_two_level, true) \
+        M(low_cardinality_key64_two_level, true) \
+        M(low_cardinality_keys128_two_level, true) \
+        M(low_cardinality_keys256_two_level, true) \
+        M(low_cardinality_key_string_two_level, true) \
+        M(low_cardinality_key_fixed_string_two_level, true) \
+
+    #define APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M) \
+        M(key32)            \
+        M(key64)            \
+        M(key_string)       \
+        M(key_fixed_string) \
+        M(keys32)           \
+        M(keys64)           \
+        M(keys128)          \
+        M(keys256)          \
+        M(serialized)       \
+        M(nullable_serialized) \
+        M(prealloc_serialized) \
+        M(nullable_prealloc_serialized) \
+        M(nullable_key32) \
+        M(nullable_key64) \
+        M(nullable_key_string) \
+        M(nullable_key_fixed_string) \
+        M(nullable_keys128) \
+        M(nullable_keys256) \
+        M(low_cardinality_key32) \
+        M(low_cardinality_key64) \
+        M(low_cardinality_keys128) \
+        M(low_cardinality_keys256) \
+        M(low_cardinality_key_string) \
+        M(low_cardinality_key_fixed_string) \
+
+    /// NOLINTNEXTLINE
+    #define APPLY_FOR_VARIANTS_NOT_CONVERTIBLE_TO_TWO_LEVEL(M) \
+        M(key8)             \
+        M(key16)            \
+        M(nullable_key8) \
+        M(nullable_key16) \
+        M(keys16)           \
+        M(key64_hash64)     \
+        M(key_string_hash64)\
+        M(key_fixed_string_hash64) \
+        M(keys128_hash64)   \
+        M(keys256_hash64)   \
+        M(serialized_hash64) \
+        M(nullable_serialized_hash64) \
+        M(prealloc_serialized_hash64) \
+        M(nullable_prealloc_serialized_hash64) \
+        M(low_cardinality_key8) \
+        M(low_cardinality_key16) \
+
+    /// NOLINTNEXTLINE
+    #define APPLY_FOR_VARIANTS_SINGLE_LEVEL(M) \
+        APPLY_FOR_VARIANTS_NOT_CONVERTIBLE_TO_TWO_LEVEL(M) \
+        APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M) \
+
+    /// NOLINTNEXTLINE
+    #define APPLY_FOR_VARIANTS_TWO_LEVEL(M) \
+        M(key32_two_level)            \
+        M(key64_two_level)            \
+        M(key_string_two_level)       \
+        M(key_fixed_string_two_level) \
+        M(keys32_two_level)           \
+        M(keys64_two_level)           \
+        M(keys128_two_level)          \
+        M(keys256_two_level)          \
+        M(serialized_two_level)       \
+        M(nullable_serialized_two_level)       \
+        M(prealloc_serialized_two_level)       \
+        M(nullable_prealloc_serialized_two_level)       \
+        M(nullable_key32_two_level) \
+        M(nullable_key64_two_level) \
+        M(nullable_key_string_two_level) \
+        M(nullable_key_fixed_string_two_level) \
+        M(nullable_keys128_two_level) \
+        M(nullable_keys256_two_level) \
+        M(low_cardinality_key32_two_level) \
+        M(low_cardinality_key64_two_level) \
+        M(low_cardinality_keys128_two_level) \
+        M(low_cardinality_keys256_two_level) \
+        M(low_cardinality_key_string_two_level) \
+        M(low_cardinality_key_fixed_string_two_level) \
+
+    #define APPLY_FOR_LOW_CARDINALITY_VARIANTS(M) \
+        M(low_cardinality_key8) \
+        M(low_cardinality_key16) \
+        M(low_cardinality_key32) \
+        M(low_cardinality_key64) \
+        M(low_cardinality_keys128) \
+        M(low_cardinality_keys256) \
+        M(low_cardinality_key_string) \
+        M(low_cardinality_key_fixed_string) \
+        M(low_cardinality_key32_two_level) \
+        M(low_cardinality_key64_two_level) \
+        M(low_cardinality_keys128_two_level) \
+        M(low_cardinality_keys256_two_level) \
+        M(low_cardinality_key_string_two_level) \
+        M(low_cardinality_key_fixed_string_two_level)
+
+    enum class Type
+    {
+        EMPTY = 0,
+        without_key,
+
+    #define M(NAME, IS_TWO_LEVEL) NAME,
+        APPLY_FOR_AGGREGATED_VARIANTS(M)
+    #undef M
+    };
+    Type type = Type::EMPTY;
+    AggregatedDataVariants();
+    ~AggregatedDataVariants();
+    bool empty() const { return type == Type::EMPTY; }
+    void invalidate() { type = Type::EMPTY; }
+    void init(Type type_, std::optional<size_t> size_hint = std::nullopt);
+    /// Number of rows (different keys).
+    size_t size() const;
+    size_t sizeWithoutOverflowRow() const;
+    const char * getMethodName() const;
+    bool isTwoLevel() const;
+    bool isConvertibleToTwoLevel() const;
+    void convertToTwoLevel();
+    bool isLowCardinality() const;
+    static ColumnsHashing::HashMethodContextPtr createCache(Type type, const ColumnsHashing::HashMethodContext::Settings & settings);
+
+};
+
+using AggregatedDataVariantsPtr = std::shared_ptr<AggregatedDataVariants>;
+using ManyAggregatedDataVariants = std::vector<AggregatedDataVariantsPtr>;
+using ManyAggregatedDataVariantsPtr = std::shared_ptr<ManyAggregatedDataVariants>;
+}
diff --git a/src/Interpreters/AggregationMethod.cpp b/src/Interpreters/AggregationMethod.cpp
new file mode 100644
index 00000000000..3ff4f0cae43
--- /dev/null
+++ b/src/Interpreters/AggregationMethod.cpp
@@ -0,0 +1,215 @@
+#include <Interpreters/AggregationMethod.h>
+
+namespace DB
+{
+template <typename FieldType, typename TData, bool consecutive_keys_optimization, bool nullable>
+void AggregationMethodOneNumber<FieldType, TData, consecutive_keys_optimization, nullable>::insertKeyIntoColumns(
+    const AggregationMethodOneNumber::Key & key, std::vector<IColumn *> & key_columns, const Sizes & /*key_sizes*/)
+{
+    ColumnFixedSizeHelper * column;
+    if constexpr (nullable)
+    {
+        ColumnNullable & nullable_col = assert_cast<ColumnNullable &>(*key_columns[0]);
+        ColumnUInt8 * null_map = assert_cast<ColumnUInt8 *>(&nullable_col.getNullMapColumn());
+        null_map->insertDefault();
+        column = static_cast<ColumnFixedSizeHelper *>(&nullable_col.getNestedColumn());
+    }
+    else
+    {
+        column = static_cast<ColumnFixedSizeHelper *>(key_columns[0]);
+    }
+    static_assert(sizeof(FieldType) <= sizeof(Key));
+    const auto * key_holder = reinterpret_cast<const char *>(&key);
+    if constexpr (sizeof(FieldType) < sizeof(Key) && std::endian::native == std::endian::big)
+        column->insertRawData<sizeof(FieldType)>(key_holder + (sizeof(Key) - sizeof(FieldType)));
+    else
+        column->insertRawData<sizeof(FieldType)>(key_holder);
+}
+
+template struct AggregationMethodOneNumber<UInt8, AggregatedDataWithUInt8Key, false>;
+template struct AggregationMethodOneNumber<UInt16, AggregatedDataWithUInt16Key, false>;
+template struct AggregationMethodOneNumber<UInt32, AggregatedDataWithUInt64Key>;
+template struct AggregationMethodOneNumber<UInt64, AggregatedDataWithUInt64Key>;
+template struct AggregationMethodOneNumber<UInt32, AggregatedDataWithUInt64KeyTwoLevel>;
+template struct AggregationMethodOneNumber<UInt64, AggregatedDataWithUInt64KeyTwoLevel>;
+template struct AggregationMethodOneNumber<UInt64, AggregatedDataWithUInt64KeyHash64>;
+template struct AggregationMethodOneNumber<UInt8, AggregatedDataWithNullableUInt8Key, false, true>;
+template struct AggregationMethodOneNumber<UInt16, AggregatedDataWithNullableUInt16Key, false, true>;
+template struct AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt32Key, true, true>;
+template struct AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64Key, true, true>;
+template struct AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt32KeyTwoLevel, true, true>;
+template struct AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64KeyTwoLevel, true, true>;
+template struct AggregationMethodOneNumber<UInt8, AggregatedDataWithNullableUInt8Key, false>;
+template struct AggregationMethodOneNumber<UInt16, AggregatedDataWithNullableUInt16Key, false>;
+template struct AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt64Key>;
+template struct AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64Key>;
+template struct AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt64KeyTwoLevel>;
+template struct AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64KeyTwoLevel>;
+
+template <typename TData, bool nullable>
+void AggregationMethodStringNoCache<TData, nullable>::insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
+{
+    if constexpr (nullable)
+    {
+        ColumnNullable & column_nullable = assert_cast<ColumnNullable &>(*key_columns[0]);
+        assert_cast<ColumnString &>(column_nullable.getNestedColumn()).insertData(key.data, key.size);
+        column_nullable.getNullMapData().push_back(0);
+    }
+    else
+    {
+        assert_cast<ColumnString &>(*key_columns[0]).insertData(key.data, key.size);
+    }
+}
+template struct AggregationMethodStringNoCache<AggregatedDataWithShortStringKey>;
+template struct AggregationMethodStringNoCache<AggregatedDataWithShortStringKeyTwoLevel>;
+template struct AggregationMethodStringNoCache<AggregatedDataWithNullableShortStringKey, true>;
+template struct AggregationMethodStringNoCache<AggregatedDataWithNullableShortStringKeyTwoLevel, true>;
+
+template <typename TData>
+void AggregationMethodFixedString<TData>::insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
+{
+    assert_cast<ColumnFixedString &>(*key_columns[0]).insertData(key.data, key.size);
+}
+template struct AggregationMethodFixedString<AggregatedDataWithStringKeyHash64>;
+template struct AggregationMethodFixedString<AggregatedDataWithNullableStringKey>;
+template struct AggregationMethodFixedString<AggregatedDataWithNullableStringKeyTwoLevel>;
+
+
+template <typename TData, bool nullable>
+void AggregationMethodFixedStringNoCache<TData, nullable>::insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
+{
+    if constexpr (nullable)
+        assert_cast<ColumnNullable &>(*key_columns[0]).insertData(key.data, key.size);
+    else
+        assert_cast<ColumnFixedString &>(*key_columns[0]).insertData(key.data, key.size);
+}
+template struct AggregationMethodFixedStringNoCache<AggregatedDataWithShortStringKey>;
+template struct AggregationMethodFixedStringNoCache<AggregatedDataWithShortStringKeyTwoLevel>;
+template struct AggregationMethodFixedStringNoCache<AggregatedDataWithNullableShortStringKey, true>;
+template struct AggregationMethodFixedStringNoCache<AggregatedDataWithNullableShortStringKeyTwoLevel, true>;
+
+
+template <typename SingleColumnMethod>
+void AggregationMethodSingleLowCardinalityColumn<SingleColumnMethod>::insertKeyIntoColumns(
+    const Key & key, std::vector<IColumn *> & key_columns_low_cardinality, const Sizes & /*key_sizes*/)
+{
+    auto * col = assert_cast<ColumnLowCardinality *>(key_columns_low_cardinality[0]);
+
+    if constexpr (std::is_same_v<Key, StringRef>)
+        col->insertData(key.data, key.size);
+    else
+        col->insertData(reinterpret_cast<const char *>(&key), sizeof(key));
+}
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt8, AggregatedDataWithNullableUInt8Key, false>>;
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt16, AggregatedDataWithNullableUInt16Key, false>>;
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt64Key>>;
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64Key>>;
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodString<AggregatedDataWithNullableStringKey>>;
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodFixedString<AggregatedDataWithNullableStringKey>>;
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt64KeyTwoLevel>>;
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64KeyTwoLevel>>;
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodString<AggregatedDataWithNullableStringKeyTwoLevel>>;
+template struct AggregationMethodSingleLowCardinalityColumn<AggregationMethodFixedString<AggregatedDataWithNullableStringKeyTwoLevel>>;
+
+
+template <typename TData, bool has_nullable_keys, bool has_low_cardinality, bool consecutive_keys_optimization>
+void AggregationMethodKeysFixed<TData, has_nullable_keys, has_low_cardinality,consecutive_keys_optimization>::insertKeyIntoColumns(const Key & key, std::vector<IColumn *> & key_columns, const Sizes & key_sizes)
+{
+    size_t keys_size = key_columns.size();
+
+    static constexpr auto bitmap_size = has_nullable_keys ? std::tuple_size<KeysNullMap<Key>>::value : 0;
+    /// In any hash key value, column values to be read start just after the bitmap, if it exists.
+    size_t pos = bitmap_size;
+
+    for (size_t i = 0; i < keys_size; ++i)
+    {
+        IColumn * observed_column;
+        ColumnUInt8 * null_map;
+
+        bool column_nullable = false;
+        if constexpr (has_nullable_keys)
+            column_nullable = isColumnNullable(*key_columns[i]);
+
+        /// If we have a nullable column, get its nested column and its null map.
+        if (column_nullable)
+        {
+            ColumnNullable & nullable_col = assert_cast<ColumnNullable &>(*key_columns[i]);
+            observed_column = &nullable_col.getNestedColumn();
+            null_map = assert_cast<ColumnUInt8 *>(&nullable_col.getNullMapColumn());
+        }
+        else
+        {
+            observed_column = key_columns[i];
+            null_map = nullptr;
+        }
+
+        bool is_null = false;
+        if (column_nullable)
+        {
+            /// The current column is nullable. Check if the value of the
+            /// corresponding key is nullable. Update the null map accordingly.
+            size_t bucket = i / 8;
+            size_t offset = i % 8;
+            UInt8 val = (reinterpret_cast<const UInt8 *>(&key)[bucket] >> offset) & 1;
+            null_map->insertValue(val);
+            is_null = val == 1;
+        }
+
+        if (has_nullable_keys && is_null)
+            observed_column->insertDefault();
+        else
+        {
+            size_t size = key_sizes[i];
+            size_t offset_to = pos;
+            if constexpr (std::endian::native == std::endian::big)
+                offset_to = sizeof(Key) - size - pos;
+            observed_column->insertData(reinterpret_cast<const char *>(&key) + offset_to, size);
+            pos += size;
+        }
+    }
+}
+template struct AggregationMethodKeysFixed<AggregatedDataWithUInt16Key, false, false, false>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithUInt32Key>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithUInt64Key>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys128>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys256>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithUInt32KeyTwoLevel>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithUInt64KeyTwoLevel>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys128TwoLevel>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys256TwoLevel>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys128Hash64>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys256Hash64>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys128, true>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys256, true>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys128TwoLevel, true>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys256TwoLevel, true>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys128, false, true>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys256, false, true>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys128TwoLevel, false, true>;
+template struct AggregationMethodKeysFixed<AggregatedDataWithKeys256TwoLevel, false, true>;
+
+
+template <typename TData, bool nullable, bool prealloc>
+void AggregationMethodSerialized<TData, nullable, prealloc>::insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
+{
+    const auto * pos = key.data;
+    for (auto & column : key_columns)
+        pos = column->deserializeAndInsertFromArena(pos);
+}
+template struct AggregationMethodSerialized<AggregatedDataWithStringKey>;
+template struct AggregationMethodSerialized<AggregatedDataWithStringKeyTwoLevel>;
+template struct AggregationMethodSerialized<AggregatedDataWithStringKeyHash64>;
+// AggregationMethodNullableSerialized
+template struct AggregationMethodSerialized<AggregatedDataWithStringKey, true, false>;
+template struct AggregationMethodSerialized<AggregatedDataWithStringKeyTwoLevel, true, false>;
+template struct AggregationMethodSerialized<AggregatedDataWithStringKeyHash64, true, false>;
+// AggregationMethodPreallocSerialized
+template struct AggregationMethodSerialized<AggregatedDataWithStringKey, false, true>;
+template struct AggregationMethodSerialized<AggregatedDataWithStringKeyTwoLevel, false, true>;
+template struct AggregationMethodSerialized<AggregatedDataWithStringKeyHash64, false, true>;
+// AggregationMethodNullablePreallocSerialized
+template struct AggregationMethodSerialized<AggregatedDataWithStringKey, true, true>;
+template struct AggregationMethodSerialized<AggregatedDataWithStringKeyTwoLevel, true, true>;
+template struct AggregationMethodSerialized<AggregatedDataWithStringKeyHash64, true, true>;
+
+}
diff --git a/src/Interpreters/AggregationMethod.h b/src/Interpreters/AggregationMethod.h
new file mode 100644
index 00000000000..41345d91990
--- /dev/null
+++ b/src/Interpreters/AggregationMethod.h
@@ -0,0 +1,320 @@
+#pragma once
+#include <vector>
+#include <Common/ColumnsHashing.h>
+#include <Interpreters/AggregationCommon.h>
+#include <Interpreters/AggregatedData.h>
+
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnFixedString.h>
+#include <Columns/ColumnAggregateFunction.h>
+#include <Columns/ColumnVector.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnLowCardinality.h>
+
+namespace DB
+{
+class IColumn;
+/// For the case where there is one numeric key.
+/// FieldType is UInt8/16/32/64 for any type with corresponding bit width.
+template <typename FieldType, typename TData,
+        bool consecutive_keys_optimization = true, bool nullable = false>
+struct AggregationMethodOneNumber
+{
+    using Data = TData;
+    using Key = typename Data::key_type;
+    using Mapped = typename Data::mapped_type;
+
+    Data data;
+
+    AggregationMethodOneNumber() = default;
+
+    explicit AggregationMethodOneNumber(size_t size_hint) : data(size_hint) { }
+
+    template <typename Other>
+    explicit AggregationMethodOneNumber(const Other & other) : data(other.data)
+    {
+    }
+
+    /// To use one `Method` in different threads, use different `State`.
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodOneNumber<
+        typename Data::value_type,
+        Mapped,
+        FieldType,
+        use_cache && consecutive_keys_optimization,
+        /*need_offset=*/ false,
+        nullable>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
+
+    /// Use optimization for low cardinality.
+    static const bool low_cardinality_optimization = false;
+    static const bool one_key_nullable_optimization = nullable;
+
+    /// Shuffle key columns before `insertKeyIntoColumns` call if needed.
+    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
+
+    // Insert the key from the hash table into columns.
+    static void insertKeyIntoColumns(const Key & key, std::vector<IColumn *> & key_columns, const Sizes & /*key_sizes*/);
+};
+
+/// For the case where there is one string key.
+template <typename TData>
+struct AggregationMethodString
+{
+    using Data = TData;
+    using Key = typename Data::key_type;
+    using Mapped = typename Data::mapped_type;
+
+    Data data;
+
+    AggregationMethodString() = default;
+
+    template <typename Other>
+    explicit AggregationMethodString(const Other & other) : data(other.data)
+    {
+    }
+
+    explicit AggregationMethodString(size_t size_hint) : data(size_hint) { }
+
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodString<typename Data::value_type, Mapped, /*place_string_to_arena=*/ true, use_cache>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
+
+    static const bool low_cardinality_optimization = false;
+    static const bool one_key_nullable_optimization = false;
+
+    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
+
+    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
+    {
+        static_cast<ColumnString *>(key_columns[0])->insertData(key.data, key.size);
+    }
+};
+
+/// Same as above but without cache
+template <typename TData, bool nullable = false>
+struct AggregationMethodStringNoCache
+{
+    using Data = TData;
+    using Key = typename Data::key_type;
+    using Mapped = typename Data::mapped_type;
+
+    Data data;
+
+    AggregationMethodStringNoCache() = default;
+
+    explicit AggregationMethodStringNoCache(size_t size_hint) : data(size_hint) { }
+
+    template <typename Other>
+    explicit AggregationMethodStringNoCache(const Other & other) : data(other.data)
+    {
+    }
+
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodString<typename Data::value_type, Mapped, true, false, false, nullable>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
+
+    static const bool low_cardinality_optimization = false;
+    static const bool one_key_nullable_optimization = nullable;
+
+    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
+
+    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &);
+};
+
+/// For the case where there is one fixed-length string key.
+template <typename TData>
+struct AggregationMethodFixedString
+{
+    using Data = TData;
+    using Key = typename Data::key_type;
+    using Mapped = typename Data::mapped_type;
+
+    Data data;
+
+    AggregationMethodFixedString() = default;
+
+    explicit AggregationMethodFixedString(size_t size_hint) : data(size_hint) { }
+
+    template <typename Other>
+    explicit AggregationMethodFixedString(const Other & other) : data(other.data)
+    {
+    }
+
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodFixedString<typename Data::value_type, Mapped, /*place_string_to_arena=*/ true, use_cache>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
+
+    static const bool low_cardinality_optimization = false;
+    static const bool one_key_nullable_optimization = false;
+
+    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
+
+    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &);
+};
+
+/// Same as above but without cache
+template <typename TData, bool nullable = false>
+struct AggregationMethodFixedStringNoCache
+{
+    using Data = TData;
+    using Key = typename Data::key_type;
+    using Mapped = typename Data::mapped_type;
+
+    Data data;
+
+    AggregationMethodFixedStringNoCache() = default;
+
+    explicit AggregationMethodFixedStringNoCache(size_t size_hint) : data(size_hint) { }
+
+    template <typename Other>
+    explicit AggregationMethodFixedStringNoCache(const Other & other) : data(other.data)
+    {
+    }
+
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodFixedString<typename Data::value_type, Mapped, true, false, false, nullable>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
+
+    static const bool low_cardinality_optimization = false;
+    static const bool one_key_nullable_optimization = nullable;
+
+    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
+
+    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &);
+};
+
+/// Single low cardinality column.
+template <typename SingleColumnMethod>
+struct AggregationMethodSingleLowCardinalityColumn : public SingleColumnMethod
+{
+    using Base = SingleColumnMethod;
+    using Data = typename Base::Data;
+    using Key = typename Base::Key;
+    using Mapped = typename Base::Mapped;
+    using Base::data;
+
+    template <bool use_cache>
+    using BaseStateImpl = typename Base::template StateImpl<use_cache>;
+
+    AggregationMethodSingleLowCardinalityColumn() = default;
+
+    template <typename Other>
+    explicit AggregationMethodSingleLowCardinalityColumn(const Other & other) : Base(other) {}
+
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodSingleLowCardinalityColumn<BaseStateImpl<use_cache>, Mapped, use_cache>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
+
+    static const bool low_cardinality_optimization = true;
+
+    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
+
+    static void insertKeyIntoColumns(const Key & key,
+         std::vector<IColumn *> & key_columns_low_cardinality, const Sizes & /*key_sizes*/);
+};
+
+/// For the case where all keys are of fixed length, and they fit in N (for example, 128) bits.
+template <typename TData, bool has_nullable_keys_ = false, bool has_low_cardinality_ = false, bool consecutive_keys_optimization = false>
+struct AggregationMethodKeysFixed
+{
+    using Data = TData;
+    using Key = typename Data::key_type;
+    using Mapped = typename Data::mapped_type;
+    static constexpr bool has_nullable_keys = has_nullable_keys_;
+    static constexpr bool has_low_cardinality = has_low_cardinality_;
+
+    Data data;
+
+    AggregationMethodKeysFixed() = default;
+
+    explicit AggregationMethodKeysFixed(size_t size_hint) : data(size_hint) { }
+
+    template <typename Other>
+    explicit AggregationMethodKeysFixed(const Other & other) : data(other.data)
+    {
+    }
+
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodKeysFixed<
+        typename Data::value_type,
+        Key,
+        Mapped,
+        has_nullable_keys,
+        has_low_cardinality,
+        use_cache && consecutive_keys_optimization>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
+
+    static const bool low_cardinality_optimization = false;
+    static const bool one_key_nullable_optimization = false;
+
+    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> & key_columns, const Sizes & key_sizes)
+    {
+        return State::shuffleKeyColumns(key_columns, key_sizes);
+    }
+
+    static void insertKeyIntoColumns(const Key & key, std::vector<IColumn *> & key_columns, const Sizes & key_sizes);
+};
+
+/** Aggregates by concatenating serialized key values.
+  * The serialized value differs in that it uniquely allows to deserialize it, having only the position with which it starts.
+  * That is, for example, for strings, it contains first the serialized length of the string, and then the bytes.
+  * Therefore, when aggregating by several strings, there is no ambiguity.
+  */
+template <typename TData, bool nullable = false, bool prealloc = false>
+struct AggregationMethodSerialized
+{
+    using Data = TData;
+    using Key = typename Data::key_type;
+    using Mapped = typename Data::mapped_type;
+
+    Data data;
+
+    AggregationMethodSerialized() = default;
+
+    explicit AggregationMethodSerialized(size_t size_hint) : data(size_hint) { }
+
+    template <typename Other>
+    explicit AggregationMethodSerialized(const Other & other) : data(other.data)
+    {
+    }
+
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodSerialized<typename Data::value_type, Mapped, nullable, prealloc>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
+
+    static const bool low_cardinality_optimization = false;
+    static const bool one_key_nullable_optimization = false;
+
+    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
+
+    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &);
+};
+
+template <typename TData>
+using AggregationMethodNullableSerialized = AggregationMethodSerialized<TData, true>;
+
+template <typename TData>
+using AggregationMethodPreallocSerialized = AggregationMethodSerialized<TData, false, true>;
+
+template <typename TData>
+using AggregationMethodNullablePreallocSerialized = AggregationMethodSerialized<TData, true, true>;
+
+
+}
diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 80a98683867..3596e2fcc4a 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -48,7 +48,6 @@ namespace ProfileEvents
     extern const Event ExternalAggregationUncompressedBytes;
     extern const Event ExternalProcessingCompressedBytesTotal;
     extern const Event ExternalProcessingUncompressedBytesTotal;
-    extern const Event AggregationPreallocatedElementsInHashTables;
     extern const Event AggregationHashTablesInitializedAsTwoLevel;
     extern const Event OverflowThrow;
     extern const Event OverflowBreak;
@@ -269,50 +268,6 @@ void updateStatistics(const DB::ManyAggregatedDataVariants & data_variants, cons
     getHashTablesStatistics().update(sum_of_sizes, *median_size, params);
 }
 
-// The std::is_constructible trait isn't suitable here because some classes have template constructors with semantics different from providing size hints.
-// Also string hash table variants are not supported due to the fact that both local perf tests and tests in CI showed slowdowns for them.
-template <typename...>
-struct HasConstructorOfNumberOfElements : std::false_type
-{
-};
-
-template <typename... Ts>
-struct HasConstructorOfNumberOfElements<HashMapTable<Ts...>> : std::true_type
-{
-};
-
-template <typename Key, typename Cell, typename Hash, typename Grower, typename Allocator, template <typename...> typename ImplTable>
-struct HasConstructorOfNumberOfElements<TwoLevelHashMapTable<Key, Cell, Hash, Grower, Allocator, ImplTable>> : std::true_type
-{
-};
-
-template <typename... Ts>
-struct HasConstructorOfNumberOfElements<HashTable<Ts...>> : std::true_type
-{
-};
-
-template <typename... Ts>
-struct HasConstructorOfNumberOfElements<TwoLevelHashTable<Ts...>> : std::true_type
-{
-};
-
-template <template <typename> typename Method, typename Base>
-struct HasConstructorOfNumberOfElements<Method<Base>> : HasConstructorOfNumberOfElements<Base>
-{
-};
-
-template <typename Method>
-auto constructWithReserveIfPossible(size_t size_hint)
-{
-    if constexpr (HasConstructorOfNumberOfElements<typename Method::Data>::value)
-    {
-        ProfileEvents::increment(ProfileEvents::AggregationPreallocatedElementsInHashTables, size_hint);
-        return std::make_unique<Method>(size_hint);
-    }
-    else
-        return std::make_unique<Method>();
-}
-
 DB::ColumnNumbers calculateKeysPositions(const DB::Block & header, const DB::Aggregator::Params & params)
 {
     DB::ColumnNumbers keys_positions(params.keys_size);
@@ -345,71 +300,11 @@ size_t getMinBytesForPrefetch()
 namespace DB
 {
 
-AggregatedDataVariants::~AggregatedDataVariants()
-{
-    if (aggregator && !aggregator->all_aggregates_has_trivial_destructor)
-    {
-        try
-        {
-            aggregator->destroyAllAggregateStates(*this);
-        }
-        catch (...)
-        {
-            tryLogCurrentException(__PRETTY_FUNCTION__);
-        }
-    }
-}
-
 std::optional<HashTablesCacheStatistics> getHashTablesCacheStatistics()
 {
     return getHashTablesStatistics().getCacheStats();
 }
 
-void AggregatedDataVariants::convertToTwoLevel()
-{
-    if (aggregator)
-        LOG_TRACE(aggregator->log, "Converting aggregation data to two-level.");
-
-    switch (type)
-    {
-#define M(NAME) \
-        case Type::NAME: \
-            NAME ## _two_level = std::make_unique<decltype(NAME ## _two_level)::element_type>(*(NAME)); \
-            (NAME).reset(); \
-            type = Type::NAME ## _two_level; \
-            break;
-
-        APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
-
-    #undef M
-
-        default:
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong data variant passed.");
-    }
-}
-
-void AggregatedDataVariants::init(Type type_, std::optional<size_t> size_hint)
-{
-    switch (type_)
-    {
-        case Type::EMPTY:
-        case Type::without_key:
-            break;
-
-#define M(NAME, IS_TWO_LEVEL) \
-    case Type::NAME: \
-        if (size_hint) \
-            (NAME) = constructWithReserveIfPossible<decltype(NAME)::element_type>(*size_hint); \
-        else \
-            (NAME) = std::make_unique<decltype(NAME)::element_type>(); \
-        break;
-            APPLY_FOR_AGGREGATED_VARIANTS(M)
-#undef M
-    }
-
-    type = type_;
-}
-
 Aggregator::Params::StatsCollectingParams::StatsCollectingParams() = default;
 
 Aggregator::Params::StatsCollectingParams::StatsCollectingParams(
@@ -1121,30 +1016,30 @@ void NO_INLINE Aggregator::executeImpl(
         if (compiled_aggregate_functions_holder && !hasSparseArguments(aggregate_instructions))
         {
             if (prefetch)
-                executeImplBatch<false, true, true>(
-                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
+                executeImplBatch<true>(
+                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, false, all_keys_are_const, true, overflow_row);
             else
-                executeImplBatch<false, true, false>(
-                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
+                executeImplBatch<false>(
+                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, false, all_keys_are_const, true, overflow_row);
         }
         else
 #endif
         {
             if (prefetch)
-                executeImplBatch<false, false, true>(
-                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
+                executeImplBatch<true>(
+                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, false, all_keys_are_const, false, overflow_row);
             else
-                executeImplBatch<false, false, false>(
-                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
+                executeImplBatch<false>(
+                    method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, false, all_keys_are_const, false, overflow_row);
         }
     }
     else
     {
-        executeImplBatch<true, false, false>(method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, all_keys_are_const, overflow_row);
+        executeImplBatch<false>(method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, true, all_keys_are_const, false, overflow_row);
     }
 }
 
-template <bool no_more_keys, bool use_compiled_functions, bool prefetch, typename Method, typename State>
+template <bool prefetch, typename Method, typename State>
 void NO_INLINE Aggregator::executeImplBatch(
     Method & method,
     State & state,
@@ -1152,7 +1047,9 @@ void NO_INLINE Aggregator::executeImplBatch(
     size_t row_begin,
     size_t row_end,
     AggregateFunctionInstruction * aggregate_instructions,
+    bool no_more_keys,
     bool all_keys_are_const,
+    bool use_compiled_functions,
     AggregateDataPtr overflow_row) const
 {
     using KeyHolder = decltype(state.getKeyHolder(0, std::declval<Arena &>()));
@@ -1164,7 +1061,7 @@ void NO_INLINE Aggregator::executeImplBatch(
     /// Optimization for special case when there are no aggregate functions.
     if (params.aggregates_size == 0)
     {
-        if constexpr (no_more_keys)
+        if (no_more_keys)
             return;
 
         /// This pointer is unused, but the logic will compare it for nullptr to check if the cell is set.
@@ -1197,39 +1094,42 @@ void NO_INLINE Aggregator::executeImplBatch(
     }
 
     /// Optimization for special case when aggregating by 8bit key.
-    if constexpr (!no_more_keys && std::is_same_v<Method, typename decltype(AggregatedDataVariants::key8)::element_type>)
+    if (!no_more_keys)
     {
-        /// We use another method if there are aggregate functions with -Array combinator.
-        bool has_arrays = false;
-        for (AggregateFunctionInstruction * inst = aggregate_instructions; inst->that; ++inst)
-        {
-            if (inst->offsets)
-            {
-                has_arrays = true;
-                break;
-            }
-        }
-
-        if (!has_arrays && !hasSparseArguments(aggregate_instructions) && !all_keys_are_const)
+        if constexpr (std::is_same_v<Method, typename decltype(AggregatedDataVariants::key8)::element_type>)
         {
+            /// We use another method if there are aggregate functions with -Array combinator.
+            bool has_arrays = false;
             for (AggregateFunctionInstruction * inst = aggregate_instructions; inst->that; ++inst)
             {
-                inst->batch_that->addBatchLookupTable8(
-                    row_begin,
-                    row_end,
-                    reinterpret_cast<AggregateDataPtr *>(method.data.data()),
-                    inst->state_offset,
-                    [&](AggregateDataPtr & aggregate_data)
-                    {
-                        AggregateDataPtr place = aggregates_pool->alignedAlloc(total_size_of_aggregate_states, align_aggregate_states);
-                        createAggregateStates(place);
-                        aggregate_data = place;
-                    },
-                    state.getKeyData(),
-                    inst->batch_arguments,
-                    aggregates_pool);
+                if (inst->offsets)
+                {
+                    has_arrays = true;
+                    break;
+                }
+            }
+
+            if (!has_arrays && !hasSparseArguments(aggregate_instructions) && !all_keys_are_const)
+            {
+                for (AggregateFunctionInstruction * inst = aggregate_instructions; inst->that; ++inst)
+                {
+                    inst->batch_that->addBatchLookupTable8(
+                        row_begin,
+                        row_end,
+                        reinterpret_cast<AggregateDataPtr *>(method.data.data()),
+                        inst->state_offset,
+                        [&](AggregateDataPtr & aggregate_data)
+                        {
+                            AggregateDataPtr place = aggregates_pool->alignedAlloc(total_size_of_aggregate_states, align_aggregate_states);
+                            createAggregateStates(place);
+                            aggregate_data = place;
+                        },
+                        state.getKeyData(),
+                        inst->batch_arguments,
+                        aggregates_pool);
+                }
+                return;
             }
-            return;
         }
     }
 
@@ -1255,12 +1155,12 @@ void NO_INLINE Aggregator::executeImplBatch(
     state.resetCache();
 
     /// For all rows.
-    for (size_t i = key_start; i < key_end; ++i)
+    if (!no_more_keys)
     {
-        AggregateDataPtr aggregate_data = nullptr;
-
-        if constexpr (!no_more_keys)
+        for (size_t i = key_start; i < key_end; ++i)
         {
+            AggregateDataPtr aggregate_data = nullptr;
+
             if constexpr (prefetch && HasPrefetchMemberFunc<decltype(method.data), KeyHolder>)
             {
                 if (i == key_start + prefetching.iterationsToMeasure())
@@ -1284,7 +1184,7 @@ void NO_INLINE Aggregator::executeImplBatch(
                 aggregate_data = aggregates_pool->alignedAlloc(total_size_of_aggregate_states, align_aggregate_states);
 
 #if USE_EMBEDDED_COMPILER
-                if constexpr (use_compiled_functions)
+                if (use_compiled_functions)
                 {
                     const auto & compiled_aggregate_functions = compiled_aggregate_functions_holder->compiled_aggregate_functions;
                     compiled_aggregate_functions.create_aggregate_states_function(aggregate_data);
@@ -1297,7 +1197,8 @@ void NO_INLINE Aggregator::executeImplBatch(
 #if defined(MEMORY_SANITIZER)
 
                     /// We compile only functions that do not allocate some data in Arena. Only store necessary state in AggregateData place.
-                    for (size_t aggregate_function_index = 0; aggregate_function_index < aggregate_functions.size(); ++aggregate_function_index)
+                    for (size_t aggregate_function_index = 0; aggregate_function_index < aggregate_functions.size();
+                         ++aggregate_function_index)
                     {
                         if (!is_aggregate_function_compiled[aggregate_function_index])
                             continue;
@@ -1320,26 +1221,51 @@ void NO_INLINE Aggregator::executeImplBatch(
                 aggregate_data = emplace_result.getMapped();
 
             assert(aggregate_data != nullptr);
+            places[i] = aggregate_data;
         }
-        else
+    }
+    else
+    {
+        for (size_t i = key_start; i < key_end; ++i)
         {
+            AggregateDataPtr aggregate_data = nullptr;
             /// Add only if the key already exists.
             auto find_result = state.findKey(method.data, i, *aggregates_pool);
             if (find_result.isFound())
-            {
                 aggregate_data = find_result.getMapped();
-            }
             else
-            {
                 aggregate_data = overflow_row;
-            }
+            places[i] = aggregate_data;
         }
-
-        places[i] = aggregate_data;
     }
 
+    executeAggregateInstructions(
+        aggregates_pool,
+        row_begin,
+        row_end,
+        aggregate_instructions,
+        places,
+        key_start,
+        state.hasOnlyOneValueSinceLastReset(),
+        no_more_keys,
+        all_keys_are_const,
+        use_compiled_functions);
+}
+
+void Aggregator::executeAggregateInstructions(
+    Arena * aggregates_pool,
+    size_t row_begin,
+    size_t row_end,
+    AggregateFunctionInstruction * aggregate_instructions,
+    const std::unique_ptr<AggregateDataPtr[]> &places,
+    size_t key_start,
+    bool has_only_one_value_since_last_reset,
+    bool no_more_keys,
+    bool all_keys_are_const,
+    bool use_compiled_functions) const
+{
 #if USE_EMBEDDED_COMPILER
-    if constexpr (use_compiled_functions)
+    if (use_compiled_functions)
     {
         std::vector<ColumnData> columns_data;
 
@@ -1355,7 +1281,7 @@ void NO_INLINE Aggregator::executeImplBatch(
                 columns_data.emplace_back(getColumnData(inst->batch_arguments[argument_index]));
         }
 
-        if (all_keys_are_const || (!no_more_keys && state.hasOnlyOneValueSinceLastReset()))
+        if (all_keys_are_const || (!no_more_keys && has_only_one_value_since_last_reset))
         {
             auto add_into_aggregate_states_function_single_place = compiled_aggregate_functions_holder->compiled_aggregate_functions.add_into_aggregate_states_function_single_place;
             add_into_aggregate_states_function_single_place(row_begin, row_end, columns_data.data(), places[key_start]);
@@ -1372,33 +1298,34 @@ void NO_INLINE Aggregator::executeImplBatch(
     for (size_t i = 0; i < aggregate_functions.size(); ++i)
     {
 #if USE_EMBEDDED_COMPILER
-        if constexpr (use_compiled_functions)
+        if (use_compiled_functions)
             if (is_aggregate_function_compiled[i])
                 continue;
 #endif
 
         AggregateFunctionInstruction * inst = aggregate_instructions + i;
 
-        if (all_keys_are_const || (!no_more_keys && state.hasOnlyOneValueSinceLastReset()))
+        if (all_keys_are_const || (!no_more_keys && has_only_one_value_since_last_reset))
             addBatchSinglePlace(row_begin, row_end, inst, places[key_start] + inst->state_offset, aggregates_pool);
         else
             addBatch(row_begin, row_end, inst, places.get(), aggregates_pool);
     }
+
 }
 
 
-template <bool use_compiled_functions>
 void NO_INLINE Aggregator::executeWithoutKeyImpl(
     AggregatedDataWithoutKey & res,
     size_t row_begin, size_t row_end,
     AggregateFunctionInstruction * aggregate_instructions,
-    Arena * arena) const
+    Arena * arena,
+    bool use_compiled_functions) const
 {
     if (row_begin == row_end)
         return;
 
 #if USE_EMBEDDED_COMPILER
-    if constexpr (use_compiled_functions)
+    if (use_compiled_functions)
     {
         std::vector<ColumnData> columns_data;
 
@@ -1441,7 +1368,7 @@ void NO_INLINE Aggregator::executeWithoutKeyImpl(
         AggregateFunctionInstruction * inst = aggregate_instructions + i;
 
 #if USE_EMBEDDED_COMPILER
-        if constexpr (use_compiled_functions)
+        if (use_compiled_functions)
             if (is_aggregate_function_compiled[i])
                 continue;
 #endif
@@ -1707,12 +1634,12 @@ bool Aggregator::executeOnBlock(Columns columns,
 // #if USE_EMBEDDED_COMPILER
 //         if (compiled_aggregate_functions_holder)
 //         {
-//             executeWithoutKeyImpl<true>(result.without_key, row_begin, row_end, aggregate_functions_instructions.data(), result.aggregates_pool);
+//             executeWithoutKeyImpl(result.without_key, row_begin, row_end, aggregate_functions_instructions.data(), result.aggregates_pool,true);
 //         }
 //         else
 // #endif
         {
-            executeWithoutKeyImpl<false>(result.without_key, row_begin, row_end, aggregate_functions_instructions.data(), result.aggregates_pool);
+            executeWithoutKeyImpl(result.without_key, row_begin, row_end, aggregate_functions_instructions.data(), result.aggregates_pool, false);
         }
     }
     else
@@ -1832,8 +1759,14 @@ Block Aggregator::convertOneBucketToBlock(
 {
     // Used in ConvertingAggregatedToChunksSource -> ConvertingAggregatedToChunksTransform (expects single chunk for each bucket_id).
     constexpr bool return_single_block = true;
-    Block block = convertToBlockImpl<return_single_block>(
-        method, method.data.impls[bucket], arena, data_variants.aggregates_pools, final, method.data.impls[bucket].size());
+    Block block = std::get<Block>(convertToBlockImpl(
+        method,
+        method.data.impls[bucket],
+        arena,
+        data_variants.aggregates_pools,
+        final,
+        method.data.impls[bucket].size(),
+        return_single_block));
 
     block.info.bucket_num = static_cast<int>(bucket);
     return block;
@@ -1953,35 +1886,33 @@ bool Aggregator::checkLimits(size_t result_size, bool & no_more_keys) const
 }
 
 
-template <bool return_single_block, typename Method, typename Table>
-Aggregator::ConvertToBlockRes<return_single_block>
-Aggregator::convertToBlockImpl(Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, bool final, size_t rows) const
+template <typename Method, typename Table>
+Aggregator::ConvertToBlockResVariant
+Aggregator::convertToBlockImpl(Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, bool final,size_t rows, bool return_single_block) const
 {
     if (data.empty())
     {
         auto && out_cols = prepareOutputBlockColumns(params, aggregate_functions, getHeader(final), aggregates_pools, final, rows);
         return {finalizeBlock(params, getHeader(final), std::move(out_cols), final, rows)};
     }
-
-    ConvertToBlockRes<return_single_block> res;
-
+    ConvertToBlockResVariant res;
     if (final)
     {
 #if USE_EMBEDDED_COMPILER
         if (compiled_aggregate_functions_holder)
         {
             static constexpr bool use_compiled_functions = !Method::low_cardinality_optimization;
-            res = convertToBlockImplFinal<Method, use_compiled_functions, return_single_block>(method, data, arena, aggregates_pools, rows);
+            res = convertToBlockImplFinal<Method>(method, data, arena, aggregates_pools, use_compiled_functions, true);
         }
         else
 #endif
         {
-            res = convertToBlockImplFinal<Method, false, return_single_block>(method, data, arena, aggregates_pools, rows);
+            res = convertToBlockImplFinal<Method>(method, data, arena, aggregates_pools, false, return_single_block);
         }
     }
     else
     {
-        res = convertToBlockImplNotFinal<return_single_block>(method, data, aggregates_pools, rows);
+        res = convertToBlockImplNotFinal(method, data, aggregates_pools, rows, return_single_block);
     }
 
     /// In order to release memory early.
@@ -2146,19 +2077,27 @@ Block Aggregator::insertResultsIntoColumns(PaddedPODArray<AggregateDataPtr> & pl
     return finalizeBlock(params, getHeader(/* final */ true), std::move(out_cols), /* final */ true, places.size());
 }
 
-template <typename Method, bool use_compiled_functions, bool return_single_block, typename Table>
-Aggregator::ConvertToBlockRes<return_single_block> NO_INLINE
-Aggregator::convertToBlockImplFinal(Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, size_t) const
+// template <typename Method, bool use_compiled_functions, bool return_single_block, typename Table>
+// Aggregator::ConvertToBlockRes<return_single_block> NO_INLINE
+// Aggregator::convertToBlockImplFinal(Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, size_t) const
+template <typename Method, typename Table>
+Aggregator::ConvertToBlockResVariant Aggregator::convertToBlockImplFinal(
+    Method & method,
+    Table & data,
+    Arena * arena,
+    Arenas & aggregates_pools,
+    bool use_compiled_functions,
+    bool return_single_block) const
 {
     /// +1 for nullKeyData, if `data` doesn't have it - not a problem, just some memory for one excessive row will be preallocated
     const size_t max_block_size = (return_single_block ? data.size() : std::min(params.max_block_size, data.size())) + 1;
     const bool final = true;
-    ConvertToBlockRes<return_single_block> res;
 
     std::optional<OutputBlockColumns> out_cols;
     std::optional<Sizes> shuffled_key_sizes;
     PaddedPODArray<AggregateDataPtr> places;
     bool has_null_key_data = false;
+    BlocksList blocks;
 
     auto init_out_cols = [&]()
     {
@@ -2187,51 +2126,78 @@ Aggregator::convertToBlockImplFinal(Method & method, Table & data, Arena * arena
     // should be invoked at least once, because null data might be the only content of the `data`
     init_out_cols();
 
-    data.forEachValue(
-        [&](const auto & key, auto & mapped)
-        {
-            if (!out_cols.has_value())
-                init_out_cols();
-
-            const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
-            method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
-            places.emplace_back(mapped);
-
-            /// Mark the cell as destroyed so it will not be destroyed in destructor.
-            mapped = nullptr;
-
-            if constexpr (!return_single_block)
+    if (return_single_block)
+    {
+        data.forEachValue(
+            [&](const auto & key, auto & mapped)
             {
+                if (!out_cols.has_value())
+                    init_out_cols();
+
+                const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
+                method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
+                places.emplace_back(mapped);
+
+                /// Mark the cell as destroyed so it will not be destroyed in destructor.
+                mapped = nullptr;
+            });
+    }
+    else
+    {
+        data.forEachValue(
+            [&](const auto & key, auto & mapped)
+            {
+                if (!out_cols.has_value())
+                    init_out_cols();
+
+                const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
+                method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
+                places.emplace_back(mapped);
+
+                /// Mark the cell as destroyed so it will not be destroyed in destructor.
+                mapped = nullptr;
+
                 if (places.size() >= max_block_size)
                 {
-                    res.emplace_back(insertResultsIntoColumns<use_compiled_functions>(places, std::move(out_cols.value()), arena, has_null_key_data));
+                    if (use_compiled_functions)
+                        blocks.emplace_back(insertResultsIntoColumns<true>(places, std::move(out_cols.value()), arena, has_null_key_data));
+                    else
+                        blocks.emplace_back(insertResultsIntoColumns<false>(places, std::move(out_cols.value()), arena, has_null_key_data));
                     places.clear();
                     out_cols.reset();
                     has_null_key_data = false;
                 }
-            }
-        });
+            });
+    }
 
-    if constexpr (return_single_block)
+    if (return_single_block)
     {
-        return insertResultsIntoColumns<use_compiled_functions>(places, std::move(out_cols.value()), arena, has_null_key_data);
+        if (use_compiled_functions)
+            return insertResultsIntoColumns<true>(places, std::move(out_cols.value()), arena, has_null_key_data);
+        else
+            return insertResultsIntoColumns<false>(places, std::move(out_cols.value()), arena, has_null_key_data);
     }
     else
     {
         if (out_cols.has_value())
-            res.emplace_back(insertResultsIntoColumns<use_compiled_functions>(places, std::move(out_cols.value()), arena, has_null_key_data));
-        return res;
+        {
+            if (use_compiled_functions)
+                blocks.emplace_back(insertResultsIntoColumns<true>(places, std::move(out_cols.value()), arena, has_null_key_data));
+            else
+                blocks.emplace_back(insertResultsIntoColumns<false>(places, std::move(out_cols.value()), arena, has_null_key_data));
+        }
+        return blocks;
     }
 }
 
-template <bool return_single_block, typename Method, typename Table>
-Aggregator::ConvertToBlockRes<return_single_block> NO_INLINE
-Aggregator::convertToBlockImplNotFinal(Method & method, Table & data, Arenas & aggregates_pools, size_t) const
+template <typename Method, typename Table>
+Aggregator::ConvertToBlockResVariant NO_INLINE
+Aggregator::convertToBlockImplNotFinal(Method & method, Table & data, Arenas & aggregates_pools, size_t, bool return_single_block) const
 {
     /// +1 for nullKeyData, if `data` doesn't have it - not a problem, just some memory for one excessive row will be preallocated
     const size_t max_block_size = (return_single_block ? data.size() : std::min(params.max_block_size, data.size())) + 1;
     const bool final = false;
-    ConvertToBlockRes<return_single_block> res;
+    BlocksList res_blocks;
 
     std::optional<OutputBlockColumns> out_cols;
     std::optional<Sizes> shuffled_key_sizes;
@@ -2261,46 +2227,65 @@ Aggregator::convertToBlockImplNotFinal(Method & method, Table & data, Arenas & a
 
     // should be invoked at least once, because null data might be the only content of the `data`
     init_out_cols();
-
-    data.forEachValue(
-        [&](const auto & key, auto & mapped)
-        {
-            if (!out_cols.has_value())
-                init_out_cols();
-
-            const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
-            method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
-
-            /// reserved, so push_back does not throw exceptions
-            for (size_t i = 0; i < params.aggregates_size; ++i)
-                out_cols->aggregate_columns_data[i]->push_back(mapped + offsets_of_aggregate_states[i]);
-
-            mapped = nullptr;
-
-            ++rows_in_current_block;
-
-            if constexpr (!return_single_block)
+    if (return_single_block)
+    {
+        data.forEachValue(
+            [&](const auto & key, auto & mapped)
             {
+                if (!out_cols.has_value())
+                    init_out_cols();
+
+                const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
+                method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
+
+                /// reserved, so push_back does not throw exceptions
+                for (size_t i = 0; i < params.aggregates_size; ++i)
+                    out_cols->aggregate_columns_data[i]->push_back(mapped + offsets_of_aggregate_states[i]);
+
+                mapped = nullptr;
+
+                ++rows_in_current_block;
+            });
+    }
+    else
+    {
+        data.forEachValue(
+            [&](const auto & key, auto & mapped)
+            {
+                if (!out_cols.has_value())
+                    init_out_cols();
+
+                const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
+                method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
+
+                /// reserved, so push_back does not throw exceptions
+                for (size_t i = 0; i < params.aggregates_size; ++i)
+                    out_cols->aggregate_columns_data[i]->push_back(mapped + offsets_of_aggregate_states[i]);
+
+                mapped = nullptr;
+
+                ++rows_in_current_block;
+
                 if (rows_in_current_block >= max_block_size)
                 {
-                    res.emplace_back(finalizeBlock(params, getHeader(final), std::move(out_cols.value()), final, rows_in_current_block));
+                    res_blocks.emplace_back(finalizeBlock(params, getHeader(final), std::move(out_cols.value()), final, rows_in_current_block));
                     out_cols.reset();
                     rows_in_current_block = 0;
                 }
-            }
-        });
+            });
+    }
 
-    if constexpr (return_single_block)
+    if (return_single_block)
     {
         return finalizeBlock(params, getHeader(final), std::move(out_cols).value(), final, rows_in_current_block);
     }
     else
     {
         if (rows_in_current_block)
-            res.emplace_back(finalizeBlock(params, getHeader(final), std::move(out_cols).value(), final, rows_in_current_block));
-        return res;
+            res_blocks.emplace_back(finalizeBlock(params, getHeader(final), std::move(out_cols).value(), final, rows_in_current_block));
+        return res_blocks;
     }
-    return res;
+    return res_blocks;
 }
 
 void Aggregator::addSingleKeyToAggregateColumns(
@@ -2406,18 +2391,23 @@ template <bool return_single_block>
 Aggregator::ConvertToBlockRes<return_single_block>
 Aggregator::prepareBlockAndFillSingleLevel(AggregatedDataVariants & data_variants, bool final) const
 {
+    ConvertToBlockResVariant res_variant;
     const size_t rows = data_variants.sizeWithoutOverflowRow();
 #define M(NAME) \
     else if (data_variants.type == AggregatedDataVariants::Type::NAME) \
     { \
-        return convertToBlockImpl<return_single_block>( \
-            *data_variants.NAME, data_variants.NAME->data, data_variants.aggregates_pool, data_variants.aggregates_pools, final, rows); \
+        res_variant = convertToBlockImpl( \
+            *data_variants.NAME, data_variants.NAME->data, data_variants.aggregates_pool, data_variants.aggregates_pools, final, rows, return_single_block); \
     }
 
     if (false) {} // NOLINT
     APPLY_FOR_VARIANTS_SINGLE_LEVEL(M)
 #undef M
     else throw Exception(ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT, "Unknown aggregated data variant.");
+    if constexpr (return_single_block)
+        return std::get<Block>(res_variant);
+    else
+        return std::get<BlocksList>(res_variant);
 }
 
 
@@ -2543,7 +2533,7 @@ BlocksList Aggregator::convertToBlocks(AggregatedDataVariants & data_variants, b
     if (data_variants.type != AggregatedDataVariants::Type::without_key)
     {
         if (!data_variants.isTwoLevel())
-            blocks.splice(blocks.end(), prepareBlockAndFillSingleLevel</* return_single_block */ false>(data_variants, final));
+            blocks.splice(blocks.end(), prepareBlockAndFillSingleLevel<false>(data_variants, final));
         else
             blocks.splice(blocks.end(), prepareBlocksAndFillTwoLevel(data_variants, final, thread_pool.get()));
     }
@@ -2609,8 +2599,8 @@ void NO_INLINE Aggregator::mergeDataNullKey(
     }
 }
 
-template <typename Method, bool use_compiled_functions, bool prefetch, typename Table>
-void NO_INLINE Aggregator::mergeDataImpl(Table & table_dst, Table & table_src, Arena * arena) const
+template <typename Method, typename Table>
+void NO_INLINE Aggregator::mergeDataImpl(Table & table_dst, Table & table_src, Arena * arena, bool use_compiled_functions, bool prefetch) const
 {
     if constexpr (Method::low_cardinality_optimization || Method::one_key_nullable_optimization)
         mergeDataNullKey<Method, Table>(table_dst, table_src, arena);
@@ -2633,11 +2623,14 @@ void NO_INLINE Aggregator::mergeDataImpl(Table & table_dst, Table & table_src, A
         src = nullptr;
     };
 
-    table_src.template mergeToViaEmplace<decltype(merge), prefetch>(table_dst, std::move(merge));
+    if (prefetch)
+        table_src.template mergeToViaEmplace<decltype(merge), true>(table_dst, std::move(merge));
+    else
+        table_src.template mergeToViaEmplace<decltype(merge), false>(table_dst, std::move(merge));
     table_src.clearAndShrink();
 
 #if USE_EMBEDDED_COMPILER
-    if constexpr (use_compiled_functions)
+    if (use_compiled_functions)
     {
         const auto & compiled_functions = compiled_aggregate_functions_holder->compiled_aggregate_functions;
         compiled_functions.merge_aggregate_states_function(dst_places.data(), src_places.data(), dst_places.size());
@@ -2790,22 +2783,14 @@ void NO_INLINE Aggregator::mergeSingleLevelDataImpl(
 #if USE_EMBEDDED_COMPILER
             if (compiled_aggregate_functions_holder)
             {
-                if (prefetch)
-                    mergeDataImpl<Method, true, true>(
-                        getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool);
-                else
-                    mergeDataImpl<Method, true, false>(
-                        getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool);
+                mergeDataImpl<Method>(
+                    getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool, true, prefetch);
             }
             else
 #endif
             {
-                if (prefetch)
-                    mergeDataImpl<Method, false, true>(
-                        getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool);
-                else
-                    mergeDataImpl<Method, false, false>(
-                        getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool);
+                mergeDataImpl<Method>(
+                    getDataVariant<Method>(*res).data, getDataVariant<Method>(current).data, res->aggregates_pool, false, prefetch);
             }
         }
         else if (res->without_key)
@@ -2854,22 +2839,18 @@ void NO_INLINE Aggregator::mergeBucketImpl(
 #if USE_EMBEDDED_COMPILER
         if (compiled_aggregate_functions_holder)
         {
-            if (prefetch)
-                mergeDataImpl<Method, true, true>(
-                    getDataVariant<Method>(*res).data.impls[bucket], getDataVariant<Method>(current).data.impls[bucket], arena);
-            else
-                mergeDataImpl<Method, true, false>(
-                    getDataVariant<Method>(*res).data.impls[bucket], getDataVariant<Method>(current).data.impls[bucket], arena);
+            mergeDataImpl<Method>(
+                getDataVariant<Method>(*res).data.impls[bucket], getDataVariant<Method>(current).data.impls[bucket], arena, true, prefetch);
         }
         else
 #endif
         {
-            if (prefetch)
-                mergeDataImpl<Method, false, true>(
-                    getDataVariant<Method>(*res).data.impls[bucket], getDataVariant<Method>(current).data.impls[bucket], arena);
-            else
-                mergeDataImpl<Method, false, false>(
-                    getDataVariant<Method>(*res).data.impls[bucket], getDataVariant<Method>(current).data.impls[bucket], arena);
+            mergeDataImpl<Method>(
+                getDataVariant<Method>(*res).data.impls[bucket],
+                getDataVariant<Method>(current).data.impls[bucket],
+                arena,
+                false,
+                prefetch);
         }
     }
 }
@@ -3589,7 +3570,4 @@ void Aggregator::destroyAllAggregateStates(AggregatedDataVariants & result) cons
         throw Exception(ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT, "Unknown aggregated data variant.");
 }
 
-
-template Aggregator::ConvertToBlockRes<false>
-Aggregator::prepareBlockAndFillSingleLevel<false>(AggregatedDataVariants & data_variants, bool final) const;
 }
diff --git a/src/Interpreters/Aggregator.h b/src/Interpreters/Aggregator.h
index 375b8986101..1d887d2a2c3 100644
--- a/src/Interpreters/Aggregator.h
+++ b/src/Interpreters/Aggregator.h
@@ -4,6 +4,7 @@
 #include <memory>
 #include <mutex>
 #include <type_traits>
+#include <variant>
 
 
 #include <base/StringRef.h>
@@ -38,998 +39,21 @@
 
 #include <Parsers/IAST_fwd.h>
 
+#include <Interpreters/AggregationMethod.h>
+#include <Interpreters/AggregatedData.h>
+#include <Interpreters/AggregatedDataVariants.h>
+
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int UNKNOWN_AGGREGATED_DATA_VARIANT;
-}
-
 class Arena;
 using ArenaPtr = std::shared_ptr<Arena>;
 using Arenas = std::vector<ArenaPtr>;
 
-/** Different data structures that can be used for aggregation
-  * For efficiency, the aggregation data itself is put into the pool.
-  * Data and pool ownership (states of aggregate functions)
-  *  is acquired later - in `convertToBlocks` function, by the ColumnAggregateFunction object.
-  *
-  * Most data structures exist in two versions: normal and two-level (TwoLevel).
-  * A two-level hash table works a little slower with a small number of different keys,
-  *  but with a large number of different keys scales better, because it allows
-  *  parallelize some operations (merging, post-processing) in a natural way.
-  *
-  * To ensure efficient work over a wide range of conditions,
-  *  first single-level hash tables are used,
-  *  and when the number of different keys is large enough,
-  *  they are converted to two-level ones.
-  *
-  * PS. There are many different approaches to the effective implementation of parallel and distributed aggregation,
-  *  best suited for different cases, and this approach is just one of them, chosen for a combination of reasons.
-  */
-
-using AggregatedDataWithoutKey = AggregateDataPtr;
-
-using AggregatedDataWithUInt8Key = FixedImplicitZeroHashMapWithCalculatedSize<UInt8, AggregateDataPtr>;
-using AggregatedDataWithUInt16Key = FixedImplicitZeroHashMap<UInt16, AggregateDataPtr>;
-
-using AggregatedDataWithUInt32Key = HashMap<UInt32, AggregateDataPtr, HashCRC32<UInt32>>;
-using AggregatedDataWithUInt64Key = HashMap<UInt64, AggregateDataPtr, HashCRC32<UInt64>>;
-
-using AggregatedDataWithShortStringKey = StringHashMap<AggregateDataPtr>;
-
-using AggregatedDataWithStringKey = HashMapWithSavedHash<StringRef, AggregateDataPtr>;
-
-using AggregatedDataWithKeys128 = HashMap<UInt128, AggregateDataPtr, UInt128HashCRC32>;
-using AggregatedDataWithKeys256 = HashMap<UInt256, AggregateDataPtr, UInt256HashCRC32>;
-
-using AggregatedDataWithUInt32KeyTwoLevel = TwoLevelHashMap<UInt32, AggregateDataPtr, HashCRC32<UInt32>>;
-using AggregatedDataWithUInt64KeyTwoLevel = TwoLevelHashMap<UInt64, AggregateDataPtr, HashCRC32<UInt64>>;
-
-using AggregatedDataWithShortStringKeyTwoLevel = TwoLevelStringHashMap<AggregateDataPtr>;
-
-using AggregatedDataWithStringKeyTwoLevel = TwoLevelHashMapWithSavedHash<StringRef, AggregateDataPtr>;
-
-using AggregatedDataWithKeys128TwoLevel = TwoLevelHashMap<UInt128, AggregateDataPtr, UInt128HashCRC32>;
-using AggregatedDataWithKeys256TwoLevel = TwoLevelHashMap<UInt256, AggregateDataPtr, UInt256HashCRC32>;
-
-/** Variants with better hash function, using more than 32 bits for hash.
-  * Using for merging phase of external aggregation, where number of keys may be far greater than 4 billion,
-  *  but we keep in memory and merge only sub-partition of them simultaneously.
-  * TODO We need to switch for better hash function not only for external aggregation,
-  *  but also for huge aggregation results on machines with terabytes of RAM.
-  */
-
-using AggregatedDataWithUInt64KeyHash64 = HashMap<UInt64, AggregateDataPtr, DefaultHash<UInt64>>;
-using AggregatedDataWithStringKeyHash64 = HashMapWithSavedHash<StringRef, AggregateDataPtr, StringRefHash64>;
-using AggregatedDataWithKeys128Hash64 = HashMap<UInt128, AggregateDataPtr, UInt128Hash>;
-using AggregatedDataWithKeys256Hash64 = HashMap<UInt256, AggregateDataPtr, UInt256Hash>;
-
-template <typename Base>
-struct AggregationDataWithNullKey : public Base
-{
-    using Base::Base;
-
-    bool & hasNullKeyData() { return has_null_key_data; }
-    AggregateDataPtr & getNullKeyData() { return null_key_data; }
-    bool hasNullKeyData() const { return has_null_key_data; }
-    const AggregateDataPtr & getNullKeyData() const { return null_key_data; }
-    size_t size() const { return Base::size() + (has_null_key_data ? 1 : 0); }
-    bool empty() const { return Base::empty() && !has_null_key_data; }
-    void clear()
-    {
-        Base::clear();
-        has_null_key_data = false;
-    }
-    void clearAndShrink()
-    {
-        Base::clearAndShrink();
-        has_null_key_data = false;
-    }
-
-private:
-    bool has_null_key_data = false;
-    AggregateDataPtr null_key_data = nullptr;
-};
-
-template <typename Base>
-struct AggregationDataWithNullKeyTwoLevel : public Base
-{
-    using Base::Base;
-    using Base::impls;
-
-    AggregationDataWithNullKeyTwoLevel() = default;
-
-    template <typename Other>
-    explicit AggregationDataWithNullKeyTwoLevel(const Other & other) : Base(other)
-    {
-        impls[0].hasNullKeyData() = other.hasNullKeyData();
-        impls[0].getNullKeyData() = other.getNullKeyData();
-    }
-
-    bool & hasNullKeyData() { return impls[0].hasNullKeyData(); }
-    AggregateDataPtr & getNullKeyData() { return impls[0].getNullKeyData(); }
-    bool hasNullKeyData() const { return impls[0].hasNullKeyData(); }
-    const AggregateDataPtr & getNullKeyData() const { return impls[0].getNullKeyData(); }
-};
-
-template <typename ... Types>
-using HashTableWithNullKey = AggregationDataWithNullKey<HashMapTable<Types ...>>;
-template <typename ... Types>
-using StringHashTableWithNullKey = AggregationDataWithNullKey<StringHashMap<Types ...>>;
-
-using AggregatedDataWithNullableUInt8Key = AggregationDataWithNullKey<AggregatedDataWithUInt8Key>;
-using AggregatedDataWithNullableUInt16Key = AggregationDataWithNullKey<AggregatedDataWithUInt16Key>;
-using AggregatedDataWithNullableUInt32Key = AggregationDataWithNullKey<AggregatedDataWithUInt32Key>;
-
-
-using AggregatedDataWithNullableUInt64Key = AggregationDataWithNullKey<AggregatedDataWithUInt64Key>;
-using AggregatedDataWithNullableStringKey = AggregationDataWithNullKey<AggregatedDataWithStringKey>;
-using AggregatedDataWithNullableShortStringKey = AggregationDataWithNullKey<AggregatedDataWithShortStringKey>;
-
-
-using AggregatedDataWithNullableUInt32KeyTwoLevel = AggregationDataWithNullKeyTwoLevel<
-    TwoLevelHashMap<UInt32, AggregateDataPtr, HashCRC32<UInt32>,
-                    TwoLevelHashTableGrower<>, HashTableAllocator, HashTableWithNullKey>>;
-using AggregatedDataWithNullableUInt64KeyTwoLevel = AggregationDataWithNullKeyTwoLevel<
-        TwoLevelHashMap<UInt64, AggregateDataPtr, HashCRC32<UInt64>,
-        TwoLevelHashTableGrower<>, HashTableAllocator, HashTableWithNullKey>>;
-
-using AggregatedDataWithNullableShortStringKeyTwoLevel = AggregationDataWithNullKeyTwoLevel<
-        TwoLevelStringHashMap<AggregateDataPtr, HashTableAllocator, StringHashTableWithNullKey>>;
-
-using AggregatedDataWithNullableStringKeyTwoLevel = AggregationDataWithNullKeyTwoLevel<
-        TwoLevelHashMapWithSavedHash<StringRef, AggregateDataPtr, DefaultHash<StringRef>,
-        TwoLevelHashTableGrower<>, HashTableAllocator, HashTableWithNullKey>>;
-
-/// For the case where there is one numeric key.
-/// FieldType is UInt8/16/32/64 for any type with corresponding bit width.
-template <typename FieldType, typename TData,
-        bool consecutive_keys_optimization = true, bool nullable = false>
-struct AggregationMethodOneNumber
-{
-    using Data = TData;
-    using Key = typename Data::key_type;
-    using Mapped = typename Data::mapped_type;
-
-    Data data;
-
-    AggregationMethodOneNumber() = default;
-
-    explicit AggregationMethodOneNumber(size_t size_hint) : data(size_hint) { }
-
-    template <typename Other>
-    explicit AggregationMethodOneNumber(const Other & other) : data(other.data)
-    {
-    }
-
-    /// To use one `Method` in different threads, use different `State`.
-    template <bool use_cache>
-    using StateImpl = ColumnsHashing::HashMethodOneNumber<
-        typename Data::value_type,
-        Mapped,
-        FieldType,
-        use_cache && consecutive_keys_optimization,
-        /*need_offset=*/ false,
-        nullable>;
-
-    using State = StateImpl<true>;
-    using StateNoCache = StateImpl<false>;
-
-    /// Use optimization for low cardinality.
-    static const bool low_cardinality_optimization = false;
-    static const bool one_key_nullable_optimization = nullable;
-
-    /// Shuffle key columns before `insertKeyIntoColumns` call if needed.
-    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
-
-    // Insert the key from the hash table into columns.
-    static void insertKeyIntoColumns(const Key & key, std::vector<IColumn *> & key_columns, const Sizes & /*key_sizes*/)
-    {
-        ColumnFixedSizeHelper * column;
-        if constexpr (nullable)
-        {
-            ColumnNullable & nullable_col = assert_cast<ColumnNullable &>(*key_columns[0]);
-            ColumnUInt8 * null_map = assert_cast<ColumnUInt8 *>(&nullable_col.getNullMapColumn());
-            null_map->insertDefault();
-            column = static_cast<ColumnFixedSizeHelper *>(&nullable_col.getNestedColumn());
-        }
-        else
-        {
-            column = static_cast<ColumnFixedSizeHelper *>(key_columns[0]);
-        }
-        static_assert(sizeof(FieldType) <= sizeof(Key));
-        const auto * key_holder = reinterpret_cast<const char *>(&key);
-        if constexpr (sizeof(FieldType) < sizeof(Key) && std::endian::native == std::endian::big)
-            column->insertRawData<sizeof(FieldType)>(key_holder + (sizeof(Key) - sizeof(FieldType)));
-        else
-            column->insertRawData<sizeof(FieldType)>(key_holder);
-    }
-};
-
-
-/// For the case where there is one string key.
-template <typename TData>
-struct AggregationMethodString
-{
-    using Data = TData;
-    using Key = typename Data::key_type;
-    using Mapped = typename Data::mapped_type;
-
-    Data data;
-
-    AggregationMethodString() = default;
-
-    template <typename Other>
-    explicit AggregationMethodString(const Other & other) : data(other.data)
-    {
-    }
-
-    explicit AggregationMethodString(size_t size_hint) : data(size_hint) { }
-
-    template <bool use_cache>
-    using StateImpl = ColumnsHashing::HashMethodString<typename Data::value_type, Mapped, /*place_string_to_arena=*/ true, use_cache>;
-
-    using State = StateImpl<true>;
-    using StateNoCache = StateImpl<false>;
-
-    static const bool low_cardinality_optimization = false;
-    static const bool one_key_nullable_optimization = false;
-
-    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
-
-    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
-    {
-        static_cast<ColumnString *>(key_columns[0])->insertData(key.data, key.size);
-    }
-};
-
-
-/// Same as above but without cache
-template <typename TData, bool nullable = false>
-struct AggregationMethodStringNoCache
-{
-    using Data = TData;
-    using Key = typename Data::key_type;
-    using Mapped = typename Data::mapped_type;
-
-    Data data;
-
-    AggregationMethodStringNoCache() = default;
-
-    explicit AggregationMethodStringNoCache(size_t size_hint) : data(size_hint) { }
-
-    template <typename Other>
-    explicit AggregationMethodStringNoCache(const Other & other) : data(other.data)
-    {
-    }
-
-    template <bool use_cache>
-    using StateImpl = ColumnsHashing::HashMethodString<typename Data::value_type, Mapped, true, false, false, nullable>;
-
-    using State = StateImpl<true>;
-    using StateNoCache = StateImpl<false>;
-
-    static const bool low_cardinality_optimization = false;
-    static const bool one_key_nullable_optimization = nullable;
-
-    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
-
-    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
-    {
-        if constexpr (nullable)
-        {
-            ColumnNullable & column_nullable = assert_cast<ColumnNullable &>(*key_columns[0]);
-            assert_cast<ColumnString &>(column_nullable.getNestedColumn()).insertData(key.data, key.size);
-            column_nullable.getNullMapData().push_back(0);
-        }
-        else
-        {
-            assert_cast<ColumnString &>(*key_columns[0]).insertData(key.data, key.size);
-        }
-    }
-};
-
-
-/// For the case where there is one fixed-length string key.
-template <typename TData>
-struct AggregationMethodFixedString
-{
-    using Data = TData;
-    using Key = typename Data::key_type;
-    using Mapped = typename Data::mapped_type;
-
-    Data data;
-
-    AggregationMethodFixedString() = default;
-
-    explicit AggregationMethodFixedString(size_t size_hint) : data(size_hint) { }
-
-    template <typename Other>
-    explicit AggregationMethodFixedString(const Other & other) : data(other.data)
-    {
-    }
-
-    template <bool use_cache>
-    using StateImpl = ColumnsHashing::HashMethodFixedString<typename Data::value_type, Mapped, /*place_string_to_arena=*/ true, use_cache>;
-
-    using State = StateImpl<true>;
-    using StateNoCache = StateImpl<false>;
-
-    static const bool low_cardinality_optimization = false;
-    static const bool one_key_nullable_optimization = false;
-
-    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
-
-    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
-    {
-        assert_cast<ColumnFixedString &>(*key_columns[0]).insertData(key.data, key.size);
-    }
-};
-
-/// Same as above but without cache
-template <typename TData, bool nullable = false>
-struct AggregationMethodFixedStringNoCache
-{
-    using Data = TData;
-    using Key = typename Data::key_type;
-    using Mapped = typename Data::mapped_type;
-
-    Data data;
-
-    AggregationMethodFixedStringNoCache() = default;
-
-    explicit AggregationMethodFixedStringNoCache(size_t size_hint) : data(size_hint) { }
-
-    template <typename Other>
-    explicit AggregationMethodFixedStringNoCache(const Other & other) : data(other.data)
-    {
-    }
-
-    template <bool use_cache>
-    using StateImpl = ColumnsHashing::HashMethodFixedString<typename Data::value_type, Mapped, true, false, false, nullable>;
-
-    using State = StateImpl<true>;
-    using StateNoCache = StateImpl<false>;
-
-    static const bool low_cardinality_optimization = false;
-    static const bool one_key_nullable_optimization = nullable;
-
-    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
-
-    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
-    {
-        if constexpr (nullable)
-        {
-            assert_cast<ColumnNullable &>(*key_columns[0]).insertData(key.data, key.size);
-        }
-        else
-        {
-            assert_cast<ColumnFixedString &>(*key_columns[0]).insertData(key.data, key.size);
-        }
-    }
-};
-
-
-/// Single low cardinality column.
-template <typename SingleColumnMethod>
-struct AggregationMethodSingleLowCardinalityColumn : public SingleColumnMethod
-{
-    using Base = SingleColumnMethod;
-    using Data = typename Base::Data;
-    using Key = typename Base::Key;
-    using Mapped = typename Base::Mapped;
-    using Base::data;
-
-    template <bool use_cache>
-    using BaseStateImpl = typename Base::template StateImpl<use_cache>;
-
-    AggregationMethodSingleLowCardinalityColumn() = default;
-
-    template <typename Other>
-    explicit AggregationMethodSingleLowCardinalityColumn(const Other & other) : Base(other) {}
-
-    template <bool use_cache>
-    using StateImpl = ColumnsHashing::HashMethodSingleLowCardinalityColumn<BaseStateImpl<use_cache>, Mapped, use_cache>;
-
-    using State = StateImpl<true>;
-    using StateNoCache = StateImpl<false>;
-
-    static const bool low_cardinality_optimization = true;
-
-    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
-
-    static void insertKeyIntoColumns(const Key & key,
-         std::vector<IColumn *> & key_columns_low_cardinality, const Sizes & /*key_sizes*/)
-    {
-        auto * col = assert_cast<ColumnLowCardinality *>(key_columns_low_cardinality[0]);
-
-        if constexpr (std::is_same_v<Key, StringRef>)
-        {
-            col->insertData(key.data, key.size);
-        }
-        else
-        {
-            col->insertData(reinterpret_cast<const char *>(&key), sizeof(key));
-        }
-    }
-};
-
-
-/// For the case where all keys are of fixed length, and they fit in N (for example, 128) bits.
-template <typename TData, bool has_nullable_keys_ = false, bool has_low_cardinality_ = false, bool consecutive_keys_optimization = false>
-struct AggregationMethodKeysFixed
-{
-    using Data = TData;
-    using Key = typename Data::key_type;
-    using Mapped = typename Data::mapped_type;
-    static constexpr bool has_nullable_keys = has_nullable_keys_;
-    static constexpr bool has_low_cardinality = has_low_cardinality_;
-
-    Data data;
-
-    AggregationMethodKeysFixed() = default;
-
-    explicit AggregationMethodKeysFixed(size_t size_hint) : data(size_hint) { }
-
-    template <typename Other>
-    explicit AggregationMethodKeysFixed(const Other & other) : data(other.data)
-    {
-    }
-
-    template <bool use_cache>
-    using StateImpl = ColumnsHashing::HashMethodKeysFixed<
-        typename Data::value_type,
-        Key,
-        Mapped,
-        has_nullable_keys,
-        has_low_cardinality,
-        use_cache && consecutive_keys_optimization>;
-
-    using State = StateImpl<true>;
-    using StateNoCache = StateImpl<false>;
-
-    static const bool low_cardinality_optimization = false;
-    static const bool one_key_nullable_optimization = false;
-
-    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> & key_columns, const Sizes & key_sizes)
-    {
-        return State::shuffleKeyColumns(key_columns, key_sizes);
-    }
-
-    static void insertKeyIntoColumns(const Key & key, std::vector<IColumn *> & key_columns, const Sizes & key_sizes)
-    {
-        size_t keys_size = key_columns.size();
-
-        static constexpr auto bitmap_size = has_nullable_keys ? std::tuple_size<KeysNullMap<Key>>::value : 0;
-        /// In any hash key value, column values to be read start just after the bitmap, if it exists.
-        size_t pos = bitmap_size;
-
-        for (size_t i = 0; i < keys_size; ++i)
-        {
-            IColumn * observed_column;
-            ColumnUInt8 * null_map;
-
-            bool column_nullable = false;
-            if constexpr (has_nullable_keys)
-                column_nullable = isColumnNullable(*key_columns[i]);
-
-            /// If we have a nullable column, get its nested column and its null map.
-            if (column_nullable)
-            {
-                ColumnNullable & nullable_col = assert_cast<ColumnNullable &>(*key_columns[i]);
-                observed_column = &nullable_col.getNestedColumn();
-                null_map = assert_cast<ColumnUInt8 *>(&nullable_col.getNullMapColumn());
-            }
-            else
-            {
-                observed_column = key_columns[i];
-                null_map = nullptr;
-            }
-
-            bool is_null = false;
-            if (column_nullable)
-            {
-                /// The current column is nullable. Check if the value of the
-                /// corresponding key is nullable. Update the null map accordingly.
-                size_t bucket = i / 8;
-                size_t offset = i % 8;
-                UInt8 val = (reinterpret_cast<const UInt8 *>(&key)[bucket] >> offset) & 1;
-                null_map->insertValue(val);
-                is_null = val == 1;
-            }
-
-            if (has_nullable_keys && is_null)
-                observed_column->insertDefault();
-            else
-            {
-                size_t size = key_sizes[i];
-                size_t offset_to = pos;
-                if constexpr (std::endian::native == std::endian::big)
-                   offset_to = sizeof(Key) - size - pos;
-                observed_column->insertData(reinterpret_cast<const char *>(&key) + offset_to, size);
-                pos += size;
-            }
-        }
-    }
-};
-
-
-/** Aggregates by concatenating serialized key values.
-  * The serialized value differs in that it uniquely allows to deserialize it, having only the position with which it starts.
-  * That is, for example, for strings, it contains first the serialized length of the string, and then the bytes.
-  * Therefore, when aggregating by several strings, there is no ambiguity.
-  */
-template <typename TData, bool nullable = false, bool prealloc = false>
-struct AggregationMethodSerialized
-{
-    using Data = TData;
-    using Key = typename Data::key_type;
-    using Mapped = typename Data::mapped_type;
-
-    Data data;
-
-    AggregationMethodSerialized() = default;
-
-    explicit AggregationMethodSerialized(size_t size_hint) : data(size_hint) { }
-
-    template <typename Other>
-    explicit AggregationMethodSerialized(const Other & other) : data(other.data)
-    {
-    }
-
-    template <bool use_cache>
-    using StateImpl = ColumnsHashing::HashMethodSerialized<typename Data::value_type, Mapped, nullable, prealloc>;
-
-    using State = StateImpl<true>;
-    using StateNoCache = StateImpl<false>;
-
-    static const bool low_cardinality_optimization = false;
-    static const bool one_key_nullable_optimization = false;
-
-    std::optional<Sizes> shuffleKeyColumns(std::vector<IColumn *> &, const Sizes &) { return {}; }
-
-    static void insertKeyIntoColumns(StringRef key, std::vector<IColumn *> & key_columns, const Sizes &)
-    {
-        const auto * pos = key.data;
-        for (auto & column : key_columns)
-            pos = column->deserializeAndInsertFromArena(pos);
-    }
-};
-
-template <typename TData>
-using AggregationMethodNullableSerialized = AggregationMethodSerialized<TData, true>;
-
-template <typename TData>
-using AggregationMethodPreallocSerialized = AggregationMethodSerialized<TData, false, true>;
-
-template <typename TData>
-using AggregationMethodNullablePreallocSerialized = AggregationMethodSerialized<TData, true, true>;
-
-class Aggregator;
-
 using ColumnsHashing::HashMethodContext;
 using ColumnsHashing::HashMethodContextPtr;
 using ColumnsHashing::LastElementCacheStats;
 
-struct AggregatedDataVariants : private boost::noncopyable
-{
-    /** Working with states of aggregate functions in the pool is arranged in the following (inconvenient) way:
-      * - when aggregating, states are created in the pool using IAggregateFunction::create (inside - `placement new` of arbitrary structure);
-      * - they must then be destroyed using IAggregateFunction::destroy (inside - calling the destructor of arbitrary structure);
-      * - if aggregation is complete, then, in the Aggregator::convertToBlocks function, pointers to the states of aggregate functions
-      *   are written to ColumnAggregateFunction; ColumnAggregateFunction "acquires ownership" of them, that is - calls `destroy` in its destructor.
-      * - if during the aggregation, before call to Aggregator::convertToBlocks, an exception was thrown,
-      *   then the states of aggregate functions must still be destroyed,
-      *   otherwise, for complex states (eg, AggregateFunctionUniq), there will be memory leaks;
-      * - in this case, to destroy states, the destructor calls Aggregator::destroyAggregateStates method,
-      *   but only if the variable aggregator (see below) is not nullptr;
-      * - that is, until you transfer ownership of the aggregate function states in the ColumnAggregateFunction, set the variable `aggregator`,
-      *   so that when an exception occurs, the states are correctly destroyed.
-      *
-      * PS. This can be corrected by making a pool that knows about which states of aggregate functions and in which order are put in it, and knows how to destroy them.
-      * But this can hardly be done simply because it is planned to put variable-length strings into the same pool.
-      * In this case, the pool will not be able to know with what offsets objects are stored.
-      */
-    const Aggregator * aggregator = nullptr;
-
-    size_t keys_size{};  /// Number of keys. NOTE do we need this field?
-    Sizes key_sizes;     /// Dimensions of keys, if keys of fixed length
-
-    /// Pools for states of aggregate functions. Ownership will be later transferred to ColumnAggregateFunction.
-    Arenas aggregates_pools;
-    Arena * aggregates_pool{};    /// The pool that is currently used for allocation.
-
-    /** Specialization for the case when there are no keys, and for keys not fitted into max_rows_to_group_by.
-      */
-    AggregatedDataWithoutKey without_key = nullptr;
-
-    /// Stats of a cache for consecutive keys optimization.
-    /// Stats can be used to disable the cache in case of a lot of misses.
-    LastElementCacheStats consecutive_keys_cache_stats;
-
-    // Disable consecutive key optimization for Uint8/16, because they use a FixedHashMap
-    // and the lookup there is almost free, so we don't need to cache the last lookup result
-    std::unique_ptr<AggregationMethodOneNumber<UInt8, AggregatedDataWithUInt8Key, false>>           key8;
-    std::unique_ptr<AggregationMethodOneNumber<UInt16, AggregatedDataWithUInt16Key, false>>         key16;
-
-    std::unique_ptr<AggregationMethodOneNumber<UInt32, AggregatedDataWithUInt64Key>>         key32;
-    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithUInt64Key>>         key64;
-    std::unique_ptr<AggregationMethodStringNoCache<AggregatedDataWithShortStringKey>>               key_string;
-    std::unique_ptr<AggregationMethodFixedStringNoCache<AggregatedDataWithShortStringKey>>          key_fixed_string;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt16Key, false, false, false>>  keys16;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt32Key>>                   keys32;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt64Key>>                   keys64;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128>>                   keys128;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256>>                   keys256;
-    std::unique_ptr<AggregationMethodSerialized<AggregatedDataWithStringKey>>                          serialized;
-    std::unique_ptr<AggregationMethodNullableSerialized<AggregatedDataWithStringKey>>                  nullable_serialized;
-    std::unique_ptr<AggregationMethodPreallocSerialized<AggregatedDataWithStringKey>>                  prealloc_serialized;
-    std::unique_ptr<AggregationMethodNullablePreallocSerialized<AggregatedDataWithStringKey>>          nullable_prealloc_serialized;
-
-    std::unique_ptr<AggregationMethodOneNumber<UInt32, AggregatedDataWithUInt64KeyTwoLevel>> key32_two_level;
-    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithUInt64KeyTwoLevel>> key64_two_level;
-    std::unique_ptr<AggregationMethodStringNoCache<AggregatedDataWithShortStringKeyTwoLevel>>       key_string_two_level;
-    std::unique_ptr<AggregationMethodFixedStringNoCache<AggregatedDataWithShortStringKeyTwoLevel>>  key_fixed_string_two_level;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt32KeyTwoLevel>>           keys32_two_level;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithUInt64KeyTwoLevel>>           keys64_two_level;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128TwoLevel>>           keys128_two_level;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256TwoLevel>>           keys256_two_level;
-    std::unique_ptr<AggregationMethodSerialized<AggregatedDataWithStringKeyTwoLevel>>                  serialized_two_level;
-    std::unique_ptr<AggregationMethodNullableSerialized<AggregatedDataWithStringKeyTwoLevel>>          nullable_serialized_two_level;
-    std::unique_ptr<AggregationMethodPreallocSerialized<AggregatedDataWithStringKeyTwoLevel>>          prealloc_serialized_two_level;
-    std::unique_ptr<AggregationMethodNullablePreallocSerialized<AggregatedDataWithStringKeyTwoLevel>>  nullable_prealloc_serialized_two_level;
-
-    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithUInt64KeyHash64>>   key64_hash64;
-    std::unique_ptr<AggregationMethodString<AggregatedDataWithStringKeyHash64>>              key_string_hash64;
-    std::unique_ptr<AggregationMethodFixedString<AggregatedDataWithStringKeyHash64>>         key_fixed_string_hash64;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128Hash64>>             keys128_hash64;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256Hash64>>             keys256_hash64;
-    std::unique_ptr<AggregationMethodSerialized<AggregatedDataWithStringKeyHash64>>                  serialized_hash64;
-    std::unique_ptr<AggregationMethodNullableSerialized<AggregatedDataWithStringKeyHash64>>          nullable_serialized_hash64;
-    std::unique_ptr<AggregationMethodPreallocSerialized<AggregatedDataWithStringKeyHash64>>          prealloc_serialized_hash64;
-    std::unique_ptr<AggregationMethodNullablePreallocSerialized<AggregatedDataWithStringKeyHash64>>  nullable_prealloc_serialized_hash64;
-
-    /// Support for nullable keys.
-    std::unique_ptr<AggregationMethodOneNumber<UInt8, AggregatedDataWithNullableUInt8Key, false, true>>         nullable_key8;
-    std::unique_ptr<AggregationMethodOneNumber<UInt16, AggregatedDataWithNullableUInt16Key, false, true>>         nullable_key16;
-    std::unique_ptr<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt32Key, true, true>>         nullable_key32;
-    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64Key, true, true>>         nullable_key64;
-    std::unique_ptr<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt32KeyTwoLevel, true, true>>         nullable_key32_two_level;
-    std::unique_ptr<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64KeyTwoLevel, true, true>>         nullable_key64_two_level;
-
-    std::unique_ptr<AggregationMethodStringNoCache<AggregatedDataWithNullableShortStringKey, true>> nullable_key_string;
-    std::unique_ptr<AggregationMethodFixedStringNoCache<AggregatedDataWithNullableShortStringKey, true>> nullable_key_fixed_string;
-    std::unique_ptr<AggregationMethodStringNoCache<AggregatedDataWithNullableShortStringKeyTwoLevel, true>> nullable_key_string_two_level;
-    std::unique_ptr<AggregationMethodFixedStringNoCache<AggregatedDataWithNullableShortStringKeyTwoLevel, true>> nullable_key_fixed_string_two_level;
-
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128, true>>             nullable_keys128;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256, true>>             nullable_keys256;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128TwoLevel, true>>     nullable_keys128_two_level;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256TwoLevel, true>>     nullable_keys256_two_level;
-
-    /// Support for low cardinality.
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt8, AggregatedDataWithNullableUInt8Key, false>>> low_cardinality_key8;
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt16, AggregatedDataWithNullableUInt16Key, false>>> low_cardinality_key16;
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt64Key>>> low_cardinality_key32;
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64Key>>> low_cardinality_key64;
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodString<AggregatedDataWithNullableStringKey>>> low_cardinality_key_string;
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodFixedString<AggregatedDataWithNullableStringKey>>> low_cardinality_key_fixed_string;
-
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt32, AggregatedDataWithNullableUInt64KeyTwoLevel>>> low_cardinality_key32_two_level;
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodOneNumber<UInt64, AggregatedDataWithNullableUInt64KeyTwoLevel>>> low_cardinality_key64_two_level;
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodString<AggregatedDataWithNullableStringKeyTwoLevel>>> low_cardinality_key_string_two_level;
-    std::unique_ptr<AggregationMethodSingleLowCardinalityColumn<AggregationMethodFixedString<AggregatedDataWithNullableStringKeyTwoLevel>>> low_cardinality_key_fixed_string_two_level;
-
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128, false, true>>      low_cardinality_keys128;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256, false, true>>      low_cardinality_keys256;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys128TwoLevel, false, true>> low_cardinality_keys128_two_level;
-    std::unique_ptr<AggregationMethodKeysFixed<AggregatedDataWithKeys256TwoLevel, false, true>> low_cardinality_keys256_two_level;
-
-    /// In this and similar macros, the option without_key is not considered.
-    #define APPLY_FOR_AGGREGATED_VARIANTS(M) \
-        M(key8,                       false) \
-        M(key16,                      false) \
-        M(key32,                      false) \
-        M(key64,                      false) \
-        M(key_string,                 false) \
-        M(key_fixed_string,           false) \
-        M(keys16,                    false) \
-        M(keys32,                    false) \
-        M(keys64,                    false) \
-        M(keys128,                    false) \
-        M(keys256,                    false) \
-        M(serialized,                   false) \
-        M(nullable_serialized,          false) \
-        M(prealloc_serialized,          false) \
-        M(nullable_prealloc_serialized, false) \
-        M(key32_two_level,            true) \
-        M(key64_two_level,            true) \
-        M(key_string_two_level,       true) \
-        M(key_fixed_string_two_level, true) \
-        M(keys32_two_level,          true) \
-        M(keys64_two_level,          true) \
-        M(keys128_two_level,          true) \
-        M(keys256_two_level,          true) \
-        M(serialized_two_level,                   true) \
-        M(nullable_serialized_two_level,          true) \
-        M(prealloc_serialized_two_level,          true) \
-        M(nullable_prealloc_serialized_two_level, true) \
-        M(key64_hash64,               false) \
-        M(key_string_hash64,          false) \
-        M(key_fixed_string_hash64,    false) \
-        M(keys128_hash64,             false) \
-        M(keys256_hash64,             false) \
-        M(serialized_hash64,                   false) \
-        M(nullable_serialized_hash64,          false) \
-        M(prealloc_serialized_hash64,          false) \
-        M(nullable_prealloc_serialized_hash64, false) \
-        M(nullable_key8,             false) \
-        M(nullable_key16,             false) \
-        M(nullable_key32,             false) \
-        M(nullable_key64,             false) \
-        M(nullable_key32_two_level,   true) \
-        M(nullable_key64_two_level,   true) \
-        M(nullable_key_string,        false) \
-        M(nullable_key_fixed_string,  false) \
-        M(nullable_key_string_two_level, true) \
-        M(nullable_key_fixed_string_two_level, true) \
-        M(nullable_keys128,           false) \
-        M(nullable_keys256,           false) \
-        M(nullable_keys128_two_level, true) \
-        M(nullable_keys256_two_level, true) \
-        M(low_cardinality_key8, false) \
-        M(low_cardinality_key16, false) \
-        M(low_cardinality_key32, false) \
-        M(low_cardinality_key64, false) \
-        M(low_cardinality_keys128, false) \
-        M(low_cardinality_keys256, false) \
-        M(low_cardinality_key_string, false) \
-        M(low_cardinality_key_fixed_string, false) \
-        M(low_cardinality_key32_two_level, true) \
-        M(low_cardinality_key64_two_level, true) \
-        M(low_cardinality_keys128_two_level, true) \
-        M(low_cardinality_keys256_two_level, true) \
-        M(low_cardinality_key_string_two_level, true) \
-        M(low_cardinality_key_fixed_string_two_level, true) \
-
-    enum class Type
-    {
-        EMPTY = 0,
-        without_key,
-
-    #define M(NAME, IS_TWO_LEVEL) NAME,
-        APPLY_FOR_AGGREGATED_VARIANTS(M)
-    #undef M
-    };
-    Type type = Type::EMPTY;
-
-    AggregatedDataVariants() : aggregates_pools(1, std::make_shared<Arena>()), aggregates_pool(aggregates_pools.back().get()) {}
-    bool empty() const { return type == Type::EMPTY; }
-    void invalidate() { type = Type::EMPTY; }
-
-    ~AggregatedDataVariants();
-
-    void init(Type type_, std::optional<size_t> size_hint = std::nullopt);
-
-    /// Number of rows (different keys).
-    size_t size() const
-    {
-        switch (type)
-        {
-            case Type::EMPTY:       return 0;
-            case Type::without_key: return 1;
-
-        #define M(NAME, IS_TWO_LEVEL) \
-            case Type::NAME: return (NAME)->data.size() + (without_key != nullptr);
-            APPLY_FOR_AGGREGATED_VARIANTS(M)
-        #undef M
-        }
-
-        UNREACHABLE();
-    }
-
-    /// The size without taking into account the row in which data is written for the calculation of TOTALS.
-    size_t sizeWithoutOverflowRow() const
-    {
-        switch (type)
-        {
-            case Type::EMPTY:       return 0;
-            case Type::without_key: return 1;
-
-            #define M(NAME, IS_TWO_LEVEL) \
-            case Type::NAME: return (NAME)->data.size();
-            APPLY_FOR_AGGREGATED_VARIANTS(M)
-            #undef M
-        }
-
-        UNREACHABLE();
-    }
-
-    const char * getMethodName() const
-    {
-        switch (type)
-        {
-            case Type::EMPTY:       return "EMPTY";
-            case Type::without_key: return "without_key";
-
-        #define M(NAME, IS_TWO_LEVEL) \
-            case Type::NAME: return #NAME;
-            APPLY_FOR_AGGREGATED_VARIANTS(M)
-        #undef M
-        }
-
-        UNREACHABLE();
-    }
-
-    bool isTwoLevel() const
-    {
-        switch (type)
-        {
-            case Type::EMPTY:       return false;
-            case Type::without_key: return false;
-
-        #define M(NAME, IS_TWO_LEVEL) \
-            case Type::NAME: return IS_TWO_LEVEL;
-            APPLY_FOR_AGGREGATED_VARIANTS(M)
-        #undef M
-        }
-
-        UNREACHABLE();
-    }
-
-    #define APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M) \
-        M(key32)            \
-        M(key64)            \
-        M(key_string)       \
-        M(key_fixed_string) \
-        M(keys32)           \
-        M(keys64)           \
-        M(keys128)          \
-        M(keys256)          \
-        M(serialized)       \
-        M(nullable_serialized) \
-        M(prealloc_serialized) \
-        M(nullable_prealloc_serialized) \
-        M(nullable_key32) \
-        M(nullable_key64) \
-        M(nullable_key_string) \
-        M(nullable_key_fixed_string) \
-        M(nullable_keys128) \
-        M(nullable_keys256) \
-        M(low_cardinality_key32) \
-        M(low_cardinality_key64) \
-        M(low_cardinality_keys128) \
-        M(low_cardinality_keys256) \
-        M(low_cardinality_key_string) \
-        M(low_cardinality_key_fixed_string) \
-
-    /// NOLINTNEXTLINE
-    #define APPLY_FOR_VARIANTS_NOT_CONVERTIBLE_TO_TWO_LEVEL(M) \
-        M(key8)             \
-        M(key16)            \
-        M(nullable_key8) \
-        M(nullable_key16) \
-        M(keys16)           \
-        M(key64_hash64)     \
-        M(key_string_hash64)\
-        M(key_fixed_string_hash64) \
-        M(keys128_hash64)   \
-        M(keys256_hash64)   \
-        M(serialized_hash64) \
-        M(nullable_serialized_hash64) \
-        M(prealloc_serialized_hash64) \
-        M(nullable_prealloc_serialized_hash64) \
-        M(low_cardinality_key8) \
-        M(low_cardinality_key16) \
-
-    /// NOLINTNEXTLINE
-    #define APPLY_FOR_VARIANTS_SINGLE_LEVEL(M) \
-        APPLY_FOR_VARIANTS_NOT_CONVERTIBLE_TO_TWO_LEVEL(M) \
-        APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M) \
-
-    bool isConvertibleToTwoLevel() const
-    {
-        switch (type)
-        {
-        #define M(NAME) \
-            case Type::NAME: return true;
-
-            APPLY_FOR_VARIANTS_CONVERTIBLE_TO_TWO_LEVEL(M)
-
-        #undef M
-            default:
-                return false;
-        }
-    }
-
-    void convertToTwoLevel();
-
-    /// NOLINTNEXTLINE
-    #define APPLY_FOR_VARIANTS_TWO_LEVEL(M) \
-        M(key32_two_level)            \
-        M(key64_two_level)            \
-        M(key_string_two_level)       \
-        M(key_fixed_string_two_level) \
-        M(keys32_two_level)           \
-        M(keys64_two_level)           \
-        M(keys128_two_level)          \
-        M(keys256_two_level)          \
-        M(serialized_two_level)       \
-        M(nullable_serialized_two_level)       \
-        M(prealloc_serialized_two_level)       \
-        M(nullable_prealloc_serialized_two_level)       \
-        M(nullable_key32_two_level) \
-        M(nullable_key64_two_level) \
-        M(nullable_key_string_two_level) \
-        M(nullable_key_fixed_string_two_level) \
-        M(nullable_keys128_two_level) \
-        M(nullable_keys256_two_level) \
-        M(low_cardinality_key32_two_level) \
-        M(low_cardinality_key64_two_level) \
-        M(low_cardinality_keys128_two_level) \
-        M(low_cardinality_keys256_two_level) \
-        M(low_cardinality_key_string_two_level) \
-        M(low_cardinality_key_fixed_string_two_level) \
-
-    #define APPLY_FOR_LOW_CARDINALITY_VARIANTS(M) \
-        M(low_cardinality_key8) \
-        M(low_cardinality_key16) \
-        M(low_cardinality_key32) \
-        M(low_cardinality_key64) \
-        M(low_cardinality_keys128) \
-        M(low_cardinality_keys256) \
-        M(low_cardinality_key_string) \
-        M(low_cardinality_key_fixed_string) \
-        M(low_cardinality_key32_two_level) \
-        M(low_cardinality_key64_two_level) \
-        M(low_cardinality_keys128_two_level) \
-        M(low_cardinality_keys256_two_level) \
-        M(low_cardinality_key_string_two_level) \
-        M(low_cardinality_key_fixed_string_two_level)
-
-    bool isLowCardinality() const
-    {
-        switch (type)
-        {
-        #define M(NAME) \
-            case Type::NAME: return true;
-
-            APPLY_FOR_LOW_CARDINALITY_VARIANTS(M)
-        #undef M
-            default:
-                return false;
-        }
-    }
-
-    static HashMethodContextPtr createCache(Type type, const HashMethodContext::Settings & settings)
-    {
-        switch (type)
-        {
-            case Type::without_key: return nullptr;
-
-            #define M(NAME, IS_TWO_LEVEL) \
-            case Type::NAME: \
-            { \
-                using TPtr ## NAME = decltype(AggregatedDataVariants::NAME); \
-                using T ## NAME = typename TPtr ## NAME ::element_type; \
-                return T ## NAME ::State::createContext(settings); \
-            }
-
-            APPLY_FOR_AGGREGATED_VARIANTS(M)
-            #undef M
-
-            default:
-                throw Exception(ErrorCodes::UNKNOWN_AGGREGATED_DATA_VARIANT, "Unknown aggregated data variant.");
-        }
-    }
-};
-
-using AggregatedDataVariantsPtr = std::shared_ptr<AggregatedDataVariants>;
-using ManyAggregatedDataVariants = std::vector<AggregatedDataVariantsPtr>;
-using ManyAggregatedDataVariantsPtr = std::shared_ptr<ManyAggregatedDataVariants>;
-
 class CompiledAggregateFunctionsHolder;
 class NativeWriter;
 struct OutputBlockColumns;
@@ -1395,7 +419,7 @@ private:
         AggregateDataPtr overflow_row) const;
 
     /// Specialization for a particular value no_more_keys.
-    template <bool no_more_keys, bool use_compiled_functions, bool prefetch, typename Method, typename State>
+    template <bool prefetch, typename Method, typename State>
     void executeImplBatch(
         Method & method,
         State & state,
@@ -1403,17 +427,31 @@ private:
         size_t row_begin,
         size_t row_end,
         AggregateFunctionInstruction * aggregate_instructions,
+        bool no_more_keys,
         bool all_keys_are_const,
+        bool use_compiled_functions,
         AggregateDataPtr overflow_row) const;
 
+    void executeAggregateInstructions(
+        Arena * aggregates_pool,
+        size_t row_begin,
+        size_t row_end,
+        AggregateFunctionInstruction * aggregate_instructions,
+        const std::unique_ptr<AggregateDataPtr[]> & places,
+        size_t key_start,
+        bool has_only_one_value_since_last_reset,
+        bool no_more_keys,
+        bool all_keys_are_const,
+        bool use_compiled_functions) const;
+
     /// For case when there are no keys (all aggregate into one row).
-    template <bool use_compiled_functions>
     void executeWithoutKeyImpl(
         AggregatedDataWithoutKey & res,
         size_t row_begin,
         size_t row_end,
         AggregateFunctionInstruction * aggregate_instructions,
-        Arena * arena) const;
+        Arena * arena,
+        bool use_compiled_functions) const;
 
     template <typename Method>
     void writeToTemporaryFileImpl(
@@ -1429,8 +467,9 @@ private:
             Arena * arena) const;
 
     /// Merge data from hash table `src` into `dst`.
-    template <typename Method, bool use_compiled_functions, bool prefetch, typename Table>
-    void mergeDataImpl(Table & table_dst, Table & table_src, Arena * arena) const;
+    // template <typename Method, bool use_compiled_functions, booal prefetch, typename Table>
+    template <typename Method, typename Table>
+    void mergeDataImpl(Table & table_dst, Table & table_src, Arena * arena, bool use_compiled_functions, bool prefetch) const;
 
     /// Merge data from hash table `src` into `dst`, but only for keys that already exist in dst. In other cases, merge the data into `overflows`.
     template <typename Method, typename Table>
@@ -1456,10 +495,11 @@ private:
 
     template <bool return_single_block>
     using ConvertToBlockRes = std::conditional_t<return_single_block, Block, BlocksList>;
+    using ConvertToBlockResVariant = std::variant<Block, BlocksList>;
 
-    template <bool return_single_block, typename Method, typename Table>
-    ConvertToBlockRes<return_single_block>
-    convertToBlockImpl(Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, bool final, size_t rows) const;
+    template <typename Method, typename Table>
+    ConvertToBlockResVariant
+    convertToBlockImpl(Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, bool final, size_t rows, bool return_single_block) const;
 
     template <typename Mapped>
     void insertAggregatesIntoColumns(
@@ -1470,13 +510,18 @@ private:
     template <bool use_compiled_functions>
     Block insertResultsIntoColumns(PaddedPODArray<AggregateDataPtr> & places, OutputBlockColumns && out_cols, Arena * arena, bool has_null_key_data) const;
 
-    template <typename Method, bool use_compiled_functions, bool return_single_block, typename Table>
-    ConvertToBlockRes<return_single_block>
-    convertToBlockImplFinal(Method & method, Table & data, Arena * arena, Arenas & aggregates_pools, size_t rows) const;
+    template <typename Method, typename Table>
+    ConvertToBlockResVariant convertToBlockImplFinal(
+        Method & method,
+        Table & data,
+        Arena * arena,
+        Arenas & aggregates_pools,
+        bool use_compiled_functions,
+        bool return_single_block) const;
 
-    template <bool return_single_block, typename Method, typename Table>
-    ConvertToBlockRes<return_single_block>
-    convertToBlockImplNotFinal(Method & method, Table & data, Arenas & aggregates_pools, size_t rows) const;
+    template <typename Method, typename Table>
+    ConvertToBlockResVariant
+    convertToBlockImplNotFinal(Method & method, Table & data, Arenas & aggregates_pools, size_t rows, bool return_single_block) const;
 
     template <typename Method>
     Block convertOneBucketToBlock(

From fb1e5923a333bad5336ccb2631c81c95f4eb57dc Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Tue, 12 Mar 2024 09:12:25 +0000
Subject: [PATCH 331/985] CI: fix runner for arm perf tests

 #do_not_test
---
 tests/ci/ci_config.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index df8bfb1c2a8..7c213da27ec 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -629,7 +629,9 @@ class CIConfig:
 
         assert result, f"BUG, no runner for [{check_name}]"
 
-        if ("aarch" in check_name or "arm" in check_name) and "aarch" not in result:
+        if (
+            "aarch" in check_name.lower() or "arm64" in check_name.lower()
+        ) and "aarch" not in result:
             if result == Runners.STRESS_TESTER:
                 # FIXME: no arm stress tester group atm
                 result = Runners.FUNC_TESTER_ARM

From f559767d2201e6f3a88a97cb72a5be6646b38585 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 15 Feb 2024 16:56:04 +0100
Subject: [PATCH 332/985] Fix finished_mutations_to_keep=0 for MergeTree (as
 docs says 0 is to keep everything)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageMergeTree.cpp                  |  5 ++++-
 .../02994_merge_tree_mutations_cleanup.reference   |  4 ++++
 .../02994_merge_tree_mutations_cleanup.sql.j2      | 14 ++++++++++++++
 3 files changed, 22 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.reference
 create mode 100644 tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.sql.j2

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 663e7f435b7..6bb8695d673 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -1479,8 +1479,11 @@ UInt64 StorageMergeTree::getCurrentMutationVersion(
 
 size_t StorageMergeTree::clearOldMutations(bool truncate)
 {
-    size_t finished_mutations_to_keep = truncate ? 0 : getSettings()->finished_mutations_to_keep;
+    size_t finished_mutations_to_keep = getSettings()->finished_mutations_to_keep;
+    if (!truncate && !finished_mutations_to_keep)
+        return 0;
 
+    finished_mutations_to_keep = truncate ? 0 : finished_mutations_to_keep;
     std::vector<MergeTreeMutationEntry> mutations_to_delete;
     {
         std::lock_guard lock(currently_processing_in_background_mutex);
diff --git a/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.reference b/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.reference
new file mode 100644
index 00000000000..8a3a458c753
--- /dev/null
+++ b/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.reference
@@ -0,0 +1,4 @@
+mutations after ALTER for data_rmt	1
+mutations after cleanup for data_rmt	1
+mutations after ALTER for data_mt	1
+mutations after cleanup for data_mt	1
diff --git a/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.sql.j2 b/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.sql.j2
new file mode 100644
index 00000000000..2740b6070c0
--- /dev/null
+++ b/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.sql.j2
@@ -0,0 +1,14 @@
+drop table if exists data_rmt;
+drop table if exists data_mt;
+
+create table data_rmt (key Int) engine=ReplicatedMergeTree('/tables/{database}/data', '{table}') order by tuple() settings finished_mutations_to_keep=0, merge_tree_clear_old_parts_interval_seconds=1;
+create table data_mt (key Int) engine=MergeTree() order by tuple() settings finished_mutations_to_keep=0, merge_tree_clear_old_parts_interval_seconds=1;
+
+{% for table in ['data_rmt', 'data_mt'] %}
+alter table {{table}} delete where 1;
+select 'mutations after ALTER for {{table}}', count() from system.mutations where database = currentDatabase() and table = '{{table}}';
+-- merge_tree_clear_old_parts_interval_seconds=1, but wait few seconds more
+select sleep(5) settings function_sleep_max_microseconds_per_block=10e6 format Null;
+select 'mutations after cleanup for {{table}}', count() from system.mutations where database = currentDatabase() and table = '{{table}}';
+drop table {{table}};
+{% endfor %}

From 6c74ab18c0d42082d49786fddb4612c813f86c0e Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 22 Feb 2024 15:10:52 +0100
Subject: [PATCH 333/985] Do not clean mutations for MergeTree on DROP PART (to
 match ReplicatedMergeTree)

Even if this should be done, only related mutations should be cleaned,
not all.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageMergeTree.cpp | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 6bb8695d673..2345cc8e79d 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -1902,8 +1902,6 @@ void StorageMergeTree::dropPart(const String & part_name, bool detach, ContextPt
         }
     }
 
-    /// Old part objects is needed to be destroyed before clearing them from filesystem.
-    clearOldMutations(true);
     clearOldPartsFromFilesystem();
     clearEmptyParts();
 }
@@ -1988,8 +1986,6 @@ void StorageMergeTree::dropPartition(const ASTPtr & partition, bool detach, Cont
         }
     }
 
-    /// Old parts are needed to be destroyed before clearing them from filesystem.
-    clearOldMutations(true);
     clearOldPartsFromFilesystem();
     clearEmptyParts();
 }

From 4bd6d4456e2a6267677941437389558b1eed1402 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sat, 24 Feb 2024 21:25:48 +0100
Subject: [PATCH 334/985] Fix expectations for
 test_all_projection_files_are_dropped_when_part_is_dropped
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Since after DROP PART mutations are not cleaned anymore.

Here an example:

                objects_at_the_end = list_objects(cluster)
    >           assert objects_at_the_end == objects_empty_table
    E           AssertionError: assert ['data/evt/iczupcswcatzvjikqwmovahturdht', 'data/oxq/dmkgqbdzeeiwmukogoxawfoxxnrqs'] == ['data/oxq/dmkgqbdzeeiwmukogoxawfoxxnrqs']
    E             At index 0 diff: 'data/evt/iczupcswcatzvjikqwmovahturdht' != 'data/oxq/dmkgqbdzeeiwmukogoxawfoxxnrqs'
    E             Left contains one more item: 'data/oxq/dmkgqbdzeeiwmukogoxawfoxxnrqs'
    E             Full diff:
    E               [
    E             +  'data/evt/iczupcswcatzvjikqwmovahturdht',
    E                'data/oxq/dmkgqbdzeeiwmukogoxawfoxxnrqs',
    E               ]

    test_replicated_zero_copy_projection_mutation/test.py:155: AssertionError

And decoded paths:

    node1 :) select local_path from system.blob_storage_log where remote_path = 'data/evt/iczupcswcatzvjikqwmovahturdht'

    SELECT local_path
    FROM system.blob_storage_log
    WHERE remote_path = 'data/evt/iczupcswcatzvjikqwmovahturdht'

    Query id: 9ee5a9c0-c3b7-46ad-82bd-64c8bcbda78d

    ┌─local_path────────────────────────────────────────────────────────┐
    │ store/bce/bcea71c9-35cd-4368-9504-c563253b1964/tmp_mutation_1.txt │
    │ store/bce/bcea71c9-35cd-4368-9504-c563253b1964/mutation_1.txt     │
    └───────────────────────────────────────────────────────────────────┘

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../test_replicated_zero_copy_projection_mutation/test.py      | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/integration/test_replicated_zero_copy_projection_mutation/test.py b/tests/integration/test_replicated_zero_copy_projection_mutation/test.py
index 4839919e23d..e0af85c3887 100644
--- a/tests/integration/test_replicated_zero_copy_projection_mutation/test.py
+++ b/tests/integration/test_replicated_zero_copy_projection_mutation/test.py
@@ -131,14 +131,13 @@ def test_all_projection_files_are_dropped_when_part_is_dropped(
             """
         )
 
-        objects_empty_table = list_objects(cluster)
-
         node.query(
             "ALTER TABLE test_all_projection_files_are_dropped ADD projection b_order (SELECT a, b ORDER BY b)"
         )
         node.query(
             "ALTER TABLE test_all_projection_files_are_dropped MATERIALIZE projection b_order"
         )
+        objects_empty_table = list_objects(cluster)
 
         node.query(
             """

From 3c08e198adb9bb62f1480f94470741ae988b249e Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 7 Mar 2024 09:59:19 +0100
Subject: [PATCH 335/985] tests: wait for mutations in
 02994_merge_tree_mutations_cleanup.sql.j2
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Otherwise it fails in private fork CI

Co-authored-by: János Benjamin Antal <antaljanosbenjamin@users.noreply.github.com>
---
 .../0_stateless/02994_merge_tree_mutations_cleanup.sql.j2       | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.sql.j2 b/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.sql.j2
index 2740b6070c0..1b9be79dbe4 100644
--- a/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.sql.j2
+++ b/tests/queries/0_stateless/02994_merge_tree_mutations_cleanup.sql.j2
@@ -5,7 +5,7 @@ create table data_rmt (key Int) engine=ReplicatedMergeTree('/tables/{database}/d
 create table data_mt (key Int) engine=MergeTree() order by tuple() settings finished_mutations_to_keep=0, merge_tree_clear_old_parts_interval_seconds=1;
 
 {% for table in ['data_rmt', 'data_mt'] %}
-alter table {{table}} delete where 1;
+alter table {{table}} delete where 1 settings mutations_sync = 1;
 select 'mutations after ALTER for {{table}}', count() from system.mutations where database = currentDatabase() and table = '{{table}}';
 -- merge_tree_clear_old_parts_interval_seconds=1, but wait few seconds more
 select sleep(5) settings function_sleep_max_microseconds_per_block=10e6 format Null;

From db3638ef21b838636a3bb4a607c83b17374067a5 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 8 Mar 2024 13:57:07 +0100
Subject: [PATCH 336/985] Enable processors profiling by default

It is only 1 record per processor for each query, while there are way
more less columns then in query_log, so it is pretty light weight.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Core/Settings.h               | 2 +-
 src/Core/SettingsChangesHistory.h | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d70a6cf51c5..3275a3f91ef 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -263,7 +263,7 @@ class IColumn;
     M(UInt64, log_queries_cut_to_length, 100000, "If query length is greater than specified threshold (in bytes), then cut query when writing to query log. Also limit length of printed query in ordinary text log.", 0) \
     M(Float, log_queries_probability, 1., "Log queries with the specified probability.", 0) \
     \
-    M(Bool, log_processors_profiles, false, "Log Processors profile events.", 0) \
+    M(Bool, log_processors_profiles, true, "Log Processors profile events.", 0) \
     M(DistributedProductMode, distributed_product_mode, DistributedProductMode::DENY, "How are distributed subqueries performed inside IN or JOIN sections?", IMPORTANT) \
     \
     M(UInt64, max_concurrent_queries_for_all_users, 0, "The maximum number of concurrent requests for all users.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index e680c02671a..144affd1b36 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -93,6 +93,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"input_format_json_use_string_type_for_ambiguous_paths_in_named_tuples_inference_from_objects", false, false, "Allow to use String type for ambiguous paths during named tuple inference from JSON objects"},
               {"throw_if_deduplication_in_dependent_materialized_views_enabled_with_async_insert", false, true, "Deduplication is dependent materialized view cannot work together with async inserts."},
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
+              {"log_processors_profiles", false, true, "Enable by default"},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},

From f6abe68b607dd1893e838b55f85245c716d41f8b Mon Sep 17 00:00:00 2001
From: Pablo Musa <pmusa@users.noreply.github.com>
Date: Tue, 12 Mar 2024 10:52:22 +0100
Subject: [PATCH 337/985] Clarify sentence about clusterAllReplicas

The explanation about `clusterAllReplicas` is not clear. This change tries to simplify the sentence and clarify the explanation.
---
 docs/en/sql-reference/table-functions/cluster.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/table-functions/cluster.md b/docs/en/sql-reference/table-functions/cluster.md
index ad92ab39183..136ff72e4a9 100644
--- a/docs/en/sql-reference/table-functions/cluster.md
+++ b/docs/en/sql-reference/table-functions/cluster.md
@@ -5,7 +5,7 @@ sidebar_label: cluster
 title: "cluster, clusterAllReplicas"
 ---
 
-Allows to access all shards in an existing cluster which configured in `remote_servers` section without creating a [Distributed](../../engines/table-engines/special/distributed.md) table. One replica of each shard is queried.
+Allows to access all shards (configured in the `remote_servers` section) of a cluster without creating a [Distributed](../../engines/table-engines/special/distributed.md) table. Only one replica of each shard is queried.
 
 `clusterAllReplicas` function — same as `cluster`, but all replicas are queried. Each replica in a cluster is used as a separate shard/connection.
 

From ccd47126fdcc82e57d0c648b82613b5672847702 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 12 Mar 2024 11:01:47 +0100
Subject: [PATCH 338/985] Fix 01603_insert_select_too_many_parts flakiness

CI: https://s3.amazonaws.com/clickhouse-test-reports/60695/048a042dc4963631a23358d3e454dcd8a9eaafa2/stateless_tests__aarch64_.html
Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../queries/0_stateless/01603_insert_select_too_many_parts.sql  | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql b/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql
index a56b680e212..0c33c1d6b18 100644
--- a/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql
+++ b/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql
@@ -3,6 +3,8 @@ CREATE TABLE too_many_parts (x UInt64) ENGINE = MergeTree ORDER BY tuple() SETTI
 
 SYSTEM STOP MERGES too_many_parts;
 SET max_block_size = 1, min_insert_block_size_rows = 0, min_insert_block_size_bytes = 0;
+-- Avoid concurrent partse check to avoid flakiness
+SET max_threads=1, max_insert_threads=1;
 
 -- exception is not thrown if threshold is exceeded when multi-block INSERT is already started.
 INSERT INTO too_many_parts SELECT * FROM numbers(10);

From 47a4ce8a4e629f2d6321be1411d93c0bfabbbc95 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Tue, 12 Mar 2024 10:02:33 +0000
Subject: [PATCH 339/985] Move `RangeHashedDictionary::getColumn` into source
 file

---
 src/Dictionaries/RangeHashedDictionary.cpp | 448 +++++++++++++++++++++
 src/Dictionaries/RangeHashedDictionary.h   | 421 -------------------
 2 files changed, 448 insertions(+), 421 deletions(-)
 create mode 100644 src/Dictionaries/RangeHashedDictionary.cpp

diff --git a/src/Dictionaries/RangeHashedDictionary.cpp b/src/Dictionaries/RangeHashedDictionary.cpp
new file mode 100644
index 00000000000..203561fc23d
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionary.cpp
@@ -0,0 +1,448 @@
+#include <Dictionaries/RangeHashedDictionary.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int TYPE_MISMATCH;
+}
+
+template <DictionaryKeyType dictionary_key_type>
+ColumnPtr RangeHashedDictionary<dictionary_key_type>::getColumn(
+    const std::string & attribute_name,
+    const DataTypePtr & attribute_type,
+    const Columns & key_columns,
+    const DataTypes & key_types,
+    DefaultOrFilter default_or_filter) const
+{
+    bool is_short_circuit = std::holds_alternative<RefFilter>(default_or_filter);
+    assert(is_short_circuit || std::holds_alternative<RefDefault>(default_or_filter));
+
+    if (dictionary_key_type == DictionaryKeyType::Complex)
+    {
+        auto key_types_copy = key_types;
+        key_types_copy.pop_back();
+        dict_struct.validateKeyTypes(key_types_copy);
+    }
+
+    ColumnPtr result;
+
+    const auto & dictionary_attribute = dict_struct.getAttribute(attribute_name, attribute_type);
+    const size_t attribute_index = dict_struct.attribute_name_to_index.find(attribute_name)->second;
+    const auto & attribute = attributes[attribute_index];
+
+    /// Cast range column to storage type
+    Columns modified_key_columns = key_columns;
+    const ColumnPtr & range_storage_column = key_columns.back();
+    ColumnWithTypeAndName column_to_cast = {range_storage_column->convertToFullColumnIfConst(), key_types.back(), ""};
+    modified_key_columns.back() = castColumnAccurate(column_to_cast, dict_struct.range_min->type);
+
+    size_t keys_size = key_columns.front()->size();
+    bool is_attribute_nullable = attribute.is_value_nullable.has_value();
+
+    ColumnUInt8::MutablePtr col_null_map_to;
+    ColumnUInt8::Container * vec_null_map_to = nullptr;
+    if (is_attribute_nullable)
+    {
+        col_null_map_to = ColumnUInt8::create(keys_size, false);
+        vec_null_map_to = &col_null_map_to->getData();
+    }
+
+    auto type_call = [&](const auto & dictionary_attribute_type)
+    {
+        using Type = std::decay_t<decltype(dictionary_attribute_type)>;
+        using AttributeType = typename Type::AttributeType;
+        using ValueType = DictionaryValueType<AttributeType>;
+        using ColumnProvider = DictionaryAttributeColumnProvider<AttributeType>;
+
+        auto column = ColumnProvider::getColumn(dictionary_attribute, keys_size);
+
+        if (is_short_circuit)
+        {
+            IColumn::Filter & default_mask = std::get<RefFilter>(default_or_filter).get();
+            size_t keys_found = 0;
+
+            if constexpr (std::is_same_v<ValueType, Array>)
+            {
+                auto * out = column.get();
+
+                keys_found = getItemsShortCircuitImpl<ValueType, false>(
+                    attribute,
+                    modified_key_columns,
+                    [&](size_t, const Array & value, bool)
+                    {
+                        out->insert(value);
+                    },
+                    default_mask);
+            }
+            else if constexpr (std::is_same_v<ValueType, StringRef>)
+            {
+                auto * out = column.get();
+
+                if (is_attribute_nullable)
+                    keys_found = getItemsShortCircuitImpl<ValueType, true>(
+                        attribute,
+                        modified_key_columns,
+                        [&](size_t row, StringRef value, bool is_null)
+                        {
+                            (*vec_null_map_to)[row] = is_null;
+                            out->insertData(value.data, value.size);
+                        },
+                        default_mask);
+                else
+                    keys_found = getItemsShortCircuitImpl<ValueType, false>(
+                        attribute,
+                        modified_key_columns,
+                        [&](size_t, StringRef value, bool)
+                        {
+                            out->insertData(value.data, value.size);
+                        },
+                        default_mask);
+            }
+            else
+            {
+                auto & out = column->getData();
+
+                if (is_attribute_nullable)
+                    keys_found = getItemsShortCircuitImpl<ValueType, true>(
+                        attribute,
+                        modified_key_columns,
+                        [&](size_t row, const auto value, bool is_null)
+                        {
+                            (*vec_null_map_to)[row] = is_null;
+                            out[row] = value;
+                        },
+                        default_mask);
+                else
+                    keys_found = getItemsShortCircuitImpl<ValueType, false>(
+                        attribute,
+                        modified_key_columns,
+                        [&](size_t row, const auto value, bool)
+                        {
+                            out[row] = value;
+                        },
+                        default_mask);
+
+                out.resize(keys_found);
+            }
+
+            if (is_attribute_nullable)
+                vec_null_map_to->resize(keys_found);
+        }
+        else
+        {
+            const ColumnPtr & default_values_column = std::get<RefDefault>(default_or_filter).get();
+
+            DictionaryDefaultValueExtractor<AttributeType> default_value_extractor(
+            dictionary_attribute.null_value, default_values_column);
+
+            if constexpr (std::is_same_v<ValueType, Array>)
+            {
+                auto * out = column.get();
+
+                getItemsImpl<ValueType, false>(
+                    attribute,
+                    modified_key_columns,
+                    [&](size_t, const Array & value, bool)
+                    {
+                        out->insert(value);
+                    },
+                    default_value_extractor);
+            }
+            else if constexpr (std::is_same_v<ValueType, StringRef>)
+            {
+                auto * out = column.get();
+
+                if (is_attribute_nullable)
+                    getItemsImpl<ValueType, true>(
+                        attribute,
+                        modified_key_columns,
+                        [&](size_t row, StringRef value, bool is_null)
+                        {
+                            (*vec_null_map_to)[row] = is_null;
+                            out->insertData(value.data, value.size);
+                        },
+                        default_value_extractor);
+                else
+                    getItemsImpl<ValueType, false>(
+                        attribute,
+                        modified_key_columns,
+                        [&](size_t, StringRef value, bool)
+                        {
+                            out->insertData(value.data, value.size);
+                        },
+                        default_value_extractor);
+            }
+            else
+            {
+                auto & out = column->getData();
+
+                if (is_attribute_nullable)
+                    getItemsImpl<ValueType, true>(
+                        attribute,
+                        modified_key_columns,
+                        [&](size_t row, const auto value, bool is_null)
+                        {
+                            (*vec_null_map_to)[row] = is_null;
+                            out[row] = value;
+                        },
+                        default_value_extractor);
+                else
+                    getItemsImpl<ValueType, false>(
+                        attribute,
+                        modified_key_columns,
+                        [&](size_t row, const auto value, bool)
+                        {
+                            out[row] = value;
+                        },
+                        default_value_extractor);
+            }
+        }
+
+        result = std::move(column);
+    };
+
+    callOnDictionaryAttributeType(attribute.type, type_call);
+
+    if (is_attribute_nullable)
+        result = ColumnNullable::create(result, std::move(col_null_map_to));
+
+    return result;
+}
+
+template <DictionaryKeyType dictionary_key_type>
+template <typename AttributeType, bool is_nullable, typename ValueSetter, typename DefaultValueExtractor>
+void RangeHashedDictionary<dictionary_key_type>::getItemsImpl(
+    const Attribute & attribute,
+    const Columns & key_columns,
+    ValueSetter && set_value,
+    DefaultValueExtractor & default_value_extractor) const
+{
+    const auto & attribute_container = std::get<AttributeContainerType<AttributeType>>(attribute.container);
+
+    size_t keys_found = 0;
+
+    const ColumnPtr & range_column = key_columns.back();
+    auto key_columns_copy = key_columns;
+    key_columns_copy.pop_back();
+
+    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
+    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
+    const size_t keys_size = keys_extractor.getKeysSize();
+
+    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
+    {
+        using Types = std::decay_t<decltype(types)>;
+        using RangeColumnType = typename Types::LeftType;
+        using RangeStorageType = typename RangeColumnType::ValueType;
+        using RangeInterval = Interval<RangeStorageType>;
+
+        const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
+        if (!range_column_typed)
+            throw Exception(ErrorCodes::TYPE_MISMATCH,
+                "Dictionary {} range column type should be equal to {}",
+                getFullName(),
+                dict_struct.range_min->type->getName());
+
+        const auto & range_column_data = range_column_typed->getData();
+
+        const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
+
+        for (size_t key_index = 0; key_index < keys_size; ++key_index)
+        {
+            auto key = keys_extractor.extractCurrentKey();
+            const auto it = key_attribute_container.find(key);
+
+            if (it)
+            {
+                const auto date = range_column_data[key_index];
+                const auto & interval_tree = it->getMapped();
+
+                size_t value_index = 0;
+                std::optional<RangeInterval> range;
+
+                interval_tree.find(date, [&](auto & interval, auto & interval_value_index)
+                {
+                    if (range)
+                    {
+                        if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
+                        {
+                            range = interval;
+                            value_index = interval_value_index;
+                        }
+                        else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > * range)
+                        {
+                            range = interval;
+                            value_index = interval_value_index;
+                        }
+                    }
+                    else
+                    {
+                        range = interval;
+                        value_index = interval_value_index;
+                    }
+
+                    return true;
+                });
+
+                if (range.has_value())
+                {
+                    ++keys_found;
+
+                    AttributeType value = attribute_container[value_index];
+
+                    if constexpr (is_nullable)
+                    {
+                        bool is_null = (*attribute.is_value_nullable)[value_index];
+                        set_value(key_index, value, is_null);
+                    }
+                    else
+                    {
+                        set_value(key_index, value, false);
+                    }
+
+                    keys_extractor.rollbackCurrentKey();
+                    continue;
+                }
+            }
+
+            if constexpr (is_nullable)
+                set_value(key_index, default_value_extractor[key_index], default_value_extractor.isNullAt(key_index));
+            else
+                set_value(key_index, default_value_extractor[key_index], false);
+
+            keys_extractor.rollbackCurrentKey();
+        }
+    });
+
+    query_count.fetch_add(keys_size, std::memory_order_relaxed);
+    found_count.fetch_add(keys_found, std::memory_order_relaxed);
+}
+
+template <DictionaryKeyType dictionary_key_type>
+template <typename AttributeType, bool is_nullable, typename ValueSetter>
+size_t RangeHashedDictionary<dictionary_key_type>::getItemsShortCircuitImpl(
+    const Attribute & attribute,
+    const Columns & key_columns,
+    ValueSetter && set_value,
+    IColumn::Filter & default_mask) const
+{
+    const auto & attribute_container = std::get<AttributeContainerType<AttributeType>>(attribute.container);
+
+    size_t keys_found = 0;
+
+    const ColumnPtr & range_column = key_columns.back();
+    auto key_columns_copy = key_columns;
+    key_columns_copy.pop_back();
+
+    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
+    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
+    const size_t keys_size = keys_extractor.getKeysSize();
+    default_mask.resize(keys_size);
+
+    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
+    {
+        using Types = std::decay_t<decltype(types)>;
+        using RangeColumnType = typename Types::LeftType;
+        using RangeStorageType = typename RangeColumnType::ValueType;
+        using RangeInterval = Interval<RangeStorageType>;
+
+        const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
+        if (!range_column_typed)
+            throw Exception(ErrorCodes::TYPE_MISMATCH,
+                "Dictionary {} range column type should be equal to {}",
+                getFullName(),
+                dict_struct.range_min->type->getName());
+
+        const auto & range_column_data = range_column_typed->getData();
+
+        const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
+
+        for (size_t key_index = 0; key_index < keys_size; ++key_index)
+        {
+            auto key = keys_extractor.extractCurrentKey();
+            const auto it = key_attribute_container.find(key);
+
+            if (it)
+            {
+                const auto date = range_column_data[key_index];
+                const auto & interval_tree = it->getMapped();
+
+                size_t value_index = 0;
+                std::optional<RangeInterval> range;
+
+                interval_tree.find(date, [&](auto & interval, auto & interval_value_index)
+                {
+                    if (range)
+                    {
+                        if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
+                        {
+                            range = interval;
+                            value_index = interval_value_index;
+                        }
+                        else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > * range)
+                        {
+                            range = interval;
+                            value_index = interval_value_index;
+                        }
+                    }
+                    else
+                    {
+                        range = interval;
+                        value_index = interval_value_index;
+                    }
+
+                    return true;
+                });
+
+                if (range.has_value())
+                {
+                    default_mask[key_index] = 0;
+                    ++keys_found;
+
+                    AttributeType value = attribute_container[value_index];
+
+                    if constexpr (is_nullable)
+                    {
+                        bool is_null = (*attribute.is_value_nullable)[value_index];
+                        set_value(key_index, value, is_null);
+                    }
+                    else
+                    {
+                        set_value(key_index, value, false);
+                    }
+
+                    keys_extractor.rollbackCurrentKey();
+                    continue;
+                }
+            }
+
+            default_mask[key_index] = 1;
+
+            keys_extractor.rollbackCurrentKey();
+        }
+    });
+
+    query_count.fetch_add(keys_size, std::memory_order_relaxed);
+    found_count.fetch_add(keys_found, std::memory_order_relaxed);
+    return keys_found;
+}
+
+template
+ColumnPtr RangeHashedDictionary<DictionaryKeyType::Simple>::getColumn(
+    const std::string & attribute_name,
+    const DataTypePtr & attribute_type,
+    const Columns & key_columns,
+    const DataTypes & key_types,
+    DefaultOrFilter default_or_filter) const;
+
+template
+ColumnPtr RangeHashedDictionary<DictionaryKeyType::Complex>::getColumn(
+    const std::string & attribute_name,
+    const DataTypePtr & attribute_type,
+    const Columns & key_columns,
+    const DataTypes & key_types,
+    DefaultOrFilter default_or_filter) const;
+
+}
diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index 509b991b30c..4a8008b9051 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -339,209 +339,6 @@ RangeHashedDictionary<dictionary_key_type>::RangeHashedDictionary(
     calculateBytesAllocated();
 }
 
-template <DictionaryKeyType dictionary_key_type>
-ColumnPtr RangeHashedDictionary<dictionary_key_type>::getColumn(
-    const std::string & attribute_name,
-    const DataTypePtr & attribute_type,
-    const Columns & key_columns,
-    const DataTypes & key_types,
-    DefaultOrFilter default_or_filter) const
-{
-    bool is_short_circuit = std::holds_alternative<RefFilter>(default_or_filter);
-    assert(is_short_circuit || std::holds_alternative<RefDefault>(default_or_filter));
-
-    if (dictionary_key_type == DictionaryKeyType::Complex)
-    {
-        auto key_types_copy = key_types;
-        key_types_copy.pop_back();
-        dict_struct.validateKeyTypes(key_types_copy);
-    }
-
-    ColumnPtr result;
-
-    const auto & dictionary_attribute = dict_struct.getAttribute(attribute_name, attribute_type);
-    const size_t attribute_index = dict_struct.attribute_name_to_index.find(attribute_name)->second;
-    const auto & attribute = attributes[attribute_index];
-
-    /// Cast range column to storage type
-    Columns modified_key_columns = key_columns;
-    const ColumnPtr & range_storage_column = key_columns.back();
-    ColumnWithTypeAndName column_to_cast = {range_storage_column->convertToFullColumnIfConst(), key_types.back(), ""};
-    modified_key_columns.back() = castColumnAccurate(column_to_cast, dict_struct.range_min->type);
-
-    size_t keys_size = key_columns.front()->size();
-    bool is_attribute_nullable = attribute.is_value_nullable.has_value();
-
-    ColumnUInt8::MutablePtr col_null_map_to;
-    ColumnUInt8::Container * vec_null_map_to = nullptr;
-    if (is_attribute_nullable)
-    {
-        col_null_map_to = ColumnUInt8::create(keys_size, false);
-        vec_null_map_to = &col_null_map_to->getData();
-    }
-
-    auto type_call = [&](const auto & dictionary_attribute_type)
-    {
-        using Type = std::decay_t<decltype(dictionary_attribute_type)>;
-        using AttributeType = typename Type::AttributeType;
-        using ValueType = DictionaryValueType<AttributeType>;
-        using ColumnProvider = DictionaryAttributeColumnProvider<AttributeType>;
-
-        auto column = ColumnProvider::getColumn(dictionary_attribute, keys_size);
-
-        if (is_short_circuit)
-        {
-            IColumn::Filter & default_mask = std::get<RefFilter>(default_or_filter).get();
-            size_t keys_found = 0;
-
-            if constexpr (std::is_same_v<ValueType, Array>)
-            {
-                auto * out = column.get();
-
-                keys_found = getItemsShortCircuitImpl<ValueType, false>(
-                    attribute,
-                    modified_key_columns,
-                    [&](size_t, const Array & value, bool)
-                    {
-                        out->insert(value);
-                    },
-                    default_mask);
-            }
-            else if constexpr (std::is_same_v<ValueType, StringRef>)
-            {
-                auto * out = column.get();
-
-                if (is_attribute_nullable)
-                    keys_found = getItemsShortCircuitImpl<ValueType, true>(
-                        attribute,
-                        modified_key_columns,
-                        [&](size_t row, StringRef value, bool is_null)
-                        {
-                            (*vec_null_map_to)[row] = is_null;
-                            out->insertData(value.data, value.size);
-                        },
-                        default_mask);
-                else
-                    keys_found = getItemsShortCircuitImpl<ValueType, false>(
-                        attribute,
-                        modified_key_columns,
-                        [&](size_t, StringRef value, bool)
-                        {
-                            out->insertData(value.data, value.size);
-                        },
-                        default_mask);
-            }
-            else
-            {
-                auto & out = column->getData();
-
-                if (is_attribute_nullable)
-                    keys_found = getItemsShortCircuitImpl<ValueType, true>(
-                        attribute,
-                        modified_key_columns,
-                        [&](size_t row, const auto value, bool is_null)
-                        {
-                            (*vec_null_map_to)[row] = is_null;
-                            out[row] = value;
-                        },
-                        default_mask);
-                else
-                    keys_found = getItemsShortCircuitImpl<ValueType, false>(
-                        attribute,
-                        modified_key_columns,
-                        [&](size_t row, const auto value, bool)
-                        {
-                            out[row] = value;
-                        },
-                        default_mask);
-
-                out.resize(keys_found);
-            }
-
-            if (is_attribute_nullable)
-                vec_null_map_to->resize(keys_found);
-        }
-        else
-        {
-            const ColumnPtr & default_values_column = std::get<RefDefault>(default_or_filter).get();
-
-            DictionaryDefaultValueExtractor<AttributeType> default_value_extractor(
-            dictionary_attribute.null_value, default_values_column);
-
-            if constexpr (std::is_same_v<ValueType, Array>)
-            {
-                auto * out = column.get();
-
-                getItemsImpl<ValueType, false>(
-                    attribute,
-                    modified_key_columns,
-                    [&](size_t, const Array & value, bool)
-                    {
-                        out->insert(value);
-                    },
-                    default_value_extractor);
-            }
-            else if constexpr (std::is_same_v<ValueType, StringRef>)
-            {
-                auto * out = column.get();
-
-                if (is_attribute_nullable)
-                    getItemsImpl<ValueType, true>(
-                        attribute,
-                        modified_key_columns,
-                        [&](size_t row, StringRef value, bool is_null)
-                        {
-                            (*vec_null_map_to)[row] = is_null;
-                            out->insertData(value.data, value.size);
-                        },
-                        default_value_extractor);
-                else
-                    getItemsImpl<ValueType, false>(
-                        attribute,
-                        modified_key_columns,
-                        [&](size_t, StringRef value, bool)
-                        {
-                            out->insertData(value.data, value.size);
-                        },
-                        default_value_extractor);
-            }
-            else
-            {
-                auto & out = column->getData();
-
-                if (is_attribute_nullable)
-                    getItemsImpl<ValueType, true>(
-                        attribute,
-                        modified_key_columns,
-                        [&](size_t row, const auto value, bool is_null)
-                        {
-                            (*vec_null_map_to)[row] = is_null;
-                            out[row] = value;
-                        },
-                        default_value_extractor);
-                else
-                    getItemsImpl<ValueType, false>(
-                        attribute,
-                        modified_key_columns,
-                        [&](size_t row, const auto value, bool)
-                        {
-                            out[row] = value;
-                        },
-                        default_value_extractor);
-            }
-        }
-
-        result = std::move(column);
-    };
-
-    callOnDictionaryAttributeType(attribute.type, type_call);
-
-    if (is_attribute_nullable)
-        result = ColumnNullable::create(result, std::move(col_null_map_to));
-
-    return result;
-}
-
 template <DictionaryKeyType dictionary_key_type>
 ColumnPtr RangeHashedDictionary<dictionary_key_type>::getColumnInternal(
     const std::string & attribute_name,
@@ -840,224 +637,6 @@ typename RangeHashedDictionary<dictionary_key_type>::Attribute RangeHashedDictio
     return attribute;
 }
 
-template <DictionaryKeyType dictionary_key_type>
-template <typename AttributeType, bool is_nullable, typename ValueSetter, typename DefaultValueExtractor>
-void RangeHashedDictionary<dictionary_key_type>::getItemsImpl(
-    const Attribute & attribute,
-    const Columns & key_columns,
-    ValueSetter && set_value,
-    DefaultValueExtractor & default_value_extractor) const
-{
-    const auto & attribute_container = std::get<AttributeContainerType<AttributeType>>(attribute.container);
-
-    size_t keys_found = 0;
-
-    const ColumnPtr & range_column = key_columns.back();
-    auto key_columns_copy = key_columns;
-    key_columns_copy.pop_back();
-
-    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
-    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
-    const size_t keys_size = keys_extractor.getKeysSize();
-
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
-    {
-        using Types = std::decay_t<decltype(types)>;
-        using RangeColumnType = typename Types::LeftType;
-        using RangeStorageType = typename RangeColumnType::ValueType;
-        using RangeInterval = Interval<RangeStorageType>;
-
-        const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
-        if (!range_column_typed)
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "Dictionary {} range column type should be equal to {}",
-                getFullName(),
-                dict_struct.range_min->type->getName());
-
-        const auto & range_column_data = range_column_typed->getData();
-
-        const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
-
-        for (size_t key_index = 0; key_index < keys_size; ++key_index)
-        {
-            auto key = keys_extractor.extractCurrentKey();
-            const auto it = key_attribute_container.find(key);
-
-            if (it)
-            {
-                const auto date = range_column_data[key_index];
-                const auto & interval_tree = it->getMapped();
-
-                size_t value_index = 0;
-                std::optional<RangeInterval> range;
-
-                interval_tree.find(date, [&](auto & interval, auto & interval_value_index)
-                {
-                    if (range)
-                    {
-                        if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
-                        {
-                            range = interval;
-                            value_index = interval_value_index;
-                        }
-                        else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > * range)
-                        {
-                            range = interval;
-                            value_index = interval_value_index;
-                        }
-                    }
-                    else
-                    {
-                        range = interval;
-                        value_index = interval_value_index;
-                    }
-
-                    return true;
-                });
-
-                if (range.has_value())
-                {
-                    ++keys_found;
-
-                    AttributeType value = attribute_container[value_index];
-
-                    if constexpr (is_nullable)
-                    {
-                        bool is_null = (*attribute.is_value_nullable)[value_index];
-                        set_value(key_index, value, is_null);
-                    }
-                    else
-                    {
-                        set_value(key_index, value, false);
-                    }
-
-                    keys_extractor.rollbackCurrentKey();
-                    continue;
-                }
-            }
-
-            if constexpr (is_nullable)
-                set_value(key_index, default_value_extractor[key_index], default_value_extractor.isNullAt(key_index));
-            else
-                set_value(key_index, default_value_extractor[key_index], false);
-
-            keys_extractor.rollbackCurrentKey();
-        }
-    });
-
-    query_count.fetch_add(keys_size, std::memory_order_relaxed);
-    found_count.fetch_add(keys_found, std::memory_order_relaxed);
-}
-
-template <DictionaryKeyType dictionary_key_type>
-template <typename AttributeType, bool is_nullable, typename ValueSetter>
-size_t RangeHashedDictionary<dictionary_key_type>::getItemsShortCircuitImpl(
-    const Attribute & attribute,
-    const Columns & key_columns,
-    ValueSetter && set_value,
-    IColumn::Filter & default_mask) const
-{
-    const auto & attribute_container = std::get<AttributeContainerType<AttributeType>>(attribute.container);
-
-    size_t keys_found = 0;
-
-    const ColumnPtr & range_column = key_columns.back();
-    auto key_columns_copy = key_columns;
-    key_columns_copy.pop_back();
-
-    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
-    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
-    const size_t keys_size = keys_extractor.getKeysSize();
-    default_mask.resize(keys_size);
-
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
-    {
-        using Types = std::decay_t<decltype(types)>;
-        using RangeColumnType = typename Types::LeftType;
-        using RangeStorageType = typename RangeColumnType::ValueType;
-        using RangeInterval = Interval<RangeStorageType>;
-
-        const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
-        if (!range_column_typed)
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "Dictionary {} range column type should be equal to {}",
-                getFullName(),
-                dict_struct.range_min->type->getName());
-
-        const auto & range_column_data = range_column_typed->getData();
-
-        const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
-
-        for (size_t key_index = 0; key_index < keys_size; ++key_index)
-        {
-            auto key = keys_extractor.extractCurrentKey();
-            const auto it = key_attribute_container.find(key);
-
-            if (it)
-            {
-                const auto date = range_column_data[key_index];
-                const auto & interval_tree = it->getMapped();
-
-                size_t value_index = 0;
-                std::optional<RangeInterval> range;
-
-                interval_tree.find(date, [&](auto & interval, auto & interval_value_index)
-                {
-                    if (range)
-                    {
-                        if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
-                        {
-                            range = interval;
-                            value_index = interval_value_index;
-                        }
-                        else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > * range)
-                        {
-                            range = interval;
-                            value_index = interval_value_index;
-                        }
-                    }
-                    else
-                    {
-                        range = interval;
-                        value_index = interval_value_index;
-                    }
-
-                    return true;
-                });
-
-                if (range.has_value())
-                {
-                    default_mask[key_index] = 0;
-                    ++keys_found;
-
-                    AttributeType value = attribute_container[value_index];
-
-                    if constexpr (is_nullable)
-                    {
-                        bool is_null = (*attribute.is_value_nullable)[value_index];
-                        set_value(key_index, value, is_null);
-                    }
-                    else
-                    {
-                        set_value(key_index, value, false);
-                    }
-
-                    keys_extractor.rollbackCurrentKey();
-                    continue;
-                }
-            }
-
-            default_mask[key_index] = 1;
-
-            keys_extractor.rollbackCurrentKey();
-        }
-    });
-
-    query_count.fetch_add(keys_size, std::memory_order_relaxed);
-    found_count.fetch_add(keys_found, std::memory_order_relaxed);
-    return keys_found;
-}
-
 template <DictionaryKeyType dictionary_key_type>
 template <typename AttributeType, bool is_nullable, typename ValueSetter>
 void RangeHashedDictionary<dictionary_key_type>::getItemsInternalImpl(

From f1f388d9d26dbaf0775e90fdc26f9085b83b1c26 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Mon, 11 Mar 2024 16:33:12 +0000
Subject: [PATCH 340/985] Remove RangeHashedDictionary as exception from large
 objects check

---
 utils/check-style/check-large-objects.sh | 2 --
 1 file changed, 2 deletions(-)

diff --git a/utils/check-style/check-large-objects.sh b/utils/check-style/check-large-objects.sh
index 5c1276e5732..5b0e8e88df5 100755
--- a/utils/check-style/check-large-objects.sh
+++ b/utils/check-style/check-large-objects.sh
@@ -7,8 +7,6 @@ TU_EXCLUDES=(
     AggregateFunctionUniq
     FunctionsConversion
 
-    RangeHashedDictionary
-
     Aggregator
 )
 

From c78a029d15f3b8d4796b69ea370af0e3b8abf8e2 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 12 Mar 2024 11:12:27 +0100
Subject: [PATCH 341/985] tests: fix typo in
 01603_insert_select_too_many_parts.sql
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: János Benjamin Antal <antaljanosbenjamin@users.noreply.github.com>
---
 .../queries/0_stateless/01603_insert_select_too_many_parts.sql  | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql b/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql
index 0c33c1d6b18..9408ccf2bbf 100644
--- a/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql
+++ b/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql
@@ -3,7 +3,7 @@ CREATE TABLE too_many_parts (x UInt64) ENGINE = MergeTree ORDER BY tuple() SETTI
 
 SYSTEM STOP MERGES too_many_parts;
 SET max_block_size = 1, min_insert_block_size_rows = 0, min_insert_block_size_bytes = 0;
--- Avoid concurrent partse check to avoid flakiness
+-- Avoid concurrent parts check to avoid flakiness
 SET max_threads=1, max_insert_threads=1;
 
 -- exception is not thrown if threshold is exceeded when multi-block INSERT is already started.

From c9c73378eb169e3de7e7579c5ec7edd573e1b72e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 12 Mar 2024 11:52:17 +0100
Subject: [PATCH 342/985] Fix problem detected by ubsan

---
 .../AggregateFunctionGroupArraySorted.cpp                   | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
index 0692ff28f18..1ee29c362cd 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
@@ -310,12 +310,12 @@ public:
         {
             for (Field & element : values)
             {
-                bool has_value = 0;
+                /// We must initialize the Field type since some internal functions (like operator=) use them
+                new (&element) Field;
+                bool has_value = false;
                 readBinary(has_value, buf);
                 if (has_value)
                     serialization->deserializeBinary(element, buf, {});
-                else
-                    element = Field{};
             }
         }
         else

From 4ce5245157418217b3f7e41724df3b8cf3dd3272 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Tue, 12 Mar 2024 11:03:39 +0000
Subject: [PATCH 343/985] Automatic style fix

---
 tests/integration/test_disk_types/test.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/integration/test_disk_types/test.py b/tests/integration/test_disk_types/test.py
index 5047cdc605e..a53d073d30b 100644
--- a/tests/integration/test_disk_types/test.py
+++ b/tests/integration/test_disk_types/test.py
@@ -50,6 +50,8 @@ def test_different_types(cluster):
             assert (
                 fields[encrypted_col_ix] == "0"
             ), f"{fields[name_col_ix]} expected to be non-encrypted!"
+
+
 def test_different_types(cluster):
     node = cluster.instances["node"]
     response = TSV.toMat(node.query("SELECT * FROM system.disks FORMAT TSVWithNames"))

From f9dcef774a5a6adac29cebc17827eef0cefe9ba9 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 14 Feb 2024 14:58:49 +0100
Subject: [PATCH 344/985] Fix function execution over const and LowCardinality
 with GROUP BY const for analyzer

Consider the following example:

    SELECT concatWithSeparator('|', 'a', concatWithSeparator('|', CAST('x', 'LowCardinality(String)'))) GROUP BY 'a'

Under analyzer it fails, UBsan report:

    ==15121==WARNING: MemorySanitizer: use-of-uninitialized-value
      ...
      8 0x5555601880ed in void DB::FormatStringImpl::format<true, false>() /src/ch/clickhouse/src/Functions/formatString.h:125:21
      9 0x55556017aeb8 in void DB::FormatStringImpl::formatExecute<>() /src/ch/clickhouse/src/Functions/formatString.h:30:13
      10 0x555560196779 in DB::()::ConcatWithSeparatorImpl<>::executeImpl() const /src/ch/clickhouse/src/Functions/concatWithSeparator.cpp:151:9
      11 0x55555a2ad5b7 in DB::FunctionToExecutableFunctionAdaptor::executeImpl() const /src/ch/clickhouse/src/Functions/IFunctionAdaptor.h:21:26
      12 0x555584312297 in DB::IExecutableFunction::executeWithoutLowCardinalityColumns() const /src/ch/clickhouse/src/Functions/IFunction.cpp:249:15
      13 0x555584317640 in DB::IExecutableFunction::executeWithoutSparseColumns() const /src/ch/clickhouse/src/Functions/IFunction.cpp:283:24
      14 0x55558431bf5c in DB::IExecutableFunction::execute() const /src/ch/clickhouse/src/Functions/IFunction.cpp:380:16
      15 0x555587bf3e20 in DB::executeAction() /src/ch/clickhouse/src/Interpreters/ExpressionActions.cpp:613:60

    Uninitialized value was created by a heap allocation
      ...
      6 0x55558b1c1a05 in DB::ColumnString::reserve(unsigned long) /src/ch/clickhouse/src/Columns/ColumnString.cpp:494:13
      7 0x55558980095d in DB::prepareOutputBlockColumns() /src/ch/clickhouse/src/Interpreters/AggregationUtils.cpp:32:25

The problem is that during query analysis
(QueryAnalyzer::resolveFunction()), the return value of the function had
been executed as LowCardinality(String), but the 'a' argument that is
passed to the concatWithSeparator() is not-const, because it had been
reused from the GROUP BY step, and this causes UB, since column 'a' does
not have enough rows (it should have 2 rows, since LowCardinality always
contains the default, while it has only 1).

v2: fix GROUPING SETs
Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Planner/PlannerExpressionAnalysis.cpp     | 33 +++++++++++++------
 .../02992_analyzer_group_by_const.reference   |  5 +++
 .../02992_analyzer_group_by_const.sql         | 10 ++++++
 3 files changed, 38 insertions(+), 10 deletions(-)
 create mode 100644 tests/queries/0_stateless/02992_analyzer_group_by_const.reference
 create mode 100644 tests/queries/0_stateless/02992_analyzer_group_by_const.sql

diff --git a/src/Planner/PlannerExpressionAnalysis.cpp b/src/Planner/PlannerExpressionAnalysis.cpp
index 52001eb27c5..175a8cc9030 100644
--- a/src/Planner/PlannerExpressionAnalysis.cpp
+++ b/src/Planner/PlannerExpressionAnalysis.cpp
@@ -81,6 +81,27 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
     bool group_by_use_nulls = planner_context->getQueryContext()->getSettingsRef().group_by_use_nulls &&
         (query_node.isGroupByWithGroupingSets() || query_node.isGroupByWithRollup() || query_node.isGroupByWithCube());
 
+    auto add_aggregation_column = [&](const auto & expression_dag_node)
+    {
+        auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
+        /// Const columns are special, the return value of the
+        /// function depens on it, and there is a special case for
+        /// const columns with LowCardinality column (see
+        /// IFunctionOverloadResolver::getReturnType()), and return
+        /// values of the function had been already obtained by the
+        /// QueryAnalyzer::resolveFunction(), and if const-ness of
+        /// the column will be ignored here, the return value of
+        /// the function can be changed, and this is UB.
+        if (typeid_cast<const ColumnConst *>(expression_dag_node->column.get()))
+            available_columns_after_aggregation.emplace_back(nullptr, expression_type_after_aggregation, expression_dag_node->result_name + "__group_by");
+        else
+            available_columns_after_aggregation.emplace_back(nullptr, expression_type_after_aggregation, expression_dag_node->result_name);
+
+        aggregation_keys.push_back(expression_dag_node->result_name);
+        before_aggregation_actions->getOutputs().push_back(expression_dag_node);
+        before_aggregation_actions_output_node_names.insert(expression_dag_node->result_name);
+    };
+
     if (query_node.hasGroupBy())
     {
         if (query_node.isGroupByWithGroupingSets())
@@ -108,11 +129,7 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                         if (before_aggregation_actions_output_node_names.contains(expression_dag_node->result_name))
                             continue;
 
-                        auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
-                        available_columns_after_aggregation.emplace_back(nullptr, expression_type_after_aggregation, expression_dag_node->result_name);
-                        aggregation_keys.push_back(expression_dag_node->result_name);
-                        before_aggregation_actions->getOutputs().push_back(expression_dag_node);
-                        before_aggregation_actions_output_node_names.insert(expression_dag_node->result_name);
+                        add_aggregation_column(expression_dag_node);
                     }
                 }
             }
@@ -158,11 +175,7 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                     if (before_aggregation_actions_output_node_names.contains(expression_dag_node->result_name))
                         continue;
 
-                    auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
-                    available_columns_after_aggregation.emplace_back(nullptr, expression_type_after_aggregation, expression_dag_node->result_name);
-                    aggregation_keys.push_back(expression_dag_node->result_name);
-                    before_aggregation_actions->getOutputs().push_back(expression_dag_node);
-                    before_aggregation_actions_output_node_names.insert(expression_dag_node->result_name);
+                    add_aggregation_column(expression_dag_node);
                 }
             }
         }
diff --git a/tests/queries/0_stateless/02992_analyzer_group_by_const.reference b/tests/queries/0_stateless/02992_analyzer_group_by_const.reference
new file mode 100644
index 00000000000..d1fab5a89a5
--- /dev/null
+++ b/tests/queries/0_stateless/02992_analyzer_group_by_const.reference
@@ -0,0 +1,5 @@
+b
+a|a
+a|x
+String, Const(size = 1, String(size = 1))
+String, Const(size = 1, String(size = 1))
diff --git a/tests/queries/0_stateless/02992_analyzer_group_by_const.sql b/tests/queries/0_stateless/02992_analyzer_group_by_const.sql
new file mode 100644
index 00000000000..a027678ec1f
--- /dev/null
+++ b/tests/queries/0_stateless/02992_analyzer_group_by_const.sql
@@ -0,0 +1,10 @@
+SET allow_experimental_analyzer=1;
+
+-- Illegal column String of first argument of function concatWithSeparator. Must be a constant String.
+SELECT concatWithSeparator('a', 'b') GROUP BY 'a';
+-- use-of-uninitialized-value
+SELECT concatWithSeparator('|', 'a', concatWithSeparator('|', CAST('a', 'LowCardinality(String)'))) GROUP BY 'a';
+SELECT concatWithSeparator('|', 'a', concatWithSeparator('|', CAST('x', 'LowCardinality(String)'))) GROUP BY 'a';
+-- should be const like for the query w/o GROUP BY
+select dumpColumnStructure('x') GROUP BY 'x';
+select dumpColumnStructure('x');

From d9c4972de4a44e9e79facefbb904263baf9be9ca Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 15 Feb 2024 09:58:04 +0100
Subject: [PATCH 345/985] Update tests references for GROUP BY const WITH TOTAL
 under analyzer

Now it preserves the original header in case of GROUP BY const, though
not for remote queries.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 ..._no_aggregates_and_constant_keys.reference |  2 +-
 ..._shard_no_aggregates_and_constant_keys.sql |  8 ++++++++
 .../00378_json_quote_64bit_integers.reference | 20 +++++++++----------
 ...01013_totals_without_aggregation.reference |  6 +++---
 .../02734_optimize_group_by.reference         |  8 ++++----
 5 files changed, 26 insertions(+), 18 deletions(-)

diff --git a/tests/queries/0_stateless/00257_shard_no_aggregates_and_constant_keys.reference b/tests/queries/0_stateless/00257_shard_no_aggregates_and_constant_keys.reference
index 866dc4f1894..63b8a9d14fc 100644
--- a/tests/queries/0_stateless/00257_shard_no_aggregates_and_constant_keys.reference
+++ b/tests/queries/0_stateless/00257_shard_no_aggregates_and_constant_keys.reference
@@ -5,7 +5,7 @@
 11
 40
 
-0
+40
 41
 
 0
diff --git a/tests/queries/0_stateless/00257_shard_no_aggregates_and_constant_keys.sql b/tests/queries/0_stateless/00257_shard_no_aggregates_and_constant_keys.sql
index 5cc06a41132..e3634141613 100644
--- a/tests/queries/0_stateless/00257_shard_no_aggregates_and_constant_keys.sql
+++ b/tests/queries/0_stateless/00257_shard_no_aggregates_and_constant_keys.sql
@@ -10,6 +10,14 @@ select 43 AS z from remote('127.0.0.{2,3}', system.one) group by 42, 43, 44;
 select 11 AS z from (SELECT 2 UNION ALL SELECT 3) group by 42, 43, 44;
 
 select 40 as z from (select * from system.numbers limit 3) group by z WITH TOTALS;
+-- NOTE: non-analyzer preserves the original header (i.e. 41) for TOTALS in
+-- case of remote queries with GROUP BY some_requested_const and there were no
+-- aggregate functions, the query above. But everything else works in the same
+-- way, i.e.:
+--
+--     select 41 as z, count() from remote('127.0.0.{2,3}', system.one) group by z WITH TOTALS;
+--     select 41 as z from remote('127.0.0.{2,3}', system.one) group by 1 WITH TOTALS;
+--
 select 41 as z from remote('127.0.0.{2,3}', system.one) group by z WITH TOTALS;
 select count(), 42 AS z from remote('127.0.0.{2,3}', system.one) group by z WITH TOTALS;
 select 43 AS z from remote('127.0.0.{2,3}', system.one) group by 42, 43, 44 WITH TOTALS;
diff --git a/tests/queries/0_stateless/00378_json_quote_64bit_integers.reference b/tests/queries/0_stateless/00378_json_quote_64bit_integers.reference
index b8d51e5d078..5174c13a9e0 100644
--- a/tests/queries/0_stateless/00378_json_quote_64bit_integers.reference
+++ b/tests/queries/0_stateless/00378_json_quote_64bit_integers.reference
@@ -48,10 +48,10 @@
 	{
 		"i0": "0",
 		"u0": "0",
-		"ip": "0",
-		"in": "0",
-		"up": "0",
-		"arr": [],
+		"ip": "9223372036854775807",
+		"in": "-9223372036854775808",
+		"up": "18446744073709551615",
+		"arr": ["0"],
 		"tuple": ["0","0"]
 	},
 
@@ -119,7 +119,7 @@
 		["0", "0", "9223372036854775807", "-9223372036854775808", "18446744073709551615", ["0"], ["0","0"]]
 	],
 
-	"totals": ["0", "0", "0", "0", "0", [], ["0","0"]],
+	"totals": ["0", "0", "9223372036854775807", "-9223372036854775808", "18446744073709551615", ["0"], ["0","0"]],
 
 	"extremes":
 	{
@@ -180,10 +180,10 @@
 	{
 		"i0": 0,
 		"u0": 0,
-		"ip": 0,
-		"in": 0,
-		"up": 0,
-		"arr": [],
+		"ip": 9223372036854775807,
+		"in": -9223372036854775808,
+		"up": 18446744073709551615,
+		"arr": [0],
 		"tuple": [0,0]
 	},
 
@@ -251,7 +251,7 @@
 		[0, 0, 9223372036854775807, -9223372036854775808, 18446744073709551615, [0], [0,0]]
 	],
 
-	"totals": [0, 0, 0, 0, 0, [], [0,0]],
+	"totals": [0, 0, 9223372036854775807, -9223372036854775808, 18446744073709551615, [0], [0,0]],
 
 	"extremes":
 	{
diff --git a/tests/queries/0_stateless/01013_totals_without_aggregation.reference b/tests/queries/0_stateless/01013_totals_without_aggregation.reference
index a1f5c1aa914..6dddf22a467 100644
--- a/tests/queries/0_stateless/01013_totals_without_aggregation.reference
+++ b/tests/queries/0_stateless/01013_totals_without_aggregation.reference
@@ -1,7 +1,7 @@
 11
 
-0
+11
+12
 12
-0
 13
-0
+13
diff --git a/tests/queries/0_stateless/02734_optimize_group_by.reference b/tests/queries/0_stateless/02734_optimize_group_by.reference
index 3f5ef03cb61..f97f780a659 100644
--- a/tests/queries/0_stateless/02734_optimize_group_by.reference
+++ b/tests/queries/0_stateless/02734_optimize_group_by.reference
@@ -1,8 +1,8 @@
 a	b
 a	b
-a	b
-	b
-a	b
-a	b
+a	b
+a	b
+a	b
+a	b
 a	b
 a	b

From 8bbd0298b1a98fa28fb947b64709f343cf73cf05 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 22 Feb 2024 18:24:34 +0100
Subject: [PATCH 346/985] Allow to share const columns in GROUP BY keys

Fixes:

    select toNullable(os_name) AS os_name, count() from (SELECT CAST('iphone' AS Enum8('iphone' = 1, 'android' = 2)) AS os_name) group by os_name WITH TOTALS settings allow_experimental_analyzer=1
    Code: 10. DB::Exception: Received from localhost:9000. DB::Exception: Not found column __table1.os_name:  in block toNullable(__table1.os_name) Nullable(Enum8('iphone' = 1, 'android' = 2)) Nullable(size = 0, Int8(size = 0), UInt8(size = 0)), count() UInt64 UInt64(size = 0). (NOT_FOUND_COLUMN_IN_BLOCK)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Planner/PlannerExpressionAnalysis.cpp | 33 +++++++----------------
 1 file changed, 10 insertions(+), 23 deletions(-)

diff --git a/src/Planner/PlannerExpressionAnalysis.cpp b/src/Planner/PlannerExpressionAnalysis.cpp
index 175a8cc9030..9b17e3b4b21 100644
--- a/src/Planner/PlannerExpressionAnalysis.cpp
+++ b/src/Planner/PlannerExpressionAnalysis.cpp
@@ -81,27 +81,6 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
     bool group_by_use_nulls = planner_context->getQueryContext()->getSettingsRef().group_by_use_nulls &&
         (query_node.isGroupByWithGroupingSets() || query_node.isGroupByWithRollup() || query_node.isGroupByWithCube());
 
-    auto add_aggregation_column = [&](const auto & expression_dag_node)
-    {
-        auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
-        /// Const columns are special, the return value of the
-        /// function depens on it, and there is a special case for
-        /// const columns with LowCardinality column (see
-        /// IFunctionOverloadResolver::getReturnType()), and return
-        /// values of the function had been already obtained by the
-        /// QueryAnalyzer::resolveFunction(), and if const-ness of
-        /// the column will be ignored here, the return value of
-        /// the function can be changed, and this is UB.
-        if (typeid_cast<const ColumnConst *>(expression_dag_node->column.get()))
-            available_columns_after_aggregation.emplace_back(nullptr, expression_type_after_aggregation, expression_dag_node->result_name + "__group_by");
-        else
-            available_columns_after_aggregation.emplace_back(nullptr, expression_type_after_aggregation, expression_dag_node->result_name);
-
-        aggregation_keys.push_back(expression_dag_node->result_name);
-        before_aggregation_actions->getOutputs().push_back(expression_dag_node);
-        before_aggregation_actions_output_node_names.insert(expression_dag_node->result_name);
-    };
-
     if (query_node.hasGroupBy())
     {
         if (query_node.isGroupByWithGroupingSets())
@@ -129,7 +108,11 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                         if (before_aggregation_actions_output_node_names.contains(expression_dag_node->result_name))
                             continue;
 
-                        add_aggregation_column(expression_dag_node);
+                        auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
+                        available_columns_after_aggregation.emplace_back(expression_dag_node->column, expression_type_after_aggregation, expression_dag_node->result_name);
+                        aggregation_keys.push_back(expression_dag_node->result_name);
+                        before_aggregation_actions->getOutputs().push_back(expression_dag_node);
+                        before_aggregation_actions_output_node_names.insert(expression_dag_node->result_name);
                     }
                 }
             }
@@ -175,7 +158,11 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                     if (before_aggregation_actions_output_node_names.contains(expression_dag_node->result_name))
                         continue;
 
-                    add_aggregation_column(expression_dag_node);
+                    auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
+                    available_columns_after_aggregation.emplace_back(expression_dag_node->column, expression_type_after_aggregation, expression_dag_node->result_name);
+                    aggregation_keys.push_back(expression_dag_node->result_name);
+                    before_aggregation_actions->getOutputs().push_back(expression_dag_node);
+                    before_aggregation_actions_output_node_names.insert(expression_dag_node->result_name);
                 }
             }
         }

From b11b732e430a9b96206233fceb9d17f2cd690700 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 22 Feb 2024 18:28:29 +0100
Subject: [PATCH 347/985] Add a test from #60046

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../queries/0_stateless/02992_analyzer_group_by_const.reference | 1 +
 tests/queries/0_stateless/02992_analyzer_group_by_const.sql     | 2 ++
 2 files changed, 3 insertions(+)

diff --git a/tests/queries/0_stateless/02992_analyzer_group_by_const.reference b/tests/queries/0_stateless/02992_analyzer_group_by_const.reference
index d1fab5a89a5..ff61ab0a515 100644
--- a/tests/queries/0_stateless/02992_analyzer_group_by_const.reference
+++ b/tests/queries/0_stateless/02992_analyzer_group_by_const.reference
@@ -3,3 +3,4 @@ a|a
 a|x
 String, Const(size = 1, String(size = 1))
 String, Const(size = 1, String(size = 1))
+5128475243952187658
diff --git a/tests/queries/0_stateless/02992_analyzer_group_by_const.sql b/tests/queries/0_stateless/02992_analyzer_group_by_const.sql
index a027678ec1f..f30a49887c7 100644
--- a/tests/queries/0_stateless/02992_analyzer_group_by_const.sql
+++ b/tests/queries/0_stateless/02992_analyzer_group_by_const.sql
@@ -8,3 +8,5 @@ SELECT concatWithSeparator('|', 'a', concatWithSeparator('|', CAST('x', 'LowCard
 -- should be const like for the query w/o GROUP BY
 select dumpColumnStructure('x') GROUP BY 'x';
 select dumpColumnStructure('x');
+-- from https://github.com/ClickHouse/ClickHouse/pull/60046
+SELECT cityHash64('limit', _CAST(materialize('World'), 'LowCardinality(String)')) FROM system.one GROUP BY GROUPING SETS ('limit');

From c1cefe18744d06bebd67b6425ae5afc9cb922e78 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Tue, 12 Mar 2024 11:41:36 +0000
Subject: [PATCH 348/985] Fix keeper reconfig for standalone binary

---
 src/Coordination/Standalone/Context.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Coordination/Standalone/Context.cpp b/src/Coordination/Standalone/Context.cpp
index 264cf118501..75b81187973 100644
--- a/src/Coordination/Standalone/Context.cpp
+++ b/src/Coordination/Standalone/Context.cpp
@@ -374,7 +374,7 @@ void Context::updateKeeperConfiguration([[maybe_unused]] const Poco::Util::Abstr
     if (!shared->keeper_dispatcher)
         return;
 
-    shared->keeper_dispatcher->updateConfiguration(getConfigRef(), getMacros());
+    shared->keeper_dispatcher->updateConfiguration(config_, getMacros());
 }
 
 std::shared_ptr<zkutil::ZooKeeper> Context::getZooKeeper() const

From aa9b5741e15b1f9a5a09b208bfbe033133bc0e25 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Tue, 12 Mar 2024 11:43:08 +0000
Subject: [PATCH 349/985] Improve tests

---
 .../integration/test_failed_mutations/test.py | 61 +++++++++++--------
 1 file changed, 35 insertions(+), 26 deletions(-)

diff --git a/tests/integration/test_failed_mutations/test.py b/tests/integration/test_failed_mutations/test.py
index 27bdcc3dd24..196a37ed627 100644
--- a/tests/integration/test_failed_mutations/test.py
+++ b/tests/integration/test_failed_mutations/test.py
@@ -19,10 +19,10 @@ node_no_backoff = cluster.add_instance(
     with_zookeeper=True,
 )
 
-REPLICATED_POSPONE_MUTATION_LOG = (
+REPLICATED_POSTPONE_MUTATION_LOG = (
     "According to exponential backoff policy, put aside this log entry"
 )
-POSPONE_MUTATION_LOG = (
+POSTPONE_MUTATION_LOG = (
     "According to exponential backoff policy, do not perform mutations for the part"
 )
 
@@ -56,21 +56,36 @@ def started_cluster():
 
 
 @pytest.mark.parametrize(
-    ("node"),
+    ("node, found_in_log"),
     [
-        (node_with_backoff),
+        (
+            node_with_backoff,
+            True,
+        ),
+        (
+            node_no_backoff,
+            False,
+        ),
     ],
 )
-def test_exponential_backoff_with_merge_tree(started_cluster, node):
+def test_exponential_backoff_with_merge_tree(started_cluster, node, found_in_log):
     prepare_cluster(False)
 
+    def check_logs():
+        if found_in_log:
+            assert node.wait_for_log_line(POSTPONE_MUTATION_LOG)
+            # Do not rotate the logs when we are checking the absence of a log message
+            node.rotate_logs()
+        else:
+            # Best effort, but when it fails, then the logs for sure contain the problematic message
+            assert not node.contains_in_log(POSTPONE_MUTATION_LOG)
+
     # Executing incorrect mutation.
     node.query(
         "ALTER TABLE test_mutations DELETE WHERE x IN (SELECT x FROM notexist_table) SETTINGS allow_nondeterministic_mutations=1"
     )
 
-    assert node.wait_for_log_line(POSPONE_MUTATION_LOG)
-    node.rotate_logs()
+    check_logs()
 
     node.query("KILL MUTATION WHERE table='test_mutations'")
     # Check that after kill new parts mutations are postponing.
@@ -78,7 +93,7 @@ def test_exponential_backoff_with_merge_tree(started_cluster, node):
         "ALTER TABLE test_mutations DELETE WHERE x IN (SELECT x FROM notexist_table) SETTINGS allow_nondeterministic_mutations=1"
     )
 
-    assert node.wait_for_log_line(POSPONE_MUTATION_LOG)
+    check_logs()
 
 
 def test_exponential_backoff_with_replicated_tree(started_cluster):
@@ -88,36 +103,30 @@ def test_exponential_backoff_with_replicated_tree(started_cluster):
         "ALTER TABLE test_mutations DELETE WHERE x IN (SELECT x FROM notexist_table) SETTINGS allow_nondeterministic_mutations=1"
     )
 
-    assert node_with_backoff.wait_for_log_line(REPLICATED_POSPONE_MUTATION_LOG)
-    assert not node_no_backoff.contains_in_log(REPLICATED_POSPONE_MUTATION_LOG)
+    assert node_with_backoff.wait_for_log_line(REPLICATED_POSTPONE_MUTATION_LOG)
+    assert not node_no_backoff.contains_in_log(REPLICATED_POSTPONE_MUTATION_LOG)
 
 
-@pytest.mark.parametrize(
-    ("node"),
-    [
-        (node_with_backoff),
-    ],
-)
-def test_exponential_backoff_create_dependent_table(started_cluster, node):
+def test_exponential_backoff_create_dependent_table(started_cluster):
     prepare_cluster(False)
 
     # Executing incorrect mutation.
-    node.query(
+    node_with_backoff.query(
         "ALTER TABLE test_mutations DELETE WHERE x IN (SELECT x  FROM dep_table) SETTINGS allow_nondeterministic_mutations=1"
     )
 
     # Creating dependent table for mutation.
-    node.query("CREATE TABLE dep_table(x UInt32) ENGINE MergeTree() ORDER BY x")
+    node_with_backoff.query("CREATE TABLE dep_table(x UInt32) ENGINE MergeTree() ORDER BY x")
 
     retry_count = 100
     no_unfinished_mutation = False
     for _ in range(0, retry_count):
-        if node.query("SELECT count() FROM system.mutations WHERE is_done=0") == "0\n":
+        if node_with_backoff.query("SELECT count() FROM system.mutations WHERE is_done=0") == "0\n":
             no_unfinished_mutation = True
             break
 
     assert no_unfinished_mutation
-    node.query("DROP TABLE IF EXISTS dep_table SYNC")
+    node_with_backoff   .query("DROP TABLE IF EXISTS dep_table SYNC")
 
 
 def test_exponential_backoff_setting_override(started_cluster):
@@ -133,7 +142,7 @@ def test_exponential_backoff_setting_override(started_cluster):
     node.query(
         "ALTER TABLE test_mutations DELETE WHERE x IN (SELECT x  FROM dep_table) SETTINGS allow_nondeterministic_mutations=1"
     )
-    assert not node.contains_in_log(POSPONE_MUTATION_LOG)
+    assert not node.contains_in_log(POSTPONE_MUTATION_LOG)
 
 
 @pytest.mark.parametrize(
@@ -152,14 +161,14 @@ def test_backoff_clickhouse_restart(started_cluster, replicated_table):
         "ALTER TABLE test_mutations DELETE WHERE x IN (SELECT x  FROM dep_table) SETTINGS allow_nondeterministic_mutations=1"
     )
     assert node.wait_for_log_line(
-        REPLICATED_POSPONE_MUTATION_LOG if replicated_table else POSPONE_MUTATION_LOG
+        REPLICATED_POSTPONE_MUTATION_LOG if replicated_table else POSTPONE_MUTATION_LOG
     )
 
     node.restart_clickhouse()
     node.rotate_logs()
 
     assert node.wait_for_log_line(
-        REPLICATED_POSPONE_MUTATION_LOG if replicated_table else POSPONE_MUTATION_LOG
+        REPLICATED_POSTPONE_MUTATION_LOG if replicated_table else POSTPONE_MUTATION_LOG
     )
 
 
@@ -181,7 +190,7 @@ def test_no_backoff_after_killing_mutation(started_cluster, replicated_table):
     # Executing correct mutation.
     node.query("ALTER TABLE test_mutations DELETE  WHERE x=1")
     assert node.wait_for_log_line(
-        REPLICATED_POSPONE_MUTATION_LOG if replicated_table else POSPONE_MUTATION_LOG
+        REPLICATED_POSTPONE_MUTATION_LOG if replicated_table else POSTPONE_MUTATION_LOG
     )
     mutation_ids = node.query("select mutation_id from system.mutations").split()
 
@@ -190,5 +199,5 @@ def test_no_backoff_after_killing_mutation(started_cluster, replicated_table):
     )
     node.rotate_logs()
     assert not node.contains_in_log(
-        REPLICATED_POSPONE_MUTATION_LOG if replicated_table else POSPONE_MUTATION_LOG
+        REPLICATED_POSTPONE_MUTATION_LOG if replicated_table else POSTPONE_MUTATION_LOG
     )

From d431276045f6600af92562abf2b6387bd37d068c Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 12 Mar 2024 12:43:48 +0100
Subject: [PATCH 350/985] Fix usage of session_token in S3

---
 src/Storages/StorageS3.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 11da394feec..ff055508aa6 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -1451,7 +1451,8 @@ void StorageS3::Configuration::connect(const ContextPtr & context)
             auth_settings.expiration_window_seconds.value_or(
                 context->getConfigRef().getUInt64("s3.expiration_window_seconds", S3::DEFAULT_EXPIRATION_WINDOW_SECONDS)),
             auth_settings.no_sign_request.value_or(context->getConfigRef().getBool("s3.no_sign_request", false)),
-        });
+        },
+        credentials.GetSessionToken());
 }
 
 void StorageS3::processNamedCollectionResult(StorageS3::Configuration & configuration, const NamedCollection & collection)

From 2e803f29f8f89eec0d9eb95b089ecad5dd6e18b7 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 12 Mar 2024 12:45:02 +0100
Subject: [PATCH 351/985] Fix KeeperSnapshotManagerS3

---
 src/Coordination/KeeperSnapshotManagerS3.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Coordination/KeeperSnapshotManagerS3.cpp b/src/Coordination/KeeperSnapshotManagerS3.cpp
index 80345db2524..796506a07db 100644
--- a/src/Coordination/KeeperSnapshotManagerS3.cpp
+++ b/src/Coordination/KeeperSnapshotManagerS3.cpp
@@ -121,7 +121,8 @@ void KeeperSnapshotManagerS3::updateS3Configuration(const Poco::Util::AbstractCo
                 auth_settings.use_insecure_imds_request.value_or(false),
                 auth_settings.expiration_window_seconds.value_or(S3::DEFAULT_EXPIRATION_WINDOW_SECONDS),
                 auth_settings.no_sign_request.value_or(false),
-            });
+            },
+            credentials.GetSessionToken());
 
         auto new_client = std::make_shared<KeeperSnapshotManagerS3::S3Configuration>(std::move(new_uri), std::move(auth_settings), std::move(client));
 

From e9ef18c3ac3424eab6fff0449740365d010f2eae Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Tue, 12 Mar 2024 11:54:56 +0000
Subject: [PATCH 352/985] Automatic style fix

---
 tests/integration/test_failed_mutations/test.py | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/tests/integration/test_failed_mutations/test.py b/tests/integration/test_failed_mutations/test.py
index 196a37ed627..c72f5264f03 100644
--- a/tests/integration/test_failed_mutations/test.py
+++ b/tests/integration/test_failed_mutations/test.py
@@ -116,17 +116,24 @@ def test_exponential_backoff_create_dependent_table(started_cluster):
     )
 
     # Creating dependent table for mutation.
-    node_with_backoff.query("CREATE TABLE dep_table(x UInt32) ENGINE MergeTree() ORDER BY x")
+    node_with_backoff.query(
+        "CREATE TABLE dep_table(x UInt32) ENGINE MergeTree() ORDER BY x"
+    )
 
     retry_count = 100
     no_unfinished_mutation = False
     for _ in range(0, retry_count):
-        if node_with_backoff.query("SELECT count() FROM system.mutations WHERE is_done=0") == "0\n":
+        if (
+            node_with_backoff.query(
+                "SELECT count() FROM system.mutations WHERE is_done=0"
+            )
+            == "0\n"
+        ):
             no_unfinished_mutation = True
             break
 
     assert no_unfinished_mutation
-    node_with_backoff   .query("DROP TABLE IF EXISTS dep_table SYNC")
+    node_with_backoff.query("DROP TABLE IF EXISTS dep_table SYNC")
 
 
 def test_exponential_backoff_setting_override(started_cluster):

From 612ff3c5bc1f4878f869bd6e49cc1e60e58e3afd Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 12 Mar 2024 12:35:33 +0100
Subject: [PATCH 353/985] Make every style-checker runner types scaling-out
 very quickly

---
 tests/ci/autoscale_runners_lambda/app.py            | 8 ++++++--
 tests/ci/autoscale_runners_lambda/test_autoscale.py | 2 +-
 2 files changed, 7 insertions(+), 3 deletions(-)

diff --git a/tests/ci/autoscale_runners_lambda/app.py b/tests/ci/autoscale_runners_lambda/app.py
index 1aa2e424320..a36c508482c 100644
--- a/tests/ci/autoscale_runners_lambda/app.py
+++ b/tests/ci/autoscale_runners_lambda/app.py
@@ -51,7 +51,7 @@ class Queue:
     label: str
 
 
-def get_scales() -> Tuple[int, int]:
+def get_scales(runner_type: str) -> Tuple[int, int]:
     "returns the multipliers for scaling down and up ASG by types"
     # Scaling down is quicker on the lack of running jobs than scaling up on
     # queue
@@ -63,8 +63,12 @@ def get_scales() -> Tuple[int, int]:
     # 10. I am trying 7 now.
     # 7 still looks a bit slow, so I try 6
     # Let's have it the same as the other ASG
+    #
+    # All type of style-checkers should be added very quickly to not block the workflows
     # UPDATE THE COMMENT ON CHANGES
     scale_up = 3
+    if "style" in runner_type:
+        scale_up = 1
     return scale_down, scale_up
 
 
@@ -95,7 +99,7 @@ def set_capacity(
             continue
         raise ValueError("Queue status is not in ['in_progress', 'queued']")
 
-    scale_down, scale_up = get_scales()
+    scale_down, scale_up = get_scales(runner_type)
     # With lyfecycle hooks some instances are actually free because some of
     # them are in 'Terminating:Wait' state
     effective_capacity = max(
diff --git a/tests/ci/autoscale_runners_lambda/test_autoscale.py b/tests/ci/autoscale_runners_lambda/test_autoscale.py
index 21a407276f9..75f178ac394 100644
--- a/tests/ci/autoscale_runners_lambda/test_autoscale.py
+++ b/tests/ci/autoscale_runners_lambda/test_autoscale.py
@@ -80,7 +80,7 @@ class TestSetCapacity(unittest.TestCase):
             ),
             TestCase("increase-1", 1, 13, 20, [Queue("queued", 23, "increase-1")], 17),
             TestCase(
-                "style-checker", 1, 13, 20, [Queue("queued", 33, "style-checker")], 20
+                "style-checker", 1, 13, 20, [Queue("queued", 19, "style-checker")], 19
             ),
             TestCase("increase-2", 1, 13, 20, [Queue("queued", 18, "increase-2")], 15),
             TestCase("increase-3", 1, 13, 20, [Queue("queued", 183, "increase-3")], 20),

From f63970769b21d9c5f882bb4eb43c71018d45fdf4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Tue, 12 Mar 2024 12:23:09 +0000
Subject: [PATCH 354/985] Make test less flaky

---
 .../test_merge_tree_load_parts/test.py        | 26 ++++++++++++++++---
 1 file changed, 22 insertions(+), 4 deletions(-)

diff --git a/tests/integration/test_merge_tree_load_parts/test.py b/tests/integration/test_merge_tree_load_parts/test.py
index 968225887ad..5d575fa95f5 100644
--- a/tests/integration/test_merge_tree_load_parts/test.py
+++ b/tests/integration/test_merge_tree_load_parts/test.py
@@ -156,15 +156,33 @@ def test_merge_tree_load_parts_corrupted(started_cluster):
     node1.query("SYSTEM WAIT LOADING PARTS mt_load_parts_2")
 
     def check_parts_loading(node, partition, loaded, failed, skipped):
+        # The whole test produces around 6-700 lines, so 2k is plenty enough.
+        # wait_for_log_line uses tail + grep, so the overhead is negligible
+        look_behind_lines = 2000
         for min_block, max_block in loaded:
             part_name = f"{partition}_{min_block}_{max_block}"
-            assert node.contains_in_log(f"Loading Active part {part_name}")
-            assert node.contains_in_log(f"Finished loading Active part {part_name}")
+            assert node.wait_for_log_line(
+                f"Loading Active part {part_name}", look_behind_lines=look_behind_lines
+            )
+            assert node.wait_for_log_line(
+                f"Finished loading Active part {part_name}",
+                look_behind_lines=look_behind_lines,
+            )
 
+        failed_part_names = []
+        # Let's wait until there is some information about all expected parts, and only
+        # check the absence of not expected log messages after all expected logs are present
         for min_block, max_block in failed:
             part_name = f"{partition}_{min_block}_{max_block}"
-            assert node.contains_in_log(f"Loading Active part {part_name}")
-            assert not node.contains_in_log(f"Finished loading Active part {part_name}")
+            failed_part_names.append(part_name)
+            assert node.wait_for_log_line(
+                f"Loading Active part {part_name}", look_behind_lines=look_behind_lines
+            )
+
+        for failed_part_name in failed_part_names:
+            assert not node.contains_in_log(
+                f"Finished loading Active part {failed_part_name}"
+            )
 
         for min_block, max_block in skipped:
             part_name = f"{partition}_{min_block}_{max_block}"

From 50aab0b69f75c027b0b6dd53ff747492485eed53 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 12 Mar 2024 14:06:17 +0100
Subject: [PATCH 355/985] Fix annoying typo

---
 tests/ci/autoscale_runners_lambda/app.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/ci/autoscale_runners_lambda/app.py b/tests/ci/autoscale_runners_lambda/app.py
index a36c508482c..6c3d71708e9 100644
--- a/tests/ci/autoscale_runners_lambda/app.py
+++ b/tests/ci/autoscale_runners_lambda/app.py
@@ -142,7 +142,7 @@ def set_capacity(
 
         logging.info(
             "The ASG %s capacity will be increased to %s, current capacity=%s, "
-            "effective capacity=%sm maximum capacity=%s, running jobs=%s, queue size=%s",
+            "effective capacity=%s, maximum capacity=%s, running jobs=%s, queue size=%s",
             asg["AutoScalingGroupName"],
             desired_capacity,
             effective_capacity,

From c011901d01709dff91e8afe53121af7388842f33 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 12 Mar 2024 14:28:28 +0100
Subject: [PATCH 356/985] Fix coverage

---
 src/Functions/coverage.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Functions/coverage.cpp b/src/Functions/coverage.cpp
index f4cac26df78..a1a43d0cf58 100644
--- a/src/Functions/coverage.cpp
+++ b/src/Functions/coverage.cpp
@@ -4,6 +4,7 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnVector.h>
+#include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnConst.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/IFunction.h>

From c27c1e1035772cff76f318a361153ca21f9adc55 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 12 Mar 2024 14:36:07 +0100
Subject: [PATCH 357/985] Fix build

---
 src/Functions/FunctionsConversion.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 94fd960a99e..e2d9c4a173e 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -3391,9 +3391,9 @@ arguments, result_type, input_rows_count); \
             case IntervalKind::Kind::INTERVAL_KIND: \
                 return createFunctionAdaptor(FunctionConvert<DataTypeInterval, NameToInterval##INTERVAL_KIND, PositiveMonotonicity>::create(), from_type);
 
-    static WrapperType createIntervalWrapper(const DataTypePtr & from_type, IntervalKind::Kind kind)
+    static WrapperType createIntervalWrapper(const DataTypePtr & from_type, IntervalKind kind)
     {
-        switch (kind)
+        switch (kind.kind)
         {
             GENERATE_INTERVAL_CASE(Nanosecond)
             GENERATE_INTERVAL_CASE(Microsecond)

From b5489ac9620311b160b8c5fa23c02afcc7271114 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Tue, 12 Mar 2024 14:05:39 +0000
Subject: [PATCH 358/985] Print out all queries to have better insights

---
 ...materialized_views_ignore_errors.reference | 26 +++++++++++++++++--
 ..._logs_materialized_views_ignore_errors.sql |  8 +++---
 2 files changed, 29 insertions(+), 5 deletions(-)

diff --git a/tests/queries/0_stateless/02572_system_logs_materialized_views_ignore_errors.reference b/tests/queries/0_stateless/02572_system_logs_materialized_views_ignore_errors.reference
index 029f80b46b0..596a047c104 100644
--- a/tests/queries/0_stateless/02572_system_logs_materialized_views_ignore_errors.reference
+++ b/tests/queries/0_stateless/02572_system_logs_materialized_views_ignore_errors.reference
@@ -1,2 +1,24 @@
-11	queryfinish	OK
-11	querystart	OK
+"-- Attach MV to system.query_log and check that writing query_log will not fail\n\nset log_queries=1;","querystart","OK"
+"-- Attach MV to system.query_log and check that writing query_log will not fail\n\nset log_queries=1;","queryfinish","OK"
+"drop table if exists log_proxy_02572;","querystart","OK"
+"drop table if exists log_proxy_02572;","queryfinish","OK"
+"drop table if exists push_to_logs_proxy_mv_02572;","querystart","OK"
+"drop table if exists push_to_logs_proxy_mv_02572;","queryfinish","OK"
+"-- create log tables\nsystem flush logs;","querystart","OK"
+"-- create log tables\nsystem flush logs;","queryfinish","OK"
+"create table log_proxy_02572 as system.query_log engine=Distributed('test_shard_localhost', currentDatabase(), 'receiver_02572');","querystart","OK"
+"create table log_proxy_02572 as system.query_log engine=Distributed('test_shard_localhost', currentDatabase(), 'receiver_02572');","queryfinish","OK"
+"create materialized view push_to_logs_proxy_mv_02572 to log_proxy_02572 as select * from system.query_log;","querystart","OK"
+"create materialized view push_to_logs_proxy_mv_02572 to log_proxy_02572 as select * from system.query_log;","queryfinish","OK"
+"select 1 format Null;","querystart","OK"
+"select 1 format Null;","queryfinish","OK"
+"system flush logs;","querystart","OK"
+"system flush logs;","queryfinish","OK"
+"system flush logs;","querystart","OK"
+"system flush logs;","queryfinish","OK"
+"drop table log_proxy_02572;","querystart","OK"
+"drop table log_proxy_02572;","queryfinish","OK"
+"drop table push_to_logs_proxy_mv_02572;","querystart","OK"
+"drop table push_to_logs_proxy_mv_02572;","queryfinish","OK"
+"set log_queries=0;","querystart","OK"
+"set log_queries=0;","queryfinish","OK"
diff --git a/tests/queries/0_stateless/02572_system_logs_materialized_views_ignore_errors.sql b/tests/queries/0_stateless/02572_system_logs_materialized_views_ignore_errors.sql
index a7a74190821..2381639fba0 100644
--- a/tests/queries/0_stateless/02572_system_logs_materialized_views_ignore_errors.sql
+++ b/tests/queries/0_stateless/02572_system_logs_materialized_views_ignore_errors.sql
@@ -21,10 +21,12 @@ system flush logs;
 drop table log_proxy_02572;
 drop table push_to_logs_proxy_mv_02572;
 
+set log_queries=0;
+
 system flush logs;
 -- lower() to pass through clickhouse-test "exception" check
-select count(), lower(type::String), errorCodeToName(exception_code)
+select replaceAll(query, '\n', '\\n'), lower(type::String), errorCodeToName(exception_code)
     from system.query_log
     where current_database = currentDatabase()
-    group by 2, 3
-    order by 2;
+    order by event_time_microseconds
+    format CSV;

From 0b588480f5165af38675911ebba043fe410465db Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 12 Mar 2024 14:34:15 +0000
Subject: [PATCH 359/985] Fix lazy execution in dictGetOrDefault for
 RangeHashedDictionary

---
 src/Functions/FunctionsExternalDictionaries.h |  7 ++--
 .../03009_range_dict_get_or_default.reference |  1 +
 .../03009_range_dict_get_or_default.sql       | 34 +++++++++++++++++++
 3 files changed, 40 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/03009_range_dict_get_or_default.reference
 create mode 100644 tests/queries/0_stateless/03009_range_dict_get_or_default.sql

diff --git a/src/Functions/FunctionsExternalDictionaries.h b/src/Functions/FunctionsExternalDictionaries.h
index 261c728e9e1..011772baab9 100644
--- a/src/Functions/FunctionsExternalDictionaries.h
+++ b/src/Functions/FunctionsExternalDictionaries.h
@@ -324,12 +324,15 @@ public:
     String getName() const override { return name; }
 
     bool isVariadic() const override { return true; }
-    bool isShortCircuit(ShortCircuitSettings & settings, size_t /*number_of_arguments*/) const override
+    bool isShortCircuit(ShortCircuitSettings & settings, size_t number_of_arguments) const override
     {
         if constexpr (dictionary_get_function_type != DictionaryGetFunctionType::getOrDefault)
             return false;
 
-        settings.arguments_with_disabled_lazy_execution.insert({0, 1, 2});
+        /// We execute lazily only last argument with default expression.
+        for (size_t i = 0; i != number_of_arguments - 1; ++i)
+            settings.arguments_with_disabled_lazy_execution.insert(i);
+
         settings.enable_lazy_execution_for_common_descendants_of_arguments = false;
         settings.force_enable_lazy_execution = false;
         return true;
diff --git a/tests/queries/0_stateless/03009_range_dict_get_or_default.reference b/tests/queries/0_stateless/03009_range_dict_get_or_default.reference
new file mode 100644
index 00000000000..0cfbf08886f
--- /dev/null
+++ b/tests/queries/0_stateless/03009_range_dict_get_or_default.reference
@@ -0,0 +1 @@
+2
diff --git a/tests/queries/0_stateless/03009_range_dict_get_or_default.sql b/tests/queries/0_stateless/03009_range_dict_get_or_default.sql
new file mode 100644
index 00000000000..1f4b4073b9f
--- /dev/null
+++ b/tests/queries/0_stateless/03009_range_dict_get_or_default.sql
@@ -0,0 +1,34 @@
+DROP DICTIONARY IF EXISTS range_dictionary;
+DROP TABLE IF EXISTS range_dictionary_nullable_source_table;
+
+
+CREATE TABLE range_dictionary_nullable_source_table
+(
+  key UInt64,
+  start_date Date,
+  end_date Date,
+  value Nullable(UInt64)
+)
+ENGINE = TinyLog;
+
+INSERT INTO range_dictionary_nullable_source_table VALUES (0, toDate('2019-05-05'), toDate('2019-05-20'), 0), (1, toDate('2019-05-05'), toDate('2019-05-20'), NULL);
+
+CREATE DICTIONARY range_dictionary
+(
+  key UInt64,
+  start_date Date,
+  end_date Date,
+  value Nullable(UInt64) DEFAULT NULL
+)
+PRIMARY KEY key
+SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() TABLE 'range_dictionary_nullable_source_table'))
+LIFETIME(MIN 1 MAX 1000)
+LAYOUT(RANGE_HASHED())
+RANGE(MIN start_date MAX end_date);
+
+SELECT dictGetOrDefault('range_dictionary', 'value', toUInt64(2), toDate(toLowCardinality(materialize('2019-05-15'))), 2);
+
+
+DROP DICTIONARY IF EXISTS range_dictionary;
+DROP TABLE IF EXISTS range_dictionary_nullable_source_table;
+

From 94f15dd5e058fc9f68bf3644c895908bba849db6 Mon Sep 17 00:00:00 2001
From: Mikhail Koviazin <mikhail.koviazin@aiven.io>
Date: Tue, 12 Mar 2024 16:48:43 +0200
Subject: [PATCH 360/985] Fix `has()` function with `Nullable` column

Previous implementation didn't check for `null_map` when the given
argument was not `Null`. This commit adds the missing check.

Fixes #60214
---
 src/Functions/array/arrayIndex.h                       | 9 +++++++--
 tests/queries/0_stateless/00662_has_nullable.reference | 2 ++
 tests/queries/0_stateless/00662_has_nullable.sql       | 7 +++++++
 3 files changed, 16 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/00662_has_nullable.reference
 create mode 100644 tests/queries/0_stateless/00662_has_nullable.sql

diff --git a/src/Functions/array/arrayIndex.h b/src/Functions/array/arrayIndex.h
index 3b19f0b486a..cd537763b4a 100644
--- a/src/Functions/array/arrayIndex.h
+++ b/src/Functions/array/arrayIndex.h
@@ -1007,8 +1007,13 @@ private:
                         if (!(*null_map)[row])
                             continue;
                     }
-                    else if (!applyVisitor(FieldVisitorAccurateEquals(), arr[i], value))
-                        continue;
+                    else
+                    {
+                        if (null_map && (*null_map)[row])
+                            continue;
+                        if (!applyVisitor(FieldVisitorAccurateEquals(), arr[i], value))
+                            continue;
+                    }
 
                     ConcreteAction::apply(data[row], i);
 
diff --git a/tests/queries/0_stateless/00662_has_nullable.reference b/tests/queries/0_stateless/00662_has_nullable.reference
new file mode 100644
index 00000000000..97da99d655e
--- /dev/null
+++ b/tests/queries/0_stateless/00662_has_nullable.reference
@@ -0,0 +1,2 @@
+1	1
+\N	0
diff --git a/tests/queries/0_stateless/00662_has_nullable.sql b/tests/queries/0_stateless/00662_has_nullable.sql
new file mode 100644
index 00000000000..0d395871d9f
--- /dev/null
+++ b/tests/queries/0_stateless/00662_has_nullable.sql
@@ -0,0 +1,7 @@
+DROP TABLE IF EXISTS 00662_has_nullable;
+CREATE TABLE 00662_has_nullable(a Nullable(UInt64)) ENGINE = Memory;
+
+INSERT INTO 00662_has_nullable VALUES (1), (Null);
+SELECT a, has([0, 1], a) FROM 00662_has_nullable;
+
+DROP TABLE 00662_has_nullable;

From 01d0fba0853930de42d4c122c9f067bd91f9af4b Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Tue, 12 Mar 2024 14:48:59 +0000
Subject: [PATCH 361/985] init

---
 src/Interpreters/InterpreterSelectQuery.cpp | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index bcedba7346d..3c84d086d85 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -2552,7 +2552,12 @@ void InterpreterSelectQuery::executeFetchColumns(QueryProcessingStage::Enum proc
 
         /// If necessary, we request more sources than the number of threads - to distribute the work evenly over the threads.
         if (max_streams > 1 && !is_sync_remote)
-            max_streams = static_cast<size_t>(max_streams * settings.max_streams_to_max_threads_ratio);
+        {
+            if (auto streams_with_ratio = max_streams * settings.max_streams_to_max_threads_ratio; streams_with_ratio > sizeof(size_t))
+                max_streams = static_cast<size_t>(streams_with_ratio);
+            else
+                throw Exception(ErrorCodes::INCORRECT_DATA, "Exceeded limit for `max_streams_to_max_threads_ratio`. Make sure that `max_streams * max_streams_to_max_threads_ratio` not exceeds {}, current value: {}", sizeof(size_t), streams_with_ratio);
+        }
 
         auto & prewhere_info = analysis_result.prewhere_info;
 

From 5576c170517c10757611868444b4f2aa7d9cf41c Mon Sep 17 00:00:00 2001
From: Peter <peter279k@gmail.com>
Date: Tue, 12 Mar 2024 22:57:06 +0800
Subject: [PATCH 362/985] Using straightforward approach to import GPG key

---
 docs/en/getting-started/install.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/getting-started/install.md b/docs/en/getting-started/install.md
index 234420de374..f3bacf7d092 100644
--- a/docs/en/getting-started/install.md
+++ b/docs/en/getting-started/install.md
@@ -78,8 +78,8 @@ It is recommended to use official pre-compiled `deb` packages for Debian or Ubun
 
 #### Setup the Debian repository
 ``` bash
-sudo apt-get install -y apt-transport-https ca-certificates dirmngr
-sudo gpg --no-default-keyring --keyring /usr/share/keyrings/clickhouse-keyring.gpg --keyserver hkp://keyserver.ubuntu.com:80 --recv-keys 8919F6BD2B48D754
+sudo apt-get install -y apt-transport-https ca-certificates dirmngr curl gpg
+curl -fsSL 'https://packages.clickhouse.com/rpm/lts/repodata/repomd.xml.key' | sudo gpg --dearmor -o /usr/share/keyrings/clickhouse-keyring.gpg
 
 echo "deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb stable main" | sudo tee \
     /etc/apt/sources.list.d/clickhouse.list

From 24f4cda4845698bc2e014087a46222d135541f36 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Tue, 12 Mar 2024 15:34:07 +0000
Subject: [PATCH 363/985] impl

---
 .../02908_many_requests_to_system_replicas.sh | 32 +++++++++++++------
 1 file changed, 22 insertions(+), 10 deletions(-)

diff --git a/tests/queries/0_stateless/02908_many_requests_to_system_replicas.sh b/tests/queries/0_stateless/02908_many_requests_to_system_replicas.sh
index d3eed891ab9..2c57545e603 100755
--- a/tests/queries/0_stateless/02908_many_requests_to_system_replicas.sh
+++ b/tests/queries/0_stateless/02908_many_requests_to_system_replicas.sh
@@ -12,22 +12,34 @@ CONCURRENCY=200
 
 echo "Creating $NUM_TABLES tables"
 
+function get_done_or_die_trying()
+{
+  # Sometimes curl produces errors like 'Recv failure: Connection reset by peer' and fails test, let's add a little bit of retries
+  for _ in $(seq 1 10)
+  do
+    curl "$CLICKHOUSE_URL" --silent --fail --show-error --data "$1" &>/dev/null && return
+  done
+
+  echo "Cannot successfully make request"
+  exit 1
+}
+
 function init_table()
 {
     set -e
     i=$1
-    curl $CLICKHOUSE_URL --silent --fail --show-error --data "CREATE TABLE test_02908_r1_$i (a UInt64) ENGINE=ReplicatedMergeTree('/02908/{database}/test_$i', 'r1') ORDER BY tuple()" 2>&1
-    curl $CLICKHOUSE_URL --silent --fail --show-error --data "CREATE TABLE test_02908_r2_$i (a UInt64) ENGINE=ReplicatedMergeTree('/02908/{database}/test_$i', 'r2') ORDER BY tuple()" 2>&1
-    curl $CLICKHOUSE_URL --silent --fail --show-error --data "CREATE TABLE test_02908_r3_$i (a UInt64) ENGINE=ReplicatedMergeTree('/02908/{database}/test_$i', 'r3') ORDER BY tuple()" 2>&1
+    get_done_or_die_trying "CREATE TABLE test_02908_r1_$i (a UInt64) ENGINE=ReplicatedMergeTree('/02908/{database}/test_$i', 'r1') ORDER BY tuple()"
+    get_done_or_die_trying "CREATE TABLE test_02908_r2_$i (a UInt64) ENGINE=ReplicatedMergeTree('/02908/{database}/test_$i', 'r2') ORDER BY tuple()"
+    get_done_or_die_trying "CREATE TABLE test_02908_r3_$i (a UInt64) ENGINE=ReplicatedMergeTree('/02908/{database}/test_$i', 'r3') ORDER BY tuple()"
 
-    curl $CLICKHOUSE_URL --silent --fail --show-error --data "INSERT INTO test_02908_r1_$i  SELECT rand64() FROM numbers(5);" 2>&1
+    get_done_or_die_trying "INSERT INTO test_02908_r1_$i  SELECT rand64() FROM numbers(5);"
 }
 
 export init_table;
 
-for i in `seq 1 $NUM_TABLES`;
+for i in $(seq 1 $NUM_TABLES)
 do
-    init_table $i &
+    init_table "$i" &
 done
 
 wait;
@@ -35,15 +47,15 @@ wait;
 
 echo "Making $CONCURRENCY requests to system.replicas"
 
-for i in `seq 1 $CONCURRENCY`;
+for i in $(seq 1 $CONCURRENCY)
 do
-    curl $CLICKHOUSE_URL --silent --fail --show-error --data "SELECT * FROM system.replicas WHERE database=currentDatabase() FORMAT Null;" 2>&1 || echo "query $i failed" &
+    curl "$CLICKHOUSE_URL" --silent --fail --show-error --data "SELECT * FROM system.replicas WHERE database=currentDatabase() FORMAT Null;" 2>&1 || echo "query $i failed" &
 done
 
 echo "Query system.replicas while waiting for other concurrent requests to finish"
 # lost_part_count column is read from ZooKeeper
-curl $CLICKHOUSE_URL --silent --fail --show-error --data "SELECT sum(lost_part_count) FROM system.replicas WHERE database=currentDatabase();" 2>&1;
+curl "$CLICKHOUSE_URL" --silent --fail --show-error --data "SELECT sum(lost_part_count) FROM system.replicas WHERE database=currentDatabase();" 2>&1;
 # is_leader column is filled without ZooKeeper
-curl $CLICKHOUSE_URL --silent --fail --show-error --data "SELECT sum(is_leader) FROM system.replicas WHERE database=currentDatabase();" 2>&1;
+curl "$CLICKHOUSE_URL" --silent --fail --show-error --data "SELECT sum(is_leader) FROM system.replicas WHERE database=currentDatabase();" 2>&1;
 
 wait;

From 07ee777c8d354526cf89c3647863916a0855de49 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Tue, 12 Mar 2024 15:39:04 +0000
Subject: [PATCH 364/985] Restart CI


From 858ad2d68860d7993280b90c0f17ae3a0e84d712 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Tue, 12 Mar 2024 16:39:10 +0100
Subject: [PATCH 365/985] beautify and change max_value

---
 src/Interpreters/InterpreterSelectQuery.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 3c84d086d85..a314492c5b0 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -2553,10 +2553,10 @@ void InterpreterSelectQuery::executeFetchColumns(QueryProcessingStage::Enum proc
         /// If necessary, we request more sources than the number of threads - to distribute the work evenly over the threads.
         if (max_streams > 1 && !is_sync_remote)
         {
-            if (auto streams_with_ratio = max_streams * settings.max_streams_to_max_threads_ratio; streams_with_ratio > sizeof(size_t))
+            if (auto streams_with_ratio = max_streams * settings.max_streams_to_max_threads_ratio; streams_with_ratio < SIZE_MAX)
                 max_streams = static_cast<size_t>(streams_with_ratio);
             else
-                throw Exception(ErrorCodes::INCORRECT_DATA, "Exceeded limit for `max_streams_to_max_threads_ratio`. Make sure that `max_streams * max_streams_to_max_threads_ratio` not exceeds {}, current value: {}", sizeof(size_t), streams_with_ratio);
+                throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Exceeded limit for `max_streams` with `max_streams_to_max_threads_ratio`. Make sure that `max_streams * max_streams_to_max_threads_ratio` not exceeds {}, current value: {}", SIZE_MAX, streams_with_ratio);
         }
 
         auto & prewhere_info = analysis_result.prewhere_info;

From 2fbc11302148f3374e5ce69ed50adebbce9cbae4 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <mr.felixoid@gmail.com>
Date: Tue, 12 Mar 2024 17:00:44 +0100
Subject: [PATCH 366/985] Adjust the packages in installation docs

---
 docs/en/getting-started/install.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/getting-started/install.md b/docs/en/getting-started/install.md
index f3bacf7d092..ca689ef7995 100644
--- a/docs/en/getting-started/install.md
+++ b/docs/en/getting-started/install.md
@@ -78,7 +78,7 @@ It is recommended to use official pre-compiled `deb` packages for Debian or Ubun
 
 #### Setup the Debian repository
 ``` bash
-sudo apt-get install -y apt-transport-https ca-certificates dirmngr curl gpg
+sudo apt-get install -y apt-transport-https ca-certificates curl gnupg
 curl -fsSL 'https://packages.clickhouse.com/rpm/lts/repodata/repomd.xml.key' | sudo gpg --dearmor -o /usr/share/keyrings/clickhouse-keyring.gpg
 
 echo "deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb stable main" | sudo tee \

From df44ed173c7062ae3f9c8c8528623feea4c5e6f7 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Fri, 1 Mar 2024 17:07:08 +0100
Subject: [PATCH 367/985] Fix missed entries in system.part_log in case of
 fetch preferred over merges/mutations

The NEED_PREPARE do not call part_log_writer() before.

v2:
- Add a test for missed entries in system.part_log for merge
- Fix part_log_writer
- Add a test for missed entries in system.part_log for mutate

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../MergeTree/MergeFromLogEntryTask.cpp       | 42 ++++++++------
 .../MergeTree/MutateFromLogEntryTask.cpp      | 57 +++++++++++--------
 .../ReplicatedMergeMutateTaskBase.cpp         | 28 +++++----
 ...2_part_log_rmt_fetch_merge_error.reference | 10 ++++
 .../03002_part_log_rmt_fetch_merge_error.sql  | 34 +++++++++++
 ..._part_log_rmt_fetch_mutate_error.reference | 10 ++++
 .../03002_part_log_rmt_fetch_mutate_error.sql | 40 +++++++++++++
 7 files changed, 163 insertions(+), 58 deletions(-)
 create mode 100644 tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.reference
 create mode 100644 tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.sql
 create mode 100644 tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.reference
 create mode 100644 tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.sql

diff --git a/src/Storages/MergeTree/MergeFromLogEntryTask.cpp b/src/Storages/MergeTree/MergeFromLogEntryTask.cpp
index ae6e398026d..ec4d98ab298 100644
--- a/src/Storages/MergeTree/MergeFromLogEntryTask.cpp
+++ b/src/Storages/MergeTree/MergeFromLogEntryTask.cpp
@@ -47,13 +47,22 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
     int32_t metadata_version = metadata_snapshot->getMetadataVersion();
     const auto storage_settings_ptr = storage.getSettings();
 
+    stopwatch_ptr = std::make_unique<Stopwatch>();
+    auto part_log_writer = [this, stopwatch = *stopwatch_ptr](const ExecutionStatus & execution_status)
+    {
+        auto profile_counters_snapshot = std::make_shared<ProfileEvents::Counters::Snapshot>(profile_counters.getPartiallyAtomicSnapshot());
+        storage.writePartLog(
+            PartLogElement::MERGE_PARTS, execution_status, stopwatch.elapsed(),
+            entry.new_part_name, part, parts, merge_mutate_entry.get(), std::move(profile_counters_snapshot));
+    };
+
     if (storage_settings_ptr->always_fetch_merged_part)
     {
         LOG_INFO(log, "Will fetch part {} because setting 'always_fetch_merged_part' is true", entry.new_part_name);
         return PrepareResult{
             .prepared_successfully = false,
             .need_to_check_missing_part_in_fetch = true,
-            .part_log_writer = {}
+            .part_log_writer = part_log_writer,
         };
     }
 
@@ -68,7 +77,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
             return PrepareResult{
                 .prepared_successfully = false,
                 .need_to_check_missing_part_in_fetch = false,
-                .part_log_writer = {}
+                .part_log_writer = part_log_writer,
             };
     }
 
@@ -88,7 +97,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
             return PrepareResult{
                 .prepared_successfully = false,
                 .need_to_check_missing_part_in_fetch = true,
-                .part_log_writer = {}
+                .part_log_writer = part_log_writer,
             };
         }
     }
@@ -107,7 +116,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
             return PrepareResult{
                 .prepared_successfully = false,
                 .need_to_check_missing_part_in_fetch = true,
-                .part_log_writer = {}
+                .part_log_writer = part_log_writer,
             };
         }
 
@@ -127,7 +136,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
             return PrepareResult{
                 .prepared_successfully = false,
                 .need_to_check_missing_part_in_fetch = true,
-                .part_log_writer = {}
+                .part_log_writer = part_log_writer,
             };
         }
 
@@ -139,7 +148,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
             return PrepareResult{
                 .prepared_successfully = false,
                 .need_to_check_missing_part_in_fetch = false,
-                .part_log_writer = {}
+                .part_log_writer = part_log_writer,
             };
         }
 
@@ -167,7 +176,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
                 return PrepareResult{
                     .prepared_successfully = false,
                     .need_to_check_missing_part_in_fetch = false,
-                    .part_log_writer = {}
+                    .part_log_writer = part_log_writer,
                 };
             }
         }
@@ -227,7 +236,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
                 return PrepareResult{
                     .prepared_successfully = false,
                     .need_to_check_missing_part_in_fetch = false,
-                    .part_log_writer = {}
+                    .part_log_writer = part_log_writer,
                 };
             }
 
@@ -267,7 +276,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
                 return PrepareResult{
                     .prepared_successfully = false,
                     .need_to_check_missing_part_in_fetch = false,
-                    .part_log_writer = {}
+                    .part_log_writer = part_log_writer,
                 };
             }
             else if (storage.findReplicaHavingCoveringPart(entry.new_part_name, /* active */ false))
@@ -284,7 +293,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
                 return PrepareResult{
                     .prepared_successfully = false,
                     .need_to_check_missing_part_in_fetch = true,
-                    .part_log_writer = {}
+                    .part_log_writer = part_log_writer,
                 };
             }
             else
@@ -311,7 +320,6 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
         task_context);
 
     transaction_ptr = std::make_unique<MergeTreeData::Transaction>(storage, NO_TRANSACTION_RAW);
-    stopwatch_ptr = std::make_unique<Stopwatch>();
 
     merge_task = storage.merger_mutator.mergePartsToTemporaryPart(
             future_merged_part,
@@ -333,13 +341,11 @@ ReplicatedMergeMutateTaskBase::PrepareResult MergeFromLogEntryTask::prepare()
     for (auto & item : future_merged_part->parts)
         priority.value += item->getBytesOnDisk();
 
-    return {true, true, [this, stopwatch = *stopwatch_ptr] (const ExecutionStatus & execution_status)
-    {
-        auto profile_counters_snapshot = std::make_shared<ProfileEvents::Counters::Snapshot>(profile_counters.getPartiallyAtomicSnapshot());
-        storage.writePartLog(
-            PartLogElement::MERGE_PARTS, execution_status, stopwatch.elapsed(),
-            entry.new_part_name, part, parts, merge_mutate_entry.get(), std::move(profile_counters_snapshot));
-    }};
+    return PrepareResult{
+        .prepared_successfully = true,
+        .need_to_check_missing_part_in_fetch = true,
+        .part_log_writer = part_log_writer,
+    };
 }
 
 
diff --git a/src/Storages/MergeTree/MutateFromLogEntryTask.cpp b/src/Storages/MergeTree/MutateFromLogEntryTask.cpp
index a9ff687fe4d..62d7d4a7f2f 100644
--- a/src/Storages/MergeTree/MutateFromLogEntryTask.cpp
+++ b/src/Storages/MergeTree/MutateFromLogEntryTask.cpp
@@ -20,6 +20,22 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
     const auto storage_settings_ptr = storage.getSettings();
     LOG_TRACE(log, "Executing log entry to mutate part {} to {}", source_part_name, entry.new_part_name);
 
+    new_part_info = MergeTreePartInfo::fromPartName(entry.new_part_name, storage.format_version);
+
+    future_mutated_part = std::make_shared<FutureMergedMutatedPart>();
+    future_mutated_part->name = entry.new_part_name;
+    future_mutated_part->uuid = entry.new_part_uuid;
+    future_mutated_part->part_info = new_part_info;
+
+    stopwatch_ptr = std::make_unique<Stopwatch>();
+    auto part_log_writer = [this](const ExecutionStatus & execution_status)
+    {
+        auto profile_counters_snapshot = std::make_shared<ProfileEvents::Counters::Snapshot>(profile_counters.getPartiallyAtomicSnapshot());
+        storage.writePartLog(
+            PartLogElement::MUTATE_PART, execution_status, stopwatch_ptr->elapsed(),
+            entry.new_part_name, new_part, future_mutated_part->parts, merge_mutate_entry.get(), std::move(profile_counters_snapshot));
+    };
+
     MergeTreeData::DataPartPtr source_part = storage.getActiveContainingPart(source_part_name);
     if (!source_part)
     {
@@ -29,10 +45,13 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
         return PrepareResult{
             .prepared_successfully = false,
             .need_to_check_missing_part_in_fetch = true,
-            .part_log_writer = {}
+            .part_log_writer = part_log_writer,
         };
     }
 
+    future_mutated_part->parts.push_back(source_part);
+    future_mutated_part->part_format = source_part->getFormat();
+
     if (source_part->name != source_part_name)
     {
         LOG_WARNING(log,
@@ -44,7 +63,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
         return PrepareResult{
             .prepared_successfully = false,
             .need_to_check_missing_part_in_fetch = true,
-            .part_log_writer = {}
+            .part_log_writer = part_log_writer,
         };
     }
 
@@ -63,7 +82,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
             return PrepareResult{
                 .prepared_successfully = false,
                 .need_to_check_missing_part_in_fetch = true,
-                .part_log_writer = {}
+                .part_log_writer = part_log_writer,
             };
         }
     }
@@ -84,13 +103,12 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
             return PrepareResult{
                 .prepared_successfully = false,
                 .need_to_check_missing_part_in_fetch = true,
-                .part_log_writer = {}
+                .part_log_writer = part_log_writer,
             };
 
         }
     }
 
-    new_part_info = MergeTreePartInfo::fromPartName(entry.new_part_name, storage.format_version);
     Strings mutation_ids;
     commands = std::make_shared<MutationCommands>(storage.queue.getMutationCommands(source_part, new_part_info.mutation, mutation_ids));
     LOG_TRACE(log, "Mutating part {} with mutation commands from {} mutations ({}): {}",
@@ -99,6 +117,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
     /// Once we mutate part, we must reserve space on the same disk, because mutations can possibly create hardlinks.
     /// Can throw an exception.
     reserved_space = storage.reserveSpace(estimated_space_for_result, source_part->getDataPartStorage());
+    future_mutated_part->updatePath(storage, reserved_space.get());
 
     table_lock_holder = storage.lockForShare(
             RWLockImpl::NO_QUERY, storage_settings_ptr->lock_acquire_timeout_for_background_operations);
@@ -106,14 +125,6 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
 
     transaction_ptr = std::make_unique<MergeTreeData::Transaction>(storage, NO_TRANSACTION_RAW);
 
-    future_mutated_part = std::make_shared<FutureMergedMutatedPart>();
-    future_mutated_part->name = entry.new_part_name;
-    future_mutated_part->uuid = entry.new_part_uuid;
-    future_mutated_part->parts.push_back(source_part);
-    future_mutated_part->part_info = new_part_info;
-    future_mutated_part->updatePath(storage, reserved_space.get());
-    future_mutated_part->part_format = source_part->getFormat();
-
     if (storage_settings_ptr->allow_remote_fs_zero_copy_replication)
     {
         if (auto disk = reserved_space->getDisk(); disk->supportZeroCopyReplication())
@@ -124,7 +135,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
                 return PrepareResult{
                     .prepared_successfully = false,
                     .need_to_check_missing_part_in_fetch = true,
-                    .part_log_writer = {}
+                    .part_log_writer = part_log_writer,
                 };
             }
 
@@ -163,7 +174,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
                 return PrepareResult{
                     .prepared_successfully = false,
                     .need_to_check_missing_part_in_fetch = false,
-                    .part_log_writer = {}
+                    .part_log_writer = part_log_writer,
                 };
             }
             else if (storage.findReplicaHavingCoveringPart(entry.new_part_name, /* active */ false))
@@ -182,7 +193,7 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
                 return PrepareResult{
                     .prepared_successfully = false,
                     .need_to_check_missing_part_in_fetch = true,
-                    .part_log_writer = {}
+                    .part_log_writer = part_log_writer,
                 };
             }
             else
@@ -201,8 +212,6 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
         future_mutated_part,
         task_context);
 
-    stopwatch_ptr = std::make_unique<Stopwatch>();
-
     mutate_task = storage.merger_mutator.mutatePartToTemporaryPart(
             future_mutated_part, metadata_snapshot, commands, merge_mutate_entry.get(),
             entry.create_time, task_context, NO_TRANSACTION_PTR, reserved_space, table_lock_holder);
@@ -211,13 +220,11 @@ ReplicatedMergeMutateTaskBase::PrepareResult MutateFromLogEntryTask::prepare()
     for (auto & item : future_mutated_part->parts)
         priority.value += item->getBytesOnDisk();
 
-    return {true, true, [this] (const ExecutionStatus & execution_status)
-    {
-        auto profile_counters_snapshot = std::make_shared<ProfileEvents::Counters::Snapshot>(profile_counters.getPartiallyAtomicSnapshot());
-        storage.writePartLog(
-            PartLogElement::MUTATE_PART, execution_status, stopwatch_ptr->elapsed(),
-            entry.new_part_name, new_part, future_mutated_part->parts, merge_mutate_entry.get(), std::move(profile_counters_snapshot));
-    }};
+    return PrepareResult{
+        .prepared_successfully = true,
+        .need_to_check_missing_part_in_fetch = true,
+        .part_log_writer = part_log_writer,
+    };
 }
 
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.cpp b/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.cpp
index 37d848ad095..2fc5238827d 100644
--- a/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeMutateTaskBase.cpp
@@ -164,8 +164,16 @@ bool ReplicatedMergeMutateTaskBase::executeImpl()
 
     auto execute_fetch = [&] (bool need_to_check_missing_part) -> bool
     {
-        if (storage.executeFetch(entry, need_to_check_missing_part))
-            return remove_processed_entry();
+        try
+        {
+            if (storage.executeFetch(entry, need_to_check_missing_part))
+                return remove_processed_entry();
+        }
+        catch (...)
+        {
+            part_log_writer(ExecutionStatus::fromCurrentException("", true));
+            throw;
+        }
 
         return false;
     };
@@ -205,8 +213,7 @@ bool ReplicatedMergeMutateTaskBase::executeImpl()
             }
             catch (...)
             {
-                if (part_log_writer)
-                    part_log_writer(ExecutionStatus::fromCurrentException("", true));
+                part_log_writer(ExecutionStatus::fromCurrentException("", true));
                 throw;
             }
 
@@ -214,17 +221,8 @@ bool ReplicatedMergeMutateTaskBase::executeImpl()
         }
         case State::NEED_FINALIZE :
         {
-            try
-            {
-                if (!finalize(part_log_writer))
-                    return execute_fetch(/* need_to_check_missing = */true);
-            }
-            catch (...)
-            {
-                if (part_log_writer)
-                    part_log_writer(ExecutionStatus::fromCurrentException("", true));
-                throw;
-            }
+            if (!finalize(part_log_writer))
+                return execute_fetch(/* need_to_check_missing = */true);
 
             return remove_processed_entry();
         }
diff --git a/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.reference b/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.reference
new file mode 100644
index 00000000000..b19d389d8d0
--- /dev/null
+++ b/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.reference
@@ -0,0 +1,10 @@
+before
+rmt_master	NewPart	0	1
+rmt_master	MergeParts	0	1
+rmt_slave	MergeParts	1	0
+rmt_slave	DownloadPart	0	1
+after
+rmt_master	NewPart	0	1
+rmt_master	MergeParts	0	1
+rmt_slave	MergeParts	1	0
+rmt_slave	DownloadPart	0	2
diff --git a/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.sql b/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.sql
new file mode 100644
index 00000000000..a7381df5e11
--- /dev/null
+++ b/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.sql
@@ -0,0 +1,34 @@
+-- Tags: no-replicated-database, no-parallel
+
+drop table if exists rmt_master;
+drop table if exists rmt_slave;
+
+create table rmt_master (key Int) engine=ReplicatedMergeTree('/clickhouse/{database}', 'master') order by key settings always_fetch_merged_part=0;
+-- always_fetch_merged_part=1, consider this table as a "slave"
+create table rmt_slave (key Int) engine=ReplicatedMergeTree('/clickhouse/{database}', 'slave') order by key settings always_fetch_merged_part=1;
+
+insert into rmt_master values (1);
+
+system sync replica rmt_master;
+system sync replica rmt_slave;
+system stop replicated sends rmt_master;
+optimize table rmt_master final settings alter_sync=1, optimize_throw_if_noop=1;
+
+select sleep(3) format Null;
+
+system flush logs;
+select 'before';
+select table, event_type, error>0, countIf(error=0) from system.part_log where database = currentDatabase() group by 1, 2, 3 order by 1, 2, 3;
+
+system start replicated sends rmt_master;
+-- sleep few seconds to try rmt_slave to fetch the part and reflect this error
+-- in system.part_log
+select sleep(3) format Null;
+system sync replica rmt_slave;
+
+system flush logs;
+select 'after';
+select table, event_type, error>0, countIf(error=0) from system.part_log where database = currentDatabase() group by 1, 2, 3 order by 1, 2, 3;
+
+drop table rmt_master;
+drop table rmt_slave;
diff --git a/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.reference b/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.reference
new file mode 100644
index 00000000000..aac9e7527d1
--- /dev/null
+++ b/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.reference
@@ -0,0 +1,10 @@
+before
+rmt_master	NewPart	0	1
+rmt_master	MutatePart	0	1
+rmt_slave	DownloadPart	0	1
+rmt_slave	MutatePart	1	0
+after
+rmt_master	NewPart	0	1
+rmt_master	MutatePart	0	1
+rmt_slave	DownloadPart	0	2
+rmt_slave	MutatePart	1	0
diff --git a/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.sql b/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.sql
new file mode 100644
index 00000000000..f19cb9c73c9
--- /dev/null
+++ b/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.sql
@@ -0,0 +1,40 @@
+-- Tags: no-replicated-database, no-parallel
+
+drop table if exists rmt_master;
+drop table if exists rmt_slave;
+
+create table rmt_master (key Int) engine=ReplicatedMergeTree('/clickhouse/{database}', 'master') order by tuple() settings always_fetch_merged_part=0;
+-- prefer_fetch_merged_part_*_threshold=0, consider this table as a "slave"
+create table rmt_slave (key Int) engine=ReplicatedMergeTree('/clickhouse/{database}', 'slave') order by tuple() settings prefer_fetch_merged_part_time_threshold=0, prefer_fetch_merged_part_size_threshold=0;
+
+insert into rmt_master values (1);
+
+system sync replica rmt_master;
+system sync replica rmt_slave;
+system stop replicated sends rmt_master;
+system stop pulling replication log rmt_slave;
+alter table rmt_master update key=key+100 where 1 settings alter_sync=1;
+
+-- first we need to make the rmt_master execute mutation so that it will have
+-- the part, and rmt_slave will consider it instead of performing mutation on
+-- it's own, otherwise prefer_fetch_merged_part_*_threshold will be simply ignored
+select sleep(3) format Null;
+system start pulling replication log rmt_slave;
+-- and sleep few more seconds to try rmt_slave to fetch the part and reflect
+-- this error in system.part_log
+select sleep(3) format Null;
+
+system flush logs;
+select 'before';
+select table, event_type, error>0, countIf(error=0) from system.part_log where database = currentDatabase() group by 1, 2, 3 order by 1, 2, 3;
+
+system start replicated sends rmt_master;
+select sleep(3) format Null;
+system sync replica rmt_slave;
+
+system flush logs;
+select 'after';
+select table, event_type, error>0, countIf(error=0) from system.part_log where database = currentDatabase() group by 1, 2, 3 order by 1, 2, 3;
+
+drop table rmt_master;
+drop table rmt_slave;

From fb0ad3eb1590a00d7e28554a6f7342ca63c3e214 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 12 Mar 2024 12:28:09 +0100
Subject: [PATCH 368/985] Disable retries for replicated fetches (they are
 handled by the engine itself)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/MergeTree/DataPartsExchange.cpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index 9f95794cf50..6bb5ff5a4ab 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -487,10 +487,15 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> Fetcher::fetchSelected
         creds.setPassword(password);
     }
 
+    ReadSettings read_settings = context->getReadSettings();
+    /// Disable retries for fetches, this will be done by the engine itself.
+    read_settings.http_max_tries = 1;
+
     auto in = BuilderRWBufferFromHTTP(uri)
                   .withConnectionGroup(HTTPConnectionGroupType::HTTP)
                   .withMethod(Poco::Net::HTTPRequest::HTTP_POST)
                   .withTimeouts(timeouts)
+                  .withSettings(read_settings)
                   .withDelayInit(false)
                   .create(creds);
 

From f71cc5d706ba63a692ddf0766691b51e2734d146 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 3 Mar 2024 12:04:22 +0100
Subject: [PATCH 369/985] Fix 02943_rmt_alter_metadata_merge_checksum_mismatch
 (filter out NO_REPLICA_HAS_PART errors)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../02943_rmt_alter_metadata_merge_checksum_mismatch.sh         | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02943_rmt_alter_metadata_merge_checksum_mismatch.sh b/tests/queries/0_stateless/02943_rmt_alter_metadata_merge_checksum_mismatch.sh
index 431f59d7918..9c0c872eb06 100755
--- a/tests/queries/0_stateless/02943_rmt_alter_metadata_merge_checksum_mismatch.sh
+++ b/tests/queries/0_stateless/02943_rmt_alter_metadata_merge_checksum_mismatch.sh
@@ -95,4 +95,4 @@ trap '' EXIT
 
 $CLICKHOUSE_CLIENT -q "system flush logs"
 # check for error "Different number of files: 5 compressed (expected 3) and 2 uncompressed ones (expected 2). (CHECKSUM_DOESNT_MATCH)"
-$CLICKHOUSE_CLIENT -q "select part_name, merge_reason, event_type, errorCodeToName(error) from system.part_log where database = '$CLICKHOUSE_DATABASE' and error != 0 order by event_time_microseconds"
+$CLICKHOUSE_CLIENT -q "select part_name, merge_reason, event_type, errorCodeToName(error) from system.part_log where database = '$CLICKHOUSE_DATABASE' and error != 0 and errorCodeToName(error) != 'NO_REPLICA_HAS_PART' order by event_time_microseconds"

From e7d02654a7edf0194fc99d93ea3cff7cfa5e1fc8 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 12 Mar 2024 17:08:28 +0100
Subject: [PATCH 370/985] Fix 02265_column_ttl (filter out NO_REPLICA_HAS_PART
 errors)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 tests/queries/0_stateless/02265_column_ttl.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02265_column_ttl.sql b/tests/queries/0_stateless/02265_column_ttl.sql
index 3ab175329bc..16ae2da2a2b 100644
--- a/tests/queries/0_stateless/02265_column_ttl.sql
+++ b/tests/queries/0_stateless/02265_column_ttl.sql
@@ -37,4 +37,4 @@ attach table ttl_02265;
 --
 optimize table ttl_02265 final;
 system flush logs;
-select * from system.part_log where database = currentDatabase() and table like 'ttl_02265%' and error != 0;
+select * from system.part_log where database = currentDatabase() and table like 'ttl_02265%' and error != 0 and errorCodeToName(error) != 'NO_REPLICA_HAS_PART';

From e1ea0671b132097182279831560f1bafc07c95ce Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Tue, 12 Mar 2024 17:27:25 +0100
Subject: [PATCH 371/985] Disable test 02998_primary_key_skip_columns.sql in
 sanitizer builds as it can be slow

---
 tests/queries/0_stateless/02998_primary_key_skip_columns.sql | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
index b2dadcc5e7c..b567155ab1f 100644
--- a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
@@ -1,3 +1,5 @@
+-- Tags: no-asan, no-tsan, no-msan, no-ubsan
+
 DROP TABLE IF EXISTS test;
 
 CREATE TABLE test (a UInt64, b UInt64, c UInt64) ENGINE = MergeTree ORDER BY (a, b, c) SETTINGS index_granularity = 1, primary_key_ratio_of_unique_prefix_values_to_skip_suffix_columns = 1;

From ccc6df0e432783e3d128fe1c7b6a22b399f2b510 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 12 Mar 2024 16:43:55 +0000
Subject: [PATCH 372/985] fix aggregate function uniqExact

---
 .../AggregateFunctionUniq.h                   |  2 ++
 .../Combinators/AggregateFunctionArray.h      |  1 +
 .../Combinators/AggregateFunctionIf.h         |  1 +
 .../Combinators/AggregateFunctionMerge.h      |  1 +
 .../Combinators/AggregateFunctionNull.h       |  1 +
 .../Combinators/AggregateFunctionState.h      |  1 +
 src/AggregateFunctions/IAggregateFunction.h   |  4 +++
 src/Common/ColumnsHashingImpl.h               |  3 +-
 src/Common/ProfileEvents.cpp                  |  2 ++
 src/Interpreters/Aggregator.cpp               | 18 ++++++++--
 src/Interpreters/Aggregator.h                 |  1 +
 .../03008_optimize_equal_ranges.reference     |  8 +++++
 .../03008_optimize_equal_ranges.sql           | 25 +++++++++++++
 .../03008_uniq_exact_equal_ranges.reference   |  0
 .../03008_uniq_exact_equal_ranges.sql         | 36 +++++++++++++++++++
 15 files changed, 100 insertions(+), 4 deletions(-)
 create mode 100644 tests/queries/0_stateless/03008_optimize_equal_ranges.reference
 create mode 100644 tests/queries/0_stateless/03008_optimize_equal_ranges.sql
 create mode 100644 tests/queries/0_stateless/03008_uniq_exact_equal_ranges.reference
 create mode 100644 tests/queries/0_stateless/03008_uniq_exact_equal_ranges.sql

diff --git a/src/AggregateFunctions/AggregateFunctionUniq.h b/src/AggregateFunctions/AggregateFunctionUniq.h
index 8ac75e4451c..891f2ac4284 100644
--- a/src/AggregateFunctions/AggregateFunctionUniq.h
+++ b/src/AggregateFunctions/AggregateFunctionUniq.h
@@ -483,6 +483,7 @@ public:
     }
 
     bool isAbleToParallelizeMerge() const override { return is_able_to_parallelize_merge; }
+    bool canOptimizeEqualKeysRanges() const override { return !is_able_to_parallelize_merge; }
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena *) const override
     {
@@ -576,6 +577,7 @@ public:
     }
 
     bool isAbleToParallelizeMerge() const override { return is_able_to_parallelize_merge; }
+    bool canOptimizeEqualKeysRanges() const override { return !is_able_to_parallelize_merge; }
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena *) const override
     {
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionArray.h b/src/AggregateFunctions/Combinators/AggregateFunctionArray.h
index 7f38453f86b..6b918926d0d 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionArray.h
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionArray.h
@@ -142,6 +142,7 @@ public:
     }
 
     bool isAbleToParallelizeMerge() const override { return nested_func->isAbleToParallelizeMerge(); }
+    bool canOptimizeEqualKeysRanges() const override { return nested_func->canOptimizeEqualKeysRanges(); }
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena * arena) const override
     {
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionIf.h b/src/AggregateFunctions/Combinators/AggregateFunctionIf.h
index e81f2203e7b..df23398a10d 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionIf.h
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionIf.h
@@ -165,6 +165,7 @@ public:
     }
 
     bool isAbleToParallelizeMerge() const override { return nested_func->isAbleToParallelizeMerge(); }
+    bool canOptimizeEqualKeysRanges() const override { return nested_func->canOptimizeEqualKeysRanges(); }
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena * arena) const override
     {
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionMerge.h b/src/AggregateFunctions/Combinators/AggregateFunctionMerge.h
index 5b9e8e606af..53c24bd60c1 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionMerge.h
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionMerge.h
@@ -111,6 +111,7 @@ public:
     }
 
     bool isAbleToParallelizeMerge() const override { return nested_func->isAbleToParallelizeMerge(); }
+    bool canOptimizeEqualKeysRanges() const override { return nested_func->canOptimizeEqualKeysRanges(); }
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena * arena) const override
     {
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionNull.h b/src/AggregateFunctions/Combinators/AggregateFunctionNull.h
index 8b614f68540..ba72f960852 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionNull.h
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionNull.h
@@ -152,6 +152,7 @@ public:
     }
 
     bool isAbleToParallelizeMerge() const override { return nested_function->isAbleToParallelizeMerge(); }
+    bool canOptimizeEqualKeysRanges() const override { return nested_function->canOptimizeEqualKeysRanges(); }
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena * arena) const override
     {
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionState.h b/src/AggregateFunctions/Combinators/AggregateFunctionState.h
index 8335d21cb1e..b0ab6d49604 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionState.h
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionState.h
@@ -92,6 +92,7 @@ public:
     }
 
     bool isAbleToParallelizeMerge() const override { return nested_func->isAbleToParallelizeMerge(); }
+    bool canOptimizeEqualKeysRanges() const override { return nested_func->canOptimizeEqualKeysRanges(); }
 
     void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, ThreadPool & thread_pool, Arena * arena) const override
     {
diff --git a/src/AggregateFunctions/IAggregateFunction.h b/src/AggregateFunctions/IAggregateFunction.h
index 94bb121893d..499185320e6 100644
--- a/src/AggregateFunctions/IAggregateFunction.h
+++ b/src/AggregateFunctions/IAggregateFunction.h
@@ -162,6 +162,10 @@ public:
     /// Tells if merge() with thread pool parameter could be used.
     virtual bool isAbleToParallelizeMerge() const { return false; }
 
+    /// Return true if it is allowed to replace call of `addBatch`
+    /// to `addBatchSinglePlace` for ranges of consecutive equal keys.
+    virtual bool canOptimizeEqualKeysRanges() const { return true; }
+
     /// Should be used only if isAbleToParallelizeMerge() returned true.
     virtual void
     merge(AggregateDataPtr __restrict /*place*/, ConstAggregateDataPtr /*rhs*/, ThreadPool & /*thread_pool*/, Arena * /*arena*/) const
diff --git a/src/Common/ColumnsHashingImpl.h b/src/Common/ColumnsHashingImpl.h
index 7116160e94c..d68171a6566 100644
--- a/src/Common/ColumnsHashingImpl.h
+++ b/src/Common/ColumnsHashingImpl.h
@@ -62,7 +62,6 @@ struct LastElementCache
     bool check(const Key & key) const { return value.first == key; }
 
     bool hasOnlyOneValue() const { return found && misses == 1; }
-    UInt64 getMisses() const { return misses; }
 };
 
 template <typename Data>
@@ -232,7 +231,7 @@ public:
     ALWAYS_INLINE UInt64 getCacheMissesSinceLastReset() const
     {
         if constexpr (consecutive_keys_optimization)
-            return cache.getMisses();
+            return cache.misses;
         return 0;
     }
 
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index c1ac3d08245..8fd1e189977 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -533,6 +533,8 @@ The server successfully detected this situation and will download merged part fr
     \
     M(AggregationPreallocatedElementsInHashTables, "How many elements were preallocated in hash tables for aggregation.") \
     M(AggregationHashTablesInitializedAsTwoLevel, "How many hash tables were inited as two-level for aggregation.") \
+    M(AggregationProcessedBlocks, "How many blocks were processed by Aggregator") \
+    M(AggregationOptimizedEqualRangesOfKeys, "For how many blocks optimization of equal ranges of keys was applied") \
     \
     M(MetadataFromKeeperCacheHit, "Number of times an object storage metadata request was answered from cache without making request to Keeper") \
     M(MetadataFromKeeperCacheMiss, "Number of times an object storage metadata request had to be answered from Keeper") \
diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 80a98683867..7c9dac82eff 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -53,6 +53,8 @@ namespace ProfileEvents
     extern const Event OverflowThrow;
     extern const Event OverflowBreak;
     extern const Event OverflowAny;
+    extern const Event AggregationProcessedBlocks;
+    extern const Event AggregationOptimizedEqualRangesOfKeys;
 }
 
 namespace CurrentMetrics
@@ -985,6 +987,7 @@ void Aggregator::executeOnBlockSmall(
 {
     /// `result` will destroy the states of aggregate functions in the destructor
     result.aggregator = this;
+    ProfileEvents::increment(ProfileEvents::AggregationProcessedBlocks);
 
     /// How to perform the aggregation?
     if (result.empty())
@@ -1342,6 +1345,7 @@ void NO_INLINE Aggregator::executeImplBatch(
     if constexpr (use_compiled_functions)
     {
         std::vector<ColumnData> columns_data;
+        bool can_optimize_equal_keys_ranges = true;
 
         for (size_t i = 0; i < aggregate_functions.size(); ++i)
         {
@@ -1350,13 +1354,15 @@ void NO_INLINE Aggregator::executeImplBatch(
 
             AggregateFunctionInstruction * inst = aggregate_instructions + i;
             size_t arguments_size = inst->that->getArgumentTypes().size(); // NOLINT
+            can_optimize_equal_keys_ranges &= inst->can_optimize_equal_keys_ranges;
 
             for (size_t argument_index = 0; argument_index < arguments_size; ++argument_index)
                 columns_data.emplace_back(getColumnData(inst->batch_arguments[argument_index]));
         }
 
-        if (all_keys_are_const || (!no_more_keys && state.hasOnlyOneValueSinceLastReset()))
+        if (all_keys_are_const || (can_optimize_equal_keys_ranges && state.hasOnlyOneValueSinceLastReset()))
         {
+            ProfileEvents::increment(ProfileEvents::AggregationOptimizedEqualRangesOfKeys);
             auto add_into_aggregate_states_function_single_place = compiled_aggregate_functions_holder->compiled_aggregate_functions.add_into_aggregate_states_function_single_place;
             add_into_aggregate_states_function_single_place(row_begin, row_end, columns_data.data(), places[key_start]);
         }
@@ -1379,10 +1385,15 @@ void NO_INLINE Aggregator::executeImplBatch(
 
         AggregateFunctionInstruction * inst = aggregate_instructions + i;
 
-        if (all_keys_are_const || (!no_more_keys && state.hasOnlyOneValueSinceLastReset()))
+        if (all_keys_are_const || (inst->can_optimize_equal_keys_ranges && state.hasOnlyOneValueSinceLastReset()))
+        {
+            ProfileEvents::increment(ProfileEvents::AggregationOptimizedEqualRangesOfKeys);
             addBatchSinglePlace(row_begin, row_end, inst, places[key_start] + inst->state_offset, aggregates_pool);
+        }
         else
+        {
             addBatch(row_begin, row_end, inst, places.get(), aggregates_pool);
+        }
     }
 }
 
@@ -1510,6 +1521,7 @@ void NO_INLINE Aggregator::executeOnIntervalWithoutKey(
     /// `data_variants` will destroy the states of aggregate functions in the destructor
     data_variants.aggregator = this;
     data_variants.init(AggregatedDataVariants::Type::without_key);
+    ProfileEvents::increment(ProfileEvents::AggregationProcessedBlocks);
 
     AggregatedDataWithoutKey & res = data_variants.without_key;
 
@@ -1588,6 +1600,7 @@ void Aggregator::prepareAggregateInstructions(
         }
 
         aggregate_functions_instructions[i].has_sparse_arguments = has_sparse_arguments;
+        aggregate_functions_instructions[i].can_optimize_equal_keys_ranges = aggregate_functions[i]->canOptimizeEqualKeysRanges();
         aggregate_functions_instructions[i].arguments = aggregate_columns[i].data();
         aggregate_functions_instructions[i].state_offset = offsets_of_aggregate_states[i];
 
@@ -1640,6 +1653,7 @@ bool Aggregator::executeOnBlock(Columns columns,
 {
     /// `result` will destroy the states of aggregate functions in the destructor
     result.aggregator = this;
+    ProfileEvents::increment(ProfileEvents::AggregationProcessedBlocks);
 
     /// How to perform the aggregation?
     if (result.empty())
diff --git a/src/Interpreters/Aggregator.h b/src/Interpreters/Aggregator.h
index 375b8986101..2d3f497fec0 100644
--- a/src/Interpreters/Aggregator.h
+++ b/src/Interpreters/Aggregator.h
@@ -1221,6 +1221,7 @@ public:
         const IColumn ** batch_arguments{};
         const UInt64 * offsets{};
         bool has_sparse_arguments = false;
+        bool can_optimize_equal_keys_ranges = true;
     };
 
     /// Used for optimize_aggregation_in_order:
diff --git a/tests/queries/0_stateless/03008_optimize_equal_ranges.reference b/tests/queries/0_stateless/03008_optimize_equal_ranges.reference
new file mode 100644
index 00000000000..08f8008fca6
--- /dev/null
+++ b/tests/queries/0_stateless/03008_optimize_equal_ranges.reference
@@ -0,0 +1,8 @@
+0	30000
+1	30000
+2	30000
+0	449985000
+1	449985000
+2	449985000
+sum	1
+uniqExact	0
diff --git a/tests/queries/0_stateless/03008_optimize_equal_ranges.sql b/tests/queries/0_stateless/03008_optimize_equal_ranges.sql
new file mode 100644
index 00000000000..c6143fb7f51
--- /dev/null
+++ b/tests/queries/0_stateless/03008_optimize_equal_ranges.sql
@@ -0,0 +1,25 @@
+DROP TABLE IF EXISTS t_optimize_equal_ranges;
+
+CREATE TABLE t_optimize_equal_ranges (a UInt64, b String, c UInt64) ENGINE = MergeTree ORDER BY a;
+
+SET max_block_size = 1024;
+SET max_bytes_before_external_group_by = 0;
+SET optimize_aggregation_in_order = 0;
+
+INSERT INTO t_optimize_equal_ranges SELECT 0, toString(number), number FROM numbers(30000);
+INSERT INTO t_optimize_equal_ranges SELECT 1, toString(number), number FROM numbers(30000);
+INSERT INTO t_optimize_equal_ranges SELECT 2, toString(number), number FROM numbers(30000);
+
+SELECT a, uniqExact(b) FROM t_optimize_equal_ranges GROUP BY a ORDER BY a;
+SELECT a, sum(c) FROM t_optimize_equal_ranges GROUP BY a ORDER BY a;
+
+SYSTEM FLUSH LOGS;
+
+SELECT
+    used_aggregate_functions[1] AS func,
+    ProfileEvents['AggregationOptimizedEqualRangesOfKeys'] > 0
+FROM system.query_log
+WHERE type = 'QueryFinish' AND current_database = currentDatabase() AND query LIKE '%SELECT%FROM%t_optimize_equal_ranges%'
+ORDER BY func;
+
+DROP TABLE t_optimize_equal_ranges;
diff --git a/tests/queries/0_stateless/03008_uniq_exact_equal_ranges.reference b/tests/queries/0_stateless/03008_uniq_exact_equal_ranges.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03008_uniq_exact_equal_ranges.sql b/tests/queries/0_stateless/03008_uniq_exact_equal_ranges.sql
new file mode 100644
index 00000000000..2e708f28cac
--- /dev/null
+++ b/tests/queries/0_stateless/03008_uniq_exact_equal_ranges.sql
@@ -0,0 +1,36 @@
+DROP TABLE IF EXISTS t_uniq_exact;
+
+CREATE TABLE t_uniq_exact (a UInt64, b String, c UInt64) ENGINE = MergeTree ORDER BY a;
+
+SET group_by_two_level_threshold_bytes = 1;
+SET group_by_two_level_threshold = 1;
+SET max_threads = 4;
+SET max_bytes_before_external_group_by = 0;
+SET optimize_aggregation_in_order = 0;
+
+INSERT INTO t_uniq_exact SELECT 0, randomPrintableASCII(5), rand() FROM numbers(300000);
+INSERT INTO t_uniq_exact SELECT 1, randomPrintableASCII(5), rand() FROM numbers(300000);
+INSERT INTO t_uniq_exact SELECT 2, randomPrintableASCII(5), rand() FROM numbers(300000);
+INSERT INTO t_uniq_exact SELECT 3, randomPrintableASCII(5), rand() FROM numbers(300000);
+INSERT INTO t_uniq_exact SELECT 4, randomPrintableASCII(5), rand() FROM numbers(300000);
+INSERT INTO t_uniq_exact SELECT 5, randomPrintableASCII(5), rand() FROM numbers(300000);
+INSERT INTO t_uniq_exact SELECT 6, randomPrintableASCII(5), rand() FROM numbers(300000);
+INSERT INTO t_uniq_exact SELECT 7, randomPrintableASCII(5), rand() FROM numbers(300000);
+INSERT INTO t_uniq_exact SELECT 8, randomPrintableASCII(5), rand() FROM numbers(300000);
+INSERT INTO t_uniq_exact SELECT 9, randomPrintableASCII(5), rand() FROM numbers(300000);
+
+OPTIMIZE TABLE t_uniq_exact FINAL;
+
+SELECT a, uniqExact(b) FROM t_uniq_exact GROUP BY a ORDER BY a
+SETTINGS min_hit_rate_to_use_consecutive_keys_optimization = 1.0
+EXCEPT
+SELECT a, uniqExact(b) FROM t_uniq_exact GROUP BY a ORDER BY a
+SETTINGS min_hit_rate_to_use_consecutive_keys_optimization = 0.5;
+
+SELECT a, sum(c) FROM t_uniq_exact GROUP BY a ORDER BY a
+SETTINGS min_hit_rate_to_use_consecutive_keys_optimization = 1.0
+EXCEPT
+SELECT a, sum(c) FROM t_uniq_exact GROUP BY a ORDER BY a
+SETTINGS min_hit_rate_to_use_consecutive_keys_optimization = 0.5;
+
+DROP TABLE t_uniq_exact;

From 53442f49140c9c8b391f5b3a76a9bf4ab45dbed0 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Tue, 12 Mar 2024 13:48:47 -0300
Subject: [PATCH 373/985] Cleans up markdown.

---
 docs/en/sql-reference/aggregate-functions/reference/varpop.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/aggregate-functions/reference/varpop.md b/docs/en/sql-reference/aggregate-functions/reference/varpop.md
index 5f18bdc30f6..76472f62789 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/varpop.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/varpop.md
@@ -27,7 +27,7 @@ Returns an integer of type `Float64`.
 
 **Implementation details**
 
-This function uses a numerically unstable algorithm. If you need numerical stability in calculations, use the slower but more stable [`varPopStable` function](#varPopStable). 
+This function uses a numerically unstable algorithm. If you need numerical stability in calculations, use the slower but more stable [`varPopStable` function](#varPopStable).
 
 **Example**
 

From b3cfb8a2cba2f779e63cb35aec49fd263a24eb19 Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Tue, 12 Mar 2024 13:57:03 -0300
Subject: [PATCH 374/985] Adds sleep function docs.

---
 .../functions/other-functions.md              | 92 ++++++++++++++++++-
 1 file changed, 89 insertions(+), 3 deletions(-)

diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index 739b688a0d2..de8ac67a936 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -300,11 +300,97 @@ The argument is internally still evaluated. Useful e.g. for benchmarks.
 
 ## sleep(seconds)
 
-Sleeps ‘seconds’ seconds for each data block. The sleep time can be specified as integer or as floating-point number.
+Used to introduce a delay or pause in the execution of a query. It is primarily used for testing and debugging purposes.
 
-## sleepEachRow(seconds)
+**Syntax**
 
-Sleeps ‘seconds’ seconds for each row. The sleep time can be specified as integer or as floating-point number.
+```sql
+sleep(seconds)
+```
+
+**Arguments**
+
+- `seconds`: [Int](../../sql-reference/data-types/int-uint.md) The number of seconds to pause the query execution to a maximum of 3 seconds. It can be a floating-point value to specify fractional seconds.
+
+**Returned value**
+
+This function does not return any value.
+
+**Example**
+
+```sql
+SELECT sleep(2);
+```
+
+This function does not return any value. However, if you run the function with `clickhouse client` you will see something similar to:
+
+```response
+SELECT sleep(2)
+
+Query id: 8aa9943e-a686-45e1-8317-6e8e3a5596ac
+
+┌─sleep(2)─┐
+│        0 │
+└──────────┘
+
+1 row in set. Elapsed: 2.012 sec.
+```
+
+This query will pause for 2 seconds before completing. During this time, no results will be returned, and the query will appear to be hanging or unresponsive.
+
+**Implementation details**
+
+The `sleep()` function is generally not used in production environments, as it can negatively impact query performance and system responsiveness. However, it can be useful in the following scenarios:
+
+1. **Testing**: When testing or benchmarking ClickHouse, you may want to simulate delays or introduce pauses to observe how the system behaves under certain conditions.
+2. **Debugging**: If you need to examine the state of the system or the execution of a query at a specific point in time, you can use `sleep()` to introduce a pause, allowing you to inspect or collect relevant information.
+3. **Simulation**: In some cases, you may want to simulate real-world scenarios where delays or pauses occur, such as network latency or external system dependencies.
+
+It's important to use the `sleep()` function judiciously and only when necessary, as it can potentially impact the overall performance and responsiveness of your ClickHouse system.
+
+## sleepEachRow
+
+Pauses the execution of a query for a specified number of seconds for each row in the result set.
+
+**Syntax**
+
+```sql
+sleepEachRow(seconds)
+```
+
+**Arguments**
+
+- `seconds`: [Int](../../sql-reference/data-types/int-uint.md) The number of seconds to pause the query execution for each row in the result set. It can be a floating-point value to specify fractional seconds.
+
+**Returned value**
+
+This function returns the same input values as it receives, without modifying them.
+
+**Example**
+
+```sql
+SELECT number, sleepEachRow(0.5) FROM system.numbers LIMIT 5;
+```
+
+```response
+┌─number─┬─sleepEachRow(0.5)─┐
+│      0 │                 0 │
+│      1 │                 0 │
+│      2 │                 0 │
+│      3 │                 0 │
+│      4 │                 0 │
+└────────┴───────────────────┘
+```
+
+But the output will be delayed, with a 0.5-second pause between each row.
+
+The `sleepEachRow()` function is primarily used for testing and debugging purposes, similar to the `sleep()` function. It allows you to simulate delays or introduce pauses in the processing of each row, which can be useful in scenarios such as:
+
+1. **Testing**: When testing or benchmarking ClickHouse's performance under specific conditions, you can use `sleepEachRow()` to simulate delays or introduce pauses for each row processed.
+2. **Debugging**: If you need to examine the state of the system or the execution of a query for each row processed, you can use `sleepEachRow()` to introduce pauses, allowing you to inspect or collect relevant information.
+3. **Simulation**: In some cases, you may want to simulate real-world scenarios where delays or pauses occur for each row processed, such as when dealing with external systems or network latencies.
+
+Like the [`sleep()` function](#sleep), it's important to use `sleepEachRow()` judiciously and only when necessary, as it can significantly impact the overall performance and responsiveness of your ClickHouse system, especially when dealing with large result sets.
 
 ## currentDatabase()
 

From 2847def5176509bdbefe0809c2abbe31baf540af Mon Sep 17 00:00:00 2001
From: johnnymatthews <9611008+johnnymatthews@users.noreply.github.com>
Date: Tue, 12 Mar 2024 13:57:34 -0300
Subject: [PATCH 375/985] Formats markdown with prettier.

---
 .../functions/other-functions.md              | 408 +++++++++---------
 1 file changed, 204 insertions(+), 204 deletions(-)

diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index de8ac67a936..df443eec0de 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -17,7 +17,7 @@ Returns a named value from the [macros](../../operations/server-configuration-pa
 
 **Syntax**
 
-``` sql
+```sql
 getMacro(name);
 ```
 
@@ -35,7 +35,7 @@ Type: [String](../../sql-reference/data-types/string.md).
 
 Example `<macros>` section in the server configuration file:
 
-``` xml
+```xml
 <macros>
     <test>Value</test>
 </macros>
@@ -43,13 +43,13 @@ Example `<macros>` section in the server configuration file:
 
 Query:
 
-``` sql
+```sql
 SELECT getMacro('test');
 ```
 
 Result:
 
-``` text
+```text
 ┌─getMacro('test')─┐
 │ Value            │
 └──────────────────┘
@@ -57,12 +57,12 @@ Result:
 
 The same value can be retrieved as follows:
 
-``` sql
+```sql
 SELECT * FROM system.macros
 WHERE macro = 'test';
 ```
 
-``` text
+```text
 ┌─macro─┬─substitution─┐
 │ test  │ Value        │
 └───────┴──────────────┘
@@ -74,7 +74,7 @@ Returns the fully qualified domain name of the ClickHouse server.
 
 **Syntax**
 
-``` sql
+```sql
 fqdn();
 ```
 
@@ -88,13 +88,13 @@ Type: `String`.
 
 **Example**
 
-``` sql
+```sql
 SELECT FQDN();
 ```
 
 Result:
 
-``` text
+```text
 ┌─FQDN()──────────────────────────┐
 │ clickhouse.ru-central1.internal │
 └─────────────────────────────────┘
@@ -104,7 +104,7 @@ Result:
 
 Extracts the tail of a string following its last slash or backslash. This function if often used to extract the filename from a path.
 
-``` sql
+```sql
 basename(expr)
 ```
 
@@ -123,13 +123,13 @@ A string that contains:
 
 Query:
 
-``` sql
+```sql
 SELECT 'some/long/path/to/file' AS a, basename(a)
 ```
 
 Result:
 
-``` text
+```text
 ┌─a──────────────────────┬─basename('some\\long\\path\\to\\file')─┐
 │ some\long\path\to\file │ file                                   │
 └────────────────────────┴────────────────────────────────────────┘
@@ -137,13 +137,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 SELECT 'some\\long\\path\\to\\file' AS a, basename(a)
 ```
 
 Result:
 
-``` text
+```text
 ┌─a──────────────────────┬─basename('some\\long\\path\\to\\file')─┐
 │ some\long\path\to\file │ file                                   │
 └────────────────────────┴────────────────────────────────────────┘
@@ -151,13 +151,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 SELECT 'some-file-name' AS a, basename(a)
 ```
 
 Result:
 
-``` text
+```text
 ┌─a──────────────┬─basename('some-file-name')─┐
 │ some-file-name │ some-file-name             │
 └────────────────┴────────────────────────────┘
@@ -170,11 +170,11 @@ This function is used by the system to implement Pretty formats.
 
 `NULL` is represented as a string corresponding to `NULL` in `Pretty` formats.
 
-``` sql
+```sql
 SELECT visibleWidth(NULL)
 ```
 
-``` text
+```text
 ┌─visibleWidth(NULL)─┐
 │                  4 │
 └────────────────────┘
@@ -256,7 +256,7 @@ SELECT key, byteSize(u8) AS `byteSize(UInt8)`, byteSize(u16) AS `byteSize(UInt16
 
 Result:
 
-``` text
+```text
 Row 1:
 ──────
 key:               1
@@ -401,7 +401,7 @@ Useful in table engine parameters of `CREATE TABLE` queries where you need to sp
 
 Returns the name of the current user. In case of a distributed query, the name of the user who initiated the query is returned.
 
-``` sql
+```sql
 SELECT currentUser();
 ```
 
@@ -416,13 +416,13 @@ Type: `String`.
 
 **Example**
 
-``` sql
+```sql
 SELECT currentUser();
 ```
 
 Result:
 
-``` text
+```text
 ┌─currentUser()─┐
 │ default       │
 └───────────────┘
@@ -438,7 +438,7 @@ This function is mostly intended for development, debugging and demonstration.
 
 **Syntax**
 
-``` sql
+```sql
 isConstant(x)
 ```
 
@@ -457,13 +457,13 @@ Type: [UInt8](../../sql-reference/data-types/int-uint.md).
 
 Query:
 
-``` sql
+```sql
 SELECT isConstant(x + 1) FROM (SELECT 43 AS x)
 ```
 
 Result:
 
-``` text
+```text
 ┌─isConstant(plus(x, 1))─┐
 │                      1 │
 └────────────────────────┘
@@ -471,13 +471,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 WITH 3.14 AS pi SELECT isConstant(cos(pi))
 ```
 
 Result:
 
-``` text
+```text
 ┌─isConstant(cos(pi))─┐
 │                   1 │
 └─────────────────────┘
@@ -485,13 +485,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 SELECT isConstant(number) FROM numbers(1)
 ```
 
 Result:
 
-``` text
+```text
 ┌─isConstant(number)─┐
 │                  0 │
 └────────────────────┘
@@ -511,7 +511,7 @@ Checks whether a floating point value is finite.
 
 **Syntax**
 
-``` sql
+```sql
 ifNotFinite(x,y)
 ```
 
@@ -565,7 +565,7 @@ The band is drawn with accuracy to one eighth of a symbol.
 
 Example:
 
-``` sql
+```sql
 SELECT
     toHour(EventTime) AS h,
     count() AS c,
@@ -575,7 +575,7 @@ GROUP BY h
 ORDER BY h ASC
 ```
 
-``` text
+```text
 ┌──h─┬──────c─┬─bar────────────────┐
 │  0 │ 292907 │ █████████▋         │
 │  1 │ 180563 │ ██████             │
@@ -633,7 +633,7 @@ For example, the first argument could have type `Int64`, while the second argume
 
 Example:
 
-``` sql
+```sql
 SELECT
     transform(SearchEngineID, [2, 3], ['Yandex', 'Google'], 'Other') AS title,
     count() AS c
@@ -643,7 +643,7 @@ GROUP BY title
 ORDER BY c DESC
 ```
 
-``` text
+```text
 ┌─title─────┬──────c─┐
 │ Yandex    │ 498635 │
 │ Google    │ 229872 │
@@ -657,7 +657,7 @@ Similar to the other variation but has no ‘default’ argument. In case no mat
 
 Example:
 
-``` sql
+```sql
 SELECT
     transform(domain(Referer), ['yandex.ru', 'google.ru', 'vkontakte.ru'], ['www.yandex', 'example.com', 'vk.com']) AS s,
     count() AS c
@@ -667,7 +667,7 @@ ORDER BY count() DESC
 LIMIT 10
 ```
 
-``` text
+```text
 ┌─s──────────────┬───────c─┐
 │                │ 2906259 │
 │ www.yandex     │  867767 │
@@ -687,13 +687,13 @@ Given a size (number of bytes), this function returns a readable, rounded size w
 
 Example:
 
-``` sql
+```sql
 SELECT
     arrayJoin([1, 1024, 1024*1024, 192851925]) AS filesize_bytes,
     formatReadableDecimalSize(filesize_bytes) AS filesize
 ```
 
-``` text
+```text
 ┌─filesize_bytes─┬─filesize───┐
 │              1 │ 1.00 B     │
 │           1024 │ 1.02 KB   │
@@ -708,7 +708,7 @@ Given a size (number of bytes), this function returns a readable, rounded size w
 
 Example:
 
-``` sql
+```sql
 SELECT
     arrayJoin([1, 1024, 1024*1024, 192851925]) AS filesize_bytes,
     formatReadableSize(filesize_bytes) AS filesize
@@ -716,7 +716,7 @@ SELECT
 
 Alias: `FORMAT_BYTES`.
 
-``` text
+```text
 ┌─filesize_bytes─┬─filesize───┐
 │              1 │ 1.00 B     │
 │           1024 │ 1.00 KiB   │
@@ -731,13 +731,13 @@ Given a number, this function returns a rounded number with suffix (thousand, mi
 
 Example:
 
-``` sql
+```sql
 SELECT
     arrayJoin([1024, 1234 * 1000, (4567 * 1000) * 1000, 98765432101234]) AS number,
     formatReadableQuantity(number) AS number_for_humans
 ```
 
-``` text
+```text
 ┌─────────number─┬─number_for_humans─┐
 │           1024 │ 1.02 thousand     │
 │        1234000 │ 1.23 million      │
@@ -752,7 +752,7 @@ Given a time interval (delta) in seconds, this function returns a time delta wit
 
 **Syntax**
 
-``` sql
+```sql
 formatReadableTimeDelta(column[, maximum_unit, minimum_unit])
 ```
 
@@ -760,21 +760,22 @@ formatReadableTimeDelta(column[, maximum_unit, minimum_unit])
 
 - `column` — A column with a numeric time delta.
 - `maximum_unit` — Optional. Maximum unit to show.
-  * Acceptable values: `nanoseconds`, `microseconds`, `milliseconds`, `seconds`, `minutes`, `hours`, `days`, `months`, `years`.
-  * Default value: `years`.
+  - Acceptable values: `nanoseconds`, `microseconds`, `milliseconds`, `seconds`, `minutes`, `hours`, `days`, `months`, `years`.
+  - Default value: `years`.
 - `minimum_unit` — Optional. Minimum unit to show. All smaller units are truncated.
-  * Acceptable values: `nanoseconds`, `microseconds`, `milliseconds`, `seconds`, `minutes`, `hours`, `days`, `months`, `years`.
-  * If explicitly specified value is bigger than `maximum_unit`, an exception will be thrown.
-  * Default value: `seconds` if `maximum_unit` is `seconds` or bigger, `nanoseconds` otherwise.
+  - Acceptable values: `nanoseconds`, `microseconds`, `milliseconds`, `seconds`, `minutes`, `hours`, `days`, `months`, `years`.
+  - If explicitly specified value is bigger than `maximum_unit`, an exception will be thrown.
+  - Default value: `seconds` if `maximum_unit` is `seconds` or bigger, `nanoseconds` otherwise.
 
 **Example**
-``` sql
+
+```sql
 SELECT
     arrayJoin([100, 12345, 432546534]) AS elapsed,
     formatReadableTimeDelta(elapsed) AS time_delta
 ```
 
-``` text
+```text
 ┌────elapsed─┬─time_delta ─────────────────────────────────────────────────────┐
 │        100 │ 1 minute and 40 seconds                                         │
 │      12345 │ 3 hours, 25 minutes and 45 seconds                              │
@@ -782,13 +783,13 @@ SELECT
 └────────────┴─────────────────────────────────────────────────────────────────┘
 ```
 
-``` sql
+```sql
 SELECT
     arrayJoin([100, 12345, 432546534]) AS elapsed,
     formatReadableTimeDelta(elapsed, 'minutes') AS time_delta
 ```
 
-``` text
+```text
 ┌────elapsed─┬─time_delta ─────────────────────────────────────────────────────┐
 │        100 │ 1 minute and 40 seconds                                         │
 │      12345 │ 205 minutes and 45 seconds                                      │
@@ -824,7 +825,6 @@ parseTimeDelta(timestr)
 
 - `timestr` — A sequence of numbers followed by something resembling a time unit.
 
-
 **Returned value**
 
 - A floating-point number with the number of seconds.
@@ -936,7 +936,7 @@ The window function that provides access to a row at a specified offset before o
 
 **Syntax**
 
-``` sql
+```sql
 neighbor(column, offset[, default_value])
 ```
 
@@ -966,13 +966,13 @@ Type: type of data blocks affected or default value type.
 
 Query:
 
-``` sql
+```sql
 SELECT number, neighbor(number, 2) FROM system.numbers LIMIT 10;
 ```
 
 Result:
 
-``` text
+```text
 ┌─number─┬─neighbor(number, 2)─┐
 │      0 │                   2 │
 │      1 │                   3 │
@@ -989,13 +989,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 SELECT number, neighbor(number, 2, 999) FROM system.numbers LIMIT 10;
 ```
 
 Result:
 
-``` text
+```text
 ┌─number─┬─neighbor(number, 2, 999)─┐
 │      0 │                        2 │
 │      1 │                        3 │
@@ -1014,7 +1014,7 @@ This function can be used to compute year-over-year metric value:
 
 Query:
 
-``` sql
+```sql
 WITH toDate('2018-01-01') AS start_date
 SELECT
     toStartOfMonth(start_date + (number * 32)) AS month,
@@ -1026,7 +1026,7 @@ FROM numbers(16)
 
 Result:
 
-``` text
+```text
 ┌──────month─┬─money─┬─prev_year─┬─year_over_year─┐
 │ 2018-01-01 │    32 │         0 │              0 │
 │ 2018-02-01 │    63 │         0 │              0 │
@@ -1063,7 +1063,7 @@ To prevent that you can create a subquery with [ORDER BY](../../sql-reference/st
 
 Example:
 
-``` sql
+```sql
 SELECT
     EventID,
     EventTime,
@@ -1080,7 +1080,7 @@ FROM
 )
 ```
 
-``` text
+```text
 ┌─EventID─┬───────────EventTime─┬─delta─┐
 │    1106 │ 2016-11-24 00:00:04 │     0 │
 │    1107 │ 2016-11-24 00:00:05 │     1 │
@@ -1092,7 +1092,7 @@ FROM
 
 Please note that the block size affects the result. The internal state of `runningDifference` state is reset for each new block.
 
-``` sql
+```sql
 SELECT
     number,
     runningDifference(number + 1) AS diff
@@ -1100,7 +1100,7 @@ FROM numbers(100000)
 WHERE diff != 1
 ```
 
-``` text
+```text
 ┌─number─┬─diff─┐
 │      0 │    0 │
 └────────┴──────┘
@@ -1109,7 +1109,7 @@ WHERE diff != 1
 └────────┴──────┘
 ```
 
-``` sql
+```sql
 set max_block_size=100000 -- default value is 65536!
 
 SELECT
@@ -1119,7 +1119,7 @@ FROM numbers(100000)
 WHERE diff != 1
 ```
 
-``` text
+```text
 ┌─number─┬─diff─┐
 │      0 │    0 │
 └────────┴──────┘
@@ -1135,21 +1135,20 @@ Calculates the number of concurrent events.
 Each event has a start time and an end time. The start time is included in the event, while the end time is excluded. Columns with a start time and an end time must be of the same data type.
 The function calculates the total number of active (concurrent) events for each event start time.
 
-
 :::tip
 Events must be ordered by the start time in ascending order. If this requirement is violated the function raises an exception. Every data block is processed separately. If events from different data blocks overlap then they can not be processed correctly.
 :::
 
 **Syntax**
 
-``` sql
+```sql
 runningConcurrency(start, end)
 ```
 
 **Arguments**
 
 - `start` — A column with the start time of events. [Date](../../sql-reference/data-types/date.md), [DateTime](../../sql-reference/data-types/datetime.md), or [DateTime64](../../sql-reference/data-types/datetime64.md).
-- `end` — A column with the end time of events.  [Date](../../sql-reference/data-types/date.md), [DateTime](../../sql-reference/data-types/datetime.md), or [DateTime64](../../sql-reference/data-types/datetime64.md).
+- `end` — A column with the end time of events. [Date](../../sql-reference/data-types/date.md), [DateTime](../../sql-reference/data-types/datetime.md), or [DateTime64](../../sql-reference/data-types/datetime64.md).
 
 **Returned values**
 
@@ -1161,7 +1160,7 @@ Type: [UInt32](../../sql-reference/data-types/int-uint.md)
 
 Consider the table:
 
-``` text
+```text
 ┌──────start─┬────────end─┐
 │ 2021-03-03 │ 2021-03-11 │
 │ 2021-03-06 │ 2021-03-12 │
@@ -1172,13 +1171,13 @@ Consider the table:
 
 Query:
 
-``` sql
+```sql
 SELECT start, runningConcurrency(start, end) FROM example_table;
 ```
 
 Result:
 
-``` text
+```text
 ┌──────start─┬─runningConcurrency(start, end)─┐
 │ 2021-03-03 │                              1 │
 │ 2021-03-06 │                              2 │
@@ -1204,7 +1203,7 @@ Given a MAC address in format AA:BB:CC:DD:EE:FF (colon-separated numbers in hexa
 Returns the number of fields in [Enum](../../sql-reference/data-types/enum.md).
 An exception is thrown if the type is not `Enum`.
 
-``` sql
+```sql
 getSizeOfEnumType(value)
 ```
 
@@ -1218,11 +1217,11 @@ getSizeOfEnumType(value)
 
 **Example**
 
-``` sql
+```sql
 SELECT getSizeOfEnumType( CAST('a' AS Enum8('a' = 1, 'b' = 2) ) ) AS x
 ```
 
-``` text
+```text
 ┌─x─┐
 │ 2 │
 └───┘
@@ -1232,7 +1231,7 @@ SELECT getSizeOfEnumType( CAST('a' AS Enum8('a' = 1, 'b' = 2) ) ) AS x
 
 Returns the size on disk without considering compression.
 
-``` sql
+```sql
 blockSerializedSize(value[, value[, ...]])
 ```
 
@@ -1248,13 +1247,13 @@ blockSerializedSize(value[, value[, ...]])
 
 Query:
 
-``` sql
+```sql
 SELECT blockSerializedSize(maxState(1)) as x
 ```
 
 Result:
 
-``` text
+```text
 ┌─x─┐
 │ 2 │
 └───┘
@@ -1264,7 +1263,7 @@ Result:
 
 Returns the internal name of the data type that represents the value.
 
-``` sql
+```sql
 toColumnTypeName(value)
 ```
 
@@ -1280,13 +1279,13 @@ toColumnTypeName(value)
 
 Difference between `toTypeName ' and ' toColumnTypeName`:
 
-``` sql
+```sql
 SELECT toTypeName(CAST('2018-01-01 01:02:03' AS DateTime))
 ```
 
 Result:
 
-``` text
+```text
 ┌─toTypeName(CAST('2018-01-01 01:02:03', 'DateTime'))─┐
 │ DateTime                                            │
 └─────────────────────────────────────────────────────┘
@@ -1294,13 +1293,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 SELECT toColumnTypeName(CAST('2018-01-01 01:02:03' AS DateTime))
 ```
 
 Result:
 
-``` text
+```text
 ┌─toColumnTypeName(CAST('2018-01-01 01:02:03', 'DateTime'))─┐
 │ Const(UInt32)                                             │
 └───────────────────────────────────────────────────────────┘
@@ -1312,7 +1311,7 @@ The example shows that the `DateTime` data type is internally stored as `Const(U
 
 Outputs a detailed description of data structures in RAM
 
-``` sql
+```sql
 dumpColumnStructure(value)
 ```
 
@@ -1326,11 +1325,11 @@ dumpColumnStructure(value)
 
 **Example**
 
-``` sql
+```sql
 SELECT dumpColumnStructure(CAST('2018-01-01 01:02:03', 'DateTime'))
 ```
 
-``` text
+```text
 ┌─dumpColumnStructure(CAST('2018-01-01 01:02:03', 'DateTime'))─┐
 │ DateTime, Const(size = 1, UInt32(size = 1))                  │
 └──────────────────────────────────────────────────────────────┘
@@ -1342,7 +1341,7 @@ Returns the default value for the given data type.
 
 Does not include default values for custom columns set by the user.
 
-``` sql
+```sql
 defaultValueOfArgumentType(expression)
 ```
 
@@ -1360,13 +1359,13 @@ defaultValueOfArgumentType(expression)
 
 Query:
 
-``` sql
+```sql
 SELECT defaultValueOfArgumentType( CAST(1 AS Int8) )
 ```
 
 Result:
 
-``` text
+```text
 ┌─defaultValueOfArgumentType(CAST(1, 'Int8'))─┐
 │                                           0 │
 └─────────────────────────────────────────────┘
@@ -1374,13 +1373,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 SELECT defaultValueOfArgumentType( CAST(1 AS Nullable(Int8) ) )
 ```
 
 Result:
 
-``` text
+```text
 ┌─defaultValueOfArgumentType(CAST(1, 'Nullable(Int8)'))─┐
 │                                                  ᴺᵁᴸᴸ │
 └───────────────────────────────────────────────────────┘
@@ -1392,7 +1391,7 @@ Returns the default value for the given type name.
 
 Does not include default values for custom columns set by the user.
 
-``` sql
+```sql
 defaultValueOfTypeName(type)
 ```
 
@@ -1410,13 +1409,13 @@ defaultValueOfTypeName(type)
 
 Query:
 
-``` sql
+```sql
 SELECT defaultValueOfTypeName('Int8')
 ```
 
 Result:
 
-``` text
+```text
 ┌─defaultValueOfTypeName('Int8')─┐
 │                              0 │
 └────────────────────────────────┘
@@ -1424,13 +1423,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 SELECT defaultValueOfTypeName('Nullable(Int8)')
 ```
 
 Result:
 
-``` text
+```text
 ┌─defaultValueOfTypeName('Nullable(Int8)')─┐
 │                                     ᴺᵁᴸᴸ │
 └──────────────────────────────────────────┘
@@ -1542,7 +1541,7 @@ Creates an array with a single value.
 
 Used for the internal implementation of [arrayJoin](../../sql-reference/functions/array-join.md#functions_arrayjoin).
 
-``` sql
+```sql
 SELECT replicate(x, arr);
 ```
 
@@ -1561,13 +1560,13 @@ Type: `Array`.
 
 Query:
 
-``` sql
+```sql
 SELECT replicate(1, ['a', 'b', 'c'])
 ```
 
 Result:
 
-``` text
+```text
 ┌─replicate(1, ['a', 'b', 'c'])─┐
 │ [1,1,1]                       │
 └───────────────────────────────┘
@@ -1579,7 +1578,7 @@ Returns the amount of free space in the filesystem hosting the database persiste
 
 **Syntax**
 
-``` sql
+```sql
 filesystemAvailable()
 ```
 
@@ -1593,13 +1592,13 @@ Type: [UInt64](../../sql-reference/data-types/int-uint.md).
 
 Query:
 
-``` sql
+```sql
 SELECT formatReadableSize(filesystemAvailable()) AS "Available space";
 ```
 
 Result:
 
-``` text
+```text
 ┌─Available space─┐
 │ 30.75 GiB       │
 └─────────────────┘
@@ -1611,7 +1610,7 @@ Returns the total amount of the free space on the filesystem hosting the databas
 
 **Syntax**
 
-``` sql
+```sql
 filesystemFree()
 ```
 
@@ -1625,13 +1624,13 @@ Type: [UInt64](../../sql-reference/data-types/int-uint.md).
 
 Query:
 
-``` sql
+```sql
 SELECT formatReadableSize(filesystemFree()) AS "Free space";
 ```
 
 Result:
 
-``` text
+```text
 ┌─Free space─┐
 │ 32.39 GiB  │
 └────────────┘
@@ -1643,7 +1642,7 @@ Returns the capacity of the filesystem in bytes. Needs the [path](../../operatio
 
 **Syntax**
 
-``` sql
+```sql
 filesystemCapacity()
 ```
 
@@ -1657,13 +1656,13 @@ Type: [UInt64](../../sql-reference/data-types/int-uint.md).
 
 Query:
 
-``` sql
+```sql
 SELECT formatReadableSize(filesystemCapacity()) AS "Capacity";
 ```
 
 Result:
 
-``` text
+```text
 ┌─Capacity──┐
 │ 39.32 GiB │
 └───────────┘
@@ -1675,7 +1674,7 @@ Calculates the result of an aggregate function based on a single value. This fun
 
 **Syntax**
 
-``` sql
+```sql
 initializeAggregation (aggregate_function, arg1, arg2, ..., argN)
 ```
 
@@ -1697,6 +1696,7 @@ Query:
 ```sql
 SELECT uniqMerge(state) FROM (SELECT initializeAggregation('uniqState', number % 3) AS state FROM numbers(10000));
 ```
+
 Result:
 
 ```text
@@ -1749,7 +1749,7 @@ Given a state of aggregate function, this function returns the result of aggrega
 
 **Syntax**
 
-``` sql
+```sql
 finalizeAggregation(state)
 ```
 
@@ -1854,7 +1854,7 @@ The state is reset for each new block of data.
 
 **Syntax**
 
-``` sql
+```sql
 runningAccumulate(agg_state[, grouping]);
 ```
 
@@ -1875,13 +1875,13 @@ Consider how you can use `runningAccumulate` to find the cumulative sum of numbe
 
 Query:
 
-``` sql
+```sql
 SELECT k, runningAccumulate(sum_k) AS res FROM (SELECT number as k, sumState(k) AS sum_k FROM numbers(10) GROUP BY k ORDER BY k);
 ```
 
 Result:
 
-``` text
+```text
 ┌─k─┬─res─┐
 │ 0 │   0 │
 │ 1 │   1 │
@@ -1909,7 +1909,7 @@ The following example shows the `groupping` parameter usage:
 
 Query:
 
-``` sql
+```sql
 SELECT
     grouping,
     item,
@@ -1928,7 +1928,7 @@ FROM
 
 Result:
 
-``` text
+```text
 ┌─grouping─┬─item─┬─res─┐
 │        0 │    0 │   0 │
 │        0 │    1 │   1 │
@@ -1960,7 +1960,7 @@ Only supports tables created with the `ENGINE = Join(ANY, LEFT, <join_keys>)` st
 
 **Syntax**
 
-``` sql
+```sql
 joinGet(join_storage_table_name, `value_column`, join_keys)
 ```
 
@@ -1982,13 +1982,13 @@ More info about `join_use_nulls` in [Join operation](../../engines/table-engines
 
 Input table:
 
-``` sql
+```sql
 CREATE DATABASE db_test
 CREATE TABLE db_test.id_val(`id` UInt32, `val` UInt32) ENGINE = Join(ANY, LEFT, id) SETTINGS join_use_nulls = 1
 INSERT INTO db_test.id_val VALUES (1,11)(2,12)(4,13)
 ```
 
-``` text
+```text
 ┌─id─┬─val─┐
 │  4 │  13 │
 │  2 │  12 │
@@ -1998,13 +1998,13 @@ INSERT INTO db_test.id_val VALUES (1,11)(2,12)(4,13)
 
 Query:
 
-``` sql
+```sql
 SELECT joinGet(db_test.id_val, 'val', toUInt32(number)) from numbers(4) SETTINGS join_use_nulls = 1
 ```
 
 Result:
 
-``` text
+```text
 ┌─joinGet(db_test.id_val, 'val', toUInt32(number))─┐
 │                                                0 │
 │                                               11 │
@@ -2022,7 +2022,7 @@ This function is not available in ClickHouse Cloud.
 Evaluate an external catboost model. [CatBoost](https://catboost.ai) is an open-source gradient boosting library developed by Yandex for machine learning.
 Accepts a path to a catboost model and model arguments (features). Returns Float64.
 
-``` sql
+```sql
 SELECT feat1, ..., feat_n, catboostEvaluate('/path/to/model.bin', feat_1, ..., feat_n) AS prediction
 FROM data_table
 ```
@@ -2035,7 +2035,7 @@ Before evaluating catboost models, the `libcatboostmodel.<so|dylib>` library mus
 
 Next, specify the path to `libcatboostmodel.<so|dylib>` in the clickhouse configuration:
 
-``` xml
+```xml
 <clickhouse>
 ...
     <catboost_lib_path>/path/to/libcatboostmodel.so</catboost_lib_path>
@@ -2048,7 +2048,7 @@ At the first execution of `catboostEvaluate()`, the server starts the library br
 communicate using a HTTP interface. By default, port `9012` is used. A different port can be specified as follows - this is useful if port
 `9012` is already assigned to a different service.
 
-``` xml
+```xml
 <library_bridge>
     <port>9019</port>
 </library_bridge>
@@ -2072,13 +2072,13 @@ To use the `error_code` argument, configuration parameter `allow_custom_error_co
 
 **Example**
 
-``` sql
+```sql
 SELECT throwIf(number = 3, 'Too many') FROM numbers(10);
 ```
 
 Result:
 
-``` text
+```text
 ↙ Progress: 0.00 rows, 0.00 B (0.00 rows/s., 0.00 B/s.) Received exception from server (version 19.14.1):
 Code: 395. DB::Exception: Received from localhost:9000. DB::Exception: Too many.
 ```
@@ -2089,7 +2089,7 @@ Returns its argument. Intended for debugging and testing. Allows to cancel using
 
 **Syntax**
 
-``` sql
+```sql
 identity(x)
 ```
 
@@ -2097,13 +2097,13 @@ identity(x)
 
 Query:
 
-``` sql
+```sql
 SELECT identity(42);
 ```
 
 Result:
 
-``` text
+```text
 ┌─identity(42)─┐
 │           42 │
 └──────────────┘
@@ -2150,7 +2150,7 @@ Checks whether the [Decimal](../../sql-reference/data-types/decimal.md) value is
 
 **Syntax**
 
-``` sql
+```sql
 isDecimalOverflow(d, [p])
 ```
 
@@ -2168,7 +2168,7 @@ isDecimalOverflow(d, [p])
 
 Query:
 
-``` sql
+```sql
 SELECT isDecimalOverflow(toDecimal32(1000000000, 0), 9),
        isDecimalOverflow(toDecimal32(1000000000, 0)),
        isDecimalOverflow(toDecimal32(-1000000000, 0), 9),
@@ -2177,7 +2177,7 @@ SELECT isDecimalOverflow(toDecimal32(1000000000, 0), 9),
 
 Result:
 
-``` text
+```text
 1	1	1	1
 ```
 
@@ -2187,7 +2187,7 @@ Returns number of decimal digits need to represent a value.
 
 **Syntax**
 
-``` sql
+```sql
 countDigits(x)
 ```
 
@@ -2209,7 +2209,7 @@ For `Decimal` values takes into account their scales: calculates result over und
 
 Query:
 
-``` sql
+```sql
 SELECT countDigits(toDecimal32(1, 9)), countDigits(toDecimal32(-1, 9)),
        countDigits(toDecimal64(1, 18)), countDigits(toDecimal64(-1, 18)),
        countDigits(toDecimal128(1, 38)), countDigits(toDecimal128(-1, 38));
@@ -2217,7 +2217,7 @@ SELECT countDigits(toDecimal32(1, 9)), countDigits(toDecimal32(-1, 9)),
 
 Result:
 
-``` text
+```text
 10	10	19	19	39	39
 ```
 
@@ -2229,13 +2229,13 @@ Type: [LowCardinality(String)](../../sql-reference/data-types/lowcardinality.md)
 
 **Syntax**
 
-``` sql
+```sql
 errorCodeToName(1)
 ```
 
 Result:
 
-``` text
+```text
 UNSUPPORTED_METHOD
 ```
 
@@ -2246,7 +2246,7 @@ If executed in the context of a distributed table, this function generates a nor
 
 **Syntax**
 
-``` sql
+```sql
 tcpPort()
 ```
 
@@ -2264,13 +2264,13 @@ Type: [UInt16](../../sql-reference/data-types/int-uint.md).
 
 Query:
 
-``` sql
+```sql
 SELECT tcpPort();
 ```
 
 Result:
 
-``` text
+```text
 ┌─tcpPort()─┐
 │      9000 │
 └───────────┘
@@ -2288,7 +2288,7 @@ The command [SET PROFILE](../../sql-reference/statements/set.md#query-set) could
 
 **Syntax**
 
-``` sql
+```sql
 currentProfiles()
 ```
 
@@ -2300,11 +2300,11 @@ Type: [Array](../../sql-reference/data-types/array.md)([String](../../sql-refere
 
 ## enabledProfiles
 
- Returns settings profiles, assigned to the current user both explicitly and implicitly. Explicitly assigned profiles are the same as returned by the [currentProfiles](#current-profiles) function. Implicitly assigned profiles include parent profiles of other assigned profiles, profiles assigned via granted roles, profiles assigned via their own settings, and the main default profile (see the `default_profile` section in the main server configuration file).
+Returns settings profiles, assigned to the current user both explicitly and implicitly. Explicitly assigned profiles are the same as returned by the [currentProfiles](#current-profiles) function. Implicitly assigned profiles include parent profiles of other assigned profiles, profiles assigned via granted roles, profiles assigned via their own settings, and the main default profile (see the `default_profile` section in the main server configuration file).
 
 **Syntax**
 
-``` sql
+```sql
 enabledProfiles()
 ```
 
@@ -2320,7 +2320,7 @@ Returns all the profiles specified at the current user's definition (see [CREATE
 
 **Syntax**
 
-``` sql
+```sql
 defaultProfiles()
 ```
 
@@ -2336,7 +2336,7 @@ Returns the roles assigned to the current user. The roles can be changed by the
 
 **Syntax**
 
-``` sql
+```sql
 currentRoles()
 ```
 
@@ -2352,7 +2352,7 @@ Returns the names of the current roles and the roles, granted to some of the cur
 
 **Syntax**
 
-``` sql
+```sql
 enabledRoles()
 ```
 
@@ -2368,7 +2368,7 @@ Returns the roles which are enabled by default for the current user when he logs
 
 **Syntax**
 
-``` sql
+```sql
 defaultRoles()
 ```
 
@@ -2384,7 +2384,7 @@ Returns the server port number. When the port is not used by the server, throws
 
 **Syntax**
 
-``` sql
+```sql
 getServerPort(port_name)
 ```
 
@@ -2392,16 +2392,16 @@ getServerPort(port_name)
 
 - `port_name` — The name of the server port. [String](../../sql-reference/data-types/string.md#string). Possible values:
 
-    - 'tcp_port'
-    - 'tcp_port_secure'
-    - 'http_port'
-    - 'https_port'
-    - 'interserver_http_port'
-    - 'interserver_https_port'
-    - 'mysql_port'
-    - 'postgresql_port'
-    - 'grpc_port'
-    - 'prometheus.port'
+  - 'tcp_port'
+  - 'tcp_port_secure'
+  - 'http_port'
+  - 'https_port'
+  - 'interserver_http_port'
+  - 'interserver_https_port'
+  - 'mysql_port'
+  - 'postgresql_port'
+  - 'grpc_port'
+  - 'prometheus.port'
 
 **Returned value**
 
@@ -2413,13 +2413,13 @@ Type: [UInt16](../../sql-reference/data-types/int-uint.md).
 
 Query:
 
-``` sql
+```sql
 SELECT getServerPort('tcp_port');
 ```
 
 Result:
 
-``` text
+```text
 ┌─getServerPort('tcp_port')─┐
 │ 9000                      │
 └───────────────────────────┘
@@ -2433,7 +2433,7 @@ In contrast to [initialQueryID](#initial-query-id) function, `queryID` can retur
 
 **Syntax**
 
-``` sql
+```sql
 queryID()
 ```
 
@@ -2447,7 +2447,7 @@ Type: [String](../../sql-reference/data-types/string.md)
 
 Query:
 
-``` sql
+```sql
 CREATE TABLE tmp (str String) ENGINE = Log;
 INSERT INTO tmp (*) VALUES ('a');
 SELECT count(DISTINCT t) FROM (SELECT queryID() AS t FROM remote('127.0.0.{1..3}', currentDatabase(), 'tmp') GROUP BY queryID());
@@ -2455,7 +2455,7 @@ SELECT count(DISTINCT t) FROM (SELECT queryID() AS t FROM remote('127.0.0.{1..3}
 
 Result:
 
-``` text
+```text
 ┌─count()─┐
 │ 3       │
 └─────────┘
@@ -2469,7 +2469,7 @@ In contrast to [queryID](#query-id) function, `initialQueryID` returns the same
 
 **Syntax**
 
-``` sql
+```sql
 initialQueryID()
 ```
 
@@ -2483,7 +2483,7 @@ Type: [String](../../sql-reference/data-types/string.md)
 
 Query:
 
-``` sql
+```sql
 CREATE TABLE tmp (str String) ENGINE = Log;
 INSERT INTO tmp (*) VALUES ('a');
 SELECT count(DISTINCT t) FROM (SELECT initialQueryID() AS t FROM remote('127.0.0.{1..3}', currentDatabase(), 'tmp') GROUP BY queryID());
@@ -2491,7 +2491,7 @@ SELECT count(DISTINCT t) FROM (SELECT initialQueryID() AS t FROM remote('127.0.0
 
 Result:
 
-``` text
+```text
 ┌─count()─┐
 │ 1       │
 └─────────┘
@@ -2504,7 +2504,7 @@ If a query is not distributed then constant value `0` is returned.
 
 **Syntax**
 
-``` sql
+```sql
 shardNum()
 ```
 
@@ -2520,7 +2520,7 @@ In the following example a configuration with two shards is used. The query is e
 
 Query:
 
-``` sql
+```sql
 CREATE TABLE shard_num_example (dummy UInt8)
     ENGINE=Distributed(test_cluster_two_shards_localhost, system, one, dummy);
 SELECT dummy, shardNum(), shardCount() FROM shard_num_example;
@@ -2528,7 +2528,7 @@ SELECT dummy, shardNum(), shardCount() FROM shard_num_example;
 
 Result:
 
-``` text
+```text
 ┌─dummy─┬─shardNum()─┬─shardCount()─┐
 │     0 │          2 │            2 │
 │     0 │          1 │            2 │
@@ -2546,7 +2546,7 @@ If a query is not distributed then constant value `0` is returned.
 
 **Syntax**
 
-``` sql
+```sql
 shardCount()
 ```
 
@@ -2566,7 +2566,7 @@ Returns a string with the current OS kernel version.
 
 **Syntax**
 
-``` sql
+```sql
 getOSKernelVersion()
 ```
 
@@ -2584,13 +2584,13 @@ Type: [String](../../sql-reference/data-types/string.md).
 
 Query:
 
-``` sql
+```sql
 SELECT getOSKernelVersion();
 ```
 
 Result:
 
-``` text
+```text
 ┌─getOSKernelVersion()────┐
 │ Linux 4.15.0-55-generic │
 └─────────────────────────┘
@@ -2602,7 +2602,7 @@ Returns the uptime of the current ZooKeeper session in seconds.
 
 **Syntax**
 
-``` sql
+```sql
 zookeeperSessionUptime()
 ```
 
@@ -2620,13 +2620,13 @@ Type: [UInt32](../../sql-reference/data-types/int-uint.md).
 
 Query:
 
-``` sql
+```sql
 SELECT zookeeperSessionUptime();
 ```
 
 Result:
 
-``` text
+```text
 ┌─zookeeperSessionUptime()─┐
 │                      286 │
 └──────────────────────────┘
@@ -2638,7 +2638,7 @@ Generates random table structure in a format `column1_name column1_type, column2
 
 **Syntax**
 
-``` sql
+```sql
 generateRandomStructure([number_of_columns, seed])
 ```
 
@@ -2659,13 +2659,13 @@ Type: [String](../../sql-reference/data-types/string.md).
 
 Query:
 
-``` sql
+```sql
 SELECT generateRandomStructure()
 ```
 
 Result:
 
-``` text
+```text
 ┌─generateRandomStructure()─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┐
 │ c1 Decimal32(5), c2 Date, c3 Tuple(LowCardinality(String), Int128, UInt64, UInt16, UInt8, IPv6), c4 Array(UInt128), c5 UInt32, c6 IPv4, c7 Decimal256(64), c8 Decimal128(3), c9 UInt256, c10 UInt64, c11 DateTime │
 └───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
@@ -2673,13 +2673,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 SELECT generateRandomStructure(1)
 ```
 
 Result:
 
-``` text
+```text
 ┌─generateRandomStructure(1)─┐
 │ c1 Map(UInt256, UInt16)    │
 └────────────────────────────┘
@@ -2687,13 +2687,13 @@ Result:
 
 Query:
 
-``` sql
+```sql
 SELECT generateRandomStructure(NULL, 33)
 ```
 
 Result:
 
-``` text
+```text
 ┌─generateRandomStructure(NULL, 33)─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┐
 │ c1 DateTime, c2 Enum8('c2V0' = 0, 'c2V1' = 1, 'c2V2' = 2, 'c2V3' = 3), c3 LowCardinality(Nullable(FixedString(30))), c4 Int16, c5 Enum8('c5V0' = 0, 'c5V1' = 1, 'c5V2' = 2, 'c5V3' = 3), c6 Nullable(UInt8), c7 String, c8 Nested(e1 IPv4, e2 UInt8, e3 UInt16, e4 UInt16, e5 Int32, e6 Map(Date, Decimal256(70))) │
 └────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
@@ -2709,7 +2709,7 @@ Converts ClickHouse table structure to CapnProto schema.
 
 **Syntax**
 
-``` sql
+```sql
 structureToCapnProtoSchema(structure)
 ```
 
@@ -2720,7 +2720,7 @@ structureToCapnProtoSchema(structure)
 
 **Returned value**
 
-- CapnProto schema 
+- CapnProto schema
 
 Type: [String](../../sql-reference/data-types/string.md).
 
@@ -2728,13 +2728,13 @@ Type: [String](../../sql-reference/data-types/string.md).
 
 Query:
 
-``` sql
+```sql
 SELECT structureToCapnProtoSchema('column1 String, column2 UInt32, column3 Array(String)') FORMAT RawBLOB
 ```
 
 Result:
 
-``` text
+```text
 @0xf96402dd754d0eb7;
 
 struct Message
@@ -2747,13 +2747,13 @@ struct Message
 
 Query:
 
-``` sql
+```sql
 SELECT structureToCapnProtoSchema('column1 Nullable(String), column2 Tuple(element1 UInt32, element2 Array(String)), column3 Map(String, String)') FORMAT RawBLOB
 ```
 
 Result:
 
-``` text
+```text
 @0xd1c8320fecad2b7f;
 
 struct Message
@@ -2788,13 +2788,13 @@ struct Message
 
 Query:
 
-``` sql
+```sql
 SELECT structureToCapnProtoSchema('column1 String, column2 UInt32', 'Root') FORMAT RawBLOB
 ```
 
 Result:
 
-``` text
+```text
 @0x96ab2d4ab133c6e1;
 
 struct Root
@@ -2810,7 +2810,7 @@ Converts ClickHouse table structure to Protobuf schema.
 
 **Syntax**
 
-``` sql
+```sql
 structureToProtobufSchema(structure)
 ```
 
@@ -2829,13 +2829,13 @@ Type: [String](../../sql-reference/data-types/string.md).
 
 Query:
 
-``` sql
+```sql
 SELECT structureToProtobufSchema('column1 String, column2 UInt32, column3 Array(String)') FORMAT RawBLOB
 ```
 
 Result:
 
-``` text
+```text
 syntax = "proto3";
 
 message Message
@@ -2848,13 +2848,13 @@ message Message
 
 Query:
 
-``` sql
+```sql
 SELECT structureToProtobufSchema('column1 Nullable(String), column2 Tuple(element1 UInt32, element2 Array(String)), column3 Map(String, String)') FORMAT RawBLOB
 ```
 
 Result:
 
-``` text
+```text
 syntax = "proto3";
 
 message Message
@@ -2872,13 +2872,13 @@ message Message
 
 Query:
 
-``` sql
+```sql
 SELECT structureToProtobufSchema('column1 String, column2 UInt32', 'Root') FORMAT RawBLOB
 ```
 
 Result:
 
-``` text
+```text
 syntax = "proto3";
 
 message Root
@@ -3050,7 +3050,7 @@ Calculates minimum required sample size for an A/B test comparing conversions (p
 
 **Syntax**
 
-``` sql
+```sql
 minSampleSizeConversion(baseline, mde, power, alpha)
 ```
 
@@ -3075,13 +3075,13 @@ A named [Tuple](../data-types/tuple.md) with 3 elements:
 
 The following query calculates the required sample size for an A/B test with baseline conversion of 25%, MDE of 3%, significance level of 5%, and the desired statistical power of 80%:
 
-``` sql
+```sql
 SELECT minSampleSizeConversion(0.25, 0.03, 0.80, 0.05) AS sample_size;
 ```
 
 Result:
 
-``` text
+```text
 ┌─sample_size───────────────────┐
 │ (3396.077603219163,0.22,0.28) │
 └───────────────────────────────┘
@@ -3093,7 +3093,7 @@ Calculates minimum required sample size for an A/B test comparing means of a con
 
 **Syntax**
 
-``` sql
+```sql
 minSampleSizeContinous(baseline, sigma, mde, power, alpha)
 ```
 
@@ -3105,7 +3105,7 @@ Uses the formula described in [this article](https://towardsdatascience.com/requ
 
 - `baseline` — Baseline value of a metric. [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
 - `sigma` — Baseline standard deviation of a metric. [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
-- `mde` — Minimum detectable effect (MDE) as percentage of the baseline value (e.g. for a baseline value 112.25 the MDE 0.03 means an expected change to 112.25 ± 112.25*0.03). [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
+- `mde` — Minimum detectable effect (MDE) as percentage of the baseline value (e.g. for a baseline value 112.25 the MDE 0.03 means an expected change to 112.25 ± 112.25\*0.03). [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
 - `power` — Required statistical power of a test (1 - probability of Type II error). [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
 - `alpha` — Required significance level of a test (probability of Type I error). [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
 
@@ -3121,13 +3121,13 @@ A named [Tuple](../data-types/tuple.md) with 3 elements:
 
 The following query calculates the required sample size for an A/B test on a metric with baseline value of 112.25, standard deviation of 21.1, MDE of 3%, significance level of 5%, and the desired statistical power of 80%:
 
-``` sql
+```sql
 SELECT minSampleSizeContinous(112.25, 21.1, 0.03, 0.80, 0.05) AS sample_size;
 ```
 
 Result:
 
-``` text
+```text
 ┌─sample_size───────────────────────────┐
 │ (616.2931945826209,108.8825,115.6175) │
 └───────────────────────────────────────┘

From 8abb85948c4b401a61cdf6dc6cf33b7ac9df2279 Mon Sep 17 00:00:00 2001
From: Yatsishin Ilya <2159081+qoega@users.noreply.github.com>
Date: Tue, 12 Mar 2024 17:03:11 +0000
Subject: [PATCH 376/985] Fix flaky test and add separate to show unexpected
 behaviour

---
 .../01603_insert_select_too_many_parts.sql       |  3 ++-
 ...t_select_too_many_parts_multithread.reference |  1 +
 ..._insert_select_too_many_parts_multithread.sql | 16 ++++++++++++++++
 3 files changed, 19 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.reference
 create mode 100644 tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.sql

diff --git a/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql b/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql
index a56b680e212..eea52282cf4 100644
--- a/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql
+++ b/tests/queries/0_stateless/01603_insert_select_too_many_parts.sql
@@ -5,7 +5,8 @@ SYSTEM STOP MERGES too_many_parts;
 SET max_block_size = 1, min_insert_block_size_rows = 0, min_insert_block_size_bytes = 0;
 
 -- exception is not thrown if threshold is exceeded when multi-block INSERT is already started.
-INSERT INTO too_many_parts SELECT * FROM numbers(10);
+-- Single thread is used as different threads check it separately https://github.com/ClickHouse/ClickHouse/issues/61158
+INSERT INTO too_many_parts SELECT * FROM numbers(10) SETTINGS max_insert_threads=1;
 SELECT count() FROM too_many_parts;
 
 -- exception is thrown if threshold is exceeded on new INSERT.
diff --git a/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.reference b/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.reference
new file mode 100644
index 00000000000..29d6383b52c
--- /dev/null
+++ b/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.reference
@@ -0,0 +1 @@
+100
diff --git a/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.sql b/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.sql
new file mode 100644
index 00000000000..00cf262add5
--- /dev/null
+++ b/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.sql
@@ -0,0 +1,16 @@
+# Tags: disabled
+# TODO: Fix parts_to_throw_insert logic for parallel  MergeTreeSink onStart calls
+DROP TABLE IF EXISTS too_many_parts;
+
+CREATE TABLE too_many_parts (x UInt64) ENGINE = MergeTree ORDER BY tuple() SETTINGS parts_to_delay_insert = 5, parts_to_throw_insert = 5;
+
+SYSTEM STOP MERGES too_many_parts;
+SET max_block_size = 1, min_insert_block_size_rows = 0, min_insert_block_size_bytes = 0, max_threads=100, max_insert_threads=100;
+
+-- exception is not thrown if threshold is exceeded when multi-block INSERT is already started.
+INSERT INTO too_many_parts SELECT * FROM numbers_mt(100);
+SELECT count() FROM too_many_parts;
+
+INSERT INTO too_many_parts SELECT * FROM numbers_mt(10); --  { serverError 252 }
+
+DROP TABLE too_many_parts;

From f3f1f611a45500f82c581e5ec34810e77a02cfdc Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <nikitamikhaylov@clickhouse.com>
Date: Tue, 12 Mar 2024 17:26:42 +0000
Subject: [PATCH 377/985] Better

---
 base/base/defines.h                      | 10 ++++++++--
 src/Parsers/ASTQueryWithTableAndOutput.h |  1 +
 2 files changed, 9 insertions(+), 2 deletions(-)

diff --git a/base/base/defines.h b/base/base/defines.h
index 1f02748633d..3308315b27f 100644
--- a/base/base/defines.h
+++ b/base/base/defines.h
@@ -108,16 +108,22 @@
         {
             [[noreturn]] void abortOnFailedAssertion(const String & description);
         }
-        #define chassert(x) do { static_cast<bool>(x) ? void(0) : ::DB::abortOnFailedAssertion(#x); } while (0)
+        #define chassert_1(x, ...) do { static_cast<bool>(x) ? void(0) : ::DB::abortOnFailedAssertion(#x); } while (0)
+        #define chassert_2(x, comment, ...) do { static_cast<bool>(x) ? void(0) : ::DB::abortOnFailedAssertion(comment); } while (0)
         #define UNREACHABLE() abort()
         // clang-format off
     #else
         /// Here sizeof() trick is used to suppress unused warning for result,
         /// since simple "(void)x" will evaluate the expression, while
         /// "sizeof(!(x))" will not.
-        #define chassert(x) (void)sizeof(!(x))
+        #define chassert_1(x, ...) (void)sizeof(!(x))
+        #define chassert_2(x, comment, ...) (void)sizeof(!(x))
         #define UNREACHABLE() __builtin_unreachable()
     #endif
+        #define CHASSERT_IMPL(_1,_2, N,...) N(_1, _2)
+        #define CHASSERT_IMPL_(tuple) CHASSERT_IMPL tuple
+        #define chassert(...) CHASSERT_IMPL_((__VA_ARGS__, chassert_2, chassert_1))
+
 #endif
 
 /// Macros for Clang Thread Safety Analysis (TSA). They can be safely ignored by other compilers.
diff --git a/src/Parsers/ASTQueryWithTableAndOutput.h b/src/Parsers/ASTQueryWithTableAndOutput.h
index 1b8621fb63b..358291d9aa8 100644
--- a/src/Parsers/ASTQueryWithTableAndOutput.h
+++ b/src/Parsers/ASTQueryWithTableAndOutput.h
@@ -61,6 +61,7 @@ protected:
             settings.ostr << '.';
         }
 
+        chassert(table != nullptr, "Table is empty for the ASTQueryWithTableAndOutputImpl.");
         table->formatImpl(settings, state, frame);
     }
 };

From ca282ab4510c3f06f6433de8349b28ce3527f436 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <nikitamikhaylov@clickhouse.com>
Date: Tue, 12 Mar 2024 17:33:09 +0000
Subject: [PATCH 378/985] Better

---
 base/base/defines.h | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/base/base/defines.h b/base/base/defines.h
index 3308315b27f..627c50c27d2 100644
--- a/base/base/defines.h
+++ b/base/base/defines.h
@@ -120,9 +120,9 @@
         #define chassert_2(x, comment, ...) (void)sizeof(!(x))
         #define UNREACHABLE() __builtin_unreachable()
     #endif
-        #define CHASSERT_IMPL(_1,_2, N,...) N(_1, _2)
-        #define CHASSERT_IMPL_(tuple) CHASSERT_IMPL tuple
-        #define chassert(...) CHASSERT_IMPL_((__VA_ARGS__, chassert_2, chassert_1))
+        #define CHASSERT_DISPATCH(_1,_2, N,...) N(_1, _2)
+        #define CHASSERT_INVOKE(tuple) CHASSERT_DISPATCH tuple
+        #define chassert(...) CHASSERT_INVOKE((__VA_ARGS__, chassert_2, chassert_1))
 
 #endif
 

From ddd2d92d0fbd31dad7e091ce1d828eb65fc34338 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 12 Mar 2024 18:40:20 +0100
Subject: [PATCH 379/985] Update curl to curl with data race fix

---
 contrib/curl | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/contrib/curl b/contrib/curl
index 5ce164e0e92..1a05e833f8f 160000
--- a/contrib/curl
+++ b/contrib/curl
@@ -1 +1 @@
-Subproject commit 5ce164e0e9290c96eb7d502173426c0a135ec008
+Subproject commit 1a05e833f8f7140628b27882b10525fd9ec4b873

From 296f7a1da2e5f5297fd26eb878071e4e60ac21fa Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 12 Mar 2024 19:02:58 +0100
Subject: [PATCH 380/985] Fix

---
 src/Disks/ObjectStorages/Web/WebObjectStorage.cpp | 4 ++++
 src/IO/ReadWriteBufferFromHTTP.cpp                | 2 +-
 src/IO/ReadWriteBufferFromHTTP.h                  | 3 +++
 3 files changed, 8 insertions(+), 1 deletion(-)

diff --git a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
index 4adb92cf5c8..7e942a6cf6f 100644
--- a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
@@ -86,6 +86,10 @@ WebObjectStorage::loadFiles(const String & path, const std::unique_lock<std::sha
             loaded_files.emplace_back(file_path);
         }
 
+        /// Check for not found url after read attempt, because of delayed initialization.
+        if (metadata_buf->hasNotFoundURL())
+            return {};
+
         auto [it, inserted] = files.add(path, FileData::createDirectoryInfo(true));
         if (!inserted)
         {
diff --git a/src/IO/ReadWriteBufferFromHTTP.cpp b/src/IO/ReadWriteBufferFromHTTP.cpp
index bcbec97537a..fdc8ef04d2e 100644
--- a/src/IO/ReadWriteBufferFromHTTP.cpp
+++ b/src/IO/ReadWriteBufferFromHTTP.cpp
@@ -449,6 +449,7 @@ bool ReadWriteBufferFromHTTP::nextImpl()
                     if (http_skip_not_found_url && e.getHTTPStatus() == Poco::Net::HTTPResponse::HTTPStatus::HTTP_NOT_FOUND)
                     {
                         next_result = false;
+                        has_not_found_url = true;
                         return;
                     }
 
@@ -740,4 +741,3 @@ ReadWriteBufferFromHTTP::HTTPFileInfo ReadWriteBufferFromHTTP::parseFileInfo(con
 }
 
 }
-
diff --git a/src/IO/ReadWriteBufferFromHTTP.h b/src/IO/ReadWriteBufferFromHTTP.h
index d0d792430c0..1b7437ea0c6 100644
--- a/src/IO/ReadWriteBufferFromHTTP.h
+++ b/src/IO/ReadWriteBufferFromHTTP.h
@@ -79,6 +79,7 @@ private:
 
     const bool use_external_buffer;
     const bool http_skip_not_found_url;
+    bool has_not_found_url = false;
 
     std::function<void(std::ostream &)> out_stream_callback;
 
@@ -183,6 +184,8 @@ public:
 
     std::optional<time_t> tryGetLastModificationTime();
 
+    bool hasNotFoundURL() const { return has_not_found_url; }
+
     HTTPFileInfo getFileInfo();
     static HTTPFileInfo parseFileInfo(const Poco::Net::HTTPResponse & response, size_t requested_range_begin);
 };

From f35987928bc41b37e3579d0a881562357efa32c7 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Tue, 12 Mar 2024 18:05:14 +0000
Subject: [PATCH 381/985] free memory earlier in inserts

---
 src/Interpreters/AsynchronousInsertQueue.cpp  | 45 ++++++++++++-------
 src/Interpreters/AsynchronousInsertQueue.h    | 13 ++++++
 .../MergeTree/MergeTreeDataWriter.cpp         | 14 +++---
 src/Storages/MergeTree/MergeTreeDataWriter.h  |  4 +-
 src/Storages/MergeTree/MergeTreeSink.cpp      |  6 ++-
 .../MergeTree/ReplicatedMergeTreeSink.cpp     |  8 +++-
 6 files changed, 64 insertions(+), 26 deletions(-)

diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index 7d56dbabe3c..12d1a5cc861 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -148,19 +148,25 @@ AsynchronousInsertQueue::InsertData::Entry::Entry(
 {
 }
 
+void AsynchronousInsertQueue::InsertData::Entry::resetChunk()
+{
+    if (chunk.empty())
+        return;
+
+    // To avoid races on counter of user's MemoryTracker we should free memory at this moment.
+    // Entries data must be destroyed in context of user who runs async insert.
+    // Each entry in the list may correspond to a different user,
+    // so we need to switch current thread's MemoryTracker.
+    MemoryTrackerSwitcher switcher(user_memory_tracker);
+    chunk = {};
+}
+
 void AsynchronousInsertQueue::InsertData::Entry::finish(std::exception_ptr exception_)
 {
     if (finished.exchange(true))
         return;
 
-    {
-        // To avoid races on counter of user's MemoryTracker we should free memory at this moment.
-        // Entries data must be destroyed in context of user who runs async insert.
-        // Each entry in the list may correspond to a different user,
-        // so we need to switch current thread's MemoryTracker.
-        MemoryTrackerSwitcher switcher(user_memory_tracker);
-        chunk = {};
-    }
+    resetChunk();
 
     if (exception_)
     {
@@ -224,7 +230,7 @@ AsynchronousInsertQueue::~AsynchronousInsertQueue()
             auto & shard = queue_shards[i];
 
             shard.are_tasks_available.notify_one();
-            assert(dump_by_first_update_threads[i].joinable());
+            chassert(dump_by_first_update_threads[i].joinable());
             dump_by_first_update_threads[i].join();
 
             if (flush_on_shutdown)
@@ -510,14 +516,13 @@ void AsynchronousInsertQueue::validateSettings(const Settings & settings, Logger
     /// Adaptive timeout settings.
     const auto min_ms = std::chrono::milliseconds(settings.async_insert_busy_timeout_min_ms);
 
-    if (min_ms > max_ms)
-        if (log)
-            LOG_WARNING(
-                log,
-                "Setting 'async_insert_busy_timeout_min_ms'={} is greater than 'async_insert_busy_timeout_max_ms'={}. Ignoring "
-                "'async_insert_busy_timeout_min_ms'",
-                min_ms.count(),
-                max_ms.count());
+    if (min_ms > max_ms && log)
+        LOG_WARNING(
+            log,
+            "Setting 'async_insert_busy_timeout_min_ms'={} is greater than 'async_insert_busy_timeout_max_ms'={}. Ignoring "
+            "'async_insert_busy_timeout_min_ms'",
+            min_ms.count(),
+            max_ms.count());
 
     if (settings.async_insert_busy_timeout_increase_rate <= 0)
         throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting 'async_insert_busy_timeout_increase_rate' must be greater than zero");
@@ -953,14 +958,18 @@ Chunk AsynchronousInsertQueue::processEntriesWithParsing(
                 "Expected entry with data kind Parsed. Got: {}", entry->chunk.getDataKind());
 
         auto buffer = std::make_unique<ReadBufferFromString>(*bytes);
+
         size_t num_bytes = bytes->size();
         size_t num_rows = executor.execute(*buffer);
+
         total_rows += num_rows;
         chunk_info->offsets.push_back(total_rows);
         chunk_info->tokens.push_back(entry->async_dedup_token);
 
         add_to_async_insert_log(entry, query_for_logging, current_exception, num_rows, num_bytes, data->timeout_ms);
+
         current_exception.clear();
+        entry->resetChunk();
     }
 
     Chunk chunk(executor.getResultColumns(), total_rows);
@@ -1011,6 +1020,8 @@ Chunk AsynchronousInsertQueue::processPreprocessedEntries(
 
         const auto & query_for_logging = get_query_by_format(entry->format);
         add_to_async_insert_log(entry, query_for_logging, "", block->rows(), block->bytes(), data->timeout_ms);
+
+        entry->resetChunk();
     }
 
     Chunk chunk(std::move(result_columns), total_rows);
diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index f60b3d343fb..f4044563f34 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -117,6 +117,17 @@ private:
                 return DataKind::Parsed;
         }
 
+        bool empty() const
+        {
+            return std::visit([]<typename T>(const T & arg)
+            {
+                if constexpr (std::is_same_v<T, Block>)
+                    return arg.rows() == 0;
+                else
+                    return arg.empty();
+            }, *this);
+        }
+
         const String * asString() const { return std::get_if<String>(this); }
         const Block * asBlock() const { return std::get_if<Block>(this); }
     };
@@ -140,7 +151,9 @@ private:
                 const String & format_,
                 MemoryTracker * user_memory_tracker_);
 
+            void resetChunk();
             void finish(std::exception_ptr exception_ = nullptr);
+
             std::future<void> getFuture() { return promise.get_future(); }
             bool isFinished() const { return finished; }
 
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.cpp b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
index fdac16ae19a..30466e1b388 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.cpp
@@ -241,7 +241,7 @@ std::vector<AsyncInsertInfoPtr> scatterAsyncInsertInfoBySelector(AsyncInsertInfo
 }
 
 BlocksWithPartition MergeTreeDataWriter::splitBlockIntoParts(
-    const Block & block, size_t max_parts, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, AsyncInsertInfoPtr async_insert_info)
+    Block && block, size_t max_parts, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, AsyncInsertInfoPtr async_insert_info)
 {
     BlocksWithPartition result;
     if (!block || !block.rows())
@@ -320,7 +320,7 @@ BlocksWithPartition MergeTreeDataWriter::splitBlockIntoParts(
 }
 
 Block MergeTreeDataWriter::mergeBlock(
-    const Block & block,
+    Block && block,
     SortDescription sort_description,
     const Names & partition_key_columns,
     IColumn::Permutation *& permutation,
@@ -410,7 +410,11 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartWithoutPref
 }
 
 MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
-    BlockWithPartition & block_with_partition, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, int64_t block_number, bool need_tmp_prefix)
+    BlockWithPartition & block_with_partition,
+    const StorageMetadataPtr & metadata_snapshot,
+    ContextPtr context,
+    int64_t block_number,
+    bool need_tmp_prefix)
 {
     TemporaryPart temp_part;
     Block & block = block_with_partition.block;
@@ -498,7 +502,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeTempPartImpl(
     if (context->getSettingsRef().optimize_on_insert)
     {
         ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::MergeTreeDataWriterMergingBlocksMicroseconds);
-        block = mergeBlock(block, sort_description, partition_key_columns, perm_ptr, data.merging_params);
+        block = mergeBlock(std::move(block), sort_description, partition_key_columns, perm_ptr, data.merging_params);
     }
 
     /// Size of part would not be greater than block.bytes() + epsilon
@@ -717,7 +721,7 @@ MergeTreeDataWriter::TemporaryPart MergeTreeDataWriter::writeProjectionPartImpl(
 
         MergeTreeData::MergingParams projection_merging_params;
         projection_merging_params.mode = MergeTreeData::MergingParams::Aggregating;
-        block = mergeBlock(block, sort_description, {}, perm_ptr, projection_merging_params);
+        block = mergeBlock(std::move(block), sort_description, {}, perm_ptr, projection_merging_params);
     }
 
     /// This effectively chooses minimal compression method:
diff --git a/src/Storages/MergeTree/MergeTreeDataWriter.h b/src/Storages/MergeTree/MergeTreeDataWriter.h
index 8fb8b82dbe6..9dffea0a471 100644
--- a/src/Storages/MergeTree/MergeTreeDataWriter.h
+++ b/src/Storages/MergeTree/MergeTreeDataWriter.h
@@ -53,7 +53,7 @@ public:
       *  (split rows by partition)
       * Works deterministically: if same block was passed, function will return same result in same order.
       */
-    static BlocksWithPartition splitBlockIntoParts(const Block & block, size_t max_parts, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, AsyncInsertInfoPtr async_insert_info = nullptr);
+    static BlocksWithPartition splitBlockIntoParts(Block && block, size_t max_parts, const StorageMetadataPtr & metadata_snapshot, ContextPtr context, AsyncInsertInfoPtr async_insert_info = nullptr);
 
     /// This structure contains not completely written temporary part.
     /// Some writes may happen asynchronously, e.g. for blob storages.
@@ -107,7 +107,7 @@ public:
         size_t block_num);
 
     static Block mergeBlock(
-        const Block & block,
+        Block && block,
         SortDescription sort_description,
         const Names & partition_key_columns,
         IColumn::Permutation *& permutation,
diff --git a/src/Storages/MergeTree/MergeTreeSink.cpp b/src/Storages/MergeTree/MergeTreeSink.cpp
index 87b0a04d244..2da7565daad 100644
--- a/src/Storages/MergeTree/MergeTreeSink.cpp
+++ b/src/Storages/MergeTree/MergeTreeSink.cpp
@@ -63,7 +63,7 @@ void MergeTreeSink::consume(Chunk chunk)
     if (!storage_snapshot->object_columns.empty())
         convertDynamicColumnsToTuples(block, storage_snapshot);
 
-    auto part_blocks = storage.writer.splitBlockIntoParts(block, max_parts_per_block, metadata_snapshot, context);
+    auto part_blocks = storage.writer.splitBlockIntoParts(std::move(block), max_parts_per_block, metadata_snapshot, context);
 
     using DelayedPartitions = std::vector<MergeTreeSink::DelayedChunk::Partition>;
     DelayedPartitions partitions;
@@ -87,6 +87,10 @@ void MergeTreeSink::consume(Chunk chunk)
             elapsed_ns = watch.elapsed();
         }
 
+        /// Reset earlier to free memory
+        current_block.block.clear();
+        current_block.partition.clear();
+
         /// If optimize_on_insert setting is true, current_block could become empty after merge
         /// and we didn't create part.
         if (!temp_part.part)
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
index e50b4007d64..768a680d9bd 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
@@ -288,7 +288,7 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "No chunk info for async inserts");
     }
 
-    auto part_blocks = storage.writer.splitBlockIntoParts(block, max_parts_per_block, metadata_snapshot, context, async_insert_info);
+    auto part_blocks = storage.writer.splitBlockIntoParts(std::move(block), max_parts_per_block, metadata_snapshot, context, async_insert_info);
 
     using DelayedPartition = typename ReplicatedMergeTreeSinkImpl<async_insert>::DelayedChunk::Partition;
     using DelayedPartitions = std::vector<DelayedPartition>;
@@ -383,6 +383,12 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
             partitions = DelayedPartitions{};
         }
 
+        if constexpr (!async_insert)
+        {
+            /// Reset earlier to free memory.
+            current_block.block.clear();
+            current_block.partition.clear();
+        }
 
         partitions.emplace_back(DelayedPartition(
             log,

From 3c2514bc77837b103c693890515fb1fd87e1befc Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Tue, 12 Mar 2024 18:33:32 +0000
Subject: [PATCH 382/985] Correct small issues

---
 src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp | 7 +++++--
 src/Storages/System/attachSystemTables.cpp             | 6 +++---
 2 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index ea2c71b0018..6c3a4245a96 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -66,9 +66,12 @@ protected:
         UInt64 * pos = vec.data(); /// This also accelerates the code.
 
         UInt64 * current_end = &vec[real_block_size];
-        if (step > 1) {
+        if (step > 1)
+        {
             iota_with_step(pos, static_cast<size_t>(current_end - pos), curr, step);
-        } else {
+        }
+        else
+        {
             iota(pos, static_cast<size_t>(current_end - pos), curr);
         }
 
diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index 6d479bc05d7..14125cbd506 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -119,9 +119,9 @@ namespace DB
 void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, bool has_zookeeper)
 {
     attachNoDescription<StorageSystemOne>(context, system_database, "one", "This table contains a single row with a single dummy UInt8 column containing the value 0. Used when the table is not specified explicitly, for example in queries like `SELECT 1`.");
-    attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers", "Generates all natural numbers, starting from 0 (to 2^64 - 1, and then again) in sorted order.", false);
-    attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers_mt", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", true);
-    attach<StorageSystemNumbers>(context, system_database, "generate_series", "Generates arithmetic progression of natural numbers in sorted order in a given segment with a given step", false, "generate_series");
+    attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers", "Generates all natural numbers, starting from 0 (to 2^64 - 1, and then again) in sorted order.", false, "numbers");
+    attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers_mt", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", true, "numbers");
+    attachNoDescription<StorageSystemNumbers>(context, system_database, "generate_series", "Generates arithmetic progression of natural numbers in sorted order in a given segment with a given step", false, "generate_series");
     attachNoDescription<StorageSystemZeros>(context, system_database, "zeros", "Produces unlimited number of non-materialized zeros.", false);
     attachNoDescription<StorageSystemZeros>(context, system_database, "zeros_mt", "Multithreaded version of system.zeros.", true);
     attach<StorageSystemDatabases>(context, system_database, "databases", "Lists all databases of the current server.");

From c947484fe0d788dd46384b90987b59694f0a0b77 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 12 Mar 2024 19:36:10 +0100
Subject: [PATCH 383/985] Fxi again

---
 tests/integration/test_disk_types/test.py       | 15 ++++++++++++---
 .../test_endpoint_macro_substitution/test.py    | 17 ++++++++++++-----
 2 files changed, 24 insertions(+), 8 deletions(-)

diff --git a/tests/integration/test_disk_types/test.py b/tests/integration/test_disk_types/test.py
index a53d073d30b..b9b8ef2010d 100644
--- a/tests/integration/test_disk_types/test.py
+++ b/tests/integration/test_disk_types/test.py
@@ -87,19 +87,28 @@ def test_different_types(cluster):
 def test_select_by_type(cluster):
     node = cluster.instances["node"]
     for name, disk_type in list(disk_types.items()):
-        if disk_type != "S3":
+        if disk_type == "Local":
             assert (
                 node.query(
                     "SELECT name FROM system.disks WHERE type='" + disk_type + "'"
                 )
                 == name + "\n"
             )
-        else:
+        elif disk_type == "S3":
             assert (
                 node.query(
-                    "SELECT name FROM system.disks WHERE type='"
+                    "SELECT name FROM system.disks WHERE object_storage_type='"
                     + disk_type
                     + "' ORDER BY name"
                 )
                 == "disk_encrypted\ndisk_s3\n"
             )
+        else:
+            assert (
+                node.query(
+                    "SELECT name FROM system.disks WHERE object_storage_type='"
+                    + disk_type
+                    + "'"
+                )
+                == name + "\n"
+            )
diff --git a/tests/integration/test_endpoint_macro_substitution/test.py b/tests/integration/test_endpoint_macro_substitution/test.py
index e161d8e82ff..ee72fb9b492 100644
--- a/tests/integration/test_endpoint_macro_substitution/test.py
+++ b/tests/integration/test_endpoint_macro_substitution/test.py
@@ -67,22 +67,29 @@ def test_different_types(cluster):
 
 def test_select_by_type(cluster):
     node = cluster.instances["node"]
-    fs = HdfsClient(hosts=cluster.hdfs_ip)
-
     for name, disk_type in list(disk_types.items()):
-        if disk_type != "S3":
+        if disk_type == "Local":
             assert (
                 node.query(
                     "SELECT name FROM system.disks WHERE type='" + disk_type + "'"
                 )
                 == name + "\n"
             )
-        else:
+        elif disk_type == "S3":
             assert (
                 node.query(
-                    "SELECT name FROM system.disks WHERE type='"
+                    "SELECT name FROM system.disks WHERE object_storage_type='"
                     + disk_type
                     + "' ORDER BY name"
                 )
                 == "disk_encrypted\ndisk_s3\n"
             )
+        else:
+            assert (
+                node.query(
+                    "SELECT name FROM system.disks WHERE object_storage_type='"
+                    + disk_type
+                    + "'"
+                )
+                == name + "\n"
+            )

From 0b277a55c78e6fcb840c543db6240ac000c09b74 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 15 Feb 2024 09:58:04 +0100
Subject: [PATCH 384/985] Fix tests with different results for GROUP BY const
 for analyzer

- 00757_enum_defaults - TOTALS
- 02699_polygons_sym_difference_rollup - TOTALS
- 02579_fill_empty_chunk - GROUP BY constX with arrayJoin(constX)

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../0_stateless/00757_enum_defaults.reference      |  6 ------
 tests/queries/0_stateless/00757_enum_defaults.sql  |  3 ---
 .../00757_enum_defaults_const.reference            |  6 ++++++
 .../0_stateless/00757_enum_defaults_const.sql      |  3 +++
 .../00757_enum_defaults_const_analyzer.reference   |  6 ++++++
 .../00757_enum_defaults_const_analyzer.sql         |  3 +++
 .../queries/0_stateless/02579_fill_empty_chunk.sql |  1 +
 .../02579_fill_empty_chunk_analyzer.reference      | 14 ++++++++++++++
 .../02579_fill_empty_chunk_analyzer.sql            | 14 ++++++++++++++
 .../02699_polygons_sym_difference_rollup.reference |  3 ---
 .../02699_polygons_sym_difference_rollup.sql       |  1 -
 .../02699_polygons_sym_difference_total.reference  |  3 +++
 .../02699_polygons_sym_difference_total.sql        |  2 ++
 ...olygons_sym_difference_total_analyzer.reference |  3 +++
 ...2699_polygons_sym_difference_total_analyzer.sql |  2 ++
 15 files changed, 57 insertions(+), 13 deletions(-)
 create mode 100644 tests/queries/0_stateless/00757_enum_defaults_const.reference
 create mode 100644 tests/queries/0_stateless/00757_enum_defaults_const.sql
 create mode 100644 tests/queries/0_stateless/00757_enum_defaults_const_analyzer.reference
 create mode 100644 tests/queries/0_stateless/00757_enum_defaults_const_analyzer.sql
 create mode 100644 tests/queries/0_stateless/02579_fill_empty_chunk_analyzer.reference
 create mode 100644 tests/queries/0_stateless/02579_fill_empty_chunk_analyzer.sql
 create mode 100644 tests/queries/0_stateless/02699_polygons_sym_difference_total.reference
 create mode 100644 tests/queries/0_stateless/02699_polygons_sym_difference_total.sql
 create mode 100644 tests/queries/0_stateless/02699_polygons_sym_difference_total_analyzer.reference
 create mode 100644 tests/queries/0_stateless/02699_polygons_sym_difference_total_analyzer.sql

diff --git a/tests/queries/0_stateless/00757_enum_defaults.reference b/tests/queries/0_stateless/00757_enum_defaults.reference
index 6bf5cc85e87..4b15bd17e44 100644
--- a/tests/queries/0_stateless/00757_enum_defaults.reference
+++ b/tests/queries/0_stateless/00757_enum_defaults.reference
@@ -1,9 +1,3 @@
-iphone	1
-
-iphone	1
-iphone	1
-
-\N	1
 a
 b
 1
diff --git a/tests/queries/0_stateless/00757_enum_defaults.sql b/tests/queries/0_stateless/00757_enum_defaults.sql
index 71edc83abe2..45dc9b80cb7 100644
--- a/tests/queries/0_stateless/00757_enum_defaults.sql
+++ b/tests/queries/0_stateless/00757_enum_defaults.sql
@@ -1,6 +1,3 @@
-select os_name, count() from (SELECT CAST('iphone' AS Enum8('iphone' = 1, 'android' = 2)) AS os_name) group by os_name WITH TOTALS;
-select toNullable(os_name) AS os_name, count() from (SELECT CAST('iphone' AS Enum8('iphone' = 1, 'android' = 2)) AS os_name) group by os_name WITH TOTALS;
-
 DROP TABLE IF EXISTS auto_assign_enum;
 DROP TABLE IF EXISTS auto_assign_enum1;
 DROP TABLE IF EXISTS auto_assign_enum2;
diff --git a/tests/queries/0_stateless/00757_enum_defaults_const.reference b/tests/queries/0_stateless/00757_enum_defaults_const.reference
new file mode 100644
index 00000000000..56ead34ad3b
--- /dev/null
+++ b/tests/queries/0_stateless/00757_enum_defaults_const.reference
@@ -0,0 +1,6 @@
+iphone	1
+
+iphone	1
+iphone	1
+
+\N	1
diff --git a/tests/queries/0_stateless/00757_enum_defaults_const.sql b/tests/queries/0_stateless/00757_enum_defaults_const.sql
new file mode 100644
index 00000000000..64271a37473
--- /dev/null
+++ b/tests/queries/0_stateless/00757_enum_defaults_const.sql
@@ -0,0 +1,3 @@
+SET allow_experimental_analyzer=0;
+select os_name, count() from (SELECT CAST('iphone' AS Enum8('iphone' = 1, 'android' = 2)) AS os_name) group by os_name WITH TOTALS;
+select toNullable(os_name) AS os_name, count() from (SELECT CAST('iphone' AS Enum8('iphone' = 1, 'android' = 2)) AS os_name) group by os_name WITH TOTALS;
diff --git a/tests/queries/0_stateless/00757_enum_defaults_const_analyzer.reference b/tests/queries/0_stateless/00757_enum_defaults_const_analyzer.reference
new file mode 100644
index 00000000000..6895acffed1
--- /dev/null
+++ b/tests/queries/0_stateless/00757_enum_defaults_const_analyzer.reference
@@ -0,0 +1,6 @@
+iphone	1
+
+iphone	1
+iphone	1
+
+iphone	1
diff --git a/tests/queries/0_stateless/00757_enum_defaults_const_analyzer.sql b/tests/queries/0_stateless/00757_enum_defaults_const_analyzer.sql
new file mode 100644
index 00000000000..bf079539019
--- /dev/null
+++ b/tests/queries/0_stateless/00757_enum_defaults_const_analyzer.sql
@@ -0,0 +1,3 @@
+SET allow_experimental_analyzer=1;
+select os_name, count() from (SELECT CAST('iphone' AS Enum8('iphone' = 1, 'android' = 2)) AS os_name) group by os_name WITH TOTALS;
+select toNullable(os_name) AS os_name, count() from (SELECT CAST('iphone' AS Enum8('iphone' = 1, 'android' = 2)) AS os_name) group by os_name WITH TOTALS;
diff --git a/tests/queries/0_stateless/02579_fill_empty_chunk.sql b/tests/queries/0_stateless/02579_fill_empty_chunk.sql
index cbdbd7a9f84..30942b154c9 100644
--- a/tests/queries/0_stateless/02579_fill_empty_chunk.sql
+++ b/tests/queries/0_stateless/02579_fill_empty_chunk.sql
@@ -1,6 +1,7 @@
 -- this SELECT produces empty chunk in FillingTransform
 
 SET enable_positional_arguments = 0;
+SET allow_experimental_analyzer = 0;
 
 SELECT
     2 AS x,
diff --git a/tests/queries/0_stateless/02579_fill_empty_chunk_analyzer.reference b/tests/queries/0_stateless/02579_fill_empty_chunk_analyzer.reference
new file mode 100644
index 00000000000..b03cfa03815
--- /dev/null
+++ b/tests/queries/0_stateless/02579_fill_empty_chunk_analyzer.reference
@@ -0,0 +1,14 @@
+1	\N
+2	\N
+2	\N
+2	\N
+2	\N
+2	\N
+2	\N
+3	\N
+4	\N
+5	\N
+6	\N
+7	\N
+8	\N
+9	\N
diff --git a/tests/queries/0_stateless/02579_fill_empty_chunk_analyzer.sql b/tests/queries/0_stateless/02579_fill_empty_chunk_analyzer.sql
new file mode 100644
index 00000000000..8350173f443
--- /dev/null
+++ b/tests/queries/0_stateless/02579_fill_empty_chunk_analyzer.sql
@@ -0,0 +1,14 @@
+-- this SELECT produces empty chunk in FillingTransform
+
+SET enable_positional_arguments = 0;
+SET allow_experimental_analyzer = 1;
+
+-- With analyzer this special query has correct output
+SELECT
+    2 AS x,
+    arrayJoin([NULL, NULL, NULL])
+GROUP BY
+    GROUPING SETS (
+        (0),
+        ([NULL, NULL, NULL]))
+ORDER BY x ASC WITH FILL FROM 1 TO 10;
diff --git a/tests/queries/0_stateless/02699_polygons_sym_difference_rollup.reference b/tests/queries/0_stateless/02699_polygons_sym_difference_rollup.reference
index 35c94347ac9..52af58fb67a 100644
--- a/tests/queries/0_stateless/02699_polygons_sym_difference_rollup.reference
+++ b/tests/queries/0_stateless/02699_polygons_sym_difference_rollup.reference
@@ -6,6 +6,3 @@
 [[(2147483647,0),(10.0001,65535),(1,255),(1023,2147483646)]]	[[[(2147483647,0),(10.0001,65535),(1023,2147483646),(2147483647,0)]]]
 [[[(100.0001,1000.0001),(1000.0001,1.1920928955078125e-7),(20,-20),(20,20),(10,10),(-20,20),(100.0001,1000.0001)]]]
 [[[(100.0001,1000.0001),(1000.0001,1.1920928955078125e-7),(20,-20),(20,20),(10,10),(-20,20),(100.0001,1000.0001)]]]
-[(9223372036854775807,1.1754943508222875e-38)]	[[(1,1.0001)]]	\N	[]
-
-[(9223372036854775807,1.1754943508222875e-38)]	[]	\N	[]
diff --git a/tests/queries/0_stateless/02699_polygons_sym_difference_rollup.sql b/tests/queries/0_stateless/02699_polygons_sym_difference_rollup.sql
index 85307bec6e5..502cca20ab2 100644
--- a/tests/queries/0_stateless/02699_polygons_sym_difference_rollup.sql
+++ b/tests/queries/0_stateless/02699_polygons_sym_difference_rollup.sql
@@ -2,4 +2,3 @@ SELECT polygonsSymDifferenceCartesian([[[(1., 1.)]] AS x], [x]) GROUP BY x WITH
 SELECT [[(2147483647, 0.), (10.0001, 65535), (1, 255), (1023, 2147483646)]], polygonsSymDifferenceCartesian([[[(2147483647, 0.), (10.0001, 65535), (1023, 2147483646)]]], [[[(1000.0001, 10.0001)]]]) GROUP BY [[(2147483647, 0.), (10.0001, 65535), (1023, 2147483646)]] WITH ROLLUP SETTINGS allow_experimental_analyzer=0;
 SELECT [[(2147483647, 0.), (10.0001, 65535), (1, 255), (1023, 2147483646)]], polygonsSymDifferenceCartesian([[[(2147483647, 0.), (10.0001, 65535), (1023, 2147483646)]]], [[[(1000.0001, 10.0001)]]]) GROUP BY [[(2147483647, 0.), (10.0001, 65535), (1023, 2147483646)]] WITH ROLLUP SETTINGS allow_experimental_analyzer=1;
 SELECT polygonsSymDifferenceCartesian([[[(100.0001, 1000.0001), (-20., 20.), (10., 10.), (20., 20.), (20., -20.), (1000.0001, 1.1920928955078125e-7)]],[[(0.0001, 100000000000000000000.)]] AS x],[x]) GROUP BY x WITH ROLLUP;
-SELECT [(9223372036854775807, 1.1754943508222875e-38)], x, NULL, polygonsSymDifferenceCartesian([[[(1.1754943508222875e-38, 1.1920928955078125e-7), (0.5, 0.5)]], [[(1.1754943508222875e-38, 1.1920928955078125e-7), (1.1754943508222875e-38, 1.1920928955078125e-7)], [(0., 1.0001)]], [[(1., 1.0001)]] AS x], [[[(3.4028234663852886e38, 0.9999)]]]) GROUP BY GROUPING SETS ((x)) WITH TOTALS
diff --git a/tests/queries/0_stateless/02699_polygons_sym_difference_total.reference b/tests/queries/0_stateless/02699_polygons_sym_difference_total.reference
new file mode 100644
index 00000000000..2b98454dc22
--- /dev/null
+++ b/tests/queries/0_stateless/02699_polygons_sym_difference_total.reference
@@ -0,0 +1,3 @@
+[(9223372036854775807,1.1754943508222875e-38)]	[[(1,1.0001)]]	\N	[]
+
+[(9223372036854775807,1.1754943508222875e-38)]	[]	\N	[]
diff --git a/tests/queries/0_stateless/02699_polygons_sym_difference_total.sql b/tests/queries/0_stateless/02699_polygons_sym_difference_total.sql
new file mode 100644
index 00000000000..0fac4b11320
--- /dev/null
+++ b/tests/queries/0_stateless/02699_polygons_sym_difference_total.sql
@@ -0,0 +1,2 @@
+SET allow_experimental_analyzer=0;
+SELECT [(9223372036854775807, 1.1754943508222875e-38)], x, NULL, polygonsSymDifferenceCartesian([[[(1.1754943508222875e-38, 1.1920928955078125e-7), (0.5, 0.5)]], [[(1.1754943508222875e-38, 1.1920928955078125e-7), (1.1754943508222875e-38, 1.1920928955078125e-7)], [(0., 1.0001)]], [[(1., 1.0001)]] AS x], [[[(3.4028234663852886e38, 0.9999)]]]) GROUP BY GROUPING SETS ((x)) WITH TOTALS
diff --git a/tests/queries/0_stateless/02699_polygons_sym_difference_total_analyzer.reference b/tests/queries/0_stateless/02699_polygons_sym_difference_total_analyzer.reference
new file mode 100644
index 00000000000..134420874b6
--- /dev/null
+++ b/tests/queries/0_stateless/02699_polygons_sym_difference_total_analyzer.reference
@@ -0,0 +1,3 @@
+[(9223372036854775807,1.1754943508222875e-38)]	[[(1,1.0001)]]	\N	[]
+
+[(9223372036854775807,1.1754943508222875e-38)]	[[(1,1.0001)]]	\N	[]
diff --git a/tests/queries/0_stateless/02699_polygons_sym_difference_total_analyzer.sql b/tests/queries/0_stateless/02699_polygons_sym_difference_total_analyzer.sql
new file mode 100644
index 00000000000..879e0e5297f
--- /dev/null
+++ b/tests/queries/0_stateless/02699_polygons_sym_difference_total_analyzer.sql
@@ -0,0 +1,2 @@
+SET allow_experimental_analyzer=1;
+SELECT [(9223372036854775807, 1.1754943508222875e-38)], x, NULL, polygonsSymDifferenceCartesian([[[(1.1754943508222875e-38, 1.1920928955078125e-7), (0.5, 0.5)]], [[(1.1754943508222875e-38, 1.1920928955078125e-7), (1.1754943508222875e-38, 1.1920928955078125e-7)], [(0., 1.0001)]], [[(1., 1.0001)]] AS x], [[[(3.4028234663852886e38, 0.9999)]]]) GROUP BY GROUPING SETS ((x)) WITH TOTALS

From ec80cc475ed8c0c3126aceb5db35ff20b9295451 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 12 Mar 2024 19:58:23 +0100
Subject: [PATCH 385/985] Fix formatting of overlay database

---
 src/Databases/DatabasesOverlay.cpp                        | 4 +++-
 .../0_stateless/03009_format_show_database.reference      | 2 ++
 tests/queries/0_stateless/03009_format_show_database.sh   | 8 ++++++++
 3 files changed, 13 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/03009_format_show_database.reference
 create mode 100755 tests/queries/0_stateless/03009_format_show_database.sh

diff --git a/src/Databases/DatabasesOverlay.cpp b/src/Databases/DatabasesOverlay.cpp
index 8cea3441698..c8705254e73 100644
--- a/src/Databases/DatabasesOverlay.cpp
+++ b/src/Databases/DatabasesOverlay.cpp
@@ -149,7 +149,9 @@ ASTPtr DatabasesOverlay::getCreateTableQueryImpl(const String & name, ContextPtr
  */
 ASTPtr DatabasesOverlay::getCreateDatabaseQuery() const
 {
-    return std::make_shared<ASTCreateQuery>();
+    auto query = std::make_shared<ASTCreateQuery>();
+    query->setDatabase(getDatabaseName());
+    return query;
 }
 
 String DatabasesOverlay::getTableDataPath(const String & table_name) const
diff --git a/tests/queries/0_stateless/03009_format_show_database.reference b/tests/queries/0_stateless/03009_format_show_database.reference
new file mode 100644
index 00000000000..83cfd4c1a68
--- /dev/null
+++ b/tests/queries/0_stateless/03009_format_show_database.reference
@@ -0,0 +1,2 @@
+CREATE DATABASE default
+UNKNOWN_DATABASE
diff --git a/tests/queries/0_stateless/03009_format_show_database.sh b/tests/queries/0_stateless/03009_format_show_database.sh
new file mode 100755
index 00000000000..7f33ad7b1e1
--- /dev/null
+++ b/tests/queries/0_stateless/03009_format_show_database.sh
@@ -0,0 +1,8 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+$CLICKHOUSE_LOCAL -q "show database default"
+$CLICKHOUSE_LOCAL -q "show database default2" 2>&1 | grep -o 'UNKNOWN_DATABASE'

From 15484bedadf62d05fdcaea842ce9d86bdafe57f3 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 12 Mar 2024 21:03:26 +0100
Subject: [PATCH 386/985] Fix clone for ASTQueryWithTableAndOutputImpl derived
 classes

---
 src/Parsers/TablePropertiesQueriesASTs.h | 18 ++++++++++++++++++
 1 file changed, 18 insertions(+)

diff --git a/src/Parsers/TablePropertiesQueriesASTs.h b/src/Parsers/TablePropertiesQueriesASTs.h
index e8e4bd8adb3..81ad975aa37 100644
--- a/src/Parsers/TablePropertiesQueriesASTs.h
+++ b/src/Parsers/TablePropertiesQueriesASTs.h
@@ -85,6 +85,15 @@ using ASTShowCreateDictionaryQuery = ASTQueryWithTableAndOutputImpl<ASTShowCreat
 
 class ASTExistsDatabaseQuery : public ASTQueryWithTableAndOutputImpl<ASTExistsDatabaseQueryIDAndQueryNames>
 {
+public:
+    ASTPtr clone() const override
+    {
+        auto res = std::make_shared<ASTExistsDatabaseQuery>(*this);
+        res->children.clear();
+        cloneTableOptions(*res);
+        return res;
+    }
+
 protected:
     void formatQueryImpl(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const override
     {
@@ -98,6 +107,15 @@ protected:
 
 class ASTShowCreateDatabaseQuery : public ASTQueryWithTableAndOutputImpl<ASTShowCreateDatabaseQueryIDAndQueryNames>
 {
+public:
+    ASTPtr clone() const override
+    {
+        auto res = std::make_shared<ASTShowCreateDatabaseQuery>(*this);
+        res->children.clear();
+        cloneTableOptions(*res);
+        return res;
+    }
+
 protected:
     void formatQueryImpl(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const override
     {

From c7c64636d018f1d07c7ea84c2fe9a61285bfe863 Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Tue, 12 Mar 2024 23:31:33 +0100
Subject: [PATCH 387/985] add a test

---
 programs/keeper/Keeper.cpp                    | 22 +++++---
 programs/server/Server.cpp                    |  2 +-
 src/Common/CgroupsMemoryUsageObserver.cpp     | 18 +++++--
 src/Common/CgroupsMemoryUsageObserver.h       | 10 ++--
 tests/integration/helpers/cluster.py          |  9 ++++
 .../test_memory_limit_observer/__init__.py    |  0
 .../config/text_log.xml                       |  7 +++
 .../test_memory_limit_observer/test.py        | 51 +++++++++++++++++++
 8 files changed, 101 insertions(+), 18 deletions(-)
 create mode 100644 tests/integration/test_memory_limit_observer/__init__.py
 create mode 100644 tests/integration/test_memory_limit_observer/config/text_log.xml
 create mode 100644 tests/integration/test_memory_limit_observer/test.py

diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index 31e0b7dc576..5ec1d2a6568 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -625,15 +625,23 @@ try
     main_config_reloader->start();
 
     std::optional<CgroupsMemoryUsageObserver> observer;
-    auto cgroups_memory_observer_wait_time = config().getUInt64("keeper_server.cgroups_memory_observer_wait_time", 1);
-    if (cgroups_memory_observer_wait_time > 0)
+    auto cgroups_memory_observer_wait_time = config().getUInt64("keeper_server.cgroups_memory_observer_wait_time", 15);
+    if (cgroups_memory_observer_wait_time != 0)
     {
-        observer.emplace(std::chrono::seconds(cgroups_memory_observer_wait_time));
-        observer->startThread();
-        observer->setOnMemoryLimitUpdate([&]()
+        try
         {
-            main_config_reloader->reload();
-        });
+            observer.emplace(std::chrono::seconds(cgroups_memory_observer_wait_time));
+            observer->setOnMemoryLimitUpdate([&]()
+            {
+                main_config_reloader->reload();
+            });
+            observer->startThread();
+        }
+        catch (Exception &)
+        {
+            tryLogCurrentException(log, "Disabling cgroup memory observer because of an error during initialization");
+        }
+
     }
 
 
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 33a30a1de2c..8e672f3f73e 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -1362,7 +1362,6 @@ try
                 cgroups_memory_usage_observer->setLimits(
                     static_cast<uint64_t>(max_server_memory_usage * hard_limit_ratio),
                     static_cast<uint64_t>(max_server_memory_usage * soft_limit_ratio));
-                cgroups_memory_usage_observer->startThread();
             }
 
             size_t merges_mutations_memory_usage_soft_limit = new_server_settings.merges_mutations_memory_usage_soft_limit;
@@ -1707,6 +1706,7 @@ try
         {
             main_config_reloader->reload();
         });
+        cgroups_memory_usage_observer->startThread();
     }
 
     /// Reload config in SYSTEM RELOAD CONFIG query.
diff --git a/src/Common/CgroupsMemoryUsageObserver.cpp b/src/Common/CgroupsMemoryUsageObserver.cpp
index 3fda51a119f..e9121754230 100644
--- a/src/Common/CgroupsMemoryUsageObserver.cpp
+++ b/src/Common/CgroupsMemoryUsageObserver.cpp
@@ -97,6 +97,12 @@ void CgroupsMemoryUsageObserver::setLimits(uint64_t hard_limit_, uint64_t soft_l
     LOG_INFO(log, "Set new limits, soft limit: {}, hard limit: {}", ReadableSize(soft_limit_), ReadableSize(hard_limit_));
 }
 
+void CgroupsMemoryUsageObserver::setOnMemoryLimitUpdate(UpdateMemLimitCallbackFn on_memory_limit_update_)
+{
+    std::lock_guard<std::mutex> set_limit_lock(set_limit_mutex);
+    on_memory_limit_update = on_memory_limit_update_;
+}
+
 uint64_t CgroupsMemoryUsageObserver::readMemoryUsage() const
 {
     return file.readMemoryUsage();
@@ -275,7 +281,10 @@ void CgroupsMemoryUsageObserver::stopThread()
 void CgroupsMemoryUsageObserver::runThread()
 {
     setThreadName("CgrpMemUsgObsr");
-    last_memory_amount = getMemoryAmount();
+
+    last_process_memory_amount = getMemoryAmount();
+    LOG_INFO(log, "Init memory amount is {} bytes", last_process_memory_amount);
+
     std::unique_lock lock(thread_mutex);
     while (true)
     {
@@ -284,10 +293,11 @@ void CgroupsMemoryUsageObserver::runThread()
 
         try
         {
-            uint64_t memory_limit = getMemoryAmount();
-            if (memory_limit != last_memory_amount)
+            uint64_t process_memory_limit = getMemoryAmount();
+            if (process_memory_limit != last_process_memory_amount)
             {
-                last_memory_amount = memory_limit;
+                LOG_INFO(log, "Find memory amount change, old limit is {} bytes, new limit is {} bytes", last_process_memory_amount, process_memory_limit);
+                last_process_memory_amount = process_memory_limit;
                 /// if we find memory amount changes, we just reload config.
                 /// Reloading config will check the memory amount again and calculate soft/hard limit again.
                 on_memory_limit_update();
diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index fc0d847af4f..24acc0d8f40 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -27,10 +27,8 @@ public:
     ~CgroupsMemoryUsageObserver();
 
     void setLimits(uint64_t hard_limit_, uint64_t soft_limit_);
-    void setOnMemoryLimitUpdate(std::function<void()> on_memory_limit_update_)
-    {
-        on_memory_limit_update = on_memory_limit_update_;
-    }
+    using UpdateMemLimitCallbackFn = std::function<void()>;
+    void setOnMemoryLimitUpdate(UpdateMemLimitCallbackFn on_memory_limit_update_);
     void startThread();
 
     size_t getHardLimit() const { return hard_limit; }
@@ -49,7 +47,7 @@ private:
     using CallbackFn = std::function<void(bool)>;
     CallbackFn on_hard_limit;
     CallbackFn on_soft_limit;
-    std::function<void()> on_memory_limit_update;
+    UpdateMemLimitCallbackFn on_memory_limit_update;
 
     uint64_t last_usage = 0;
 
@@ -80,7 +78,7 @@ private:
     std::condition_variable cond;
     ThreadFromGlobalPool thread;
     bool quit = false;
-    uint64_t last_memory_amount;
+    uint64_t last_process_memory_amount;
 };
 
 #else
diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 52c0d8a8ee5..b695b493db7 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -1618,6 +1618,7 @@ class ClickHouseCluster:
         with_installed_binary=False,
         external_dirs=None,
         tmpfs=None,
+        mem_limit=None,
         zookeeper_docker_compose_path=None,
         minio_certs_dir=None,
         minio_data_dir=None,
@@ -1728,6 +1729,7 @@ class ClickHouseCluster:
             with_installed_binary=with_installed_binary,
             external_dirs=external_dirs,
             tmpfs=tmpfs or [],
+            mem_limit=mem_limit,
             config_root_name=config_root_name,
             extra_configs=extra_configs,
         )
@@ -3203,6 +3205,7 @@ services:
             {krb5_conf}
         entrypoint: {entrypoint_cmd}
         tmpfs: {tmpfs}
+        {mem_limit}
         cap_add:
             - SYS_PTRACE
             - NET_ADMIN
@@ -3288,6 +3291,7 @@ class ClickHouseInstance:
         with_installed_binary=False,
         external_dirs=None,
         tmpfs=None,
+        mem_limit=None,
         config_root_name="clickhouse",
         extra_configs=[],
     ):
@@ -3299,6 +3303,10 @@ class ClickHouseInstance:
 
         self.external_dirs = external_dirs
         self.tmpfs = tmpfs or []
+        if mem_limit is not None:
+            self.mem_limit = "mem_limit : " + mem_limit
+        else:
+            self.mem_limit = ""
         self.base_config_dir = (
             p.abspath(p.join(base_path, base_config_dir)) if base_config_dir else None
         )
@@ -4644,6 +4652,7 @@ class ClickHouseInstance:
                     db_dir=db_dir,
                     external_dirs_volumes=external_dirs_volumes,
                     tmpfs=str(self.tmpfs),
+                    mem_limit=self.mem_limit,
                     logs_dir=logs_dir,
                     depends_on=str(depends_on),
                     user=os.getuid(),
diff --git a/tests/integration/test_memory_limit_observer/__init__.py b/tests/integration/test_memory_limit_observer/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_memory_limit_observer/config/text_log.xml b/tests/integration/test_memory_limit_observer/config/text_log.xml
new file mode 100644
index 00000000000..5c1cc663d0f
--- /dev/null
+++ b/tests/integration/test_memory_limit_observer/config/text_log.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <text_log>
+        <database>system</database>
+        <table>text_log</table>
+        <flush_interval_milliseconds>500</flush_interval_milliseconds>
+    </text_log>
+</clickhouse>
diff --git a/tests/integration/test_memory_limit_observer/test.py b/tests/integration/test_memory_limit_observer/test.py
new file mode 100644
index 00000000000..cf10f46be6a
--- /dev/null
+++ b/tests/integration/test_memory_limit_observer/test.py
@@ -0,0 +1,51 @@
+import pytest
+import logging
+import time
+
+from helpers.cluster import ClickHouseCluster, run_and_check
+
+cluster = ClickHouseCluster(__file__)
+
+node1 = cluster.add_instance(
+    "node1", main_configs=["config/text_log.xml"], mem_limit = "5g"
+)
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+def get_latest_mem_limit():
+    for _ in range(10):
+        try:
+            mem_limit = float(node1.query(
+            '''
+            select extract(message, '\\d+\\.\\d+') from system.text_log
+            where message like '%Setting max_server_memory_usage was set to%' and
+            message not like '%like%' order by event_time desc limit 1
+            '''
+            ).strip())
+            return mem_limit
+        except Exception as e:
+            time.sleep(1)
+    raise Exception("Cannot get memory limit")
+
+def test_observe_memory_limit(started_cluster):
+    original_max_mem = get_latest_mem_limit()
+    #container_id = cluster.get_container_id('node1')
+    #cmd = "docker update --memory=10g {}".format(node1.docker_id)
+    logging.debug(f"get original memory limit {original_max_mem}")
+    run_and_check([
+        'docker', 'update', '--memory=10g', node1.docker_id
+    ])
+    for _ in range(30):
+        time.sleep(10)
+        new_max_mem =  get_latest_mem_limit()
+        logging.debug(f"get new memory limit {new_max_mem}")
+        if new_max_mem > original_max_mem:
+            return

From ebd934e28696c1d01f6ee225c62b4e76a026c337 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 05:05:23 +0100
Subject: [PATCH 388/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 390 +++++++++++++-------------
 1 file changed, 192 insertions(+), 198 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index e2d9c4a173e..846b6c31062 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -179,6 +179,131 @@ struct ToDateTimeImpl
 };
 
 
+/// Implementation of toDate function.
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTransform32Or64
+{
+    static constexpr auto name = "toDate";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
+        }
+        /// if value is smaller (or equal) than maximum day value for Date, than treat it as day num,
+        /// otherwise treat it as unix timestamp. This is a bit weird, but we leave this behavior.
+        if (from <= DATE_LUT_MAX_DAY_NUM)
+            return from;
+        else
+            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
+    }
+};
+
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTransform32Or64Signed
+{
+    static constexpr auto name = "toDate";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    {
+        // TODO: decide narrow or extended range based on FromType
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < 0 || from > MAX_DATE_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
+        }
+        else
+        {
+            if (from < 0)
+                return 0;
+        }
+        return (from <= DATE_LUT_MAX_DAY_NUM)
+            ? static_cast<ToType>(from)
+            : time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATE_TIMESTAMP)));
+    }
+};
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTransform8Or16Signed
+{
+    static constexpr auto name = "toDate";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        if (from < 0)
+        {
+            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
+            else
+                return 0;
+        }
+        return from;
+    }
+};
+
+/// Implementation of toDate32 function.
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDate32Transform32Or64
+{
+    static constexpr auto name = "toDate32";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    {
+        if (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
+            return static_cast<ToType>(from);
+        else
+        {
+            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+            {
+                if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
+            }
+            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME64_TIMESTAMP)));
+        }
+    }
+};
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDate32Transform32Or64Signed
+{
+    static constexpr auto name = "toDate32";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    {
+        static const Int32 daynum_min_offset = -static_cast<Int32>(time_zone.getDayNumOffsetEpoch());
+
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < daynum_min_offset || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
+        }
+
+        if (from < daynum_min_offset)
+            return daynum_min_offset;
+
+        return (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
+            ? static_cast<ToType>(from)
+            : time_zone.toDayNum(std::min(time_t(Int64(from)), time_t(MAX_DATETIME64_TIMESTAMP)));
+    }
+};
+
+template <typename FromType, typename ToType>
+struct ToDate32Transform8Or16Signed
+{
+    static constexpr auto name = "toDate32";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        return from;
+    }
+};
+
+
 /// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
 struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
 
@@ -241,6 +366,73 @@ struct ConvertImpl
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeImpl<date_time_overflow_behavior>, false>::execute(
                 arguments, result_type, input_rows_count);
         }
+        /** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
+          * Float32, Float64) to Date. If the
+          * number is less than 65536, then it is treated as DayNum, and if it's greater or equals to 65536,
+          * then treated as unix timestamp. If the number exceeds UInt32, saturate to MAX_UINT32 then as DayNum.
+          * It's a bit illogical, as we actually have two functions in one.
+          * But allows to support frequent case,
+          *  when user write toDate(UInt32), expecting conversion of unix timestamp to Date.
+          *  (otherwise such usage would be frequent mistake).
+          */
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeUInt32>
+                || std::is_same_v<FromDataType, DataTypeUInt64>)
+            && std::is_same_v<ToDataType, DataTypeDate>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt8>
+                || std::is_same_v<FromDataType, DataTypeInt16>)
+            && std::is_same_v<ToDataType, DataTypeDate>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform8Or16Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt32>
+                || std::is_same_v<FromDataType, DataTypeInt64>
+                || std::is_same_v<FromDataType, DataTypeFloat32>
+                || std::is_same_v<FromDataType, DataTypeFloat64>)
+            && std::is_same_v<ToDataType, DataTypeDate>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeUInt32>
+                || std::is_same_v<FromDataType, DataTypeUInt64>)
+            && std::is_same_v<ToDataType, DataTypeDate32>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt8>
+                || std::is_same_v<FromDataType, DataTypeInt16>)
+            && std::is_same_v<ToDataType, DataTypeDate32>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform8Or16Signed<typename FromDataType::FieldType, UInt16>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt32>
+                || std::is_same_v<FromDataType, DataTypeInt64>
+                || std::is_same_v<FromDataType, DataTypeFloat32>
+                || std::is_same_v<FromDataType, DataTypeFloat64>)
+            && std::is_same_v<ToDataType, DataTypeDate32>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
         else
         {
             using ColVecFrom = typename FromDataType::ColumnType;
@@ -490,208 +682,10 @@ struct ConvertImpl
 };
 
 
-/// Implementation of toDate function.
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTransform32Or64
-{
-    static constexpr auto name = "toDate";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
-        }
-        /// if value is smaller (or equal) than maximum day value for Date, than treat it as day num,
-        /// otherwise treat it as unix timestamp. This is a bit weird, but we leave this behavior.
-        if (from <= DATE_LUT_MAX_DAY_NUM)
-            return from;
-        else
-            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
-    }
-};
-
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTransform32Or64Signed
-{
-    static constexpr auto name = "toDate";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        // TODO: decide narrow or extended range based on FromType
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < 0 || from > MAX_DATE_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
-        }
-        else
-        {
-            if (from < 0)
-                return 0;
-        }
-        return (from <= DATE_LUT_MAX_DAY_NUM)
-            ? static_cast<ToType>(from)
-            : time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATE_TIMESTAMP)));
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTransform8Or16Signed
-{
-    static constexpr auto name = "toDate";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if (from < 0)
-        {
-            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
-            else
-                return 0;
-        }
-        return from;
-    }
-};
-
 template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ConvertImpl<DataTypeDateTime64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
         : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false> {};
 
-/// Implementation of toDate32 function.
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDate32Transform32Or64
-{
-    static constexpr auto name = "toDate32";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        if (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
-            return static_cast<ToType>(from);
-        else
-        {
-            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-            {
-                if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
-            }
-            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME64_TIMESTAMP)));
-        }
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDate32Transform32Or64Signed
-{
-    static constexpr auto name = "toDate32";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        static const Int32 daynum_min_offset = -static_cast<Int32>(time_zone.getDayNumOffsetEpoch());
-
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < daynum_min_offset || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
-        }
-
-        if (from < daynum_min_offset)
-            return daynum_min_offset;
-
-        return (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
-            ? static_cast<ToType>(from)
-            : time_zone.toDayNum(std::min(time_t(Int64(from)), time_t(MAX_DATETIME64_TIMESTAMP)));
-    }
-};
-
-template <typename FromType, typename ToType>
-struct ToDate32Transform8Or16Signed
-{
-    static constexpr auto name = "toDate32";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        return from;
-    }
-};
-
-/** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
-  * Float32, Float64) to Date. If the
-  * number is less than 65536, then it is treated as DayNum, and if it's greater or equals to 65536,
-  * then treated as unix timestamp. If the number exceeds UInt32, saturate to MAX_UINT32 then as DayNum.
-  * It's a bit illogical, as we actually have two functions in one.
-  * But allows to support frequent case,
-  *  when user write toDate(UInt32), expecting conversion of unix timestamp to Date.
-  *  (otherwise such usage would be frequent mistake).
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt32, DataTypeDate, ToDateTransform32Or64<UInt32, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDate, ToDateTransform32Or64<UInt64, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDate, ToDateTransform8Or16Signed<Int8, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDate, ToDateTransform8Or16Signed<Int16, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDate, ToDateTransform32Or64Signed<Int32, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDate, ToDateTransform32Or64Signed<Int64, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDate, ToDateTransform32Or64Signed<Float32, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDate, ToDateTransform32Or64Signed<Float64, UInt16, default_date_time_overflow_behavior>, false> {};
-
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt32, DataTypeDate32, ToDate32Transform32Or64<UInt32, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDate32, ToDate32Transform32Or64<UInt64, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDate32, ToDate32Transform8Or16Signed<Int8, Int32>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDate32, ToDate32Transform8Or16Signed<Int16, Int32>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDate32, ToDate32Transform32Or64Signed<Int32, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDate32, ToDate32Transform32Or64Signed<Int64, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDate32, ToDate32Transform32Or64Signed<Float32, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDate32, ToDate32Transform32Or64Signed<Float64, Int32, default_date_time_overflow_behavior>, false> {};
-
 
 template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDateTimeTransform64

From da06ba432e7a3232688a661aac337f9994fddead Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Wed, 13 Mar 2024 12:09:35 +0800
Subject: [PATCH 389/985] [fix] merge and resolve problems

---
 src/Storages/MergeTree/MergeTreeData.cpp | 21 ---------------------
 1 file changed, 21 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index 55ab8208472..f8448be7268 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7233,27 +7233,6 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     scope_guard src_flushed_tmp_dir_lock;
     MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
 
-    /// If source part is in memory, flush it to disk and clone it already in on-disk format
-    /// Protect tmp dir from removing by cleanup thread with src_flushed_tmp_dir_lock
-    /// Construct src_flushed_tmp_part in order to delete part with its directory at destructor
-    if (auto src_part_in_memory = asInMemoryPart(src_part))
-    {
-        auto flushed_part_path = *src_part_in_memory->getRelativePathForPrefix(tmp_part_prefix);
-
-        auto tmp_src_part_file_name = fs::path(tmp_dst_part_name).filename();
-        src_flushed_tmp_dir_lock = src_part->storage.getTemporaryPartDirectoryHolder(tmp_src_part_file_name);
-
-        auto flushed_part_storage = src_part_in_memory->flushToDisk(flushed_part_path, metadata_snapshot);
-
-        src_flushed_tmp_part = MergeTreeDataPartBuilder(*this, src_part->name, flushed_part_storage)
-            .withPartInfo(src_part->info)
-            .withPartFormatFromDisk()
-            .build();
-
-        src_flushed_tmp_part->is_temp = true;
-        src_part_storage = flushed_part_storage;
-    }
-
     String with_copy;
     if (params.copy_instead_of_hardlink)
         with_copy = " (copying data)";

From dbfda047014ab1b3e4cd81e46c5ce623387d61fe Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 05:18:51 +0100
Subject: [PATCH 390/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 846b6c31062..33ef12b9d23 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -366,6 +366,12 @@ struct ConvertImpl
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeImpl<date_time_overflow_behavior>, false>::execute(
                 arguments, result_type, input_rows_count);
         }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64> && std::is_same_v<ToDataType, DataTypeDate32>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false>::execute(
+                arguments, result_type, input_rows_count, TransformDateTime64<ToDate32Impl>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
+        }
         /** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
           * Float32, Float64) to Date. If the
           * number is less than 65536, then it is treated as DayNum, and if it's greater or equals to 65536,
@@ -682,11 +688,6 @@ struct ConvertImpl
 };
 
 
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-        : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false> {};
-
-
 template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDateTimeTransform64
 {

From a5383a4619a18f0979594e25701f8f7893d62d56 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 05:27:05 +0100
Subject: [PATCH 391/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 410 +++++++++++++-------------
 1 file changed, 205 insertions(+), 205 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 33ef12b9d23..ffcb0086e27 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -303,6 +303,183 @@ struct ToDate32Transform8Or16Signed
     }
 };
 
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTimeTransform64
+{
+    static constexpr auto name = "toDateTime";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
+        }
+        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
+    }
+};
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTimeTransformSigned
+{
+    static constexpr auto name = "toDateTime";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        if (from < 0)
+        {
+            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
+            else
+                return 0;
+        }
+        return from;
+    }
+};
+
+template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTimeTransform64Signed
+{
+    static constexpr auto name = "toDateTime";
+
+    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < 0 || from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
+        }
+
+        if (from < 0)
+            return 0;
+        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
+    }
+};
+
+/** Conversion of numeric to DateTime64
+  */
+
+template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTime64TransformUnsigned
+{
+    static constexpr auto name = "toDateTime64";
+
+    const DateTime64::NativeType scale_multiplier = 1;
+
+    ToDateTime64TransformUnsigned(UInt32 scale = 0) /// NOLINT
+        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
+    {}
+
+    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
+            else
+                return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
+        }
+        else
+            return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP), 0, scale_multiplier);
+    }
+};
+template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTime64TransformSigned
+{
+    static constexpr auto name = "toDateTime64";
+
+    const DateTime64::NativeType scale_multiplier = 1;
+
+    ToDateTime64TransformSigned(UInt32 scale = 0) /// NOLINT
+        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
+    {}
+
+    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
+        }
+        from = static_cast<FromType>(std::max<time_t>(from, MIN_DATETIME64_TIMESTAMP));
+        from = static_cast<FromType>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP));
+
+        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
+    }
+};
+template <typename FromDataType, typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+struct ToDateTime64TransformFloat
+{
+    static constexpr auto name = "toDateTime64";
+
+    const UInt32 scale = 1;
+
+    ToDateTime64TransformFloat(UInt32 scale_ = 0) /// NOLINT
+        : scale(scale_)
+    {}
+
+    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
+    {
+        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
+        {
+            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
+                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
+        }
+
+        from = std::max(from, static_cast<FromType>(MIN_DATETIME64_TIMESTAMP));
+        from = std::min(from, static_cast<FromType>(MAX_DATETIME64_TIMESTAMP));
+        return convertToDecimal<FromDataType, DataTypeDateTime64>(from, scale);
+    }
+};
+
+/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
+ */
+template <typename Transform>
+struct FromDateTime64Transform
+{
+    static constexpr auto name = Transform::name;
+
+    const DateTime64::NativeType scale_multiplier = 1;
+
+    FromDateTime64Transform(UInt32 scale) /// NOLINT
+        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
+    {}
+
+    auto execute(DateTime64::NativeType dt, const DateLUTImpl & time_zone) const
+    {
+        const auto c = DecimalUtils::splitWithScaleMultiplier(DateTime64(dt), scale_multiplier);
+        return Transform::execute(static_cast<UInt32>(c.whole), time_zone);
+    }
+};
+
+struct ToDateTime64Transform
+{
+    static constexpr auto name = "toDateTime64";
+
+    const DateTime64::NativeType scale_multiplier = 1;
+
+    ToDateTime64Transform(UInt32 scale = 0) /// NOLINT
+        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
+    {}
+
+    DateTime64::NativeType execute(UInt16 d, const DateLUTImpl & time_zone) const
+    {
+        const auto dt = ToDateTimeImpl<>::execute(d, time_zone);
+        return execute(dt, time_zone);
+    }
+
+    DateTime64::NativeType execute(Int32 d, const DateLUTImpl & time_zone) const
+    {
+        Int64 dt = static_cast<Int64>(time_zone.fromDayNum(ExtendedDayNum(d)));
+        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
+    }
+
+    DateTime64::NativeType execute(UInt32 dt, const DateLUTImpl & /*time_zone*/) const
+    {
+        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
+    }
+};
+
 
 /// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
 struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
@@ -439,6 +616,34 @@ struct ConvertImpl
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
                 arguments, result_type, input_rows_count);
         }
+        /// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt8>
+                || std::is_same_v<FromDataType, DataTypeInt16>
+                || std::is_same_v<FromDataType, DataTypeInt32>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransformSigned<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
+            && std::is_same_v<ToDataType, DataTypeDateTime>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt64>
+                || std::is_same_v<FromDataType, DataTypeFloat32>
+                || std::is_same_v<FromDataType, DataTypeFloat64>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64Signed<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
         else
         {
             using ColVecFrom = typename FromDataType::ColumnType;
@@ -688,164 +893,6 @@ struct ConvertImpl
 };
 
 
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTimeTransform64
-{
-    static constexpr auto name = "toDateTime";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
-        }
-        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTimeTransformSigned
-{
-    static constexpr auto name = "toDateTime";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if (from < 0)
-        {
-            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
-            else
-                return 0;
-        }
-        return from;
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTimeTransform64Signed
-{
-    static constexpr auto name = "toDateTime";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < 0 || from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
-        }
-
-        if (from < 0)
-            return 0;
-        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
-    }
-};
-
-/// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDateTime, ToDateTimeTransformSigned<Int8, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDateTime, ToDateTimeTransformSigned<Int16, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDateTime, ToDateTimeTransformSigned<Int32, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDateTime, ToDateTimeTransform64Signed<Int64, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDateTime, ToDateTimeTransform64<UInt64, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDateTime, ToDateTimeTransform64Signed<Float32, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDateTime, ToDateTimeTransform64Signed<Float64, UInt32, default_date_time_overflow_behavior>, false> {};
-
-/** Conversion of numeric to DateTime64
-  */
-
-template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTime64TransformUnsigned
-{
-    static constexpr auto name = "toDateTime64";
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    ToDateTime64TransformUnsigned(UInt32 scale = 0) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
-            else
-                return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
-        }
-        else
-            return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP), 0, scale_multiplier);
-    }
-};
-template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTime64TransformSigned
-{
-    static constexpr auto name = "toDateTime64";
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    ToDateTime64TransformSigned(UInt32 scale = 0) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
-        }
-        from = static_cast<FromType>(std::max<time_t>(from, MIN_DATETIME64_TIMESTAMP));
-        from = static_cast<FromType>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP));
-
-        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
-    }
-};
-template <typename FromDataType, typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTime64TransformFloat
-{
-    static constexpr auto name = "toDateTime64";
-
-    const UInt32 scale = 1;
-
-    ToDateTime64TransformFloat(UInt32 scale_ = 0) /// NOLINT
-        : scale(scale_)
-    {}
-
-    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
-        }
-
-        from = std::max(from, static_cast<FromType>(MIN_DATETIME64_TIMESTAMP));
-        from = std::min(from, static_cast<FromType>(MAX_DATETIME64_TIMESTAMP));
-        return convertToDecimal<FromDataType, DataTypeDateTime64>(from, scale);
-    }
-};
-
 template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ConvertImpl<DataTypeInt8, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
     : DateTimeTransformImpl<DataTypeInt8, DataTypeDateTime64, ToDateTime64TransformSigned<Int8, date_time_overflow_behavior>, false> {};
@@ -875,26 +922,6 @@ struct ConvertImpl<DataTypeFloat64, DataTypeDateTime64, Name, ConvertDefaultBeha
     : DateTimeTransformImpl<DataTypeFloat64, DataTypeDateTime64, ToDateTime64TransformFloat<DataTypeFloat64, Float64, date_time_overflow_behavior>, false> {};
 
 
-/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
- */
-template <typename Transform>
-struct FromDateTime64Transform
-{
-    static constexpr auto name = Transform::name;
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    FromDateTime64Transform(UInt32 scale) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    auto execute(DateTime64::NativeType dt, const DateLUTImpl & time_zone) const
-    {
-        const auto c = DecimalUtils::splitWithScaleMultiplier(DateTime64(dt), scale_multiplier);
-        return Transform::execute(static_cast<UInt32>(c.whole), time_zone);
-    }
-};
-
 /** Conversion of DateTime64 to Date or DateTime: discards fractional part.
  */
 template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
@@ -905,33 +932,6 @@ template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_over
 struct ConvertImpl<DataTypeDateTime64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
     : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDateTime, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false> {};
 
-struct ToDateTime64Transform
-{
-    static constexpr auto name = "toDateTime64";
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    ToDateTime64Transform(UInt32 scale = 0) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    DateTime64::NativeType execute(UInt16 d, const DateLUTImpl & time_zone) const
-    {
-        const auto dt = ToDateTimeImpl<>::execute(d, time_zone);
-        return execute(dt, time_zone);
-    }
-
-    DateTime64::NativeType execute(Int32 d, const DateLUTImpl & time_zone) const
-    {
-        Int64 dt = static_cast<Int64>(time_zone.fromDayNum(ExtendedDayNum(d)));
-        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
-    }
-
-    DateTime64::NativeType execute(UInt32 dt, const DateLUTImpl & /*time_zone*/) const
-    {
-        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
-    }
-};
 
 /** Conversion of Date or DateTime to DateTime64: add zero sub-second part.
   */

From 5336a8911794662d6a207c5e4adda14c93871562 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 05:36:09 +0100
Subject: [PATCH 392/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 56 +++++++++++++--------------
 1 file changed, 27 insertions(+), 29 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index ffcb0086e27..af240f88560 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -644,6 +644,33 @@ struct ConvertImpl
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64Signed<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
                 arguments, result_type, input_rows_count);
         }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt8>
+                || std::is_same_v<FromDataType, DataTypeInt16>
+                || std::is_same_v<FromDataType, DataTypeInt32>
+                || std::is_same_v<FromDataType, DataTypeInt64>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformSigned<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
+            && std::is_same_v<ToDataType, DataTypeDateTime64>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformUnsigned<UInt64, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeFloat32>
+                || std::is_same_v<FromDataType, DataTypeFloat64>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformFloat<FromDataType, typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
         else
         {
             using ColVecFrom = typename FromDataType::ColumnType;
@@ -893,35 +920,6 @@ struct ConvertImpl
 };
 
 
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDateTime64, ToDateTime64TransformSigned<Int8, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDateTime64, ToDateTime64TransformSigned<Int16, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDateTime64, ToDateTime64TransformSigned<Int32, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDateTime64, ToDateTime64TransformSigned<Int64, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDateTime64, ToDateTime64TransformUnsigned<UInt64, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDateTime64, ToDateTime64TransformFloat<DataTypeFloat32, Float32, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDateTime64, ToDateTime64TransformFloat<DataTypeFloat64, Float64, date_time_overflow_behavior>, false> {};
-
-
 /** Conversion of DateTime64 to Date or DateTime: discards fractional part.
  */
 template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>

From 460692ac74d68a38bad1b4786b3bbabd377189e6 Mon Sep 17 00:00:00 2001
From: Yakov Olkhovskiy <99031427+yakov-olkhovskiy@users.noreply.github.com>
Date: Wed, 13 Mar 2024 00:36:23 -0400
Subject: [PATCH 393/985] Update
 docs/en/sql-reference/functions/other-functions.md

---
 docs/en/sql-reference/functions/other-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index df443eec0de..288905c83da 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -360,7 +360,7 @@ sleepEachRow(seconds)
 
 **Arguments**
 
-- `seconds`: [Int](../../sql-reference/data-types/int-uint.md) The number of seconds to pause the query execution for each row in the result set. It can be a floating-point value to specify fractional seconds.
+- `seconds`: [Int](../../sql-reference/data-types/int-uint.md) The number of seconds to pause the query execution for each row in the result set to a maximum of 3 seconds. It can be a floating-point value to specify fractional seconds.
 
 **Returned value**
 

From b870d9d1cd767eddcbe98cb31abe0167bbdab488 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 05:45:33 +0100
Subject: [PATCH 394/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 239 +++++++++++++-------------
 1 file changed, 119 insertions(+), 120 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index af240f88560..574e99bd6a6 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -433,7 +433,7 @@ struct ToDateTime64TransformFloat
 };
 
 /** Conversion of DateTime64 to Date or DateTime: discards fractional part.
- */
+  */
 template <typename Transform>
 struct FromDateTime64Transform
 {
@@ -480,6 +480,98 @@ struct ToDateTime64Transform
     }
 };
 
+/** Transformation of numbers, dates, datetimes to strings: through formatting.
+  */
+template <typename DataType>
+struct FormatImpl
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const typename DataType::FieldType x, WriteBuffer & wb, const DataType *, const DateLUTImpl *)
+    {
+        writeText(x, wb);
+        return ReturnType(true);
+    }
+};
+
+template <>
+struct FormatImpl<DataTypeDate>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const DataTypeDate::FieldType x, WriteBuffer & wb, const DataTypeDate *, const DateLUTImpl * time_zone)
+    {
+        writeDateText(DayNum(x), wb, *time_zone);
+        return ReturnType(true);
+    }
+};
+
+template <>
+struct FormatImpl<DataTypeDate32>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const DataTypeDate32::FieldType x, WriteBuffer & wb, const DataTypeDate32 *, const DateLUTImpl * time_zone)
+    {
+        writeDateText(ExtendedDayNum(x), wb, *time_zone);
+        return ReturnType(true);
+    }
+};
+
+template <>
+struct FormatImpl<DataTypeDateTime>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const DataTypeDateTime::FieldType x, WriteBuffer & wb, const DataTypeDateTime *, const DateLUTImpl * time_zone)
+    {
+        writeDateTimeText(x, wb, *time_zone);
+        return ReturnType(true);
+    }
+};
+
+template <>
+struct FormatImpl<DataTypeDateTime64>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const DataTypeDateTime64::FieldType x, WriteBuffer & wb, const DataTypeDateTime64 * type, const DateLUTImpl * time_zone)
+    {
+        writeDateTimeText(DateTime64(x), type->getScale(), wb, *time_zone);
+        return ReturnType(true);
+    }
+};
+
+
+template <typename FieldType>
+struct FormatImpl<DataTypeEnum<FieldType>>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeEnum<FieldType> * type, const DateLUTImpl *)
+    {
+        static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
+
+        if constexpr (throw_exception)
+        {
+            writeString(type->getNameForValue(x), wb);
+        }
+        else
+        {
+            StringRef res;
+            bool is_ok = type->getNameForValue(x, res);
+            if (is_ok)
+                writeString(res, wb);
+            return ReturnType(is_ok);
+        }
+    }
+};
+
+template <typename FieldType>
+struct FormatImpl<DataTypeDecimal<FieldType>>
+{
+    template <typename ReturnType = void>
+    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeDecimal<FieldType> * type, const DateLUTImpl *)
+    {
+        writeText(x, type->getScale(), wb, false);
+        return ReturnType(true);
+    }
+};
+
 
 /// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
 struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
@@ -671,6 +763,32 @@ struct ConvertImpl
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformFloat<FromDataType, typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
                 arguments, result_type, input_rows_count);
         }
+        /// Conversion of DateTime64 to Date or DateTime: discards fractional part.
+        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
+            && std::is_same_v<ToDataType, DataTypeDate>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false>::execute(
+                arguments, result_type, input_rows_count, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
+        }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
+            && std::is_same_v<ToDataType, DataTypeDateTime>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false>::execute(
+                arguments, result_type, input_rows_count, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
+        }
+        /// Conversion of Date or DateTime to DateTime64: add zero sub-second part.
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeDate>
+                || std::is_same_v<FromDataType, DataTypeDate32>
+                || std::is_same_v<FromDataType, DataTypeDateTime>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64Transform, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
         else
         {
             using ColVecFrom = typename FromDataType::ColumnType;
@@ -920,125 +1038,6 @@ struct ConvertImpl
 };
 
 
-/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
- */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDateTime, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false> {};
-
-
-/** Conversion of Date or DateTime to DateTime64: add zero sub-second part.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate, DataTypeDateTime64, ToDateTime64Transform> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate32, DataTypeDateTime64, ToDateTime64Transform> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDateTime64, ToDateTime64Transform> {};
-
-
-/** Transformation of numbers, dates, datetimes to strings: through formatting.
-  */
-template <typename DataType>
-struct FormatImpl
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const typename DataType::FieldType x, WriteBuffer & wb, const DataType *, const DateLUTImpl *)
-    {
-        writeText(x, wb);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDate>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDate::FieldType x, WriteBuffer & wb, const DataTypeDate *, const DateLUTImpl * time_zone)
-    {
-        writeDateText(DayNum(x), wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDate32>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDate32::FieldType x, WriteBuffer & wb, const DataTypeDate32 *, const DateLUTImpl * time_zone)
-    {
-        writeDateText(ExtendedDayNum(x), wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDateTime>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDateTime::FieldType x, WriteBuffer & wb, const DataTypeDateTime *, const DateLUTImpl * time_zone)
-    {
-        writeDateTimeText(x, wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDateTime64>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDateTime64::FieldType x, WriteBuffer & wb, const DataTypeDateTime64 * type, const DateLUTImpl * time_zone)
-    {
-        writeDateTimeText(DateTime64(x), type->getScale(), wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-
-template <typename FieldType>
-struct FormatImpl<DataTypeEnum<FieldType>>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeEnum<FieldType> * type, const DateLUTImpl *)
-    {
-        static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
-
-        if constexpr (throw_exception)
-        {
-            writeString(type->getNameForValue(x), wb);
-        }
-        else
-        {
-            StringRef res;
-            bool is_ok = type->getNameForValue(x, res);
-            if (is_ok)
-                writeString(res, wb);
-            return ReturnType(is_ok);
-        }
-    }
-};
-
-template <typename FieldType>
-struct FormatImpl<DataTypeDecimal<FieldType>>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeDecimal<FieldType> * type, const DateLUTImpl *)
-    {
-        writeText(x, type->getScale(), wb, false);
-        return ReturnType(true);
-    }
-};
-
-
 /// DataTypeEnum<T> to DataType<T> free conversion
 template <typename FieldType, typename Name>
 struct ConvertImpl<DataTypeEnum<FieldType>, DataTypeNumber<FieldType>, Name, ConvertDefaultBehaviorTag>

From 8d9a8fdfc1d91723513bd66184662a810e01b2fe Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 05:52:01 +0100
Subject: [PATCH 395/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 25 +++++++------------------
 1 file changed, 7 insertions(+), 18 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 574e99bd6a6..2ce508c4924 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -609,9 +609,12 @@ struct ConvertImpl
     {
         const ColumnWithTypeAndName & named_from = arguments[0];
 
-        if constexpr (std::is_same_v<FromDataType, ToDataType> && !FromDataType::is_parametric)
+        if constexpr ((std::is_same_v<FromDataType, ToDataType> && !FromDataType::is_parametric)
+            || (std::is_same_v<FromDataType, DataTypeEnum8> && std::is_same_v<ToDataType, DataTypeInt8>)
+            || (std::is_same_v<FromDataType, DataTypeEnum16> && std::is_same_v<ToDataType, DataTypeInt16>))
         {
             /// If types are the same, reuse the columns.
+            /// Conversions between Enum and the underlying type are also free.
             return named_from.column;
         }
         else if constexpr ((std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDate32>)
@@ -1038,25 +1041,11 @@ struct ConvertImpl
 };
 
 
-/// DataTypeEnum<T> to DataType<T> free conversion
-template <typename FieldType, typename Name>
-struct ConvertImpl<DataTypeEnum<FieldType>, DataTypeNumber<FieldType>, Name, ConvertDefaultBehaviorTag>
-{
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/)
-    {
-        return arguments[0].column;
-    }
-};
-
 inline ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
 {
-    ColumnUInt8::MutablePtr null_map = nullptr;
-    if (const auto * col_null = checkAndGetColumn<ColumnNullable>(col.get()))
-    {
-        null_map = ColumnUInt8::create();
-        null_map->insertRangeFrom(col_null->getNullMapColumn(), 0, col_null->size());
-    }
-    return null_map;
+    if (const auto * col_nullable = checkAndGetColumn<ColumnNullable>(col.get()))
+        return col_nullable->getNullMapColumn().mutate();
+    return nullptr;
 }
 
 template <typename FromDataType, typename Name>

From 17a7696a378c5cfaad18214284e340f1d2306170 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 06:06:07 +0100
Subject: [PATCH 396/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 2ce508c4924..56a0d74c60c 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1041,11 +1041,15 @@ struct ConvertImpl
 };
 
 
-inline ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
+ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
 {
+    ColumnUInt8::MutablePtr null_map = nullptr;
     if (const auto * col_nullable = checkAndGetColumn<ColumnNullable>(col.get()))
-        return col_nullable->getNullMapColumn().mutate();
-    return nullptr;
+    {
+        null_map = ColumnUInt8::create();
+        null_map->insertRangeFrom(col_nullable->getNullMapColumn(), 0, col_nullable->size());
+    }
+    return null_map;
 }
 
 template <typename FromDataType, typename Name>

From ecd6b88831a4251acf3f62d52a43302fa1ef534c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 06:15:17 +0100
Subject: [PATCH 397/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 1272 ++++++++++++-------------
 1 file changed, 635 insertions(+), 637 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 56a0d74c60c..16f547939fa 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -572,475 +572,6 @@ struct FormatImpl<DataTypeDecimal<FieldType>>
     }
 };
 
-
-/// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
-struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
-
-struct AccurateConvertStrategyAdditions
-{
-    UInt32 scale { 0 };
-};
-
-struct AccurateOrNullConvertStrategyAdditions
-{
-    UInt32 scale { 0 };
-};
-
-
-struct ConvertDefaultBehaviorTag {};
-struct ConvertReturnNullOnErrorTag {};
-struct ConvertReturnZeroOnErrorTag {};
-
-/** Conversion of number types to each other, enums to numbers, dates and datetimes to numbers and back: done by straight assignment.
-  *  (Date is represented internally as number of days from some day; DateTime - as unix timestamp)
-  */
-template <typename FromDataType, typename ToDataType, typename Name,
-    typename SpecialTag = ConvertDefaultBehaviorTag,
-    FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
-struct ConvertImpl
-{
-    using FromFieldType = typename FromDataType::FieldType;
-    using ToFieldType = typename ToDataType::FieldType;
-
-    template <typename Additions = void *>
-    static ColumnPtr NO_SANITIZE_UNDEFINED execute(
-        const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type [[maybe_unused]], size_t input_rows_count,
-        Additions additions [[maybe_unused]] = Additions())
-    {
-        const ColumnWithTypeAndName & named_from = arguments[0];
-
-        if constexpr ((std::is_same_v<FromDataType, ToDataType> && !FromDataType::is_parametric)
-            || (std::is_same_v<FromDataType, DataTypeEnum8> && std::is_same_v<ToDataType, DataTypeInt8>)
-            || (std::is_same_v<FromDataType, DataTypeEnum16> && std::is_same_v<ToDataType, DataTypeInt16>))
-        {
-            /// If types are the same, reuse the columns.
-            /// Conversions between Enum and the underlying type are also free.
-            return named_from.column;
-        }
-        else if constexpr ((std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDate32>)
-            && std::is_same_v<ToDataType, DataTypeDate>)
-        {
-            /// Conversion of DateTime to Date: throw off time component.
-            /// Conversion of Date32 to Date.
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateImpl<date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> && std::is_same_v<ToDataType, DataTypeDate32>)
-        {
-            /// Conversion of DateTime to Date: throw off time component.
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Impl, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr ((std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
-            && std::is_same_v<ToDataType, DataTypeDateTime>)
-        {
-            /// Conversion from Date/Date32 to DateTime.
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeImpl<date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64> && std::is_same_v<ToDataType, DataTypeDate32>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false>::execute(
-                arguments, result_type, input_rows_count, TransformDateTime64<ToDate32Impl>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
-        }
-        /** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
-          * Float32, Float64) to Date. If the
-          * number is less than 65536, then it is treated as DayNum, and if it's greater or equals to 65536,
-          * then treated as unix timestamp. If the number exceeds UInt32, saturate to MAX_UINT32 then as DayNum.
-          * It's a bit illogical, as we actually have two functions in one.
-          * But allows to support frequent case,
-          *  when user write toDate(UInt32), expecting conversion of unix timestamp to Date.
-          *  (otherwise such usage would be frequent mistake).
-          */
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeUInt32>
-                || std::is_same_v<FromDataType, DataTypeUInt64>)
-            && std::is_same_v<ToDataType, DataTypeDate>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeInt8>
-                || std::is_same_v<FromDataType, DataTypeInt16>)
-            && std::is_same_v<ToDataType, DataTypeDate>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform8Or16Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeInt32>
-                || std::is_same_v<FromDataType, DataTypeInt64>
-                || std::is_same_v<FromDataType, DataTypeFloat32>
-                || std::is_same_v<FromDataType, DataTypeFloat64>)
-            && std::is_same_v<ToDataType, DataTypeDate>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeUInt32>
-                || std::is_same_v<FromDataType, DataTypeUInt64>)
-            && std::is_same_v<ToDataType, DataTypeDate32>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeInt8>
-                || std::is_same_v<FromDataType, DataTypeInt16>)
-            && std::is_same_v<ToDataType, DataTypeDate32>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform8Or16Signed<typename FromDataType::FieldType, UInt16>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeInt32>
-                || std::is_same_v<FromDataType, DataTypeInt64>
-                || std::is_same_v<FromDataType, DataTypeFloat32>
-                || std::is_same_v<FromDataType, DataTypeFloat64>)
-            && std::is_same_v<ToDataType, DataTypeDate32>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        /// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeInt8>
-                || std::is_same_v<FromDataType, DataTypeInt16>
-                || std::is_same_v<FromDataType, DataTypeInt32>)
-            && std::is_same_v<ToDataType, DataTypeDateTime>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransformSigned<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
-            && std::is_same_v<ToDataType, DataTypeDateTime>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeInt64>
-                || std::is_same_v<FromDataType, DataTypeFloat32>
-                || std::is_same_v<FromDataType, DataTypeFloat64>)
-            && std::is_same_v<ToDataType, DataTypeDateTime>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64Signed<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeInt8>
-                || std::is_same_v<FromDataType, DataTypeInt16>
-                || std::is_same_v<FromDataType, DataTypeInt32>
-                || std::is_same_v<FromDataType, DataTypeInt64>)
-            && std::is_same_v<ToDataType, DataTypeDateTime64>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformSigned<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
-            && std::is_same_v<ToDataType, DataTypeDateTime64>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformUnsigned<UInt64, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeFloat32>
-                || std::is_same_v<FromDataType, DataTypeFloat64>)
-            && std::is_same_v<ToDataType, DataTypeDateTime64>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformFloat<FromDataType, typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        /// Conversion of DateTime64 to Date or DateTime: discards fractional part.
-        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
-            && std::is_same_v<ToDataType, DataTypeDate>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false>::execute(
-                arguments, result_type, input_rows_count, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
-        }
-        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
-            && std::is_same_v<ToDataType, DataTypeDateTime>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false>::execute(
-                arguments, result_type, input_rows_count, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
-        }
-        /// Conversion of Date or DateTime to DateTime64: add zero sub-second part.
-        else if constexpr ((
-                std::is_same_v<FromDataType, DataTypeDate>
-                || std::is_same_v<FromDataType, DataTypeDate32>
-                || std::is_same_v<FromDataType, DataTypeDateTime>)
-            && std::is_same_v<ToDataType, DataTypeDateTime64>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64Transform, false>::execute(
-                arguments, result_type, input_rows_count);
-        }
-        else
-        {
-            using ColVecFrom = typename FromDataType::ColumnType;
-            using ColVecTo = typename ToDataType::ColumnType;
-
-            if constexpr ((IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
-                && !(std::is_same_v<DataTypeDateTime64, FromDataType> || std::is_same_v<DataTypeDateTime64, ToDataType>)
-                && (!IsDataTypeDecimalOrNumber<FromDataType> || !IsDataTypeDecimalOrNumber<ToDataType>))
-            {
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    named_from.column->getName(), Name::name);
-            }
-
-            const ColVecFrom * col_from = checkAndGetColumn<ColVecFrom>(named_from.column.get());
-            if (!col_from)
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    named_from.column->getName(), Name::name);
-
-            typename ColVecTo::MutablePtr col_to = nullptr;
-
-            if constexpr (IsDataTypeDecimal<ToDataType>)
-            {
-                UInt32 scale;
-
-                if constexpr (std::is_same_v<Additions, AccurateConvertStrategyAdditions>
-                    || std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                {
-                    scale = additions.scale;
-                }
-                else
-                {
-                    scale = additions;
-                }
-
-                col_to = ColVecTo::create(0, scale);
-            }
-            else
-                col_to = ColVecTo::create();
-
-            const auto & vec_from = col_from->getData();
-            auto & vec_to = col_to->getData();
-            vec_to.resize(input_rows_count);
-
-            ColumnUInt8::MutablePtr col_null_map_to;
-            ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
-            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-            {
-                col_null_map_to = ColumnUInt8::create(input_rows_count, false);
-                vec_null_map_to = &col_null_map_to->getData();
-            }
-
-            bool result_is_bool = isBool(result_type);
-            for (size_t i = 0; i < input_rows_count; ++i)
-            {
-                if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
-                {
-                    if (result_is_bool)
-                    {
-                        vec_to[i] = vec_from[i] != FromFieldType(0);
-                        continue;
-                    }
-                }
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> && std::is_same_v<ToDataType, DataTypeUInt128>)
-                {
-                    static_assert(
-                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                        "UInt128 and UUID types must be same");
-
-                    vec_to[i].items[1] = vec_from[i].toUnderType().items[0];
-                    vec_to[i].items[0] = vec_from[i].toUnderType().items[1];
-                }
-                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
-                {
-                    static_assert(
-                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                        "UInt128 and IPv6 types must be same");
-
-                    vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
-                    vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
-                }
-                else if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                    "Conversion between numeric types and UUID is not supported. "
-                                    "Probably the passed UUID is unquoted");
-                }
-                else if constexpr (
-                    (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
-                    && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6>
-                        || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>))
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
-                                    TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
-                }
-                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6>
-                    && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                    "Conversion between numeric types and IPv6 is not supported. "
-                                    "Probably the passed IPv6 is unquoted");
-                }
-                else if constexpr (IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
-                {
-                    if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                    {
-                        ToFieldType result;
-                        bool convert_result = false;
-
-                        if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                            convert_result = tryConvertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale(), result);
-                        else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
-                            convert_result = tryConvertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), result);
-                        else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                            convert_result = tryConvertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale(), result);
-
-                        if (convert_result)
-                            vec_to[i] = result;
-                        else
-                        {
-                            vec_to[i] = static_cast<ToFieldType>(0);
-                            (*vec_null_map_to)[i] = true;
-                        }
-                    }
-                    else
-                    {
-                        if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                            vec_to[i] = convertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale());
-                        else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
-                            vec_to[i] = convertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale());
-                        else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                            vec_to[i] = convertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale());
-                        else
-                            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unsupported data type in conversion function");
-                    }
-                }
-                else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
-                {
-                    const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
-                    const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                    if (!matchIPv6Subnet(src, ip4_cidr, 96))
-                    {
-                        char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
-                        char * paddr = addr;
-                        formatIPv6(src, paddr);
-
-                        throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
-                    }
-
-                    uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                    if constexpr (std::endian::native == std::endian::little)
-                    {
-                        dst[0] = src[15];
-                        dst[1] = src[14];
-                        dst[2] = src[13];
-                        dst[3] = src[12];
-                    }
-                    else
-                    {
-                        dst[0] = src[12];
-                        dst[1] = src[13];
-                        dst[2] = src[14];
-                        dst[3] = src[15];
-                    }
-                }
-                else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
-                {
-                    const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                    uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                    std::memset(dst, '\0', IPV6_BINARY_LENGTH);
-                    dst[10] = dst[11] = 0xff;
-
-                    if constexpr (std::endian::native == std::endian::little)
-                    {
-                        dst[12] = src[3];
-                        dst[13] = src[2];
-                        dst[14] = src[1];
-                        dst[15] = src[0];
-                    }
-                    else
-                    {
-                        dst[12] = src[0];
-                        dst[13] = src[1];
-                        dst[14] = src[2];
-                        dst[15] = src[3];
-                    }
-                }
-                else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
-                {
-                    vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
-                }
-                else if constexpr (std::is_same_v<Name, NameToUnixTimestamp>
-                    && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
-                {
-                    vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
-                }
-                else
-                {
-                    /// If From Data is Nan or Inf and we convert to integer type, throw exception
-                    if constexpr (std::is_floating_point_v<FromFieldType> && !std::is_floating_point_v<ToFieldType>)
-                    {
-                        if (!isFinite(vec_from[i]))
-                        {
-                            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                            {
-                                vec_to[i] = 0;
-                                (*vec_null_map_to)[i] = true;
-                                continue;
-                            }
-                            else
-                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unexpected inf or nan to integer conversion");
-                        }
-                    }
-
-                    if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>
-                            || std::is_same_v<Additions, AccurateConvertStrategyAdditions>)
-                    {
-                        bool convert_result = accurate::convertNumeric(vec_from[i], vec_to[i]);
-
-                        if (!convert_result)
-                        {
-                            if (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                            {
-                                vec_to[i] = 0;
-                                (*vec_null_map_to)[i] = true;
-                            }
-                            else
-                            {
-                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Value in column {} cannot be safely converted into type {}",
-                                    named_from.column->getName(), result_type->getName());
-                            }
-                        }
-                    }
-                    else
-                    {
-                        vec_to[i] = static_cast<ToFieldType>(vec_from[i]);
-                    }
-                }
-            }
-
-            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
-            else
-                return col_to;
-        }
-    }
-};
-
-
 ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
 {
     ColumnUInt8::MutablePtr null_map = nullptr;
@@ -1052,174 +583,6 @@ ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
     return null_map;
 }
 
-template <typename FromDataType, typename Name>
-requires (!std::is_same_v<FromDataType, DataTypeString>)
-struct ConvertImpl<FromDataType, DataTypeString, Name, ConvertDefaultBehaviorTag>
-{
-    using FromFieldType = typename FromDataType::FieldType;
-    using ColVecType = ColumnVectorOrDecimal<FromFieldType>;
-
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/)
-    {
-        if constexpr (IsDataTypeDateOrDateTime<FromDataType>)
-        {
-            auto datetime_arg = arguments[0];
-
-            const DateLUTImpl * time_zone = nullptr;
-            const ColumnConst * time_zone_column = nullptr;
-
-            if (arguments.size() == 1)
-            {
-                auto non_null_args = createBlockWithNestedColumns(arguments);
-                time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
-            }
-            else /// When we have a column for timezone
-            {
-                datetime_arg.column = datetime_arg.column->convertToFullColumnIfConst();
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
-                    time_zone = &DateLUT::instance();
-                /// For argument of Date or DateTime type, second argument with time zone could be specified.
-                if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDateTime64>)
-                {
-                    if ((time_zone_column = checkAndGetColumnConst<ColumnString>(arguments[1].column.get())))
-                    {
-                        auto non_null_args = createBlockWithNestedColumns(arguments);
-                        time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
-                    }
-                }
-            }
-            const auto & col_with_type_and_name = columnGetNested(datetime_arg);
-
-            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
-            {
-                auto col_to = ColumnString::create();
-
-                const typename ColVecType::Container & vec_from = col_from->getData();
-                ColumnString::Chars & data_to = col_to->getChars();
-                ColumnString::Offsets & offsets_to = col_to->getOffsets();
-                size_t size = vec_from.size();
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeDate>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
-                else if constexpr (std::is_same_v<FromDataType, DataTypeDate32>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
-                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss") + 1));
-                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss.") + col_from->getScale() + 1));
-                else
-                    data_to.resize(size * 3);   /// Arbitrary
-
-                offsets_to.resize(size);
-
-                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
-                const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
-
-                ColumnUInt8::MutablePtr null_map = copyNullMap(datetime_arg.column);
-
-                if (!null_map && arguments.size() > 1)
-                    null_map = copyNullMap(arguments[1].column->convertToFullColumnIfConst());
-
-                if (null_map)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!time_zone_column && arguments.size() > 1)
-                        {
-                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
-                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
-                            else
-                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
-                        }
-                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, time_zone);
-                        null_map->getData()[i] |= !is_ok;
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!time_zone_column && arguments.size() > 1)
-                        {
-                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
-                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
-                            else
-                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
-                        }
-                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, time_zone);
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-
-                write_buffer.finalize();
-
-                if (null_map)
-                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
-                return col_to;
-            }
-            else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                        arguments[0].column->getName(), Name::name);
-        }
-        else
-        {
-            ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
-
-            const auto & col_with_type_and_name = columnGetNested(arguments[0]);
-            const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
-
-            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
-            {
-                auto col_to = ColumnString::create();
-
-                const typename ColVecType::Container & vec_from = col_from->getData();
-                ColumnString::Chars & data_to = col_to->getChars();
-                ColumnString::Offsets & offsets_to = col_to->getOffsets();
-                size_t size = vec_from.size();
-
-                data_to.resize(size * 3);
-                offsets_to.resize(size);
-
-                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
-
-                if (null_map)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, nullptr);
-                        /// We don't use timezones in this branch
-                        null_map->getData()[i] |= !is_ok;
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, nullptr);
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-
-                write_buffer.finalize();
-
-                if (null_map)
-                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
-                return col_to;
-            }
-            else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                        arguments[0].column->getName(), Name::name);
-        }
-    }
-};
-
 
 /// Generic conversion of any type to String or FixedString via serialization to text.
 template <typename StringColumnType>
@@ -1774,6 +1137,641 @@ struct ConvertThroughParsing
 };
 
 
+/// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
+struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
+
+struct AccurateConvertStrategyAdditions
+{
+    UInt32 scale { 0 };
+};
+
+struct AccurateOrNullConvertStrategyAdditions
+{
+    UInt32 scale { 0 };
+};
+
+
+struct ConvertDefaultBehaviorTag {};
+struct ConvertReturnNullOnErrorTag {};
+struct ConvertReturnZeroOnErrorTag {};
+
+/** Conversion of number types to each other, enums to numbers, dates and datetimes to numbers and back: done by straight assignment.
+  *  (Date is represented internally as number of days from some day; DateTime - as unix timestamp)
+  */
+template <typename FromDataType, typename ToDataType, typename Name,
+    typename SpecialTag = ConvertDefaultBehaviorTag,
+    FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
+struct ConvertImpl
+{
+    using FromFieldType = typename FromDataType::FieldType;
+    using ToFieldType = typename ToDataType::FieldType;
+
+    template <typename Additions = void *>
+    static ColumnPtr NO_SANITIZE_UNDEFINED execute(
+        const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type [[maybe_unused]], size_t input_rows_count,
+        Additions additions [[maybe_unused]] = Additions())
+    {
+        const ColumnWithTypeAndName & named_from = arguments[0];
+
+        if constexpr ((std::is_same_v<FromDataType, ToDataType> && !FromDataType::is_parametric)
+            || (std::is_same_v<FromDataType, DataTypeEnum8> && std::is_same_v<ToDataType, DataTypeInt8>)
+            || (std::is_same_v<FromDataType, DataTypeEnum16> && std::is_same_v<ToDataType, DataTypeInt16>))
+        {
+            /// If types are the same, reuse the columns.
+            /// Conversions between Enum and the underlying type are also free.
+            return named_from.column;
+        }
+        else if constexpr ((std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDate32>)
+            && std::is_same_v<ToDataType, DataTypeDate>)
+        {
+            /// Conversion of DateTime to Date: throw off time component.
+            /// Conversion of Date32 to Date.
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateImpl<date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> && std::is_same_v<ToDataType, DataTypeDate32>)
+        {
+            /// Conversion of DateTime to Date: throw off time component.
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Impl, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>)
+        {
+            /// Conversion from Date/Date32 to DateTime.
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeImpl<date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64> && std::is_same_v<ToDataType, DataTypeDate32>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false>::execute(
+                arguments, result_type, input_rows_count, TransformDateTime64<ToDate32Impl>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
+        }
+        /** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
+          * Float32, Float64) to Date. If the
+          * number is less than 65536, then it is treated as DayNum, and if it's greater or equals to 65536,
+          * then treated as unix timestamp. If the number exceeds UInt32, saturate to MAX_UINT32 then as DayNum.
+          * It's a bit illogical, as we actually have two functions in one.
+          * But allows to support frequent case,
+          *  when user write toDate(UInt32), expecting conversion of unix timestamp to Date.
+          *  (otherwise such usage would be frequent mistake).
+          */
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeUInt32>
+                || std::is_same_v<FromDataType, DataTypeUInt64>)
+            && std::is_same_v<ToDataType, DataTypeDate>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt8>
+                || std::is_same_v<FromDataType, DataTypeInt16>)
+            && std::is_same_v<ToDataType, DataTypeDate>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform8Or16Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt32>
+                || std::is_same_v<FromDataType, DataTypeInt64>
+                || std::is_same_v<FromDataType, DataTypeFloat32>
+                || std::is_same_v<FromDataType, DataTypeFloat64>)
+            && std::is_same_v<ToDataType, DataTypeDate>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeUInt32>
+                || std::is_same_v<FromDataType, DataTypeUInt64>)
+            && std::is_same_v<ToDataType, DataTypeDate32>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt8>
+                || std::is_same_v<FromDataType, DataTypeInt16>)
+            && std::is_same_v<ToDataType, DataTypeDate32>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform8Or16Signed<typename FromDataType::FieldType, UInt16>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt32>
+                || std::is_same_v<FromDataType, DataTypeInt64>
+                || std::is_same_v<FromDataType, DataTypeFloat32>
+                || std::is_same_v<FromDataType, DataTypeFloat64>)
+            && std::is_same_v<ToDataType, DataTypeDate32>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        /// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt8>
+                || std::is_same_v<FromDataType, DataTypeInt16>
+                || std::is_same_v<FromDataType, DataTypeInt32>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransformSigned<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
+            && std::is_same_v<ToDataType, DataTypeDateTime>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt64>
+                || std::is_same_v<FromDataType, DataTypeFloat32>
+                || std::is_same_v<FromDataType, DataTypeFloat64>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64Signed<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeInt8>
+                || std::is_same_v<FromDataType, DataTypeInt16>
+                || std::is_same_v<FromDataType, DataTypeInt32>
+                || std::is_same_v<FromDataType, DataTypeInt64>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformSigned<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
+            && std::is_same_v<ToDataType, DataTypeDateTime64>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformUnsigned<UInt64, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeFloat32>
+                || std::is_same_v<FromDataType, DataTypeFloat64>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformFloat<FromDataType, typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        /// Conversion of DateTime64 to Date or DateTime: discards fractional part.
+        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
+            && std::is_same_v<ToDataType, DataTypeDate>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false>::execute(
+                arguments, result_type, input_rows_count, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
+        }
+        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
+            && std::is_same_v<ToDataType, DataTypeDateTime>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false>::execute(
+                arguments, result_type, input_rows_count, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
+        }
+        /// Conversion of Date or DateTime to DateTime64: add zero sub-second part.
+        else if constexpr ((
+                std::is_same_v<FromDataType, DataTypeDate>
+                || std::is_same_v<FromDataType, DataTypeDate32>
+                || std::is_same_v<FromDataType, DataTypeDateTime>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64Transform, false>::execute(
+                arguments, result_type, input_rows_count);
+        }
+        else if constexpr (IsDataTypeDateOrDateTime<FromDataType>
+            && std::is_same_v<ToDataType, DataTypeString>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            /// Date or DateTime to String
+
+            using ColVecType = ColumnVectorOrDecimal<FromFieldType>;
+
+            auto datetime_arg = arguments[0];
+
+            const DateLUTImpl * time_zone = nullptr;
+            const ColumnConst * time_zone_column = nullptr;
+
+            if (arguments.size() == 1)
+            {
+                auto non_null_args = createBlockWithNestedColumns(arguments);
+                time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
+            }
+            else /// When we have a column for timezone
+            {
+                datetime_arg.column = datetime_arg.column->convertToFullColumnIfConst();
+
+                if constexpr (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
+                    time_zone = &DateLUT::instance();
+                /// For argument of Date or DateTime type, second argument with time zone could be specified.
+                if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDateTime64>)
+                {
+                    if ((time_zone_column = checkAndGetColumnConst<ColumnString>(arguments[1].column.get())))
+                    {
+                        auto non_null_args = createBlockWithNestedColumns(arguments);
+                        time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
+                    }
+                }
+            }
+            const auto & col_with_type_and_name = columnGetNested(datetime_arg);
+
+            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
+            {
+                auto col_to = ColumnString::create();
+
+                const typename ColVecType::Container & vec_from = col_from->getData();
+                ColumnString::Chars & data_to = col_to->getChars();
+                ColumnString::Offsets & offsets_to = col_to->getOffsets();
+                size_t size = vec_from.size();
+
+                if constexpr (std::is_same_v<FromDataType, DataTypeDate>)
+                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
+                else if constexpr (std::is_same_v<FromDataType, DataTypeDate32>)
+                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
+                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime>)
+                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss") + 1));
+                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>)
+                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss.") + col_from->getScale() + 1));
+                else
+                    data_to.resize(size * 3);   /// Arbitrary
+
+                offsets_to.resize(size);
+
+                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
+                const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
+
+                ColumnUInt8::MutablePtr null_map = copyNullMap(datetime_arg.column);
+
+                if (!null_map && arguments.size() > 1)
+                    null_map = copyNullMap(arguments[1].column->convertToFullColumnIfConst());
+
+                if (null_map)
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        if (!time_zone_column && arguments.size() > 1)
+                        {
+                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
+                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
+                            else
+                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
+                        }
+                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, time_zone);
+                        null_map->getData()[i] |= !is_ok;
+                        writeChar(0, write_buffer);
+                        offsets_to[i] = write_buffer.count();
+                    }
+                }
+                else
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        if (!time_zone_column && arguments.size() > 1)
+                        {
+                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
+                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
+                            else
+                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
+                        }
+                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, time_zone);
+                        writeChar(0, write_buffer);
+                        offsets_to[i] = write_buffer.count();
+                    }
+                }
+
+                write_buffer.finalize();
+
+                if (null_map)
+                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
+                return col_to;
+            }
+            else
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                        arguments[0].column->getName(), Name::name);
+        }
+        else if constexpr (std::is_same_v<ToDataType, DataTypeString>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            /// Anything else to String.
+
+            using ColVecType = ColumnVectorOrDecimal<FromFieldType>;
+
+            ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
+
+            const auto & col_with_type_and_name = columnGetNested(arguments[0]);
+            const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
+
+            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
+            {
+                auto col_to = ColumnString::create();
+
+                const typename ColVecType::Container & vec_from = col_from->getData();
+                ColumnString::Chars & data_to = col_to->getChars();
+                ColumnString::Offsets & offsets_to = col_to->getOffsets();
+                size_t size = vec_from.size();
+
+                data_to.resize(size * 3);
+                offsets_to.resize(size);
+
+                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
+
+                if (null_map)
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, nullptr);
+                        /// We don't use timezones in this branch
+                        null_map->getData()[i] |= !is_ok;
+                        writeChar(0, write_buffer);
+                        offsets_to[i] = write_buffer.count();
+                    }
+                }
+                else
+                {
+                    for (size_t i = 0; i < size; ++i)
+                    {
+                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, nullptr);
+                        writeChar(0, write_buffer);
+                        offsets_to[i] = write_buffer.count();
+                    }
+                }
+
+                write_buffer.finalize();
+
+                if (null_map)
+                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
+                return col_to;
+            }
+            else
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                        arguments[0].column->getName(), Name::name);
+        }
+        else
+        {
+            using ColVecFrom = typename FromDataType::ColumnType;
+            using ColVecTo = typename ToDataType::ColumnType;
+
+            if constexpr ((IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
+                && !(std::is_same_v<DataTypeDateTime64, FromDataType> || std::is_same_v<DataTypeDateTime64, ToDataType>)
+                && (!IsDataTypeDecimalOrNumber<FromDataType> || !IsDataTypeDecimalOrNumber<ToDataType>))
+            {
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                    named_from.column->getName(), Name::name);
+            }
+
+            const ColVecFrom * col_from = checkAndGetColumn<ColVecFrom>(named_from.column.get());
+            if (!col_from)
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                    named_from.column->getName(), Name::name);
+
+            typename ColVecTo::MutablePtr col_to = nullptr;
+
+            if constexpr (IsDataTypeDecimal<ToDataType>)
+            {
+                UInt32 scale;
+
+                if constexpr (std::is_same_v<Additions, AccurateConvertStrategyAdditions>
+                    || std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                {
+                    scale = additions.scale;
+                }
+                else
+                {
+                    scale = additions;
+                }
+
+                col_to = ColVecTo::create(0, scale);
+            }
+            else
+                col_to = ColVecTo::create();
+
+            const auto & vec_from = col_from->getData();
+            auto & vec_to = col_to->getData();
+            vec_to.resize(input_rows_count);
+
+            ColumnUInt8::MutablePtr col_null_map_to;
+            ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
+            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+            {
+                col_null_map_to = ColumnUInt8::create(input_rows_count, false);
+                vec_null_map_to = &col_null_map_to->getData();
+            }
+
+            bool result_is_bool = isBool(result_type);
+            for (size_t i = 0; i < input_rows_count; ++i)
+            {
+                if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
+                {
+                    if (result_is_bool)
+                    {
+                        vec_to[i] = vec_from[i] != FromFieldType(0);
+                        continue;
+                    }
+                }
+
+                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> && std::is_same_v<ToDataType, DataTypeUInt128>)
+                {
+                    static_assert(
+                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
+                        "UInt128 and UUID types must be same");
+
+                    vec_to[i].items[1] = vec_from[i].toUnderType().items[0];
+                    vec_to[i].items[0] = vec_from[i].toUnderType().items[1];
+                }
+                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
+                {
+                    static_assert(
+                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
+                        "UInt128 and IPv6 types must be same");
+
+                    vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
+                    vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
+                }
+                else if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
+                {
+                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                                    "Conversion between numeric types and UUID is not supported. "
+                                    "Probably the passed UUID is unquoted");
+                }
+                else if constexpr (
+                    (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
+                    && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6>
+                        || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>))
+                {
+                    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
+                                    TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
+                }
+                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6>
+                    && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
+                {
+                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                                    "Conversion between numeric types and IPv6 is not supported. "
+                                    "Probably the passed IPv6 is unquoted");
+                }
+                else if constexpr (IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
+                {
+                    if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                    {
+                        ToFieldType result;
+                        bool convert_result = false;
+
+                        if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                            convert_result = tryConvertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale(), result);
+                        else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
+                            convert_result = tryConvertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), result);
+                        else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                            convert_result = tryConvertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale(), result);
+
+                        if (convert_result)
+                            vec_to[i] = result;
+                        else
+                        {
+                            vec_to[i] = static_cast<ToFieldType>(0);
+                            (*vec_null_map_to)[i] = true;
+                        }
+                    }
+                    else
+                    {
+                        if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                            vec_to[i] = convertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale());
+                        else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
+                            vec_to[i] = convertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale());
+                        else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
+                            vec_to[i] = convertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale());
+                        else
+                            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unsupported data type in conversion function");
+                    }
+                }
+                else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
+                {
+                    const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
+                    const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                    if (!matchIPv6Subnet(src, ip4_cidr, 96))
+                    {
+                        char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
+                        char * paddr = addr;
+                        formatIPv6(src, paddr);
+
+                        throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
+                    }
+
+                    uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                    if constexpr (std::endian::native == std::endian::little)
+                    {
+                        dst[0] = src[15];
+                        dst[1] = src[14];
+                        dst[2] = src[13];
+                        dst[3] = src[12];
+                    }
+                    else
+                    {
+                        dst[0] = src[12];
+                        dst[1] = src[13];
+                        dst[2] = src[14];
+                        dst[3] = src[15];
+                    }
+                }
+                else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
+                {
+                    const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
+                    uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
+                    std::memset(dst, '\0', IPV6_BINARY_LENGTH);
+                    dst[10] = dst[11] = 0xff;
+
+                    if constexpr (std::endian::native == std::endian::little)
+                    {
+                        dst[12] = src[3];
+                        dst[13] = src[2];
+                        dst[14] = src[1];
+                        dst[15] = src[0];
+                    }
+                    else
+                    {
+                        dst[12] = src[0];
+                        dst[13] = src[1];
+                        dst[14] = src[2];
+                        dst[15] = src[3];
+                    }
+                }
+                else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
+                {
+                    vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
+                }
+                else if constexpr (std::is_same_v<Name, NameToUnixTimestamp>
+                    && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
+                {
+                    vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
+                }
+                else
+                {
+                    /// If From Data is Nan or Inf and we convert to integer type, throw exception
+                    if constexpr (std::is_floating_point_v<FromFieldType> && !std::is_floating_point_v<ToFieldType>)
+                    {
+                        if (!isFinite(vec_from[i]))
+                        {
+                            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                            {
+                                vec_to[i] = 0;
+                                (*vec_null_map_to)[i] = true;
+                                continue;
+                            }
+                            else
+                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unexpected inf or nan to integer conversion");
+                        }
+                    }
+
+                    if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>
+                            || std::is_same_v<Additions, AccurateConvertStrategyAdditions>)
+                    {
+                        bool convert_result = accurate::convertNumeric(vec_from[i], vec_to[i]);
+
+                        if (!convert_result)
+                        {
+                            if (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                            {
+                                vec_to[i] = 0;
+                                (*vec_null_map_to)[i] = true;
+                            }
+                            else
+                            {
+                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Value in column {} cannot be safely converted into type {}",
+                                    named_from.column->getName(), result_type->getName());
+                            }
+                        }
+                    }
+                    else
+                    {
+                        vec_to[i] = static_cast<ToFieldType>(vec_from[i]);
+                    }
+                }
+            }
+
+            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
+                return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
+            else
+                return col_to;
+        }
+    }
+};
+
+
 template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 requires (!std::is_same_v<ToDataType, DataTypeString>)
 struct ConvertImpl<DataTypeString, ToDataType, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>

From f339c88079e2b0173b29e343872a576767b56e7b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 06:32:31 +0100
Subject: [PATCH 398/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 61 +++++++++++++--------------
 1 file changed, 29 insertions(+), 32 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 16f547939fa..5001abcb5d2 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1163,13 +1163,10 @@ template <typename FromDataType, typename ToDataType, typename Name,
     FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
 struct ConvertImpl
 {
-    using FromFieldType = typename FromDataType::FieldType;
-    using ToFieldType = typename ToDataType::FieldType;
-
     template <typename Additions = void *>
     static ColumnPtr NO_SANITIZE_UNDEFINED execute(
         const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type [[maybe_unused]], size_t input_rows_count,
-        Additions additions [[maybe_unused]] = Additions())
+        Additions additions = Additions())
     {
         const ColumnWithTypeAndName & named_from = arguments[0];
 
@@ -1206,7 +1203,7 @@ struct ConvertImpl
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false>::execute(
-                arguments, result_type, input_rows_count, TransformDateTime64<ToDate32Impl>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
+                arguments, result_type, input_rows_count, additions);
         }
         /** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
           * Float32, Float64) to Date. If the
@@ -1336,14 +1333,14 @@ struct ConvertImpl
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false>::execute(
-                arguments, result_type, input_rows_count, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
+                arguments, result_type, input_rows_count, additions);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
             && std::is_same_v<ToDataType, DataTypeDateTime>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false>::execute(
-                arguments, result_type, input_rows_count, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>(assert_cast<const DataTypeDateTime64 &>(*named_from.type).getScale()));
+                arguments, result_type, input_rows_count, additions);
         }
         /// Conversion of Date or DateTime to DateTime64: add zero sub-second part.
         else if constexpr ((
@@ -1362,6 +1359,7 @@ struct ConvertImpl
         {
             /// Date or DateTime to String
 
+            using FromFieldType = typename FromDataType::FieldType;
             using ColVecType = ColumnVectorOrDecimal<FromFieldType>;
 
             auto datetime_arg = arguments[0];
@@ -1471,6 +1469,7 @@ struct ConvertImpl
         {
             /// Anything else to String.
 
+            using FromFieldType = typename FromDataType::FieldType;
             using ColVecType = ColumnVectorOrDecimal<FromFieldType>;
 
             ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
@@ -1523,8 +1522,31 @@ struct ConvertImpl
                 throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
                         arguments[0].column->getName(), Name::name);
         }
+        else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>)
+            && !std::is_same_v<ToDataType, DataTypeString>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal>::execute(
+                arguments, result_type, input_rows_count, additions);
+        }
+        else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>)
+            && !std::is_same_v<ToDataType, DataTypeString>
+            && std::is_same_v<SpecialTag, ConvertReturnNullOnErrorTag>)
+        {
+            return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal>::execute(
+                arguments, result_type, input_rows_count, additions);
+        }
+        else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>)
+            && is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>
+            && std::is_same_v<SpecialTag, ConvertReturnZeroOnErrorTag>)
+        {
+            return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::Normal>::execute(
+                arguments, result_type, input_rows_count, additions);
+        }
         else
         {
+            using FromFieldType = typename FromDataType::FieldType;
+            using ToFieldType = typename ToDataType::FieldType;
             using ColVecFrom = typename FromDataType::ColumnType;
             using ColVecTo = typename ToDataType::ColumnType;
 
@@ -1772,31 +1794,6 @@ struct ConvertImpl
 };
 
 
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeString>)
-struct ConvertImpl<DataTypeString, ToDataType, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeString, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal> {};
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeFixedString>)
-struct ConvertImpl<DataTypeFixedString, ToDataType, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeFixedString, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal> {};
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeString>)
-struct ConvertImpl<DataTypeString, ToDataType, Name, ConvertReturnNullOnErrorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeString, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal> {};
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeFixedString>)
-struct ConvertImpl<DataTypeFixedString, ToDataType, Name, ConvertReturnNullOnErrorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeFixedString, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal> {};
-
-template <typename FromDataType, typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (is_any_of<FromDataType, DataTypeString, DataTypeFixedString> && is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>)
-struct ConvertImpl<FromDataType, ToDataType, Name, ConvertReturnZeroOnErrorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::Normal> {};
-
 /// Generic conversion of any type from String. Used for complex types: Array and Tuple or types with custom serialization.
 struct ConvertImplGenericFromString
 {

From 044eed8d8231cb7f22f46fd0b394a15698e7257f Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Wed, 13 Mar 2024 06:40:47 +0100
Subject: [PATCH 399/985] fix style

---
 .../test_memory_limit_observer/test.py        | 28 +++++++++----------
 1 file changed, 14 insertions(+), 14 deletions(-)

diff --git a/tests/integration/test_memory_limit_observer/test.py b/tests/integration/test_memory_limit_observer/test.py
index cf10f46be6a..54e8db89eac 100644
--- a/tests/integration/test_memory_limit_observer/test.py
+++ b/tests/integration/test_memory_limit_observer/test.py
@@ -7,9 +7,10 @@ from helpers.cluster import ClickHouseCluster, run_and_check
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance(
-    "node1", main_configs=["config/text_log.xml"], mem_limit = "5g"
+    "node1", main_configs=["config/text_log.xml"], mem_limit="5g"
 )
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
@@ -20,16 +21,19 @@ def started_cluster():
     finally:
         cluster.shutdown()
 
+
 def get_latest_mem_limit():
     for _ in range(10):
         try:
-            mem_limit = float(node1.query(
-            '''
-            select extract(message, '\\d+\\.\\d+') from system.text_log
-            where message like '%Setting max_server_memory_usage was set to%' and
-            message not like '%like%' order by event_time desc limit 1
-            '''
-            ).strip())
+            mem_limit = float(
+                node1.query(
+                    """
+                        select extract(message, '\\d+\\.\\d+') from system.text_log
+                        where message like '%Setting max_server_memory_usage was set to%' and
+                        message not like '%like%' order by event_time desc limit 1
+                    """
+                ).strip()
+            )
             return mem_limit
         except Exception as e:
             time.sleep(1)
@@ -37,15 +41,11 @@ def get_latest_mem_limit():
 
 def test_observe_memory_limit(started_cluster):
     original_max_mem = get_latest_mem_limit()
-    #container_id = cluster.get_container_id('node1')
-    #cmd = "docker update --memory=10g {}".format(node1.docker_id)
     logging.debug(f"get original memory limit {original_max_mem}")
-    run_and_check([
-        'docker', 'update', '--memory=10g', node1.docker_id
-    ])
+    run_and_check(['docker', 'update', '--memory=10g', node1.docker_id])
     for _ in range(30):
         time.sleep(10)
-        new_max_mem =  get_latest_mem_limit()
+        new_max_mem = get_latest_mem_limit()
         logging.debug(f"get new memory limit {new_max_mem}")
         if new_max_mem > original_max_mem:
             return

From 87db039d8952ca0e2ed32c7eda0f49600f9078c4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 07:06:06 +0100
Subject: [PATCH 400/985] Continue

---
 src/Functions/FunctionsConversion.cpp | 119 ++++++++++++--------------
 1 file changed, 55 insertions(+), 64 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 5001abcb5d2..fd328e8af42 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1354,8 +1354,7 @@ struct ConvertImpl
                 arguments, result_type, input_rows_count);
         }
         else if constexpr (IsDataTypeDateOrDateTime<FromDataType>
-            && std::is_same_v<ToDataType, DataTypeString>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeString>)
         {
             /// Date or DateTime to String
 
@@ -1464,6 +1463,54 @@ struct ConvertImpl
                 throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
                         arguments[0].column->getName(), Name::name);
         }
+        /// Conversion from FixedString to String.
+        /// Cutting sequences of zero bytes from end of strings.
+        else if constexpr (std::is_same_v<ToDataType, DataTypeString>
+            && std::is_same_v<FromDataType, DataTypeFixedString>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+            ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
+            const auto & nested =  columnGetNested(arguments[0]);
+            if (const ColumnFixedString * col_from = checkAndGetColumn<ColumnFixedString>(nested.column.get()))
+            {
+                auto col_to = ColumnString::create();
+
+                const ColumnFixedString::Chars & data_from = col_from->getChars();
+                ColumnString::Chars & data_to = col_to->getChars();
+                ColumnString::Offsets & offsets_to = col_to->getOffsets();
+                size_t size = col_from->size();
+                size_t n = col_from->getN();
+                data_to.resize(size * (n + 1)); /// + 1 - zero terminator
+                offsets_to.resize(size);
+
+                size_t offset_from = 0;
+                size_t offset_to = 0;
+                for (size_t i = 0; i < size; ++i)
+                {
+                    if (!null_map || !null_map->getData()[i])
+                    {
+                        size_t bytes_to_copy = n;
+                        while (bytes_to_copy > 0 && data_from[offset_from + bytes_to_copy - 1] == 0)
+                            --bytes_to_copy;
+
+                        memcpy(&data_to[offset_to], &data_from[offset_from], bytes_to_copy);
+                        offset_to += bytes_to_copy;
+                    }
+                    data_to[offset_to] = 0;
+                    ++offset_to;
+                    offsets_to[i] = offset_to;
+                    offset_from += n;
+                }
+
+                data_to.resize(offset_to);
+                if (result_type->isNullable() && null_map)
+                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
+                return col_to;
+            }
+            else
+                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
+                        arguments[0].column->getName(), Name::name);
+        }
         else if constexpr (std::is_same_v<ToDataType, DataTypeString>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
@@ -1543,6 +1590,12 @@ struct ConvertImpl
             return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::Normal>::execute(
                 arguments, result_type, input_rows_count, additions);
         }
+        else if constexpr (std::is_same_v<Name, NameToUnixTimestamp>
+            && std::is_same_v<FromDataType, DataTypeString>
+            && std::is_same_v<ToDataType, DataTypeUInt32>
+            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        {
+        }
         else
         {
             using FromFieldType = typename FromDataType::FieldType;
@@ -1863,68 +1916,6 @@ struct ConvertImplGenericFromString
 };
 
 
-template <>
-struct ConvertImpl<DataTypeString, DataTypeUInt32, NameToUnixTimestamp, ConvertDefaultBehaviorTag>
-    : ConvertImpl<DataTypeString, DataTypeDateTime, NameToUnixTimestamp, ConvertDefaultBehaviorTag> {};
-
-template <>
-struct ConvertImpl<DataTypeString, DataTypeUInt32, NameToUnixTimestamp, ConvertReturnNullOnErrorTag>
-    : ConvertImpl<DataTypeString, DataTypeDateTime, NameToUnixTimestamp, ConvertReturnNullOnErrorTag> {};
-
-
-/** Conversion from FixedString to String.
-  * Cutting sequences of zero bytes from end of strings.
-  */
-template <typename Name>
-struct ConvertImpl<DataTypeFixedString, DataTypeString, Name, ConvertDefaultBehaviorTag>
-{
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type, size_t /*input_rows_count*/)
-    {
-        ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
-        const auto & nested =  columnGetNested(arguments[0]);
-        if (const ColumnFixedString * col_from = checkAndGetColumn<ColumnFixedString>(nested.column.get()))
-        {
-            auto col_to = ColumnString::create();
-
-            const ColumnFixedString::Chars & data_from = col_from->getChars();
-            ColumnString::Chars & data_to = col_to->getChars();
-            ColumnString::Offsets & offsets_to = col_to->getOffsets();
-            size_t size = col_from->size();
-            size_t n = col_from->getN();
-            data_to.resize(size * (n + 1)); /// + 1 - zero terminator
-            offsets_to.resize(size);
-
-            size_t offset_from = 0;
-            size_t offset_to = 0;
-            for (size_t i = 0; i < size; ++i)
-            {
-                if (!null_map || !null_map->getData()[i])
-                {
-                    size_t bytes_to_copy = n;
-                    while (bytes_to_copy > 0 && data_from[offset_from + bytes_to_copy - 1] == 0)
-                        --bytes_to_copy;
-
-                    memcpy(&data_to[offset_to], &data_from[offset_from], bytes_to_copy);
-                    offset_to += bytes_to_copy;
-                }
-                data_to[offset_to] = 0;
-                ++offset_to;
-                offsets_to[i] = offset_to;
-                offset_from += n;
-            }
-
-            data_to.resize(offset_to);
-            if (return_type->isNullable() && null_map)
-                return ColumnNullable::create(std::move(col_to), std::move(null_map));
-            return col_to;
-        }
-        else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    arguments[0].column->getName(), Name::name);
-    }
-};
-
-
 /// Declared early because used below.
 struct NameToDate { static constexpr auto name = "toDate"; };
 struct NameToDate32 { static constexpr auto name = "toDate32"; };

From f8dfd8c03a05f45729f0dce588da4c9b0200739e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 07:15:07 +0100
Subject: [PATCH 401/985] Less garbage

---
 src/Functions/FunctionsConversion.cpp | 30 +++++++++++++--------------
 1 file changed, 15 insertions(+), 15 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index fd328e8af42..5461661386e 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -2389,7 +2389,6 @@ public:
     static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
 
     static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionConvertFromString>(); }
-    static FunctionPtr create() { return std::make_shared<FunctionConvertFromString>(); }
 
     String getName() const override
     {
@@ -2516,28 +2515,29 @@ public:
         ColumnPtr result_column;
 
         if constexpr (to_decimal)
+        {
             result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count,
                 assert_cast<const ToDataType &>(*removeNullable(result_type)).getScale());
-        else
+        }
+        else if (isDateTime64<Name, ToDataType>(arguments))
         {
-            if (isDateTime64<Name, ToDataType>(arguments))
-            {
-                UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
-                if (arguments.size() > 1)
-                    scale = extractToDecimalScale(arguments[1]);
+            UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
+            if (arguments.size() > 1)
+                scale = extractToDecimalScale(arguments[1]);
 
-                if (scale == 0)
-                    result_column = executeInternal<DataTypeDateTime>(arguments, result_type, input_rows_count);
-                else
-                {
-                    result_column = executeInternal<DataTypeDateTime64>(arguments, result_type, input_rows_count, static_cast<UInt32>(scale));
-                }
+            if (scale == 0)
+            {
+                result_column = executeInternal<DataTypeDateTime>(arguments, result_type, input_rows_count);
             }
             else
             {
-                result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count);
+                result_column = executeInternal<DataTypeDateTime64>(arguments, result_type, input_rows_count, static_cast<UInt32>(scale));
             }
         }
+        else
+        {
+            result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count);
+        }
 
         if (!result_column)
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
@@ -3204,7 +3204,7 @@ private:
         {
             /// In case when converting to Nullable type, we apply different parsing rule,
             /// that will not throw an exception but return NULL in case of malformed input.
-            FunctionPtr function = FunctionConvertFromString<ToDataType, FunctionCastName, ConvertFromStringExceptionMode::Null>::create();
+            FunctionPtr function = FunctionConvertFromString<ToDataType, FunctionCastName, ConvertFromStringExceptionMode::Null>::create(context);
             return createFunctionAdaptor(function, from_type);
         }
         else if (!can_apply_accurate_cast)

From cb3ffc6f1a6da589739d94b82a965c3bd5835e43 Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Wed, 13 Mar 2024 07:28:41 +0100
Subject: [PATCH 402/985] fix style

---
 tests/integration/test_memory_limit_observer/test.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_memory_limit_observer/test.py b/tests/integration/test_memory_limit_observer/test.py
index 54e8db89eac..408aa5e4018 100644
--- a/tests/integration/test_memory_limit_observer/test.py
+++ b/tests/integration/test_memory_limit_observer/test.py
@@ -39,10 +39,11 @@ def get_latest_mem_limit():
             time.sleep(1)
     raise Exception("Cannot get memory limit")
 
+
 def test_observe_memory_limit(started_cluster):
     original_max_mem = get_latest_mem_limit()
     logging.debug(f"get original memory limit {original_max_mem}")
-    run_and_check(['docker', 'update', '--memory=10g', node1.docker_id])
+    run_and_check(["docker", "update", "--memory=10g", node1.docker_id])
     for _ in range(30):
         time.sleep(10)
         new_max_mem = get_latest_mem_limit()

From 65a541fbdbac4ec3a00a1f0271867e68e6cdef87 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 07:48:14 +0100
Subject: [PATCH 403/985] Tighten

---
 utils/check-style/check-large-objects.sh | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/utils/check-style/check-large-objects.sh b/utils/check-style/check-large-objects.sh
index 3e2a385bdd0..9b78d6196e3 100755
--- a/utils/check-style/check-large-objects.sh
+++ b/utils/check-style/check-large-objects.sh
@@ -6,10 +6,7 @@ export LC_ALL=C # The "total" should be printed without localization
 
 TU_EXCLUDES=(
     AggregateFunctionUniq
-    FunctionsConversion
-
     RangeHashedDictionary
-
     Aggregator
 )
 

From 486e8537a80abe1b238839f207f35a9f9030011e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 08:02:27 +0100
Subject: [PATCH 404/985] Fix error

---
 src/Functions/FunctionsConversion.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 5461661386e..67d6e202255 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1309,14 +1309,14 @@ struct ConvertImpl
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformSigned<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
+                arguments, result_type, input_rows_count, additions);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
             && std::is_same_v<ToDataType, DataTypeDateTime64>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformUnsigned<UInt64, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
+                arguments, result_type, input_rows_count, additions);
         }
         else if constexpr ((
                 std::is_same_v<FromDataType, DataTypeFloat32>
@@ -1325,7 +1325,7 @@ struct ConvertImpl
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformFloat<FromDataType, typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count);
+                arguments, result_type, input_rows_count, additions);
         }
         /// Conversion of DateTime64 to Date or DateTime: discards fractional part.
         else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
@@ -1351,7 +1351,7 @@ struct ConvertImpl
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64Transform, false>::execute(
-                arguments, result_type, input_rows_count);
+                arguments, result_type, input_rows_count, additions);
         }
         else if constexpr (IsDataTypeDateOrDateTime<FromDataType>
             && std::is_same_v<ToDataType, DataTypeString>)

From cea5d460f8a14561d733fef69cff1721567c3fb2 Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Wed, 13 Mar 2024 15:06:28 +0800
Subject: [PATCH 405/985] [debug] replace 2 submodule to new version(whose
 version can't be found in test)

---
 contrib/idxd-config | 2 +-
 contrib/re2         | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/contrib/idxd-config b/contrib/idxd-config
index a836ce0e420..3feff87d1f4 160000
--- a/contrib/idxd-config
+++ b/contrib/idxd-config
@@ -1 +1 @@
-Subproject commit a836ce0e42052a69bffbbc14239ab4097f3b77f1
+Subproject commit 3feff87d1f4add861b356f2126364750c7d00727
diff --git a/contrib/re2 b/contrib/re2
index a807e8a3aac..108914d28a7 160000
--- a/contrib/re2
+++ b/contrib/re2
@@ -1 +1 @@
-Subproject commit a807e8a3aac2cc33c77b7071efea54fcabe38e0c
+Subproject commit 108914d28a79243d4300e7e651cd0a0d5883ca0f

From 87846b2c98205f95db69d99ede102e600615c54a Mon Sep 17 00:00:00 2001
From: Mikhail Koviazin <mikhail.koviazin@aiven.io>
Date: Wed, 13 Mar 2024 09:14:55 +0200
Subject: [PATCH 406/985] Added more tests

---
 .../0_stateless/00662_has_nullable.reference  | 12 +++++++
 .../0_stateless/00662_has_nullable.sql        | 32 +++++++++++++++++++
 2 files changed, 44 insertions(+)

diff --git a/tests/queries/0_stateless/00662_has_nullable.reference b/tests/queries/0_stateless/00662_has_nullable.reference
index 97da99d655e..1ac93f25a39 100644
--- a/tests/queries/0_stateless/00662_has_nullable.reference
+++ b/tests/queries/0_stateless/00662_has_nullable.reference
@@ -1,2 +1,14 @@
+Nullable(UInt64), non-null array
 1	1
 \N	0
+Non-nullable UInt64, nullable array
+0	0
+1	1
+2	1
+Nullable(UInt64), nullable array
+0	0
+\N	1
+1	1
+All NULLs
+0	0
+\N	1
diff --git a/tests/queries/0_stateless/00662_has_nullable.sql b/tests/queries/0_stateless/00662_has_nullable.sql
index 0d395871d9f..3fd3bd46baa 100644
--- a/tests/queries/0_stateless/00662_has_nullable.sql
+++ b/tests/queries/0_stateless/00662_has_nullable.sql
@@ -1,7 +1,39 @@
 DROP TABLE IF EXISTS 00662_has_nullable;
+
+SELECT 'Nullable(UInt64), non-null array';
 CREATE TABLE 00662_has_nullable(a Nullable(UInt64)) ENGINE = Memory;
 
 INSERT INTO 00662_has_nullable VALUES (1), (Null);
 SELECT a, has([0, 1], a) FROM 00662_has_nullable;
 
 DROP TABLE 00662_has_nullable;
+
+--------------------------------------------------------------------------------
+
+SELECT 'Non-nullable UInt64, nullable array';
+CREATE TABLE 00662_has_nullable(a UInt64) ENGINE = Memory;
+
+INSERT INTO 00662_has_nullable VALUES (0), (1), (2);
+SELECT a, has([NULL, 1, 2], a) FROM 00662_has_nullable;
+
+DROP TABLE 00662_has_nullable;
+
+--------------------------------------------------------------------------------
+
+SELECT 'Nullable(UInt64), nullable array';
+CREATE TABLE 00662_has_nullable(a Nullable(UInt64)) ENGINE = Memory;
+
+INSERT INTO 00662_has_nullable VALUES (0), (Null), (1);
+SELECT a, has([NULL, 1, 2], a) FROM 00662_has_nullable;
+
+DROP TABLE 00662_has_nullable;
+
+--------------------------------------------------------------------------------
+
+SELECT 'All NULLs';
+CREATE TABLE 00662_has_nullable(a Nullable(UInt64)) ENGINE = Memory;
+
+INSERT INTO 00662_has_nullable VALUES (0), (Null);
+SELECT a, has([NULL, NULL], a) FROM 00662_has_nullable;
+
+DROP TABLE 00662_has_nullable;

From 28bebe40a8bc457a6c743e11727269ad1edc6b0d Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Wed, 13 Mar 2024 15:17:35 +0800
Subject: [PATCH 407/985] [debug] change the submodule back to version which is
 similar to master

---
 contrib/idxd-config | 2 +-
 contrib/re2         | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/contrib/idxd-config b/contrib/idxd-config
index 3feff87d1f4..a836ce0e420 160000
--- a/contrib/idxd-config
+++ b/contrib/idxd-config
@@ -1 +1 @@
-Subproject commit 3feff87d1f4add861b356f2126364750c7d00727
+Subproject commit a836ce0e42052a69bffbbc14239ab4097f3b77f1
diff --git a/contrib/re2 b/contrib/re2
index 108914d28a7..a807e8a3aac 160000
--- a/contrib/re2
+++ b/contrib/re2
@@ -1 +1 @@
-Subproject commit 108914d28a79243d4300e7e651cd0a0d5883ca0f
+Subproject commit a807e8a3aac2cc33c77b7071efea54fcabe38e0c

From 6ebc1e4522c7dc071e14c253fc47f87ab9b3d458 Mon Sep 17 00:00:00 2001
From: lgbo-ustc <lgbo.ustc@gmail.com>
Date: Wed, 13 Mar 2024 17:09:01 +0800
Subject: [PATCH 408/985] fixed

---
 src/Interpreters/Aggregator.cpp | 130 +++++++++++---------------------
 1 file changed, 44 insertions(+), 86 deletions(-)

diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 2902a590e01..28f8bf7972f 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -2051,7 +2051,7 @@ Aggregator::ConvertToBlockResVariant Aggregator::convertToBlockImplFinal(
     Table & data,
     Arena * arena,
     Arenas & aggregates_pools,
-    bool use_compiled_functions,
+    bool use_compiled_functions [[maybe_unused]],
     bool return_single_block) const
 {
     /// +1 for nullKeyData, if `data` doesn't have it - not a problem, just some memory for one excessive row will be preallocated
@@ -2091,46 +2091,28 @@ Aggregator::ConvertToBlockResVariant Aggregator::convertToBlockImplFinal(
     // should be invoked at least once, because null data might be the only content of the `data`
     init_out_cols();
 
-    if (return_single_block)
-    {
-        data.forEachValue(
-            [&](const auto & key, auto & mapped)
+    data.forEachValue(
+        [&](const auto & key, auto & mapped)
+        {
+            if (!out_cols.has_value())
+                init_out_cols();
+
+            const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
+            method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
+            places.emplace_back(mapped);
+
+            /// Mark the cell as destroyed so it will not be destroyed in destructor.
+            mapped = nullptr;
+
+            if (return_single_block && places.size() >= max_block_size)
             {
-                if (!out_cols.has_value())
-                    init_out_cols();
-
-                const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
-                method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
-                places.emplace_back(mapped);
-
-                /// Mark the cell as destroyed so it will not be destroyed in destructor.
-                mapped = nullptr;
-            });
-    }
-    else
-    {
-        data.forEachValue(
-            [&](const auto & key, auto & mapped)
-            {
-                if (!out_cols.has_value())
-                    init_out_cols();
-
-                const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
-                method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
-                places.emplace_back(mapped);
-
-                /// Mark the cell as destroyed so it will not be destroyed in destructor.
-                mapped = nullptr;
-
-                if (places.size() >= max_block_size)
-                {
-                    blocks.emplace_back(insertResultsIntoColumns(places, std::move(out_cols.value()), arena, has_null_key_data, use_compiled_functions));
-                    places.clear();
-                    out_cols.reset();
-                    has_null_key_data = false;
-                }
-            });
-    }
+                blocks.emplace_back(
+                    insertResultsIntoColumns(places, std::move(out_cols.value()), arena, has_null_key_data, use_compiled_functions));
+                places.clear();
+                out_cols.reset();
+                has_null_key_data = false;
+            }
+        });
 
     if (return_single_block)
     {
@@ -2183,53 +2165,29 @@ Aggregator::convertToBlockImplNotFinal(Method & method, Table & data, Arenas & a
 
     // should be invoked at least once, because null data might be the only content of the `data`
     init_out_cols();
-    if (return_single_block)
-    {
-        data.forEachValue(
-            [&](const auto & key, auto & mapped)
+    data.forEachValue(
+        [&](const auto & key, auto & mapped)
+        {
+            if (!out_cols.has_value())
+                init_out_cols();
+
+            const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
+            method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
+
+            /// reserved, so push_back does not throw exceptions
+            for (size_t i = 0; i < params.aggregates_size; ++i)
+                out_cols->aggregate_columns_data[i]->push_back(mapped + offsets_of_aggregate_states[i]);
+
+            mapped = nullptr;
+
+            ++rows_in_current_block;
+            if (return_single_block && rows_in_current_block >= max_block_size)
             {
-                if (!out_cols.has_value())
-                    init_out_cols();
-
-                const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
-                method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
-
-                /// reserved, so push_back does not throw exceptions
-                for (size_t i = 0; i < params.aggregates_size; ++i)
-                    out_cols->aggregate_columns_data[i]->push_back(mapped + offsets_of_aggregate_states[i]);
-
-                mapped = nullptr;
-
-                ++rows_in_current_block;
-            });
-    }
-    else
-    {
-        data.forEachValue(
-            [&](const auto & key, auto & mapped)
-            {
-                if (!out_cols.has_value())
-                    init_out_cols();
-
-                const auto & key_sizes_ref = shuffled_key_sizes ? *shuffled_key_sizes : key_sizes;
-                method.insertKeyIntoColumns(key, out_cols->raw_key_columns, key_sizes_ref);
-
-                /// reserved, so push_back does not throw exceptions
-                for (size_t i = 0; i < params.aggregates_size; ++i)
-                    out_cols->aggregate_columns_data[i]->push_back(mapped + offsets_of_aggregate_states[i]);
-
-                mapped = nullptr;
-
-                ++rows_in_current_block;
-
-                if (rows_in_current_block >= max_block_size)
-                {
-                    res_blocks.emplace_back(finalizeBlock(params, getHeader(final), std::move(out_cols.value()), final, rows_in_current_block));
-                    out_cols.reset();
-                    rows_in_current_block = 0;
-                }
-            });
-    }
+                res_blocks.emplace_back(finalizeBlock(params, getHeader(final), std::move(out_cols.value()), final, rows_in_current_block));
+                out_cols.reset();
+                rows_in_current_block = 0;
+            }
+        });
 
     if (return_single_block)
     {

From 87a03ae219f376f4bae70fdc4f277b7d3b7e8e4f Mon Sep 17 00:00:00 2001
From: lgbo-ustc <lgbo.ustc@gmail.com>
Date: Wed, 13 Mar 2024 17:20:56 +0800
Subject: [PATCH 409/985] fixed

---
 src/Interpreters/Aggregator.cpp | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 28f8bf7972f..c2a6634c55d 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -2104,7 +2104,7 @@ Aggregator::ConvertToBlockResVariant Aggregator::convertToBlockImplFinal(
             /// Mark the cell as destroyed so it will not be destroyed in destructor.
             mapped = nullptr;
 
-            if (return_single_block && places.size() >= max_block_size)
+            if (!return_single_block && places.size() >= max_block_size)
             {
                 blocks.emplace_back(
                     insertResultsIntoColumns(places, std::move(out_cols.value()), arena, has_null_key_data, use_compiled_functions));
@@ -2181,7 +2181,7 @@ Aggregator::convertToBlockImplNotFinal(Method & method, Table & data, Arenas & a
             mapped = nullptr;
 
             ++rows_in_current_block;
-            if (return_single_block && rows_in_current_block >= max_block_size)
+            if (!return_single_block && rows_in_current_block >= max_block_size)
             {
                 res_blocks.emplace_back(finalizeBlock(params, getHeader(final), std::move(out_cols.value()), final, rows_in_current_block));
                 out_cols.reset();
@@ -2199,7 +2199,6 @@ Aggregator::convertToBlockImplNotFinal(Method & method, Table & data, Arenas & a
             res_blocks.emplace_back(finalizeBlock(params, getHeader(final), std::move(out_cols).value(), final, rows_in_current_block));
         return res_blocks;
     }
-    return res_blocks;
 }
 
 void Aggregator::addSingleKeyToAggregateColumns(

From 514f8392f93b9488ab4b52011102891a851b51db Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 13 Mar 2024 10:25:37 +0100
Subject: [PATCH 410/985] Fix error

---
 src/Functions/FunctionsConversion.cpp | 15 +++++++--------
 1 file changed, 7 insertions(+), 8 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 67d6e202255..70cbf31bcb3 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1569,15 +1569,20 @@ struct ConvertImpl
                 throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
                         arguments[0].column->getName(), Name::name);
         }
+        else if constexpr (std::is_same_v<Name, NameToUnixTimestamp>
+            && std::is_same_v<FromDataType, DataTypeString>
+            && std::is_same_v<ToDataType, DataTypeUInt32>)
+        {
+            return ConvertImpl<FromDataType, DataTypeDateTime, Name, SpecialTag, date_time_overflow_behavior>::execute(
+                arguments, result_type, input_rows_count, additions);
+        }
         else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>)
-            && !std::is_same_v<ToDataType, DataTypeString>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal>::execute(
                 arguments, result_type, input_rows_count, additions);
         }
         else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>)
-            && !std::is_same_v<ToDataType, DataTypeString>
             && std::is_same_v<SpecialTag, ConvertReturnNullOnErrorTag>)
         {
             return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal>::execute(
@@ -1590,12 +1595,6 @@ struct ConvertImpl
             return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::Normal>::execute(
                 arguments, result_type, input_rows_count, additions);
         }
-        else if constexpr (std::is_same_v<Name, NameToUnixTimestamp>
-            && std::is_same_v<FromDataType, DataTypeString>
-            && std::is_same_v<ToDataType, DataTypeUInt32>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
-        {
-        }
         else
         {
             using FromFieldType = typename FromDataType::FieldType;

From 47dfefd6b3983bad2c5598c19b14df679f605d93 Mon Sep 17 00:00:00 2001
From: Alexander Sapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 10:37:51 +0100
Subject: [PATCH 411/985] config substitutions

---
 src/Common/Config/ConfigProcessor.cpp         | 21 +++++++-
 src/Common/Config/ConfigProcessor.h           | 11 +++--
 src/Common/tests/gtest_config_processor.cpp   | 49 +++++++++++++++++++
 .../configs/config_zk_include_test.xml        |  8 +++
 .../test_config_substitutions/test.py         | 11 ++++-
 5 files changed, 93 insertions(+), 7 deletions(-)
 create mode 100644 tests/integration/test_config_substitutions/configs/config_zk_include_test.xml

diff --git a/src/Common/Config/ConfigProcessor.cpp b/src/Common/Config/ConfigProcessor.cpp
index 641e7ddcdaa..57e9f9efc10 100644
--- a/src/Common/Config/ConfigProcessor.cpp
+++ b/src/Common/Config/ConfigProcessor.cpp
@@ -173,10 +173,12 @@ static void deleteAttributesRecursive(Node * root)
 static void mergeAttributes(Element & config_element, Element & with_element)
 {
     auto * with_element_attributes = with_element.attributes();
+    //std::cerr << "MERGE ATTRIBUTES:" << with_element_attributes->length() << "\n";
 
     for (size_t i = 0; i < with_element_attributes->length(); ++i)
     {
         auto * attr = with_element_attributes->item(i);
+        //std::cerr << "ATTR NAME:" << attr->nodeName() << std::endl;
         config_element.setAttribute(attr->nodeName(), attr->getNodeValue());
     }
 
@@ -276,6 +278,8 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
     for (Node * node = config_root->firstChild(); node;)
     {
         Node * next_node = node->nextSibling();
+        //if (next_node)
+        //    std::cerr << "NEXT NODE:"  << next_node->nodeName() << std::endl;
         /// Remove text from the original config node.
         if (node->nodeType() == Node::TEXT_NODE && !allWhitespace(node->getNodeValue()))
         {
@@ -283,6 +287,7 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
         }
         else if (node->nodeType() == Node::ELEMENT_NODE)
         {
+            std::cerr << "NODES IN SOURCE: " << node->nodeName() << std::endl;
             config_element_by_id.insert(ElementsByIdentifier::value_type(getElementIdentifier(node), node));
         }
         node = next_node;
@@ -296,6 +301,7 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
         bool remove = false;
         if (with_node->nodeType() == Node::ELEMENT_NODE)
         {
+            //std::cerr << "WITH NODE: " << with_node->nodeName() << std::endl;
             Element & with_element = dynamic_cast<Element &>(*with_node);
             remove = with_element.hasAttribute("remove");
             bool replace = with_element.hasAttribute("replace");
@@ -303,11 +309,13 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
             if (remove && replace)
                 throw Poco::Exception("both remove and replace attributes set for element <" + with_node->nodeName() + ">");
 
+
             ElementsByIdentifier::iterator it = config_element_by_id.find(getElementIdentifier(with_node));
 
             if (it != config_element_by_id.end())
             {
                 Node * config_node = it->second;
+                //std::cerr << "SUBNODE NODE: " << config_node->nodeName() << std::endl;
                 config_element_by_id.erase(it);
 
                 if (remove)
@@ -316,12 +324,14 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
                 }
                 else if (replace)
                 {
+                    //std::cerr << "REPLACE!!!" << std::endl;
                     with_element.removeAttribute("replace");
                     NodePtr new_node = config->importNode(with_node, true);
                     config_root->replaceChild(new_node, config_node);
                 }
                 else
                 {
+                    //std::cerr << "SUBNODE NODE HERE: " << config_node->nodeName() << std::endl;
                     Element & config_element = dynamic_cast<Element &>(*config_node);
 
                     /// Remove substitution attributes from the merge target node if source node already has a value
@@ -333,11 +343,17 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
                     mergeAttributes(config_element, with_element);
                     mergeRecursive(config, config_node, with_node);
                 }
+                //std::cerr << "DONE\n";
                 merged = true;
             }
         }
+        else
+        {
+            //std::cerr << "ELEMENT NOT FOUND\n";
+        }
         if (!merged && !remove)
         {
+            //std::cerr << "NOTHING hAPPENED\n";
             /// Since we didn't find a pair to this node in default config, we will paste it as is.
             /// But it may have some child nodes which have attributes like "replace" or "remove".
             /// They are useless in preprocessed configuration.
@@ -433,6 +449,7 @@ void ConfigProcessor::doIncludesRecursive(
     auto process_include = [&](const Node * include_attr, const std::function<const Node * (const std::string &)> & get_node, const char * error_msg)
     {
         const std::string & name = include_attr->getNodeValue();
+        LOG_DEBUG(log, "PROCESS INCLUDE {}", name);
         const Node * node_to_include = get_node(name);
         if (!node_to_include)
         {
@@ -453,13 +470,15 @@ void ConfigProcessor::doIncludesRecursive(
             /// Replace the whole node not just contents.
             if (node->nodeName() == "include")
             {
+                LOG_DEBUG(log, "Include here for node {}", name);
                 const NodeListPtr children = node_to_include->childNodes();
                 Node * next_child = nullptr;
                 for (Node * child = children->item(0); child; child = next_child)
                 {
                     next_child = child->nextSibling();
                     NodePtr new_node = config->importNode(child, true);
-                    node->parentNode()->insertBefore(new_node, node);
+                    //node->parentNode()->insertBefore(new_node, node);
+                    mergeRecursive(config, node->parentNode(), new_node);
                 }
 
                 node->parentNode()->removeChild(node);
diff --git a/src/Common/Config/ConfigProcessor.h b/src/Common/Config/ConfigProcessor.h
index 5712c36d737..9201ec7b77d 100644
--- a/src/Common/Config/ConfigProcessor.h
+++ b/src/Common/Config/ConfigProcessor.h
@@ -119,6 +119,11 @@ public:
 
     static inline const auto SUBSTITUTION_ATTRS = {"incl", "from_zk", "from_env"};
 
+    /// If config root node name is not 'clickhouse' and merging config's root node names doesn't match, bypasses merging and returns false.
+    /// For compatibility root node 'yandex' considered equal to 'clickhouse'.
+    bool merge(XMLDocumentPtr config, XMLDocumentPtr with);
+    void mergeRecursive(XMLDocumentPtr config, Poco::XML::Node * config_root, const Poco::XML::Node * with_root);
+
 private:
     const std::string path;
     std::string preprocessed_path;
@@ -145,11 +150,7 @@ private:
     void hideRecursive(Poco::XML::Node * config_root);
     XMLDocumentPtr hideElements(XMLDocumentPtr xml_tree);
 
-    void mergeRecursive(XMLDocumentPtr config, Poco::XML::Node * config_root, const Poco::XML::Node * with_root);
-
-    /// If config root node name is not 'clickhouse' and merging config's root node names doesn't match, bypasses merging and returns false.
-    /// For compatibility root node 'yandex' considered equal to 'clickhouse'.
-    bool merge(XMLDocumentPtr config, XMLDocumentPtr with);
+    //void mergeRecursive(XMLDocumentPtr config, Poco::XML::Node * config_root, const Poco::XML::Node * with_root);
 
     void doIncludesRecursive(
             XMLDocumentPtr config,
diff --git a/src/Common/tests/gtest_config_processor.cpp b/src/Common/tests/gtest_config_processor.cpp
index f01460d515b..d5397dd54c2 100644
--- a/src/Common/tests/gtest_config_processor.cpp
+++ b/src/Common/tests/gtest_config_processor.cpp
@@ -2,6 +2,7 @@
 #include <IO/WriteBufferFromFile.h>
 #include <IO/WriteHelpers.h>
 #include <Poco/Timestamp.h>
+#include <Common/XMLUtils.h>
 #include <Poco/Util/XMLConfiguration.h>
 #include <base/scope_guard.h>
 #include <gtest/gtest.h>
@@ -63,3 +64,51 @@ TEST(Common, ConfigProcessorManyElements)
     /// More that 5 min is way too slow
     ASSERT_LE(enumerate_elapsed_ms, 300*1000);
 }
+
+TEST(Common, ConfigProcessorMerge)
+{
+    namespace fs = std::filesystem;
+
+    auto path = fs::path("/tmp/test_config_processor/");
+
+    fs::remove_all(path);
+    fs::create_directories(path);
+    fs::create_directories(path / "config.d");
+    //SCOPE_EXIT({ fs::remove_all(path); });
+
+    auto config_file = std::make_unique<Poco::File>(path / "config.xml");
+    {
+        DB::WriteBufferFromFile out(config_file->path());
+        writeString("<clickhouse>\n", out);
+        writeString("<merge_tree><min_bytes_for_wide_part>1</min_bytes_for_wide_part></merge_tree>\n", out);
+        writeString("</clickhouse>\n", out);
+    }
+    DB::XMLDocumentPtr config_xml;
+    DB::ConfigProcessor processor(config_file->path(), /* throw_on_bad_incl = */ false, /* log_to_console = */ false);
+    {
+        bool has_zk_includes;
+        config_xml = processor.processConfig(&has_zk_includes);
+    }
+
+    auto small_part_file = std::make_unique<Poco::File>(path / "config.d" / "part.xml");
+    {
+        DB::WriteBufferFromFile out(small_part_file->path());
+        writeString("<merge_tree><min_bytes_for_wide_part>33</min_bytes_for_wide_part></merge_tree>\n", out);
+    }
+    DB::XMLDocumentPtr part_xml;
+
+    {
+        DB::ConfigProcessor tiny(small_part_file->path(), /* throw_on_bad_incl = */ false, /* log_to_console = */ false);
+        bool has_zk_includes;
+        part_xml = tiny.processConfig(&has_zk_includes);
+    }
+
+    auto * root_node = DB::XMLUtils::getRootNode(config_xml);
+    auto * part_node = DB::XMLUtils::getRootNode(part_xml);
+    auto * new_node = config_xml->importNode(part_node, true);
+    auto * deep_root = root_node->getNodeByPath("merge_tree");
+    processor.mergeRecursive(config_xml, deep_root, new_node);
+    DB::ConfigurationPtr configuration(new Poco::Util::XMLConfiguration(config_xml));
+
+    ASSERT_EQ(configuration->getUInt64("merge_tree.min_bytes_for_wide_part"), 33);
+}
diff --git a/tests/integration/test_config_substitutions/configs/config_zk_include_test.xml b/tests/integration/test_config_substitutions/configs/config_zk_include_test.xml
new file mode 100644
index 00000000000..4a0ed623c4e
--- /dev/null
+++ b/tests/integration/test_config_substitutions/configs/config_zk_include_test.xml
@@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="utf-8"?>
+<clickhouse>
+  <merge_tree>
+    <min_bytes_for_wide_part>1</min_bytes_for_wide_part>
+  </merge_tree>
+
+  <include from_zk="/min_bytes_for_wide_part"/>
+ </clickhouse>
diff --git a/tests/integration/test_config_substitutions/test.py b/tests/integration/test_config_substitutions/test.py
index 564985b2f50..08834e20423 100644
--- a/tests/integration/test_config_substitutions/test.py
+++ b/tests/integration/test_config_substitutions/test.py
@@ -13,7 +13,7 @@ node2 = cluster.add_instance(
     env_variables={"MAX_QUERY_SIZE": "55555"},
 )
 node3 = cluster.add_instance(
-    "node3", user_configs=["configs/config_zk.xml"], with_zookeeper=True
+    "node3", user_configs=["configs/config_zk.xml",], main_configs=["configs/config_zk_include_test.xml"], with_zookeeper=True
 )
 node4 = cluster.add_instance(
     "node4",
@@ -62,6 +62,11 @@ def start_cluster():
                 value=b"<user_2><password></password><profile>default</profile></user_2>",
                 makepath=True,
             )
+            zk.create(
+                path="/min_bytes_for_wide_part",
+                value=b"<merge_tree><min_bytes_for_wide_part>33</min_bytes_for_wide_part></merge_tree>",
+                makepath=True,
+            )
 
         cluster.add_zookeeper_startup_command(create_zk_roots)
 
@@ -237,3 +242,7 @@ def test_allow_databases(start_cluster):
         ).strip()
         == ""
     )
+
+def test_config_multiple_zk_substitutions(start_cluster):
+    #print(node3.query("SELECT * FROM system.merge_tree_settings"))
+    print(node3.query("SELECT * FROM system.merge_tree_settings WHERE changed=1"))

From 8362c11c8ad4eaf34c8f51ced971025b6bd8fc46 Mon Sep 17 00:00:00 2001
From: lgbo-ustc <lgbo.ustc@gmail.com>
Date: Wed, 13 Mar 2024 17:39:40 +0800
Subject: [PATCH 412/985] fixed

---
 src/Interpreters/Aggregator.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index c2a6634c55d..817664e4898 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -1247,7 +1247,7 @@ void Aggregator::executeAggregateInstructions(
     bool has_only_one_value_since_last_reset,
     bool no_more_keys,
     bool all_keys_are_const,
-    bool use_compiled_functions) const
+    bool use_compiled_functions [[maybe_unused]]) const
 {
 #if USE_EMBEDDED_COMPILER
     if (use_compiled_functions)
@@ -2513,7 +2513,8 @@ void NO_INLINE Aggregator::mergeDataNullKey(
 }
 
 template <typename Method, typename Table>
-void NO_INLINE Aggregator::mergeDataImpl(Table & table_dst, Table & table_src, Arena * arena, bool use_compiled_functions, bool prefetch) const
+void NO_INLINE Aggregator::mergeDataImpl(
+    Table & table_dst, Table & table_src, Arena * arena, bool use_compiled_functions [[maybe_unused]], bool prefetch) const
 {
     if constexpr (Method::low_cardinality_optimization || Method::one_key_nullable_optimization)
         mergeDataNullKey<Method, Table>(table_dst, table_src, arena);

From 5ef241cc850fe95240145f86329e259f5609de31 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 13 Mar 2024 11:30:11 +0100
Subject: [PATCH 413/985] WIP on virtual columns in StorageMerge

---
 src/Storages/StorageMerge.cpp | 42 ++++++++++++++++++++++++++++-------
 1 file changed, 34 insertions(+), 8 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 8410f0a8df8..ec03545d767 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -56,12 +56,17 @@
 #include <Storages/checkAndGetLiteralArgument.h>
 #include <base/defines.h>
 #include <base/range.h>
+#include "Common/logger_useful.h"
 #include <Common/Exception.h>
 #include <Common/assert_cast.h>
 #include <Common/checkStackSize.h>
 #include <Common/typeid_cast.h>
+#include "Analyzer/QueryNode.h"
+#include "Core/QueryProcessingStage.h"
+#include "IO/WriteHelpers.h"
 #include <Core/NamesAndTypes.h>
 #include <Functions/FunctionFactory.h>
+#include <Poco/Logger.h>
 
 namespace DB
 {
@@ -798,10 +803,13 @@ QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
     const ContextPtr & context,
     const Names & required_column_names)
 {
+    LOG_DEBUG(&Poco::Logger::get("replaceTableExpressionAndRemoveJoin"), "BEFORE:\n{}", query->dumpTree());
     auto * query_node = query->as<QueryNode>();
     auto join_tree_type = query_node->getJoinTree()->getNodeType();
     auto modified_query = query_node->cloneAndReplace(original_table_expression, replacement_table_expression);
 
+    LOG_DEBUG(&Poco::Logger::get("replaceTableExpressionAndRemoveJoin"), "AFTER:\n{}", modified_query->dumpTree());
+
     // For the case when join tree is just a table or a table function we don't need to do anything more.
     if (join_tree_type == QueryTreeNodeType::TABLE || join_tree_type == QueryTreeNodeType::TABLE_FUNCTION)
         return modified_query;
@@ -880,6 +888,7 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
     if (modified_query_info.table_expression)
     {
         auto replacement_table_expression = std::make_shared<TableNode>(storage, storage_lock, storage_snapshot_);
+        replacement_table_expression->setAlias(modified_query_info.table_expression->getAlias());
         if (query_info.table_expression_modifiers)
             replacement_table_expression->setTableExpressionModifiers(*query_info.table_expression_modifiers);
 
@@ -960,6 +969,8 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
                 column_name_to_node);
         }
 
+        LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "{}", modified_query_info.query_tree->dumpTree());
+
         modified_query_info.query = queryNodeToSelectQuery(modified_query_info.query_tree);
     }
     else
@@ -1020,7 +1031,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
     const auto & [database_name, storage, _, table_name] = storage_with_lock;
     bool allow_experimental_analyzer = context->getSettingsRef().allow_experimental_analyzer;
     auto storage_stage
-        = storage->getQueryProcessingStage(context, QueryProcessingStage::Complete, storage_snapshot_, modified_query_info);
+        = storage->getQueryProcessingStage(context, processed_stage, storage_snapshot_, modified_query_info);
 
     builder = plan.buildQueryPipeline(
         QueryPlanOptimizationSettings::fromContext(context), BuildQueryPipelineSettings::fromContext(context));
@@ -1047,10 +1058,23 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
 
         Block pipe_header = builder->getHeader();
 
-        if (has_database_virtual_column && common_header.has("_database") && !pipe_header.has("_database"))
+        auto get_column_options = GetColumnsOptions(GetColumnsOptions::All).withExtendedObjects().withVirtuals();
+        if (storage_snapshot_->storage.supportsSubcolumns())
+            get_column_options.withSubcolumns();
+
+        LOG_DEBUG(&Poco::Logger::get("createSources"), "Processed:{}\nStorage:{}", toString(processed_stage), toString(storage_stage));
+        
+        String table_alias;
+        if (allow_experimental_analyzer)
+            table_alias = modified_query_info.query_tree->as<QueryNode>()->getJoinTree()->as<TableNode>()->getAlias();
+
+        String database_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_database" : table_alias + "._database";
+        String table_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_table" : table_alias + "._table";
+
+        if (has_database_virtual_column && common_header.has(database_column) && (storage_stage == QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr))
         {
             ColumnWithTypeAndName column;
-            column.name = "_database";
+            column.name = database_column;
             column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
             column.column = column.type->createColumnConst(0, Field(database_name));
 
@@ -1062,10 +1086,10 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
                                         { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
         }
 
-        if (has_table_virtual_column && common_header.has("_table") && !pipe_header.has("_table"))
+        if (has_table_virtual_column && common_header.has(table_column) && (storage_stage == QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr))
         {
             ColumnWithTypeAndName column;
-            column.name = "_table";
+            column.name = table_column;
             column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
             column.column = column.type->createColumnConst(0, Field(table_name));
 
@@ -1080,7 +1104,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
         /// Subordinary tables could have different but convertible types, like numeric types of different width.
         /// We must return streams with structure equals to structure of Merge table.
         convertAndFilterSourceStream(
-            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, processed_stage);
+            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, storage_stage);
     }
 
     return builder;
@@ -1433,7 +1457,7 @@ void ReadFromMerge::convertAndFilterSourceStream(
     const RowPolicyDataOpt & row_policy_data_opt,
     ContextPtr local_context,
     QueryPipelineBuilder & builder,
-    QueryProcessingStage::Enum processed_stage)
+    QueryProcessingStage::Enum processed_stage [[maybe_unused]])
 {
     Block before_block_header = builder.getHeader();
 
@@ -1493,7 +1517,7 @@ void ReadFromMerge::convertAndFilterSourceStream(
     ActionsDAG::MatchColumnsMode convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Name;
 
     if (local_context->getSettingsRef().allow_experimental_analyzer
-        && (processed_stage != QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&snapshot->storage) != nullptr))
+        && (processed_stage != QueryProcessingStage::FetchColumns))
         convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Position;
 
     if (row_policy_data_opt)
@@ -1501,6 +1525,8 @@ void ReadFromMerge::convertAndFilterSourceStream(
         row_policy_data_opt->addFilterTransform(builder);
     }
 
+    LOG_DEBUG(&Poco::Logger::get("convertAndFilterSourceStream"), "SOURCE:\n{}\nRESULT:\n{}", builder.getHeader().dumpStructure(), header.dumpStructure());
+
     auto convert_actions_dag = ActionsDAG::makeConvertingActions(builder.getHeader().getColumnsWithTypeAndName(),
                                                                 header.getColumnsWithTypeAndName(),
                                                                 convert_actions_match_columns_mode);

From 2e49140de7695095831f52b32fc965a6b07ffd3e Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 13 Mar 2024 11:37:42 +0100
Subject: [PATCH 414/985] Small progress

---
 src/Storages/StorageMerge.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index ec03545d767..d5fd0f51a62 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -1517,7 +1517,7 @@ void ReadFromMerge::convertAndFilterSourceStream(
     ActionsDAG::MatchColumnsMode convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Name;
 
     if (local_context->getSettingsRef().allow_experimental_analyzer
-        && (processed_stage != QueryProcessingStage::FetchColumns))
+        && (processed_stage == QueryProcessingStage::FetchColumns && dynamic_cast<const StorageDistributed *>(&snapshot->storage) != nullptr))
         convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Position;
 
     if (row_policy_data_opt)

From c0bfafa203091abbe2f5af6d1253249fc432ad64 Mon Sep 17 00:00:00 2001
From: Yatsishin Ilya <2159081+qoega@users.noreply.github.com>
Date: Wed, 13 Mar 2024 10:48:02 +0000
Subject: [PATCH 415/985] fix tags

---
 .../02997_insert_select_too_many_parts_multithread.sql        | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.sql b/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.sql
index 00cf262add5..2dfc8094115 100644
--- a/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.sql
+++ b/tests/queries/0_stateless/02997_insert_select_too_many_parts_multithread.sql
@@ -1,5 +1,5 @@
-# Tags: disabled
-# TODO: Fix parts_to_throw_insert logic for parallel  MergeTreeSink onStart calls
+--  Tags: disabled
+-- TODO: Fix parts_to_throw_insert logic for parallel  MergeTreeSink onStart calls
 DROP TABLE IF EXISTS too_many_parts;
 
 CREATE TABLE too_many_parts (x UInt64) ENGINE = MergeTree ORDER BY tuple() SETTINGS parts_to_delay_insert = 5, parts_to_throw_insert = 5;

From dc9548d31b98d6c371d6b84c70bf98ad850bf475 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Wed, 13 Mar 2024 18:57:33 +0800
Subject: [PATCH 416/985] add perf test

---
 tests/performance/array_join.xml | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/performance/array_join.xml b/tests/performance/array_join.xml
index ca280ce28ad..b3fc24d3166 100644
--- a/tests/performance/array_join.xml
+++ b/tests/performance/array_join.xml
@@ -8,4 +8,6 @@
     <query>SELECT count() FROM (SELECT [number] a, [number * 2] b FROM numbers(10000000)) AS t LEFT ARRAY JOIN a, b WHERE NOT ignore(a + b) SETTINGS enable_unaligned_array_join = 1</query>
     <query>SELECT count() FROM (SELECT [number] a, [number * 2, number] b FROM numbers(10000000)) AS t ARRAY JOIN a, b WHERE NOT ignore(a + b) SETTINGS enable_unaligned_array_join = 1</query>
     <query>SELECT count() FROM (SELECT [number] a, [number * 2, number] b FROM numbers(10000000)) AS t LEFT ARRAY JOIN a, b WHERE NOT ignore(a + b) SETTINGS enable_unaligned_array_join = 1</query>
+
+    <query>with 'clickhouse' as str select arrayJoin(range(number % 10)),  materialize(str) from numbers(10000000)</query>
 </test>

From a704ea510a2c180d46ba89031915624619d3b74c Mon Sep 17 00:00:00 2001
From: Konstantin Bogdanov <thevar1able@users.noreply.github.com>
Date: Wed, 13 Mar 2024 12:03:42 +0100
Subject: [PATCH 417/985] Fix `test_placement_info` (#61057)

* Fix test

* Fix last minute changes

* Automatic style fix

---------

Co-authored-by: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
---
 tests/integration/helpers/mock_servers.py      |  2 +-
 .../configs/imds_bootstrap.xml                 |  9 +++++++++
 tests/integration/test_placement_info/test.py  | 18 ++++++++++--------
 3 files changed, 20 insertions(+), 9 deletions(-)
 create mode 100644 tests/integration/test_placement_info/configs/imds_bootstrap.xml

diff --git a/tests/integration/helpers/mock_servers.py b/tests/integration/helpers/mock_servers.py
index e4655ffeeaf..f2181d85e12 100644
--- a/tests/integration/helpers/mock_servers.py
+++ b/tests/integration/helpers/mock_servers.py
@@ -33,7 +33,7 @@ def start_mock_servers(cluster, script_dir, mocks, timeout=100):
 
         cluster.exec_in_container(
             container_id,
-            ["python", server_name, str(port)],
+            ["python3", server_name, str(port)],
             detach=True,
         )
 
diff --git a/tests/integration/test_placement_info/configs/imds_bootstrap.xml b/tests/integration/test_placement_info/configs/imds_bootstrap.xml
new file mode 100644
index 00000000000..5b2a77e0663
--- /dev/null
+++ b/tests/integration/test_placement_info/configs/imds_bootstrap.xml
@@ -0,0 +1,9 @@
+<clickhouse>
+    <s3>
+        <use_environment_credentials>1</use_environment_credentials>
+    </s3>
+    <placement>
+        <use_imds>0</use_imds>
+        <availability_zone>ci-placeholder</availability_zone>
+    </placement>
+</clickhouse>
diff --git a/tests/integration/test_placement_info/test.py b/tests/integration/test_placement_info/test.py
index 1b93a3eae0b..32fd2fa57d7 100644
--- a/tests/integration/test_placement_info/test.py
+++ b/tests/integration/test_placement_info/test.py
@@ -2,16 +2,14 @@ import pytest
 from helpers.cluster import ClickHouseCluster
 from helpers.mock_servers import start_mock_servers
 import os
-import time
 
-METADATA_SERVER_HOSTNAME = "resolver"
+METADATA_SERVER_HOSTNAME = "node_imds"
 METADATA_SERVER_PORT = 8080
 
 cluster = ClickHouseCluster(__file__)
 node_imds = cluster.add_instance(
     "node_imds",
-    with_minio=True,
-    main_configs=["configs/imds.xml"],
+    main_configs=["configs/imds_bootstrap.xml"],
     env_variables={
         "AWS_EC2_METADATA_SERVICE_ENDPOINT": f"http://{METADATA_SERVER_HOSTNAME}:{METADATA_SERVER_PORT}",
     },
@@ -32,10 +30,10 @@ node_missing_value = cluster.add_instance(
 )
 
 
-def start_metadata_server():
+def start_metadata_server(started_cluster):
     script_dir = os.path.join(os.path.dirname(__file__), "metadata_servers")
     start_mock_servers(
-        cluster,
+        started_cluster,
         script_dir,
         [
             (
@@ -51,13 +49,17 @@ def start_metadata_server():
 def start_cluster():
     try:
         cluster.start()
-        start_metadata_server()
-        yield
+        start_metadata_server(cluster)
+        yield cluster
     finally:
         cluster.shutdown()
 
 
 def test_placement_info_from_imds():
+    with open(os.path.join(os.path.dirname(__file__), "configs/imds.xml"), "r") as f:
+        node_imds.replace_config(
+            "/etc/clickhouse-server/config.d/imds_bootstrap.xml", f.read()
+        )
     node_imds.stop_clickhouse(kill=True)
     node_imds.start_clickhouse()
 

From 0353121dccb87403ff08334137fd9cecbb8953f1 Mon Sep 17 00:00:00 2001
From: peter279k <peter279k@gmail.com>
Date: Wed, 13 Mar 2024 19:17:27 +0800
Subject: [PATCH 418/985] Improve related NULL functions usage

---
 docs/en/sql-reference/functions/functions-for-nulls.md | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/functions-for-nulls.md b/docs/en/sql-reference/functions/functions-for-nulls.md
index 91c04cfded3..e73d6c899e7 100644
--- a/docs/en/sql-reference/functions/functions-for-nulls.md
+++ b/docs/en/sql-reference/functions/functions-for-nulls.md
@@ -14,7 +14,7 @@ Returns whether the argument is [NULL](../../sql-reference/syntax.md#null).
 isNull(x)
 ```
 
-Alias: `ISNULL`.
+Alias: `IS NULL`.
 
 **Arguments**
 
@@ -58,6 +58,8 @@ Returns whether the argument is not [NULL](../../sql-reference/syntax.md#null-li
 isNotNull(x)
 ```
 
+Alias: `IS NOT NULL`.
+
 **Arguments:**
 
 - `x` — A value of non-compound data type.
@@ -100,6 +102,8 @@ Returns whether the argument is 0 (zero) or [NULL](../../sql-reference/syntax.md
 isZeroOrNull(x)
 ```
 
+Alias: `x = 0 OR x IS NULL`.
+
 **Arguments:**
 
 - `x` — A value of non-compound data type.

From 4f446c566346b7cb1f33fc5fe1b7e892f90814f1 Mon Sep 17 00:00:00 2001
From: lgbo-ustc <lgbo.ustc@gmail.com>
Date: Wed, 13 Mar 2024 19:22:16 +0800
Subject: [PATCH 419/985] fixed

---
 src/Interpreters/Aggregator.cpp | 12 +++---------
 1 file changed, 3 insertions(+), 9 deletions(-)

diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 817664e4898..0674f4f0ec0 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -1862,19 +1862,13 @@ Aggregator::convertToBlockImpl(Method & method, Table & data, Arena * arena, Are
         return {finalizeBlock(params, getHeader(final), std::move(out_cols), final, rows)};
     }
     ConvertToBlockResVariant res;
+    bool use_compiled_functions = false;
     if (final)
     {
 #if USE_EMBEDDED_COMPILER
-        if (compiled_aggregate_functions_holder)
-        {
-            static constexpr bool use_compiled_functions = !Method::low_cardinality_optimization;
-            res = convertToBlockImplFinal<Method>(method, data, arena, aggregates_pools, use_compiled_functions, true);
-        }
-        else
+        use_compiled_functions = compiled_aggregate_functions_holder != nullptr && !Method::low_cardinality_optimization;
 #endif
-        {
-            res = convertToBlockImplFinal<Method>(method, data, arena, aggregates_pools, false, return_single_block);
-        }
+        res = convertToBlockImplFinal<Method>(method, data, arena, aggregates_pools, use_compiled_functions, return_single_block);
     }
     else
     {

From 3931351ec4806769048d2638f54323f1ae89e056 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 13 Mar 2024 12:36:47 +0100
Subject: [PATCH 420/985] Pass timeout through setting

---
 src/Core/Settings.h                               |  1 +
 src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp   |  5 +++--
 src/Disks/IO/CachedOnDiskWriteBufferFromFile.cpp  | 10 +++++++---
 src/Disks/IO/CachedOnDiskWriteBufferFromFile.h    | 15 +++++++++------
 src/IO/ReadSettings.h                             |  1 +
 src/IO/WriteSettings.h                            |  1 +
 src/Interpreters/Cache/FileCache.cpp              |  5 +++--
 src/Interpreters/Cache/FileCache.h                |  3 ++-
 src/Interpreters/Cache/FileCache_fwd.h            |  1 -
 src/Interpreters/Cache/FileSegment.cpp            |  4 ++--
 src/Interpreters/Cache/FileSegment.h              |  2 +-
 src/Interpreters/Cache/Metadata.cpp               |  6 +++++-
 .../Cache/WriteBufferToFileSegment.cpp            |  8 +++++++-
 src/Interpreters/Cache/WriteBufferToFileSegment.h |  2 ++
 src/Interpreters/Context.cpp                      |  2 ++
 15 files changed, 46 insertions(+), 20 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d70a6cf51c5..7ba335099e6 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -778,6 +778,7 @@ class IColumn;
     M(UInt64, filesystem_cache_max_download_size, (128UL * 1024 * 1024 * 1024), "Max remote filesystem cache size that can be downloaded by a single query", 0) \
     M(Bool, throw_on_error_from_cache_on_write_operations, false, "Ignore error from cache when caching on write operations (INSERT, merges)", 0) \
     M(UInt64, filesystem_cache_segments_batch_size, 20, "Limit on size of a single batch of file segments that a read buffer can request from cache. Too low value will lead to excessive requests to cache, too large may slow down eviction from cache", 0) \
+    M(UInt64, filesystem_cache_reserve_space_wait_lock_timeout_milliseconds, 1000, "Wait time to lock cache for sapce reservation in filesystem cache", 0) \
     \
     M(Bool, use_page_cache_for_disks_without_file_cache, false, "Use userspace page cache for remote disks that don't have filesystem cache enabled.", 0) \
     M(Bool, read_from_page_cache_if_exists_otherwise_bypass_cache, false, "Use userspace page cache in passive mode, similar to read_from_filesystem_cache_if_exists_otherwise_bypass_cache.", 0) \
diff --git a/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp b/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp
index 47ee5858562..1e108b481ee 100644
--- a/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp
+++ b/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp
@@ -637,7 +637,8 @@ void CachedOnDiskReadBufferFromFile::predownload(FileSegment & file_segment)
 
             ProfileEvents::increment(ProfileEvents::CachedReadBufferReadFromSourceBytes, current_impl_buffer_size);
 
-            bool continue_predownload = file_segment.reserve(current_predownload_size);
+            bool continue_predownload = file_segment.reserve(
+                current_predownload_size, settings.filesystem_cache_reserve_space_wait_lock_timeout_milliseconds);
             if (continue_predownload)
             {
                 LOG_TEST(log, "Left to predownload: {}, buffer size: {}", bytes_to_predownload, current_impl_buffer_size);
@@ -992,7 +993,7 @@ bool CachedOnDiskReadBufferFromFile::nextImplStep()
         {
             chassert(file_offset_of_buffer_end + size - 1 <= file_segment.range().right);
 
-            bool success = file_segment.reserve(size);
+            bool success = file_segment.reserve(size, settings.filesystem_cache_reserve_space_wait_lock_timeout_milliseconds);
             if (success)
             {
                 chassert(file_segment.getCurrentWriteOffset() == static_cast<size_t>(implementation_buffer->getPosition()));
diff --git a/src/Disks/IO/CachedOnDiskWriteBufferFromFile.cpp b/src/Disks/IO/CachedOnDiskWriteBufferFromFile.cpp
index faed55de713..f4e309f461e 100644
--- a/src/Disks/IO/CachedOnDiskWriteBufferFromFile.cpp
+++ b/src/Disks/IO/CachedOnDiskWriteBufferFromFile.cpp
@@ -26,16 +26,18 @@ FileSegmentRangeWriter::FileSegmentRangeWriter(
     FileCache * cache_,
     const FileSegment::Key & key_,
     const FileCacheUserInfo & user_,
+    size_t reserve_space_lock_wait_timeout_milliseconds_,
     std::shared_ptr<FilesystemCacheLog> cache_log_,
     const String & query_id_,
     const String & source_path_)
     : cache(cache_)
     , key(key_)
+    , user(user_)
+    , reserve_space_lock_wait_timeout_milliseconds(reserve_space_lock_wait_timeout_milliseconds_)
     , log(getLogger("FileSegmentRangeWriter"))
     , cache_log(cache_log_)
     , query_id(query_id_)
     , source_path(source_path_)
-    , user(user_)
 {
 }
 
@@ -89,7 +91,7 @@ bool FileSegmentRangeWriter::write(const char * data, size_t size, size_t offset
 
         size_t size_to_write = std::min(available_size, size);
 
-        bool reserved = file_segment->reserve(size_to_write);
+        bool reserved = file_segment->reserve(size_to_write, reserve_space_lock_wait_timeout_milliseconds);
         if (!reserved)
         {
             appendFilesystemCacheLog(*file_segment);
@@ -211,6 +213,7 @@ CachedOnDiskWriteBufferFromFile::CachedOnDiskWriteBufferFromFile(
     , key(key_)
     , query_id(query_id_)
     , user(user_)
+    , reserve_space_lock_wait_timeout_milliseconds(settings_.filesystem_cache_reserve_space_wait_lock_timeout_milliseconds)
     , throw_on_error_from_cache(settings_.throw_on_error_from_cache)
     , cache_log(!query_id_.empty() && settings_.enable_filesystem_cache_log ? cache_log_ : nullptr)
 {
@@ -251,7 +254,8 @@ void CachedOnDiskWriteBufferFromFile::cacheData(char * data, size_t size, bool t
 
     if (!cache_writer)
     {
-        cache_writer = std::make_unique<FileSegmentRangeWriter>(cache.get(), key, user, cache_log, query_id, source_path);
+        cache_writer = std::make_unique<FileSegmentRangeWriter>(
+            cache.get(), key, user, reserve_space_lock_wait_timeout_milliseconds, cache_log, query_id, source_path);
     }
 
     Stopwatch watch(CLOCK_MONOTONIC);
diff --git a/src/Disks/IO/CachedOnDiskWriteBufferFromFile.h b/src/Disks/IO/CachedOnDiskWriteBufferFromFile.h
index 59e0c76ca3d..ad4f6b5916d 100644
--- a/src/Disks/IO/CachedOnDiskWriteBufferFromFile.h
+++ b/src/Disks/IO/CachedOnDiskWriteBufferFromFile.h
@@ -30,6 +30,7 @@ public:
         FileCache * cache_,
         const FileSegment::Key & key_,
         const FileCacheUserInfo & user_,
+        size_t reserve_space_lock_wait_timeout_milliseconds_,
         std::shared_ptr<FilesystemCacheLog> cache_log_,
         const String & query_id_,
         const String & source_path_);
@@ -52,13 +53,14 @@ private:
     void completeFileSegment();
 
     FileCache * cache;
-    FileSegment::Key key;
+    const FileSegment::Key key;
+    const FileCacheUserInfo user;
+    const size_t reserve_space_lock_wait_timeout_milliseconds;
 
     LoggerPtr log;
     std::shared_ptr<FilesystemCacheLog> cache_log;
-    String query_id;
-    String source_path;
-    FileCacheUserInfo user;
+    const String query_id;
+    const String source_path;
 
     FileSegmentsHolderPtr file_segments;
 
@@ -99,11 +101,12 @@ private:
     String source_path;
     FileCacheKey key;
 
-    size_t current_download_offset = 0;
     const String query_id;
     const FileCacheUserInfo user;
+    const size_t reserve_space_lock_wait_timeout_milliseconds;
+    const bool throw_on_error_from_cache;
 
-    bool throw_on_error_from_cache;
+    size_t current_download_offset = 0;
     bool cache_in_error_state_or_disabled = false;
 
     std::unique_ptr<FileSegmentRangeWriter> cache_writer;
diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index c0a63bf51b1..6a0cac35878 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -100,6 +100,7 @@ struct ReadSettings
     bool read_from_filesystem_cache_if_exists_otherwise_bypass_cache = false;
     bool enable_filesystem_cache_log = false;
     size_t filesystem_cache_segments_batch_size = 20;
+    size_t filesystem_cache_reserve_space_wait_lock_timeout_milliseconds = 1000;
 
     bool use_page_cache_for_disks_without_file_cache = false;
     bool read_from_page_cache_if_exists_otherwise_bypass_cache = false;
diff --git a/src/IO/WriteSettings.h b/src/IO/WriteSettings.h
index fcadf34f021..7d36677b468 100644
--- a/src/IO/WriteSettings.h
+++ b/src/IO/WriteSettings.h
@@ -20,6 +20,7 @@ struct WriteSettings
     bool enable_filesystem_cache_on_write_operations = false;
     bool enable_filesystem_cache_log = false;
     bool throw_on_error_from_cache = false;
+    size_t filesystem_cache_reserve_space_wait_lock_timeout_milliseconds = 1000;
 
     bool s3_allow_parallel_part_upload = true;
 
diff --git a/src/Interpreters/Cache/FileCache.cpp b/src/Interpreters/Cache/FileCache.cpp
index 5650b9ce44e..ea40ffcfa3c 100644
--- a/src/Interpreters/Cache/FileCache.cpp
+++ b/src/Interpreters/Cache/FileCache.cpp
@@ -777,12 +777,13 @@ bool FileCache::tryReserve(
     FileSegment & file_segment,
     const size_t size,
     FileCacheReserveStat & reserve_stat,
-    const UserInfo & user)
+    const UserInfo & user,
+    size_t lock_wait_timeout_milliseconds)
 {
     ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheReserveMicroseconds);
 
     assertInitialized();
-    auto cache_lock = tryLockCache(std::chrono::milliseconds(FILECACHE_TRY_RESERVE_LOCK_TIMEOUT_MILLISECONDS));
+    auto cache_lock = tryLockCache(std::chrono::milliseconds(lock_wait_timeout_milliseconds));
     if (!cache_lock)
     {
         ProfileEvents::increment(ProfileEvents::FilesystemCacheFailToReserveSpaceBecauseOfLockContention);
diff --git a/src/Interpreters/Cache/FileCache.h b/src/Interpreters/Cache/FileCache.h
index 7434b2ac78a..007c4fd9483 100644
--- a/src/Interpreters/Cache/FileCache.h
+++ b/src/Interpreters/Cache/FileCache.h
@@ -161,7 +161,8 @@ public:
         FileSegment & file_segment,
         size_t size,
         FileCacheReserveStat & stat,
-        const UserInfo & user);
+        const UserInfo & user,
+        size_t lock_wait_timeout_milliseconds);
 
     std::vector<FileSegment::Info> getFileSegmentInfos(const UserID & user_id);
 
diff --git a/src/Interpreters/Cache/FileCache_fwd.h b/src/Interpreters/Cache/FileCache_fwd.h
index eaed279e7fd..06261b19db7 100644
--- a/src/Interpreters/Cache/FileCache_fwd.h
+++ b/src/Interpreters/Cache/FileCache_fwd.h
@@ -12,7 +12,6 @@ static constexpr int FILECACHE_DEFAULT_LOAD_METADATA_THREADS = 16;
 static constexpr int FILECACHE_DEFAULT_MAX_ELEMENTS = 10000000;
 static constexpr int FILECACHE_DEFAULT_HITS_THRESHOLD = 0;
 static constexpr size_t FILECACHE_BYPASS_THRESHOLD = 256 * 1024 * 1024;
-static constexpr size_t FILECACHE_TRY_RESERVE_LOCK_TIMEOUT_MILLISECONDS = 1000; /// 1 sec.
 
 class FileCache;
 using FileCachePtr = std::shared_ptr<FileCache>;
diff --git a/src/Interpreters/Cache/FileSegment.cpp b/src/Interpreters/Cache/FileSegment.cpp
index 6b2d4a4bec8..9ec2b090dc7 100644
--- a/src/Interpreters/Cache/FileSegment.cpp
+++ b/src/Interpreters/Cache/FileSegment.cpp
@@ -497,7 +497,7 @@ LockedKeyPtr FileSegment::lockKeyMetadata(bool assert_exists) const
     return metadata->tryLock();
 }
 
-bool FileSegment::reserve(size_t size_to_reserve, FileCacheReserveStat * reserve_stat)
+bool FileSegment::reserve(size_t size_to_reserve, size_t lock_wait_timeout_milliseconds, FileCacheReserveStat * reserve_stat)
 {
     if (!size_to_reserve)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Zero space reservation is not allowed");
@@ -549,7 +549,7 @@ bool FileSegment::reserve(size_t size_to_reserve, FileCacheReserveStat * reserve
     if (!reserve_stat)
         reserve_stat = &dummy_stat;
 
-    bool reserved = cache->tryReserve(*this, size_to_reserve, *reserve_stat, getKeyMetadata()->user);
+    bool reserved = cache->tryReserve(*this, size_to_reserve, *reserve_stat, getKeyMetadata()->user, lock_wait_timeout_milliseconds);
 
     if (!reserved)
         setDownloadFailedUnlocked(lockFileSegment());
diff --git a/src/Interpreters/Cache/FileSegment.h b/src/Interpreters/Cache/FileSegment.h
index ea97a6b0157..c34ee064345 100644
--- a/src/Interpreters/Cache/FileSegment.h
+++ b/src/Interpreters/Cache/FileSegment.h
@@ -199,7 +199,7 @@ public:
 
     /// Try to reserve exactly `size` bytes (in addition to the getDownloadedSize() bytes already downloaded).
     /// Returns true if reservation was successful, false otherwise.
-    bool reserve(size_t size_to_reserve, FileCacheReserveStat * reserve_stat = nullptr);
+    bool reserve(size_t size_to_reserve, size_t lock_wait_timeout_milliseconds, FileCacheReserveStat * reserve_stat = nullptr);
 
     /// Write data into reserved space.
     void write(const char * from, size_t size, size_t offset);
diff --git a/src/Interpreters/Cache/Metadata.cpp b/src/Interpreters/Cache/Metadata.cpp
index 727f2762cca..b79605622b6 100644
--- a/src/Interpreters/Cache/Metadata.cpp
+++ b/src/Interpreters/Cache/Metadata.cpp
@@ -1,6 +1,7 @@
 #include <Interpreters/Cache/Metadata.h>
 #include <Interpreters/Cache/FileCache.h>
 #include <Interpreters/Cache/FileSegment.h>
+#include <Interpreters/Context.h>
 #include <Common/logger_useful.h>
 #include <Common/ElapsedTimeProfileEventIncrement.h>
 #include <filesystem>
@@ -693,6 +694,9 @@ void CacheMetadata::downloadImpl(FileSegment & file_segment, std::optional<Memor
         reader->set(memory->data(), memory->size());
     }
 
+    const auto reserve_space_lock_wait_timeout_milliseconds =
+        Context::getGlobalContextInstance()->getReadSettings().filesystem_cache_reserve_space_wait_lock_timeout_milliseconds;
+
     size_t offset = file_segment.getCurrentWriteOffset();
     if (offset != static_cast<size_t>(reader->getPosition()))
         reader->seek(offset, SEEK_SET);
@@ -701,7 +705,7 @@ void CacheMetadata::downloadImpl(FileSegment & file_segment, std::optional<Memor
     {
         auto size = reader->available();
 
-        if (!file_segment.reserve(size))
+        if (!file_segment.reserve(size, reserve_space_lock_wait_timeout_milliseconds))
         {
             LOG_TEST(
                 log, "Failed to reserve space during background download "
diff --git a/src/Interpreters/Cache/WriteBufferToFileSegment.cpp b/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
index 7cd4e2d6e8d..759135722dc 100644
--- a/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
+++ b/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
@@ -1,6 +1,7 @@
 #include <Interpreters/Cache/WriteBufferToFileSegment.h>
 #include <Interpreters/Cache/FileSegment.h>
 #include <Interpreters/Cache/FileCache.h>
+#include <Interpreters/Context.h>
 #include <IO/SwapHelper.h>
 #include <IO/ReadBufferFromFile.h>
 
@@ -32,6 +33,11 @@ WriteBufferToFileSegment::WriteBufferToFileSegment(FileSegmentsHolderPtr segment
     , file_segment(&segment_holder_->front())
     , segment_holder(std::move(segment_holder_))
 {
+    auto query_context = CurrentThread::getQueryContext();
+    if (query_context)
+        reserve_space_lock_wait_timeout_milliseconds = query_context->getReadSettings().filesystem_cache_reserve_space_wait_lock_timeout_milliseconds;
+    else
+        reserve_space_lock_wait_timeout_milliseconds = Context::getGlobalContextInstance()->getReadSettings().filesystem_cache_reserve_space_wait_lock_timeout_milliseconds;
 }
 
 /// If it throws an exception, the file segment will be incomplete, so you should not use it in the future.
@@ -49,7 +55,7 @@ void WriteBufferToFileSegment::nextImpl()
     FileCacheReserveStat reserve_stat;
     /// In case of an error, we don't need to finalize the file segment
     /// because it will be deleted soon and completed in the holder's destructor.
-    bool ok = file_segment->reserve(bytes_to_write, &reserve_stat);
+    bool ok = file_segment->reserve(bytes_to_write, reserve_space_lock_wait_timeout_milliseconds, &reserve_stat);
 
     if (!ok)
     {
diff --git a/src/Interpreters/Cache/WriteBufferToFileSegment.h b/src/Interpreters/Cache/WriteBufferToFileSegment.h
index feb33472513..bff340d79b3 100644
--- a/src/Interpreters/Cache/WriteBufferToFileSegment.h
+++ b/src/Interpreters/Cache/WriteBufferToFileSegment.h
@@ -28,6 +28,8 @@ private:
 
     /// Empty if file_segment is not owned by this WriteBufferToFileSegment
     FileSegmentsHolderPtr segment_holder;
+
+    size_t reserve_space_lock_wait_timeout_milliseconds;
 };
 
 
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index d658fbe9920..6a0657a842c 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -5166,6 +5166,7 @@ ReadSettings Context::getReadSettings() const
     res.read_from_filesystem_cache_if_exists_otherwise_bypass_cache = settings.read_from_filesystem_cache_if_exists_otherwise_bypass_cache;
     res.enable_filesystem_cache_log = settings.enable_filesystem_cache_log;
     res.filesystem_cache_segments_batch_size = settings.filesystem_cache_segments_batch_size;
+    res.filesystem_cache_reserve_space_wait_lock_timeout_milliseconds = settings.filesystem_cache_reserve_space_wait_lock_timeout_milliseconds;
 
     res.filesystem_cache_max_download_size = settings.filesystem_cache_max_download_size;
     res.skip_download_if_exceeds_query_cache = settings.skip_download_if_exceeds_query_cache;
@@ -5214,6 +5215,7 @@ WriteSettings Context::getWriteSettings() const
     res.enable_filesystem_cache_on_write_operations = settings.enable_filesystem_cache_on_write_operations;
     res.enable_filesystem_cache_log = settings.enable_filesystem_cache_log;
     res.throw_on_error_from_cache = settings.throw_on_error_from_cache_on_write_operations;
+    res.filesystem_cache_reserve_space_wait_lock_timeout_milliseconds = settings.filesystem_cache_reserve_space_wait_lock_timeout_milliseconds;
 
     res.s3_allow_parallel_part_upload = settings.s3_allow_parallel_part_upload;
 

From ef796c668d187c80f13223dbf679dcc442907008 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 13 Mar 2024 12:03:37 +0000
Subject: [PATCH 421/985] Fixing
 test_build_sets_from_multiple_threads/test.py::test_set

---
 src/Planner/Planner.cpp                     | 4 +++-
 tests/analyzer_integration_broken_tests.txt | 1 -
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index bc1fb30781d..861b12e3da2 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -1081,7 +1081,9 @@ void addBuildSubqueriesForSetsStepIfNeeded(
     for (auto & subquery : subqueries)
     {
         auto query_tree = subquery->detachQueryTree();
-        auto subquery_options = select_query_options.subquery();
+        /// I suppose it should be better to use all flags from select_query_options,
+        /// But for now it is done in the same way as in old analyzer.
+        auto subquery_options = SelectQueryOptions(QueryProcessingStage::Complete, select_query_options.subquery_depth).subquery();
         Planner subquery_planner(
             query_tree,
             subquery_options,
diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index 31527dc3476..e71a047c215 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -1,4 +1,3 @@
-test_build_sets_from_multiple_threads/test.py::test_set
 test_concurrent_backups_s3/test.py::test_concurrent_backups
 test_distributed_type_object/test.py::test_distributed_type_object
 test_merge_table_over_distributed/test.py::test_global_in

From 1a47682c12a45acb888c89974302ec35bee5aaed Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 13 Mar 2024 13:08:12 +0100
Subject: [PATCH 422/985] Analyzer: Fix virtual columns in StorageMerge
 #ci_set_analyzer

---
 src/Interpreters/InterpreterSelectQueryAnalyzer.cpp | 1 +
 src/Storages/StorageMerge.cpp                       | 8 +++++---
 tests/analyzer_tech_debt.txt                        | 1 -
 3 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
index 922f4a99b4a..539d7a59f6f 100644
--- a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
+++ b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
@@ -86,6 +86,7 @@ void replaceStorageInQueryTree(QueryTreeNodePtr & query_tree, const ContextPtr &
             continue;
 
         auto replacement_table_expression = std::make_shared<TableNode>(storage, context);
+        replacement_table_expression->setAlias(node->getAlias());
 
         if (auto table_expression_modifiers = table_node.getTableExpressionModifiers())
             replacement_table_expression->setTableExpressionModifiers(*table_expression_modifiers);
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index d5fd0f51a62..fab4b2e5146 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -1135,13 +1135,15 @@ QueryPlan ReadFromMerge::createPlanForTable(
     bool allow_experimental_analyzer = modified_context->getSettingsRef().allow_experimental_analyzer;
 
     auto storage_stage = storage->getQueryProcessingStage(modified_context,
-        QueryProcessingStage::Complete,
+        processed_stage,
         storage_snapshot_,
         modified_query_info);
 
+    LOG_DEBUG(&Poco::Logger::get("createPlanForTable"), "Storage: {}", toString(storage_stage));
+
     QueryPlan plan;
 
-    if (processed_stage <= storage_stage || (allow_experimental_analyzer && processed_stage == QueryProcessingStage::FetchColumns))
+    if (processed_stage <= storage_stage)
     {
         /// If there are only virtual columns in query, you must request at least one other column.
         if (real_column_names.empty())
@@ -1186,7 +1188,7 @@ QueryPlan ReadFromMerge::createPlanForTable(
                 row_policy_data_opt->addStorageFilter(source_step_with_filter);
         }
     }
-    else if (processed_stage > storage_stage || (allow_experimental_analyzer && processed_stage != QueryProcessingStage::FetchColumns))
+    else if (processed_stage > storage_stage || allow_experimental_analyzer)
     {
         /// Maximum permissible parallelism is streams_num
         modified_context->setSetting("max_threads", streams_num);
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index dc6284d20c5..cee3cff8cd5 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -1,5 +1,4 @@
 00223_shard_distributed_aggregation_memory_efficient
-00717_merge_and_distributed
 00725_memory_tracking
 01062_pm_all_join_with_block_continuation
 01083_expressions_in_engine_arguments

From 9da03607282b8fc338be4356322c67229686fd39 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Wed, 13 Mar 2024 13:10:48 +0100
Subject: [PATCH 423/985] Reload CI


From 6203d45b966c91a18b2aee6b6da6e3dd3d36db62 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 13:12:48 +0100
Subject: [PATCH 424/985] working version with comments

---
 programs/server/Server.cpp                    |  6 +-
 src/Common/Config/ConfigProcessor.cpp         | 71 ++++++++++++++-----
 src/Core/BaseSettings.cpp                     |  4 +-
 .../configs/config_zk_include_test.xml        |  6 +-
 .../test_config_substitutions/test.py         | 40 ++++++++++-
 5 files changed, 104 insertions(+), 23 deletions(-)

diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 7636f221ab5..9d7dd02a235 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -733,8 +733,6 @@ try
     LOG_INFO(log, "Available CPU instruction sets: {}", cpu_info);
 #endif
 
-    sanityChecks(*this);
-
     // Initialize global thread pool. Do it before we fetch configs from zookeeper
     // nodes (`from_zk`), because ZooKeeper interface uses the pool. We will
     // ignore `max_thread_pool_size` in configs we fetch from ZK, but oh well.
@@ -904,6 +902,7 @@ try
         config_processor.savePreprocessedConfig(loaded_config, config().getString("path", DBMS_DEFAULT_PATH));
         config().removeConfiguration(old_configuration.get());
         config().add(loaded_config.configuration.duplicate(), PRIO_DEFAULT, false);
+        global_context->setConfig(loaded_config.configuration);
     }
 
     Settings::checkNoSettingNamesAtTopLevel(config(), config_path);
@@ -911,6 +910,9 @@ try
     /// We need to reload server settings because config could be updated via zookeeper.
     server_settings.loadSettingsFromConfig(config());
 
+    /// NOTE: Do sanity checks after we loaded all possible substituions from ZK
+    sanityChecks(*this);
+
 #if defined(OS_LINUX)
     std::string executable_path = getExecutablePath();
 
diff --git a/src/Common/Config/ConfigProcessor.cpp b/src/Common/Config/ConfigProcessor.cpp
index 57e9f9efc10..75a973f582f 100644
--- a/src/Common/Config/ConfigProcessor.cpp
+++ b/src/Common/Config/ConfigProcessor.cpp
@@ -272,6 +272,7 @@ void ConfigProcessor::hideRecursive(Poco::XML::Node * config_root)
 
 void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root, const Node * with_root)
 {
+    //LOG_DEBUG(log, "WITH ROOT {}", with_root->nodeName());
     const NodeListPtr with_nodes = with_root->childNodes();
     using ElementsByIdentifier = std::multimap<ElementIdentifier, Node *>;
     ElementsByIdentifier config_element_by_id;
@@ -287,7 +288,7 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
         }
         else if (node->nodeType() == Node::ELEMENT_NODE)
         {
-            std::cerr << "NODES IN SOURCE: " << node->nodeName() << std::endl;
+            //LOG_DEBUG(log, "NODES IN SOURCE: {}", node->nodeName());
             config_element_by_id.insert(ElementsByIdentifier::value_type(getElementIdentifier(node), node));
         }
         node = next_node;
@@ -301,6 +302,7 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
         bool remove = false;
         if (with_node->nodeType() == Node::ELEMENT_NODE)
         {
+            //LOG_DEBUG(log, "WITH NODE: {}", with_node->nodeName());
             //std::cerr << "WITH NODE: " << with_node->nodeName() << std::endl;
             Element & with_element = dynamic_cast<Element &>(*with_node);
             remove = with_element.hasAttribute("remove");
@@ -315,6 +317,7 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
             if (it != config_element_by_id.end())
             {
                 Node * config_node = it->second;
+                //LOG_DEBUG(log, "SUBNODE NODE: {}", config_node->nodeName());
                 //std::cerr << "SUBNODE NODE: " << config_node->nodeName() << std::endl;
                 config_element_by_id.erase(it);
 
@@ -324,6 +327,7 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
                 }
                 else if (replace)
                 {
+                    //LOG_DEBUG(log, "REPLACE: {}", config_node->nodeName());
                     //std::cerr << "REPLACE!!!" << std::endl;
                     with_element.removeAttribute("replace");
                     NodePtr new_node = config->importNode(with_node, true);
@@ -331,6 +335,7 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
                 }
                 else
                 {
+                    //LOG_DEBUG(log, "SUBNODE NODE HERE: {}", config_node->nodeName());
                     //std::cerr << "SUBNODE NODE HERE: " << config_node->nodeName() << std::endl;
                     Element & config_element = dynamic_cast<Element &>(*config_node);
 
@@ -346,13 +351,15 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
                 //std::cerr << "DONE\n";
                 merged = true;
             }
-        }
-        else
-        {
-            //std::cerr << "ELEMENT NOT FOUND\n";
+            //else
+            //{
+            //    LOG_DEBUG(log, "ELEMENT NOT FOUND");
+            //    //std::cerr << "ELEMENT NOT FOUND\n";
+            //}
         }
         if (!merged && !remove)
         {
+            //LOG_DEBUG(log, "NOTHING HAPPENED");
             //std::cerr << "NOTHING hAPPENED\n";
             /// Since we didn't find a pair to this node in default config, we will paste it as is.
             /// But it may have some child nodes which have attributes like "replace" or "remove".
@@ -443,13 +450,14 @@ void ConfigProcessor::doIncludesRecursive(
 
     /// Replace the original contents, not add to it.
     bool replace = attributes->getNamedItem("replace");
+    bool merge = attributes->getNamedItem("merge");
 
     bool included_something = false;
 
     auto process_include = [&](const Node * include_attr, const std::function<const Node * (const std::string &)> & get_node, const char * error_msg)
     {
         const std::string & name = include_attr->getNodeValue();
-        LOG_DEBUG(log, "PROCESS INCLUDE {}", name);
+        //LOG_DEBUG(log, "PROCESS INCLUDE {}", name);
         const Node * node_to_include = get_node(name);
         if (!node_to_include)
         {
@@ -467,26 +475,38 @@ void ConfigProcessor::doIncludesRecursive(
         }
         else
         {
+
+            Element & element = dynamic_cast<Element &>(*node);
             /// Replace the whole node not just contents.
             if (node->nodeName() == "include")
             {
-                LOG_DEBUG(log, "Include here for node {}", name);
+                //LOG_DEBUG(log, "Include here for node {}", name);
                 const NodeListPtr children = node_to_include->childNodes();
                 Node * next_child = nullptr;
+
                 for (Node * child = children->item(0); child; child = next_child)
                 {
                     next_child = child->nextSibling();
-                    NodePtr new_node = config->importNode(child, true);
-                    //node->parentNode()->insertBefore(new_node, node);
-                    mergeRecursive(config, node->parentNode(), new_node);
+
+                    //LOG_DEBUG(log, "MERGEEEE {} PARENT NODE {} NODE {}", merge, node->parentNode()->nodeName(), node->nodeName());
+                    if (merge)
+                    {
+                        //LOG_DEBUG(log, "MERGEEEE");
+                        NodePtr new_node = config->importNode(child->parentNode(), true);
+                        //LOG_DEBUG(log, "CHILD {} NEW NODE NAME {}", child->nodeName(), new_node->nodeName());
+                        mergeRecursive(config, node->parentNode(), new_node);
+                    }
+                    else
+                    {
+                        NodePtr new_node = config->importNode(child, true);
+                        node->parentNode()->insertBefore(new_node, node);
+                    }
                 }
 
                 node->parentNode()->removeChild(node);
             }
             else
             {
-                Element & element = dynamic_cast<Element &>(*node);
-
                 for (const auto & attr_name : SUBSTITUTION_ATTRS)
                     element.removeAttribute(attr_name);
 
@@ -792,13 +812,19 @@ ConfigProcessor::LoadedConfig ConfigProcessor::loadConfig(bool allow_zk_includes
 
     ConfigurationPtr configuration(new Poco::Util::XMLConfiguration(config_xml));
 
+    //LOG_DEBUG(log, "MIN BYTES FOR WIDE PART {}", configuration->getUInt64("merge_tree.min_bytes_for_wide_part"));
+    //Poco::Util::AbstractConfiguration::Keys config_keys;
+    //configuration->keys("merge_tree", config_keys);
+    //for (const String & key : config_keys)
+    //{
+    //    LOG_DEBUG(log, "CONFIG KEY {} LEFT in merge_tree before ZK", key);
+    //}
+
     return LoadedConfig{configuration, has_zk_includes, /* loaded_from_preprocessed = */ false, config_xml, path};
 }
 
 ConfigProcessor::LoadedConfig ConfigProcessor::loadConfigWithZooKeeperIncludes(
-        zkutil::ZooKeeperNodeCache & zk_node_cache,
-        const zkutil::EventPtr & zk_changed_event,
-        bool fallback_to_preprocessed)
+    zkutil::ZooKeeperNodeCache & zk_node_cache, const zkutil::EventPtr & zk_changed_event, bool fallback_to_preprocessed)
 {
     XMLDocumentPtr config_xml;
     bool has_zk_includes;
@@ -817,13 +843,26 @@ ConfigProcessor::LoadedConfig ConfigProcessor::loadConfigWithZooKeeperIncludes(
         if (!zk_exception)
             throw;
 
-        LOG_WARNING(log, "Error while processing from_zk config includes: {}. Config will be loaded from preprocessed file: {}", zk_exception->message(), preprocessed_path);
+        LOG_WARNING(
+            log,
+            "Error while processing from_zk config includes: {}. Config will be loaded from preprocessed file: {}",
+            zk_exception->message(),
+            preprocessed_path);
 
         config_xml = dom_parser.parse(preprocessed_path);
     }
 
     ConfigurationPtr configuration(new Poco::Util::XMLConfiguration(config_xml));
 
+    //LOG_DEBUG(log, "MIN BYTES FOR WIDE PART {} WITH ZK INCLUDE", configuration->getUInt64("merge_tree.min_bytes_for_wide_part"));
+
+    //Poco::Util::AbstractConfiguration::Keys config_keys;
+    //configuration->keys("merge_tree", config_keys);
+    //for (const String & key : config_keys)
+    //{
+    //    LOG_DEBUG(log, "CONFIG KEY {} LEFT in merge_tree after ZK", key);
+    //}
+
     return LoadedConfig{configuration, has_zk_includes, !processed_successfully, config_xml, path};
 }
 
diff --git a/src/Core/BaseSettings.cpp b/src/Core/BaseSettings.cpp
index a7e1ab99af7..c535b9ce65e 100644
--- a/src/Core/BaseSettings.cpp
+++ b/src/Core/BaseSettings.cpp
@@ -41,13 +41,13 @@ BaseSettingsHelpers::Flags BaseSettingsHelpers::readFlags(ReadBuffer & in)
 
 void BaseSettingsHelpers::throwSettingNotFound(std::string_view name)
 {
-    throw Exception(ErrorCodes::UNKNOWN_SETTING, "Unknown setting {}", String{name});
+    throw Exception(ErrorCodes::UNKNOWN_SETTING, "Unknown setting '{}'", String{name});
 }
 
 
 void BaseSettingsHelpers::warningSettingNotFound(std::string_view name)
 {
-    LOG_WARNING(getLogger("Settings"), "Unknown setting {}, skipping", name);
+    LOG_WARNING(getLogger("Settings"), "Unknown setting '{}', skipping", name);
 }
 
 }
diff --git a/tests/integration/test_config_substitutions/configs/config_zk_include_test.xml b/tests/integration/test_config_substitutions/configs/config_zk_include_test.xml
index 4a0ed623c4e..743770c3024 100644
--- a/tests/integration/test_config_substitutions/configs/config_zk_include_test.xml
+++ b/tests/integration/test_config_substitutions/configs/config_zk_include_test.xml
@@ -1,8 +1,12 @@
 <?xml version="1.0" encoding="utf-8"?>
 <clickhouse>
+  <background_pool_size>44</background_pool_size>
   <merge_tree>
+    <include from_zk="/merge_max_block_size" merge="true"/>
+    <merge_max_block_size>99</merge_max_block_size>
     <min_bytes_for_wide_part>1</min_bytes_for_wide_part>
+    <min_rows_for_wide_part>1111</min_rows_for_wide_part>
   </merge_tree>
 
-  <include from_zk="/min_bytes_for_wide_part"/>
+  <include from_zk="/min_bytes_for_wide_part" merge="true"/>
  </clickhouse>
diff --git a/tests/integration/test_config_substitutions/test.py b/tests/integration/test_config_substitutions/test.py
index 08834e20423..304506148b0 100644
--- a/tests/integration/test_config_substitutions/test.py
+++ b/tests/integration/test_config_substitutions/test.py
@@ -67,6 +67,12 @@ def start_cluster():
                 value=b"<merge_tree><min_bytes_for_wide_part>33</min_bytes_for_wide_part></merge_tree>",
                 makepath=True,
             )
+            zk.create(
+                path="/merge_max_block_size",
+                value=b"<merge_max_block_size>8888</merge_max_block_size>",
+                makepath=True,
+            )
+
 
         cluster.add_zookeeper_startup_command(create_zk_roots)
 
@@ -244,5 +250,35 @@ def test_allow_databases(start_cluster):
     )
 
 def test_config_multiple_zk_substitutions(start_cluster):
-    #print(node3.query("SELECT * FROM system.merge_tree_settings"))
-    print(node3.query("SELECT * FROM system.merge_tree_settings WHERE changed=1"))
+    assert node3.query("SELECT value FROM system.merge_tree_settings WHERE name='min_bytes_for_wide_part'") == "33\n"
+    assert node3.query("SELECT value FROM system.merge_tree_settings WHERE name='min_rows_for_wide_part'") == "1111\n"
+    assert node3.query("SELECT value FROM system.merge_tree_settings WHERE name='merge_max_block_size'") == "8888\n"
+    assert node3.query("SELECT value FROM system.server_settings WHERE name='background_pool_size'") == "44\n"
+
+    zk = cluster.get_kazoo_client("zoo1")
+    zk.create(
+        path="/background_pool_size",
+        value=b"<background_pool_size>72</background_pool_size>",
+        makepath=True,
+    )
+
+    node3.replace_config(
+        "/etc/clickhouse-server/config.d/config_zk_include_test.xml",
+        """
+<clickhouse>
+  <include from_zk="/background_pool_size" merge="true"/>
+  <background_pool_size>44</background_pool_size>
+  <merge_tree>
+    <include from_zk="/merge_max_block_size" merge="true"/>
+    <min_bytes_for_wide_part>1</min_bytes_for_wide_part>
+    <min_rows_for_wide_part>1111</min_rows_for_wide_part>
+  </merge_tree>
+
+  <include from_zk="/min_bytes_for_wide_part" merge="true"/>
+ </clickhouse>
+""",
+    )
+
+    node3.query("SYSTEM RELOAD CONFIG")
+
+    assert node3.query("SELECT value FROM system.server_settings WHERE name='background_pool_size'") == "72\n"

From eacf33b445f6b93abda804ef2a9aed2928c82e56 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 13:13:29 +0100
Subject: [PATCH 425/985] Remove comments

---
 src/Common/Config/ConfigProcessor.cpp | 21 ---------------------
 1 file changed, 21 deletions(-)

diff --git a/src/Common/Config/ConfigProcessor.cpp b/src/Common/Config/ConfigProcessor.cpp
index 75a973f582f..1aa41558923 100644
--- a/src/Common/Config/ConfigProcessor.cpp
+++ b/src/Common/Config/ConfigProcessor.cpp
@@ -173,12 +173,10 @@ static void deleteAttributesRecursive(Node * root)
 static void mergeAttributes(Element & config_element, Element & with_element)
 {
     auto * with_element_attributes = with_element.attributes();
-    //std::cerr << "MERGE ATTRIBUTES:" << with_element_attributes->length() << "\n";
 
     for (size_t i = 0; i < with_element_attributes->length(); ++i)
     {
         auto * attr = with_element_attributes->item(i);
-        //std::cerr << "ATTR NAME:" << attr->nodeName() << std::endl;
         config_element.setAttribute(attr->nodeName(), attr->getNodeValue());
     }
 
@@ -279,8 +277,6 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
     for (Node * node = config_root->firstChild(); node;)
     {
         Node * next_node = node->nextSibling();
-        //if (next_node)
-        //    std::cerr << "NEXT NODE:"  << next_node->nodeName() << std::endl;
         /// Remove text from the original config node.
         if (node->nodeType() == Node::TEXT_NODE && !allWhitespace(node->getNodeValue()))
         {
@@ -288,7 +284,6 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
         }
         else if (node->nodeType() == Node::ELEMENT_NODE)
         {
-            //LOG_DEBUG(log, "NODES IN SOURCE: {}", node->nodeName());
             config_element_by_id.insert(ElementsByIdentifier::value_type(getElementIdentifier(node), node));
         }
         node = next_node;
@@ -302,8 +297,6 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
         bool remove = false;
         if (with_node->nodeType() == Node::ELEMENT_NODE)
         {
-            //LOG_DEBUG(log, "WITH NODE: {}", with_node->nodeName());
-            //std::cerr << "WITH NODE: " << with_node->nodeName() << std::endl;
             Element & with_element = dynamic_cast<Element &>(*with_node);
             remove = with_element.hasAttribute("remove");
             bool replace = with_element.hasAttribute("replace");
@@ -317,8 +310,6 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
             if (it != config_element_by_id.end())
             {
                 Node * config_node = it->second;
-                //LOG_DEBUG(log, "SUBNODE NODE: {}", config_node->nodeName());
-                //std::cerr << "SUBNODE NODE: " << config_node->nodeName() << std::endl;
                 config_element_by_id.erase(it);
 
                 if (remove)
@@ -327,16 +318,12 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
                 }
                 else if (replace)
                 {
-                    //LOG_DEBUG(log, "REPLACE: {}", config_node->nodeName());
-                    //std::cerr << "REPLACE!!!" << std::endl;
                     with_element.removeAttribute("replace");
                     NodePtr new_node = config->importNode(with_node, true);
                     config_root->replaceChild(new_node, config_node);
                 }
                 else
                 {
-                    //LOG_DEBUG(log, "SUBNODE NODE HERE: {}", config_node->nodeName());
-                    //std::cerr << "SUBNODE NODE HERE: " << config_node->nodeName() << std::endl;
                     Element & config_element = dynamic_cast<Element &>(*config_node);
 
                     /// Remove substitution attributes from the merge target node if source node already has a value
@@ -348,19 +335,11 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
                     mergeAttributes(config_element, with_element);
                     mergeRecursive(config, config_node, with_node);
                 }
-                //std::cerr << "DONE\n";
                 merged = true;
             }
-            //else
-            //{
-            //    LOG_DEBUG(log, "ELEMENT NOT FOUND");
-            //    //std::cerr << "ELEMENT NOT FOUND\n";
-            //}
         }
         if (!merged && !remove)
         {
-            //LOG_DEBUG(log, "NOTHING HAPPENED");
-            //std::cerr << "NOTHING hAPPENED\n";
             /// Since we didn't find a pair to this node in default config, we will paste it as is.
             /// But it may have some child nodes which have attributes like "replace" or "remove".
             /// They are useless in preprocessed configuration.

From 21ccabd603cde420b761736966a172a6312de6f9 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 13:19:49 +0100
Subject: [PATCH 426/985] Remove redundant diff

---
 src/Common/Config/ConfigProcessor.cpp | 23 -----------------------
 1 file changed, 23 deletions(-)

diff --git a/src/Common/Config/ConfigProcessor.cpp b/src/Common/Config/ConfigProcessor.cpp
index 1aa41558923..d639c243639 100644
--- a/src/Common/Config/ConfigProcessor.cpp
+++ b/src/Common/Config/ConfigProcessor.cpp
@@ -270,7 +270,6 @@ void ConfigProcessor::hideRecursive(Poco::XML::Node * config_root)
 
 void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root, const Node * with_root)
 {
-    //LOG_DEBUG(log, "WITH ROOT {}", with_root->nodeName());
     const NodeListPtr with_nodes = with_root->childNodes();
     using ElementsByIdentifier = std::multimap<ElementIdentifier, Node *>;
     ElementsByIdentifier config_element_by_id;
@@ -436,7 +435,6 @@ void ConfigProcessor::doIncludesRecursive(
     auto process_include = [&](const Node * include_attr, const std::function<const Node * (const std::string &)> & get_node, const char * error_msg)
     {
         const std::string & name = include_attr->getNodeValue();
-        //LOG_DEBUG(log, "PROCESS INCLUDE {}", name);
         const Node * node_to_include = get_node(name);
         if (!node_to_include)
         {
@@ -459,7 +457,6 @@ void ConfigProcessor::doIncludesRecursive(
             /// Replace the whole node not just contents.
             if (node->nodeName() == "include")
             {
-                //LOG_DEBUG(log, "Include here for node {}", name);
                 const NodeListPtr children = node_to_include->childNodes();
                 Node * next_child = nullptr;
 
@@ -467,12 +464,9 @@ void ConfigProcessor::doIncludesRecursive(
                 {
                     next_child = child->nextSibling();
 
-                    //LOG_DEBUG(log, "MERGEEEE {} PARENT NODE {} NODE {}", merge, node->parentNode()->nodeName(), node->nodeName());
                     if (merge)
                     {
-                        //LOG_DEBUG(log, "MERGEEEE");
                         NodePtr new_node = config->importNode(child->parentNode(), true);
-                        //LOG_DEBUG(log, "CHILD {} NEW NODE NAME {}", child->nodeName(), new_node->nodeName());
                         mergeRecursive(config, node->parentNode(), new_node);
                     }
                     else
@@ -791,14 +785,6 @@ ConfigProcessor::LoadedConfig ConfigProcessor::loadConfig(bool allow_zk_includes
 
     ConfigurationPtr configuration(new Poco::Util::XMLConfiguration(config_xml));
 
-    //LOG_DEBUG(log, "MIN BYTES FOR WIDE PART {}", configuration->getUInt64("merge_tree.min_bytes_for_wide_part"));
-    //Poco::Util::AbstractConfiguration::Keys config_keys;
-    //configuration->keys("merge_tree", config_keys);
-    //for (const String & key : config_keys)
-    //{
-    //    LOG_DEBUG(log, "CONFIG KEY {} LEFT in merge_tree before ZK", key);
-    //}
-
     return LoadedConfig{configuration, has_zk_includes, /* loaded_from_preprocessed = */ false, config_xml, path};
 }
 
@@ -833,15 +819,6 @@ ConfigProcessor::LoadedConfig ConfigProcessor::loadConfigWithZooKeeperIncludes(
 
     ConfigurationPtr configuration(new Poco::Util::XMLConfiguration(config_xml));
 
-    //LOG_DEBUG(log, "MIN BYTES FOR WIDE PART {} WITH ZK INCLUDE", configuration->getUInt64("merge_tree.min_bytes_for_wide_part"));
-
-    //Poco::Util::AbstractConfiguration::Keys config_keys;
-    //configuration->keys("merge_tree", config_keys);
-    //for (const String & key : config_keys)
-    //{
-    //    LOG_DEBUG(log, "CONFIG KEY {} LEFT in merge_tree after ZK", key);
-    //}
-
     return LoadedConfig{configuration, has_zk_includes, !processed_successfully, config_xml, path};
 }
 

From 62681225173b5c2044e33b83b691ca9ffb9245e5 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 13:21:06 +0100
Subject: [PATCH 427/985] Revert unit test

---
 src/Common/tests/gtest_config_processor.cpp | 49 ---------------------
 1 file changed, 49 deletions(-)

diff --git a/src/Common/tests/gtest_config_processor.cpp b/src/Common/tests/gtest_config_processor.cpp
index d5397dd54c2..f01460d515b 100644
--- a/src/Common/tests/gtest_config_processor.cpp
+++ b/src/Common/tests/gtest_config_processor.cpp
@@ -2,7 +2,6 @@
 #include <IO/WriteBufferFromFile.h>
 #include <IO/WriteHelpers.h>
 #include <Poco/Timestamp.h>
-#include <Common/XMLUtils.h>
 #include <Poco/Util/XMLConfiguration.h>
 #include <base/scope_guard.h>
 #include <gtest/gtest.h>
@@ -64,51 +63,3 @@ TEST(Common, ConfigProcessorManyElements)
     /// More that 5 min is way too slow
     ASSERT_LE(enumerate_elapsed_ms, 300*1000);
 }
-
-TEST(Common, ConfigProcessorMerge)
-{
-    namespace fs = std::filesystem;
-
-    auto path = fs::path("/tmp/test_config_processor/");
-
-    fs::remove_all(path);
-    fs::create_directories(path);
-    fs::create_directories(path / "config.d");
-    //SCOPE_EXIT({ fs::remove_all(path); });
-
-    auto config_file = std::make_unique<Poco::File>(path / "config.xml");
-    {
-        DB::WriteBufferFromFile out(config_file->path());
-        writeString("<clickhouse>\n", out);
-        writeString("<merge_tree><min_bytes_for_wide_part>1</min_bytes_for_wide_part></merge_tree>\n", out);
-        writeString("</clickhouse>\n", out);
-    }
-    DB::XMLDocumentPtr config_xml;
-    DB::ConfigProcessor processor(config_file->path(), /* throw_on_bad_incl = */ false, /* log_to_console = */ false);
-    {
-        bool has_zk_includes;
-        config_xml = processor.processConfig(&has_zk_includes);
-    }
-
-    auto small_part_file = std::make_unique<Poco::File>(path / "config.d" / "part.xml");
-    {
-        DB::WriteBufferFromFile out(small_part_file->path());
-        writeString("<merge_tree><min_bytes_for_wide_part>33</min_bytes_for_wide_part></merge_tree>\n", out);
-    }
-    DB::XMLDocumentPtr part_xml;
-
-    {
-        DB::ConfigProcessor tiny(small_part_file->path(), /* throw_on_bad_incl = */ false, /* log_to_console = */ false);
-        bool has_zk_includes;
-        part_xml = tiny.processConfig(&has_zk_includes);
-    }
-
-    auto * root_node = DB::XMLUtils::getRootNode(config_xml);
-    auto * part_node = DB::XMLUtils::getRootNode(part_xml);
-    auto * new_node = config_xml->importNode(part_node, true);
-    auto * deep_root = root_node->getNodeByPath("merge_tree");
-    processor.mergeRecursive(config_xml, deep_root, new_node);
-    DB::ConfigurationPtr configuration(new Poco::Util::XMLConfiguration(config_xml));
-
-    ASSERT_EQ(configuration->getUInt64("merge_tree.min_bytes_for_wide_part"), 33);
-}

From ef1f3c1af8c09ea94004857c0582de8e0137a1b4 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 13:21:51 +0100
Subject: [PATCH 428/985] Revert config processor.h

---
 src/Common/Config/ConfigProcessor.h | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/src/Common/Config/ConfigProcessor.h b/src/Common/Config/ConfigProcessor.h
index 9201ec7b77d..5712c36d737 100644
--- a/src/Common/Config/ConfigProcessor.h
+++ b/src/Common/Config/ConfigProcessor.h
@@ -119,11 +119,6 @@ public:
 
     static inline const auto SUBSTITUTION_ATTRS = {"incl", "from_zk", "from_env"};
 
-    /// If config root node name is not 'clickhouse' and merging config's root node names doesn't match, bypasses merging and returns false.
-    /// For compatibility root node 'yandex' considered equal to 'clickhouse'.
-    bool merge(XMLDocumentPtr config, XMLDocumentPtr with);
-    void mergeRecursive(XMLDocumentPtr config, Poco::XML::Node * config_root, const Poco::XML::Node * with_root);
-
 private:
     const std::string path;
     std::string preprocessed_path;
@@ -150,7 +145,11 @@ private:
     void hideRecursive(Poco::XML::Node * config_root);
     XMLDocumentPtr hideElements(XMLDocumentPtr xml_tree);
 
-    //void mergeRecursive(XMLDocumentPtr config, Poco::XML::Node * config_root, const Poco::XML::Node * with_root);
+    void mergeRecursive(XMLDocumentPtr config, Poco::XML::Node * config_root, const Poco::XML::Node * with_root);
+
+    /// If config root node name is not 'clickhouse' and merging config's root node names doesn't match, bypasses merging and returns false.
+    /// For compatibility root node 'yandex' considered equal to 'clickhouse'.
+    bool merge(XMLDocumentPtr config, XMLDocumentPtr with);
 
     void doIncludesRecursive(
             XMLDocumentPtr config,

From 8af9262e43435528bebd528eaed39ae103fa229c Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 13:26:25 +0100
Subject: [PATCH 429/985] Add docs

---
 docs/en/operations/configuration-files.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index 9f17f4af1e8..fbac2407640 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -116,6 +116,8 @@ XML substitution example:
 
 Substitutions can also be performed from ZooKeeper. To do this, specify the attribute `from_zk = "/path/to/node"`. The element value is replaced with the contents of the node at `/path/to/node` in ZooKeeper. You can also put an entire XML subtree on the ZooKeeper node, and it will be fully inserted into the source element.
 
+If you want to merge substitution content with existing configuration instead of append you can use attribute `merge="true`, for example: `<include from_zk="/some_path" merge="true">`. In this case existing configuration will be merged with content from substituion and existing configuration settings will be replaced with values from substituion.
+
 ## Encrypting and Hiding Configuration {#encryption}
 
 You can use symmetric encryption to encrypt a configuration element, for example, a plaintext password or private key. To do so, first configure the [encryption codec](../sql-reference/statements/create/table.md#encryption-codecs), then add attribute `encrypted_by` with the name of the encryption codec as value to the element to encrypt.

From 479b58ec70ec3c2563a5cdc358bfd2674f58325d Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 13:28:10 +0100
Subject: [PATCH 430/985] Remove redundant changes

---
 src/Common/Config/ConfigProcessor.cpp | 13 ++++---------
 1 file changed, 4 insertions(+), 9 deletions(-)

diff --git a/src/Common/Config/ConfigProcessor.cpp b/src/Common/Config/ConfigProcessor.cpp
index d639c243639..333d4d45a8f 100644
--- a/src/Common/Config/ConfigProcessor.cpp
+++ b/src/Common/Config/ConfigProcessor.cpp
@@ -452,9 +452,6 @@ void ConfigProcessor::doIncludesRecursive(
         }
         else
         {
-
-            Element & element = dynamic_cast<Element &>(*node);
-            /// Replace the whole node not just contents.
             if (node->nodeName() == "include")
             {
                 const NodeListPtr children = node_to_include->childNodes();
@@ -789,7 +786,9 @@ ConfigProcessor::LoadedConfig ConfigProcessor::loadConfig(bool allow_zk_includes
 }
 
 ConfigProcessor::LoadedConfig ConfigProcessor::loadConfigWithZooKeeperIncludes(
-    zkutil::ZooKeeperNodeCache & zk_node_cache, const zkutil::EventPtr & zk_changed_event, bool fallback_to_preprocessed)
+    zkutil::ZooKeeperNodeCache & zk_node_cache,
+    const zkutil::EventPtr & zk_changed_event,
+    bool fallback_to_preprocessed)
 {
     XMLDocumentPtr config_xml;
     bool has_zk_includes;
@@ -808,11 +807,7 @@ ConfigProcessor::LoadedConfig ConfigProcessor::loadConfigWithZooKeeperIncludes(
         if (!zk_exception)
             throw;
 
-        LOG_WARNING(
-            log,
-            "Error while processing from_zk config includes: {}. Config will be loaded from preprocessed file: {}",
-            zk_exception->message(),
-            preprocessed_path);
+        LOG_WARNING(log, "Error while processing from_zk config includes: {}. Config will be loaded from preprocessed file: {}", zk_exception->message(), preprocessed_path);
 
         config_xml = dom_parser.parse(preprocessed_path);
     }

From ab8276f23c5c09b63e3537ad29043b5a4a9f13a2 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 13:29:04 +0100
Subject: [PATCH 431/985] Buildable code

---
 src/Common/Config/ConfigProcessor.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Common/Config/ConfigProcessor.cpp b/src/Common/Config/ConfigProcessor.cpp
index 333d4d45a8f..deac1039372 100644
--- a/src/Common/Config/ConfigProcessor.cpp
+++ b/src/Common/Config/ConfigProcessor.cpp
@@ -477,6 +477,7 @@ void ConfigProcessor::doIncludesRecursive(
             }
             else
             {
+                Element & element = dynamic_cast<Element &>(*node);
                 for (const auto & attr_name : SUBSTITUTION_ATTRS)
                     element.removeAttribute(attr_name);
 

From 24626d431cac2e5c76ea14c5dd40afe5617ae1d0 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Wed, 13 Mar 2024 12:35:27 +0000
Subject: [PATCH 432/985] Automatic style fix

---
 .../test_config_substitutions/test.py         | 44 ++++++++++++++++---
 1 file changed, 37 insertions(+), 7 deletions(-)

diff --git a/tests/integration/test_config_substitutions/test.py b/tests/integration/test_config_substitutions/test.py
index 304506148b0..ac75771cb9c 100644
--- a/tests/integration/test_config_substitutions/test.py
+++ b/tests/integration/test_config_substitutions/test.py
@@ -13,7 +13,12 @@ node2 = cluster.add_instance(
     env_variables={"MAX_QUERY_SIZE": "55555"},
 )
 node3 = cluster.add_instance(
-    "node3", user_configs=["configs/config_zk.xml",], main_configs=["configs/config_zk_include_test.xml"], with_zookeeper=True
+    "node3",
+    user_configs=[
+        "configs/config_zk.xml",
+    ],
+    main_configs=["configs/config_zk_include_test.xml"],
+    with_zookeeper=True,
 )
 node4 = cluster.add_instance(
     "node4",
@@ -73,7 +78,6 @@ def start_cluster():
                 makepath=True,
             )
 
-
         cluster.add_zookeeper_startup_command(create_zk_roots)
 
         cluster.start()
@@ -249,11 +253,32 @@ def test_allow_databases(start_cluster):
         == ""
     )
 
+
 def test_config_multiple_zk_substitutions(start_cluster):
-    assert node3.query("SELECT value FROM system.merge_tree_settings WHERE name='min_bytes_for_wide_part'") == "33\n"
-    assert node3.query("SELECT value FROM system.merge_tree_settings WHERE name='min_rows_for_wide_part'") == "1111\n"
-    assert node3.query("SELECT value FROM system.merge_tree_settings WHERE name='merge_max_block_size'") == "8888\n"
-    assert node3.query("SELECT value FROM system.server_settings WHERE name='background_pool_size'") == "44\n"
+    assert (
+        node3.query(
+            "SELECT value FROM system.merge_tree_settings WHERE name='min_bytes_for_wide_part'"
+        )
+        == "33\n"
+    )
+    assert (
+        node3.query(
+            "SELECT value FROM system.merge_tree_settings WHERE name='min_rows_for_wide_part'"
+        )
+        == "1111\n"
+    )
+    assert (
+        node3.query(
+            "SELECT value FROM system.merge_tree_settings WHERE name='merge_max_block_size'"
+        )
+        == "8888\n"
+    )
+    assert (
+        node3.query(
+            "SELECT value FROM system.server_settings WHERE name='background_pool_size'"
+        )
+        == "44\n"
+    )
 
     zk = cluster.get_kazoo_client("zoo1")
     zk.create(
@@ -281,4 +306,9 @@ def test_config_multiple_zk_substitutions(start_cluster):
 
     node3.query("SYSTEM RELOAD CONFIG")
 
-    assert node3.query("SELECT value FROM system.server_settings WHERE name='background_pool_size'") == "72\n"
+    assert (
+        node3.query(
+            "SELECT value FROM system.server_settings WHERE name='background_pool_size'"
+        )
+        == "72\n"
+    )

From c234e1bca623106f625b4789513cc6ef20d7986f Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 13:35:37 +0100
Subject: [PATCH 433/985] Less diff

---
 src/Common/Config/ConfigProcessor.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Common/Config/ConfigProcessor.cpp b/src/Common/Config/ConfigProcessor.cpp
index deac1039372..d524db883eb 100644
--- a/src/Common/Config/ConfigProcessor.cpp
+++ b/src/Common/Config/ConfigProcessor.cpp
@@ -303,7 +303,6 @@ void ConfigProcessor::mergeRecursive(XMLDocumentPtr config, Node * config_root,
             if (remove && replace)
                 throw Poco::Exception("both remove and replace attributes set for element <" + with_node->nodeName() + ">");
 
-
             ElementsByIdentifier::iterator it = config_element_by_id.find(getElementIdentifier(with_node));
 
             if (it != config_element_by_id.end())
@@ -456,17 +455,17 @@ void ConfigProcessor::doIncludesRecursive(
             {
                 const NodeListPtr children = node_to_include->childNodes();
                 Node * next_child = nullptr;
-
                 for (Node * child = children->item(0); child; child = next_child)
                 {
                     next_child = child->nextSibling();
 
+                    /// Recursively replace existing nodes in merge mode
                     if (merge)
                     {
                         NodePtr new_node = config->importNode(child->parentNode(), true);
                         mergeRecursive(config, node->parentNode(), new_node);
                     }
-                    else
+                    else  /// Append to existing node by default
                     {
                         NodePtr new_node = config->importNode(child, true);
                         node->parentNode()->insertBefore(new_node, node);
@@ -478,6 +477,7 @@ void ConfigProcessor::doIncludesRecursive(
             else
             {
                 Element & element = dynamic_cast<Element &>(*node);
+
                 for (const auto & attr_name : SUBSTITUTION_ATTRS)
                     element.removeAttribute(attr_name);
 

From 457578627103b0eb0028f51b739c3911de278bf4 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 13 Mar 2024 12:38:17 +0000
Subject: [PATCH 434/985] Fix 01952_optimize_distributed_group_by_sharding_key
 with analyzer.

---
 ...istributed_group_by_sharding_key.reference | 78 +++++++++++++++++++
 ...mize_distributed_group_by_sharding_key.sql | 14 ++++
 2 files changed, 92 insertions(+)

diff --git a/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.reference b/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.reference
index ddfa6929d69..212dd348edb 100644
--- a/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.reference
+++ b/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.reference
@@ -71,3 +71,81 @@ Expression (Projection)
             Expression ((Before ORDER BY + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Projection + Before ORDER BY)))))
               ReadFromSystemNumbers
       ReadFromRemote (Read from remote replica)
+set allow_experimental_analyzer = 1;
+explain select distinct k1 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- not optimized
+Expression (Project names)
+  Distinct (DISTINCT)
+    Union
+      Distinct (Preliminary DISTINCT)
+        Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers)))))))
+          ReadFromSystemNumbers
+      ReadFromRemote (Read from remote replica)
+explain select distinct k1, k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- optimized
+Union
+  Expression (Project names)
+    Distinct (DISTINCT)
+      Distinct (Preliminary DISTINCT)
+        Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers)))))))
+          ReadFromSystemNumbers
+  ReadFromRemote (Read from remote replica)
+explain select distinct on (k1) k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- not optimized
+Expression (Project names)
+  LimitBy
+    Union
+      Expression (Before LIMIT BY)
+        LimitBy
+          Expression ((Before LIMIT BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))))
+            ReadFromSystemNumbers
+      Expression
+        ReadFromRemote (Read from remote replica)
+explain select distinct on (k1, k2) v from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- optimized
+Union
+  Expression (Project names)
+    LimitBy
+      Expression ((Before LIMIT BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))))
+        ReadFromSystemNumbers
+  ReadFromRemote (Read from remote replica)
+explain select distinct k1 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- not optimized
+Expression (Project names)
+  Distinct (DISTINCT)
+    Sorting (Merge sorted streams for ORDER BY, without aggregation)
+      Union
+        Sorting (Sorting for ORDER BY)
+          Expression (Before ORDER BY)
+            Distinct (Preliminary DISTINCT)
+              Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers)))))))
+                ReadFromSystemNumbers
+        ReadFromRemote (Read from remote replica)
+explain select distinct k1, k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- optimized
+Expression (Project names)
+  Sorting (Merge sorted streams after aggregation stage for ORDER BY)
+    Union
+      Distinct (DISTINCT)
+        Sorting (Sorting for ORDER BY)
+          Expression (Before ORDER BY)
+            Distinct (Preliminary DISTINCT)
+              Expression ((Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers)))))))
+                ReadFromSystemNumbers
+      ReadFromRemote (Read from remote replica)
+explain select distinct on (k1) k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- not optimized
+Expression (Project names)
+  LimitBy
+    Expression (Before LIMIT BY)
+      Sorting (Merge sorted streams for ORDER BY, without aggregation)
+        Union
+          LimitBy
+            Expression ((Before LIMIT BY + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))) [lifted up part]))
+              Sorting (Sorting for ORDER BY)
+                Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))))
+                  ReadFromSystemNumbers
+          ReadFromRemote (Read from remote replica)
+explain select distinct on (k1, k2) v from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- optimized
+Expression (Project names)
+  Sorting (Merge sorted streams after aggregation stage for ORDER BY)
+    Union
+      LimitBy
+        Expression ((Before LIMIT BY + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))) [lifted up part]))
+          Sorting (Sorting for ORDER BY)
+            Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Convert VIEW subquery result to VIEW table structure + (Materialize constants after VIEW subquery + (Project names + (Projection + Change column names to column identifiers))))))))
+              ReadFromSystemNumbers
+      ReadFromRemote (Read from remote replica)
diff --git a/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.sql b/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.sql
index 74b55b95315..adf55a9dd7f 100644
--- a/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.sql
+++ b/tests/queries/0_stateless/01952_optimize_distributed_group_by_sharding_key.sql
@@ -4,6 +4,8 @@ set optimize_skip_unused_shards=1;
 set optimize_distributed_group_by_sharding_key=1;
 set prefer_localhost_replica=1;
 
+set allow_experimental_analyzer = 0;
+
 -- { echo }
 explain select distinct k1 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- not optimized
 explain select distinct k1, k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- optimized
@@ -14,3 +16,15 @@ explain select distinct k1 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v
 explain select distinct k1, k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- optimized
 explain select distinct on (k1) k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- not optimized
 explain select distinct on (k1, k2) v from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- optimized
+
+set allow_experimental_analyzer = 1;
+
+explain select distinct k1 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- not optimized
+explain select distinct k1, k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- optimized
+explain select distinct on (k1) k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- not optimized
+explain select distinct on (k1, k2) v from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)); -- optimized
+
+explain select distinct k1 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- not optimized
+explain select distinct k1, k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- optimized
+explain select distinct on (k1) k2 from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- not optimized
+explain select distinct on (k1, k2) v from remote('127.{1,2}', view(select 1 k1, 2 k2, 3 v from numbers(2)), cityHash64(k1, k2)) order by v; -- optimized

From ffdb84b8df7120292543da077227ef049552dccf Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 13 Mar 2024 13:38:23 +0100
Subject: [PATCH 435/985] Fix style

---
 src/Storages/StorageMerge.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index fab4b2e5146..e695594873b 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -1063,7 +1063,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
             get_column_options.withSubcolumns();
 
         LOG_DEBUG(&Poco::Logger::get("createSources"), "Processed:{}\nStorage:{}", toString(processed_stage), toString(storage_stage));
-        
+
         String table_alias;
         if (allow_experimental_analyzer)
             table_alias = modified_query_info.query_tree->as<QueryNode>()->getJoinTree()->as<TableNode>()->getAlias();

From 4954bde599dd1bdcdf56957e17b0b9a661aa17f6 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 13:38:35 +0100
Subject: [PATCH 436/985] Update
 docs/en/sql-reference/functions/string-functions.md

Co-authored-by: Johnny <9611008+johnnymatthews@users.noreply.github.com>
---
 docs/en/sql-reference/functions/string-functions.md | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index f9c3f91a12b..a9b7cc9566d 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -615,7 +615,9 @@ Assumes that the string contains valid UTF-8 encoded text. If this assumption is
 **Example**
 
 ```sql
-SELECT 'database' AS string, substringUTF8(string, 5), substringUTF8(string, 5, 1)
+SELECT 'Täglich grüßt das Murmeltier.' AS str,
+       substringUTF8(str, 9),
+       substringUTF8(str, 9, 5)
 ```
 
 ```response

From b4953f35b4a8ca3eca816557c080ff612062b482 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 13:39:03 +0100
Subject: [PATCH 437/985] Update
 docs/en/sql-reference/functions/string-functions.md

Co-authored-by: Johnny <9611008+johnnymatthews@users.noreply.github.com>
---
 docs/en/sql-reference/functions/string-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index a9b7cc9566d..25a0c7e38d8 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -686,7 +686,7 @@ Assumes that the string contains valid UTF-8 encoded text. If this assumption is
 **Example**
 
 ```sql
-SELECT substringIndexUTF8('www.clickhouse.com', '.', 2)
+SELECT substringIndexUTF8('www.straßen-in-europa.de', '.', 2)
 ```
 
 ```response

From 6ca4fc26f4bca8f787b3a575d5496ffd75ee0c55 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 13:39:14 +0100
Subject: [PATCH 438/985] Update
 docs/en/sql-reference/functions/string-functions.md

Co-authored-by: Johnny <9611008+johnnymatthews@users.noreply.github.com>
---
 docs/en/sql-reference/functions/string-functions.md | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index 25a0c7e38d8..01a583e1713 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -621,9 +621,7 @@ SELECT 'Täglich grüßt das Murmeltier.' AS str,
 ```
 
 ```response
-┌─string───┬─substringUTF8('database', 5)─┬─substringUTF8('database', 5, 1)─┐
-│ database │ base                         │ b                               │
-└──────────┴──────────────────────────────┴─────────────────────────────────┘
+Täglich grüßt das Murmeltier.	grüßt das Murmeltier.	grüßt
 ```
 
 ## substringIndex

From 1e536251a20a0fdbac08b0a99e420a8e74886bcd Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 13:41:56 +0100
Subject: [PATCH 439/985] Update string-functions.md

---
 docs/en/sql-reference/functions/string-functions.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index 01a583e1713..b4e2adbed3c 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -688,7 +688,7 @@ SELECT substringIndexUTF8('www.straßen-in-europa.de', '.', 2)
 ```
 
 ```response
-www.clickhouse
+www.straßen-in-europa
 ```
 
 ## appendTrailingCharIfAbsent

From e5e632ec3362d2106adca2e02ae2a4ea1862ee3c Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 13 Mar 2024 12:43:10 +0000
Subject: [PATCH 440/985] Update analyzer_tech_debt.txt

---
 tests/analyzer_tech_debt.txt | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index dbd216ea7be..42aa579658e 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -9,7 +9,6 @@
 01747_join_view_filter_dictionary
 01761_cast_to_enum_nullable
 01925_join_materialized_columns
-01952_optimize_distributed_group_by_sharding_key
 02354_annoy
 # Check after constants refactoring
 02901_parallel_replicas_rollup

From cca96e05cf7be69f53a479db13414824552b7ca0 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 11 Mar 2024 17:57:24 +0100
Subject: [PATCH 441/985] Bring clickhouse-test changes from private

---
 tests/clickhouse-test | 376 ++++++++++++++++++++++++++++++++++++++----
 1 file changed, 345 insertions(+), 31 deletions(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index ce0feadf050..057502379ed 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -4,9 +4,11 @@
 # pylint: disable=global-variable-not-assigned
 # pylint: disable=too-many-lines
 # pylint: disable=anomalous-backslash-in-string
+# pylint: disable=protected-access
 
 import copy
 import enum
+import tempfile
 import glob
 
 # Not requests, to avoid requiring extra dependency.
@@ -68,6 +70,144 @@ TEST_FILE_EXTENSIONS = [".sql", ".sql.j2", ".sh", ".py", ".expect"]
 VERSION_PATTERN = r"^((\d+\.)?(\d+\.)?(\d+\.)?\d+)$"
 
 
+class SharedEngineReplacer:
+    ENGINES_NON_REPLICATED_REGEXP = r"[ =]((Collapsing|VersionedCollapsing|Summing|Replacing|Aggregating|)MergeTree\(?\)?)"
+    ENGINES_MAPPING_REPLICATED = [
+        ("ReplicatedMergeTree", "SharedMergeTree"),
+        ("ReplicatedCollapsingMergeTree", "SharedCollapsingMergeTree"),
+        (
+            "ReplicatedVersionedCollapsingMergeTree",
+            "SharedVersionedCollapsingMergeTree",
+        ),
+        ("ReplicatedSummingMergeTree", "SharedSummingMergeTree"),
+        ("ReplicatedReplacingMergeTree", "SharedReplacingMergeTree"),
+        ("ReplicatedAggregatingMergeTree", "SharedAggregatingMergeTree"),
+    ]
+    NEW_SYNTAX_REPLICATED_MERGE_TREE_RE = (
+        r"Replicated[a-zA-Z]*MergeTree\((\\?'.*\\?')?,?(\\?'.*\\?')?[a-zA-Z, _}{]*\)"
+    )
+    OLD_SYNTAX_OR_ARGUMENTS_RE = r"Tree\(.*[0-9]+.*\)"
+
+    def _check_replicad_new_syntax(self, line):
+        return re.search(self.NEW_SYNTAX_REPLICATED_MERGE_TREE_RE, line) is not None
+
+    def _check_old_syntax_or_arguments(self, line):
+        return re.search(self.OLD_SYNTAX_OR_ARGUMENTS_RE, line) is not None
+
+    @staticmethod
+    def _is_comment_line(line):
+        return line.startswith("SELECT") or line.startswith("select")
+
+    @staticmethod
+    def _is_create_query(line):
+        return (
+            line.startswith("CREATE")
+            or line.startswith("create")
+            or line.startswith("ENGINE")
+            or line.startswith("engine")
+        )
+
+    def _replace_non_replicated(self, line, escape_quotes, use_random_path):
+        groups = re.search(self.ENGINES_NON_REPLICATED_REGEXP, line)
+        if groups is not None and not self._check_old_syntax_or_arguments(line):
+            non_replicated_engine = groups.groups()[0]
+            basename_no_ext = os.path.splitext(os.path.basename(self.file_name))[0]
+            if use_random_path:
+                shared_path = "/" + os.path.join(
+                    basename_no_ext.replace("_", "/"),
+                    str(os.getpid()),
+                    str(random.randint(1, 1000)),
+                )
+            else:
+                shared_path = "/" + os.path.join(
+                    basename_no_ext.replace("_", "/"), str(os.getpid())
+                )
+
+            if escape_quotes:
+                shared_engine = (
+                    "Shared"
+                    + non_replicated_engine.replace("()", "")
+                    + f"(\\'{shared_path}\\', \\'1\\')"
+                )
+            else:
+                shared_engine = (
+                    "Shared"
+                    + non_replicated_engine.replace("()", "")
+                    + f"('{shared_path}', '1')"
+                )
+            return line.replace(non_replicated_engine, shared_engine)
+
+        return line
+
+    def _need_to_replace_something(self):
+        return (
+            self.replace_replicated or self.replace_non_replicated
+        ) and "shared_merge_tree" not in self.file_name
+
+    def _has_show_create_table(self):
+        with open(self.file_name, "r", encoding="utf-8") as f:
+            return re.search("show create table", f.read(), re.IGNORECASE)
+
+    def __init__(
+        self, file_name, replace_replicated, replace_non_replicated, reference_file
+    ):
+        self.file_name = file_name
+        self.temp_file_path = get_temp_file_path()
+        self.replace_replicated = replace_replicated
+        self.replace_non_replicated = replace_non_replicated
+
+        use_random_path = not reference_file and not self._has_show_create_table()
+
+        if not self._need_to_replace_something():
+            return
+
+        shutil.copyfile(self.file_name, self.temp_file_path)
+        shutil.copymode(self.file_name, self.temp_file_path)
+
+        with open(self.file_name, "w", newline="", encoding="utf-8") as modified:
+            with open(self.temp_file_path, "r", newline="", encoding="utf-8") as source:
+                for line in source:
+                    if self._is_comment_line(line) or (
+                        reference_file and not self._is_create_query(line)
+                    ):
+                        modified.write(line)
+                        continue
+
+                    if self.replace_replicated:
+                        for (
+                            engine_from,
+                            engine_to,
+                        ) in SharedEngineReplacer.ENGINES_MAPPING_REPLICATED:
+                            if engine_from in line and (
+                                self._check_replicad_new_syntax(line)
+                                or engine_from + " " in line
+                                or engine_from + ";" in line
+                            ):
+                                line = line.replace(engine_from, engine_to)
+                                break
+
+                    if self.replace_non_replicated:
+                        line = self._replace_non_replicated(
+                            line, reference_file, use_random_path
+                        )
+
+                    modified.write(line)
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, exc_type, exc_value, exc_tb):
+        if not self._need_to_replace_something():
+            return
+        shutil.move(self.temp_file_path, self.file_name)
+
+
+def get_temp_file_path():
+    return os.path.join(
+        tempfile._get_default_tempdir(), next(tempfile._get_candidate_names())
+    )
+
+
 def stringhash(s: str) -> int:
     # default hash() function consistent
     # only during process invocation https://stackoverflow.com/a/42089311
@@ -92,6 +232,16 @@ def trim_for_log(s):
         return "\n".join(lines)
 
 
+def is_valid_utf_8(fname):
+    try:
+        with open(fname, "rb") as f:
+            contents = f.read()
+            contents.decode("utf-8")
+            return True
+    except UnicodeDecodeError:
+        return False
+
+
 class TestException(Exception):
     pass
 
@@ -536,6 +686,8 @@ class FailureReason(enum.Enum):
     INTERNAL_QUERY_FAIL = "Internal query (CREATE/DROP DATABASE) failed:"
 
     # SKIPPED reasons
+    NOT_SUPPORTED_IN_CLOUD = "not supported in cloud environment"
+    NOT_SUPPORTED_IN_PRIVATE = "not supported in private build"
     DISABLED = "disabled"
     SKIP = "skip"
     NO_JINJA = "no jinja"
@@ -548,6 +700,7 @@ class FailureReason(enum.Enum):
     S3_STORAGE = "s3-storage"
     BUILD = "not running for current build"
     NO_PARALLEL_REPLICAS = "smth in not supported with parallel replicas"
+    SHARED_MERGE_TREE = "no-shared-merge-tree"
 
     # UNKNOWN reasons
     NO_REFERENCE = "no reference file"
@@ -606,8 +759,6 @@ class SettingsRandomizer:
         "read_in_order_two_level_merge_threshold": lambda: random.randint(0, 100),
         "optimize_aggregation_in_order": lambda: random.randint(0, 1),
         "aggregation_in_order_max_block_bytes": lambda: random.randint(0, 50000000),
-        "min_compress_block_size": lambda: random.randint(1, 1048576 * 3),
-        "max_compress_block_size": lambda: random.randint(1, 1048576 * 3),
         "use_uncompressed_cache": lambda: random.randint(0, 1),
         "min_bytes_to_use_direct_io": threshold_generator(
             0.2, 0.5, 1, 10 * 1024 * 1024 * 1024
@@ -659,6 +810,11 @@ class SettingsRandomizer:
             0.3, 0.5, 1, 10 * 1024 * 1024 * 1024
         ),
         "max_bytes_before_remerge_sort": lambda: random.randint(1, 3000000000),
+        "min_compress_block_size": lambda: random.randint(1, 1048576 * 3),
+        "max_compress_block_size": lambda: random.randint(1, 1048576 * 3),
+        "merge_tree_compact_parts_min_granules_to_multibuffer_read": lambda: random.randint(
+            1, 128
+        ),
         "optimize_sorting_by_input_stream_properties": lambda: random.randint(0, 1),
         "http_response_buffer_size": lambda: random.randint(0, 10 * 1048576),
         "http_wait_end_of_query": lambda: random.random() > 0.5,
@@ -684,6 +840,7 @@ class SettingsRandomizer:
                 get_localzone(),
             ]
         ),
+        "prefer_warmed_unmerged_parts_seconds": lambda: random.randint(0, 10),
         "use_page_cache_for_disks_without_file_cache": lambda: random.random() < 0.7,
         "page_cache_inject_eviction": lambda: random.random() < 0.5,
     }
@@ -733,6 +890,17 @@ class MergeTreeSettingsRandomizer:
         "primary_key_compress_block_size": lambda: random.randint(8000, 100000),
         "replace_long_file_name_to_hash": lambda: random.randint(0, 1),
         "max_file_name_length": threshold_generator(0.3, 0.3, 0, 128),
+        "min_bytes_for_full_part_storage": threshold_generator(
+            0.3, 0.3, 0, 512 * 1024 * 1024
+        ),
+        "compact_parts_max_bytes_to_buffer": lambda: random.randint(
+            1024, 512 * 1024 * 1024
+        ),
+        "compact_parts_max_granules_to_buffer": threshold_generator(0.15, 0.15, 1, 256),
+        "compact_parts_merge_max_bytes_to_prefetch_part": lambda: random.randint(
+            1, 32 * 1024 * 1024
+        ),
+        "cache_populated_by_fetch": lambda: random.randint(0, 1),
     }
 
     @staticmethod
@@ -744,6 +912,10 @@ class MergeTreeSettingsRandomizer:
         return random_settings
 
 
+def replace_in_file(filename, what, with_what):
+    os.system(f"LC_ALL=C sed -i -e 's|{what}|{with_what}|g' {filename}")
+
+
 class TestResult:
     def __init__(
         self,
@@ -972,6 +1144,15 @@ class TestCase:
         if tags and ("disabled" in tags) and not args.disabled:
             return FailureReason.DISABLED
 
+        elif args.private and self.name in suite.private_skip_list:
+            return FailureReason.NOT_SUPPORTED_IN_PRIVATE
+
+        elif args.cloud and ("no-replicated-database" in tags):
+            return FailureReason.REPLICATED_DB
+
+        elif args.cloud and self.name in suite.cloud_skip_list:
+            return FailureReason.NOT_SUPPORTED_IN_CLOUD
+
         elif (
             os.path.exists(os.path.join(suite.suite_path, self.name) + ".disabled")
             and not args.disabled
@@ -1022,6 +1203,13 @@ class TestCase:
         ):
             return FailureReason.NON_ATOMIC_DB
 
+        elif (
+            tags
+            and ("no-shared-merge-tree" in tags)
+            and args.replace_replicated_with_shared
+        ):
+            return FailureReason.SHARED_MERGE_TREE
+
         elif tags and ("no-s3-storage" in tags) and args.s3_storage:
             return FailureReason.S3_STORAGE
         elif (
@@ -1051,7 +1239,8 @@ class TestCase:
     ):
         description = ""
 
-        debug_log = trim_for_log(debug_log)
+        if debug_log:
+            debug_log = "\n".join(debug_log.splitlines()[:100])
 
         if proc:
             if proc.returncode is None:
@@ -1136,6 +1325,7 @@ class TestCase:
             description += "\nstdout:\n"
             description += trim_for_log(stdout)
             description += "\n"
+
             if debug_log:
                 description += "\n"
                 description += debug_log
@@ -1148,9 +1338,7 @@ class TestCase:
             )
 
         if "Exception" in stdout:
-            description += "\n"
-            description += trim_for_log(stdout)
-            description += "\n"
+            description += "\n{}\n".format("\n".join(stdout.splitlines()[:100]))
             if debug_log:
                 description += "\n"
                 description += debug_log
@@ -1358,7 +1546,13 @@ class TestCase:
         # because there are also output of per test database creation
         pattern = "{test} > {stdout} 2> {stderr}"
 
-        if self.ext == ".sql":
+        if self.ext == ".sql" and args.cloud:
+            # Get at least some logs, because we don't have access to system.text_log and pods...
+            pattern = (
+                "{client} --send_logs_level={logs_level} {secure} --multiquery {options}"
+                " --send_logs_level=trace < {test} > {stdout}  2>> /test_output/some_logs_from_server.log"
+            )
+        elif self.ext == ".sql" and not args.cloud:
             pattern = (
                 "{client} --send_logs_level={logs_level} {secure} --multiquery {options} < "
                 + pattern
@@ -1396,17 +1590,15 @@ class TestCase:
         total_time = (datetime.now() - start_time).total_seconds()
 
         # Normalize randomized database names in stdout, stderr files.
-        os.system(f"LC_ALL=C sed -i -e 's/{database}/default/g' {self.stdout_file}")
+        replace_in_file(self.stdout_file, database, "default")
         if args.hide_db_name:
-            os.system(f"LC_ALL=C sed -i -e 's/{database}/default/g' {self.stderr_file}")
+            replace_in_file(self.stderr_file, database, "default")
         if args.replicated_database:
-            os.system(f"LC_ALL=C sed -i -e 's|/auto_{{shard}}||g' {self.stdout_file}")
-            os.system(f"LC_ALL=C sed -i -e 's|auto_{{replica}}||g' {self.stdout_file}")
+            replace_in_file(self.stdout_file, "/auto_{shard}", "")
+            replace_in_file(self.stdout_file, "auto_{replica}", "")
 
         # Normalize hostname in stdout file.
-        os.system(
-            f"LC_ALL=C sed -i -e 's/{socket.gethostname()}/localhost/g' {self.stdout_file}"
-        )
+        replace_in_file(self.stdout_file, socket.gethostname(), "localhost")
 
         stdout = ""
         if os.path.exists(self.stdout_file):
@@ -1444,18 +1636,51 @@ class TestCase:
             self.testcase_args = self.configure_testcase_args(
                 args, self.case_file, suite.suite_tmp_path
             )
+
             client_options = self.add_random_settings(client_options)
-            proc, stdout, stderr, debug_log, total_time = self.run_single_test(
-                server_logs_level, client_options
-            )
 
-            result = self.process_result_impl(
-                proc, stdout, stderr, debug_log, total_time
-            )
-            result.check_if_need_retry(args, stdout, stderr, self.runs_count)
-            # to avoid breaking CSV parser
-            result.description = result.description.replace("\0", "")
+            if not is_valid_utf_8(self.case_file) or not is_valid_utf_8(
+                self.reference_file
+            ):
+                proc, stdout, stderr, debug_log, total_time = self.run_single_test(
+                    server_logs_level, client_options
+                )
 
+                result = self.process_result_impl(
+                    proc, stdout, stderr, debug_log, total_time
+                )
+                result.check_if_need_retry(args, stdout, stderr, self.runs_count)
+                # to avoid breaking CSV parser
+                result.description = result.description.replace("\0", "")
+            else:
+                with SharedEngineReplacer(
+                    self.case_file,
+                    args.replace_replicated_with_shared,
+                    args.replace_non_replicated_with_shared,
+                    False,
+                ):
+                    with SharedEngineReplacer(
+                        self.reference_file,
+                        args.replace_replicated_with_shared,
+                        args.replace_non_replicated_with_shared,
+                        True,
+                    ):
+                        (
+                            proc,
+                            stdout,
+                            stderr,
+                            debug_log,
+                            total_time,
+                        ) = self.run_single_test(server_logs_level, client_options)
+
+                        result = self.process_result_impl(
+                            proc, stdout, stderr, debug_log, total_time
+                        )
+                        result.check_if_need_retry(
+                            args, stdout, stderr, self.runs_count
+                        )
+                        # to avoid breaking CSV parser
+                        result.description = result.description.replace("\0", "")
             if result.status == TestStatus.FAIL:
                 result.description = self.add_info_about_settings(result.description)
 
@@ -1688,6 +1913,8 @@ class TestSuite:
         self.suite_path: str = suite_path
         self.suite_tmp_path: str = suite_tmp_path
         self.suite: str = suite
+        self.cloud_skip_list: List[str] = []
+        self.private_skip_list: List[str] = []
 
         if args.run_by_hash_num is not None and args.run_by_hash_total is not None:
             if args.run_by_hash_num > args.run_by_hash_total:
@@ -1987,10 +2214,16 @@ def check_server_started(args):
 
     sys.stdout.flush()
     retry_count = args.server_check_retries
+    query = "SELECT version(), arrayStringConcat(groupArray(value), ' ') FROM system.build_options WHERE name IN ('GIT_HASH', 'GIT_BRANCH')"
     while retry_count > 0:
         try:
-            clickhouse_execute(args, "SELECT 1", max_http_retries=1)
+            res = (
+                str(clickhouse_execute(args, query).decode())
+                .strip()
+                .replace("\t", " @ ")
+            )
             print(" OK")
+            print(f"Connected to server {res}")
             sys.stdout.flush()
             return True
         except (ConnectionError, http.client.ImproperConnectionState) as e:
@@ -2412,6 +2645,23 @@ def reportLogStats(args):
     print("\n")
 
 
+def try_get_skip_list(base_dir, name):
+    test_names_to_skip = []
+    skip_list_path = os.path.join(base_dir, name)
+    if not os.path.exists(skip_list_path):
+        return test_names_to_skip
+
+    with open(skip_list_path, "r", encoding="utf-8") as fd:
+        for line in fd.read().split("\n"):
+            if line == "" or line[0] == " ":
+                continue
+            test_name = line.split()[0].strip()
+            if test_name != "":
+                test_names_to_skip.append(test_name)
+
+    return test_names_to_skip
+
+
 def main(args):
     global server_died
     global stop_time
@@ -2430,18 +2680,18 @@ def main(args):
 
     args.build_flags = collect_build_flags(args)
     args.changed_merge_tree_settings = collect_changed_merge_tree_settings(args)
-    args.suppport_system_processes_is_all_data_sent = check_table_column(
-        args, "system", "processes", "is_all_data_sent"
-    )
 
-    if args.s3_storage and (
-        BuildFlags.THREAD in args.build_flags or BuildFlags.DEBUG in args.build_flags
-    ):
+    if args.s3_storage and (BuildFlags.RELEASE not in args.build_flags):
         args.no_random_settings = True
 
     if args.skip:
         args.skip = set(args.skip)
 
+    if args.replace_replicated_with_shared:
+        if not args.skip:
+            args.skip = set([])
+        args.skip = set(args.skip)
+
     base_dir = os.path.abspath(args.queries)
 
     # Keep same default values as in queries/shell_config.sh
@@ -2516,6 +2766,8 @@ def main(args):
         )
 
     total_tests_run = 0
+    cloud_skip_list = try_get_skip_list(base_dir, "../queries-no-cloud-tests.txt")
+    private_skip_list = try_get_skip_list(base_dir, "../queries-no-private-tests.txt")
 
     for suite in sorted(os.listdir(base_dir), key=suite_key_func):
         if server_died.is_set():
@@ -2525,6 +2777,8 @@ def main(args):
         if test_suite is None:
             continue
 
+        test_suite.cloud_skip_list = cloud_skip_list
+        test_suite.private_skip_list = private_skip_list
         total_tests_run += do_run_tests(args.jobs, test_suite, args.parallel)
 
     if server_died.is_set():
@@ -2644,7 +2898,14 @@ def find_clickhouse_command(binary, command):
 
 def get_additional_client_options(args):
     if args.client_option:
-        return " ".join("--" + option for option in args.client_option)
+        client_options = " ".join("--" + option for option in args.client_option)
+        if "CLICKHOUSE_CLIENT_OPT" in os.environ:
+            return os.environ["CLICKHOUSE_CLIENT_OPT"] + client_options
+        else:
+            return client_options
+    else:
+        if "CLICKHOUSE_CLIENT_OPT" in os.environ:
+            return os.environ["CLICKHOUSE_CLIENT_OPT"]
     return ""
 
 
@@ -2839,6 +3100,43 @@ def parse_args():
         help="Display $ characters after line with trailing whitespaces in diff output",
     )
 
+    group = parser.add_mutually_exclusive_group(required=False)
+    group.add_argument(
+        "--cloud",
+        action="store_true",
+        default=None,
+        dest="cloud",
+        help="Run only tests that are supported in ClickHouse Cloud environment",
+    )
+
+    group.add_argument(
+        "--no-cloud",
+        action="store_false",
+        default=None,
+        dest="cloud",
+        help="Run all the tests, including the ones not supported in ClickHouse Cloud environment",
+    )
+    parser.set_defaults(cloud=False)
+
+    group = parser.add_mutually_exclusive_group(required=False)
+    group.add_argument(
+        "--private",
+        action="store_true",
+        default=None,
+        dest="private",
+        help="Run only tests that are supported in the private build",
+    )
+
+    group.add_argument(
+        "--no-private",
+        action="store_false",
+        default=None,
+        dest="private",
+        help="Run all the tests, including the ones not supported in the private build",
+    )
+    # Only used to skip tests via "../queries-no-private-tests.txt", so it's fine to keep it enabled by default
+    parser.set_defaults(private=True)
+
     group = parser.add_mutually_exclusive_group(required=False)
     group.add_argument(
         "--zookeeper",
@@ -2920,6 +3218,18 @@ def parse_args():
         default=False,
         help="Do not include tests that are not supported with parallel replicas feature",
     )
+    parser.add_argument(
+        "--replace-replicated-with-shared",
+        action="store_true",
+        default=os.environ.get("USE_META_IN_KEEPER_FOR_MERGE_TREE", False),
+        help="Replace ReplicatedMergeTree engine with SharedMergeTree",
+    )
+    parser.add_argument(
+        "--replace-non-replicated-with-shared",
+        action="store_true",
+        default=False,
+        help="Replace ordinary MergeTree engine with SharedMergeTree",
+    )
 
     return parser.parse_args()
 
@@ -3062,6 +3372,7 @@ if __name__ == "__main__":
 
         client_options_query_str = get_additional_client_options_url(args)
         args.client_options_query_str = client_options_query_str + "&"
+        args.client_options_query_str += os.environ["CLICKHOUSE_URL_PARAMS"]
         os.environ["CLICKHOUSE_URL_PARAMS"] += client_options_query_str
     else:
         args.client_options_query_str = ""
@@ -3072,4 +3383,7 @@ if __name__ == "__main__":
     if args.db_engine and args.db_engine == "Ordinary":
         MESSAGES_TO_RETRY.append(" locking attempt on ")
 
+    if args.replace_replicated_with_shared:
+        args.s3_storage = True
+
     main(args)

From 80723134d6957f72606a419040c8101ec60c05e9 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 13 Mar 2024 14:00:57 +0100
Subject: [PATCH 442/985] Fix fast test #ci_set_analyzer

---
 src/Storages/StorageMerge.cpp | 89 +++++++++++++++++++++++------------
 1 file changed, 58 insertions(+), 31 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index e695594873b..f0b9d58f3dd 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -1058,47 +1058,74 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
 
         Block pipe_header = builder->getHeader();
 
-        auto get_column_options = GetColumnsOptions(GetColumnsOptions::All).withExtendedObjects().withVirtuals();
-        if (storage_snapshot_->storage.supportsSubcolumns())
-            get_column_options.withSubcolumns();
-
         LOG_DEBUG(&Poco::Logger::get("createSources"), "Processed:{}\nStorage:{}", toString(processed_stage), toString(storage_stage));
 
-        String table_alias;
         if (allow_experimental_analyzer)
-            table_alias = modified_query_info.query_tree->as<QueryNode>()->getJoinTree()->as<TableNode>()->getAlias();
-
-        String database_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_database" : table_alias + "._database";
-        String table_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_table" : table_alias + "._table";
-
-        if (has_database_virtual_column && common_header.has(database_column) && (storage_stage == QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr))
         {
-            ColumnWithTypeAndName column;
-            column.name = database_column;
-            column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
-            column.column = column.type->createColumnConst(0, Field(database_name));
+            String table_alias = modified_query_info.query_tree->as<QueryNode>()->getJoinTree()->as<TableNode>()->getAlias();
 
-            auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
-            auto adding_column_actions = std::make_shared<ExpressionActions>(
-                std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+            String database_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_database" : table_alias + "._database";
+            String table_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_table" : table_alias + "._table";
 
-            builder->addSimpleTransform([&](const Block & stream_header)
-                                        { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            if (has_database_virtual_column && common_header.has(database_column) && (storage_stage == QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr))
+            {
+                ColumnWithTypeAndName column;
+                column.name = database_column;
+                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+                column.column = column.type->createColumnConst(0, Field(database_name));
+
+                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+                auto adding_column_actions = std::make_shared<ExpressionActions>(
+                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+
+                builder->addSimpleTransform([&](const Block & stream_header)
+                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            }
+
+            if (has_table_virtual_column && common_header.has(table_column) && (storage_stage == QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr))
+            {
+                ColumnWithTypeAndName column;
+                column.name = table_column;
+                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+                column.column = column.type->createColumnConst(0, Field(table_name));
+
+                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+                auto adding_column_actions = std::make_shared<ExpressionActions>(
+                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+
+                builder->addSimpleTransform([&](const Block & stream_header)
+                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            }
         }
-
-        if (has_table_virtual_column && common_header.has(table_column) && (storage_stage == QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr))
+        else
         {
-            ColumnWithTypeAndName column;
-            column.name = table_column;
-            column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
-            column.column = column.type->createColumnConst(0, Field(table_name));
+            if (has_database_virtual_column && common_header.has("_database") && !pipe_header.has("_database"))
+            {
+                ColumnWithTypeAndName column;
+                column.name = "_database";
+                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+                column.column = column.type->createColumnConst(0, Field(database_name));
 
-            auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
-            auto adding_column_actions = std::make_shared<ExpressionActions>(
-                std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+                auto adding_column_actions = std::make_shared<ExpressionActions>(
+                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+                builder->addSimpleTransform([&](const Block & stream_header)
+                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            }
 
-            builder->addSimpleTransform([&](const Block & stream_header)
-                                        { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            if (has_table_virtual_column && common_header.has("_table") && !pipe_header.has("_table"))
+            {
+                ColumnWithTypeAndName column;
+                column.name = "_table";
+                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+                column.column = column.type->createColumnConst(0, Field(table_name));
+
+                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+                auto adding_column_actions = std::make_shared<ExpressionActions>(
+                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+                builder->addSimpleTransform([&](const Block & stream_header)
+                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            }
         }
 
         /// Subordinary tables could have different but convertible types, like numeric types of different width.

From d8c5008280aaf19bd481d436099afd89019a81c4 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 13:07:14 +0000
Subject: [PATCH 443/985] Follow up to #61258

---
 .../functions/other-functions.md              |  6 ++---
 src/Functions/sleep.h                         | 25 ++++---------------
 2 files changed, 8 insertions(+), 23 deletions(-)

diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index 288905c83da..e7fca31483a 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -298,7 +298,7 @@ Full columns and constants are represented differently in memory. Functions usua
 Accepts any arguments, including `NULL` and does nothing. Always returns 0.
 The argument is internally still evaluated. Useful e.g. for benchmarks.
 
-## sleep(seconds)
+## sleep
 
 Used to introduce a delay or pause in the execution of a query. It is primarily used for testing and debugging purposes.
 
@@ -310,7 +310,7 @@ sleep(seconds)
 
 **Arguments**
 
-- `seconds`: [Int](../../sql-reference/data-types/int-uint.md) The number of seconds to pause the query execution to a maximum of 3 seconds. It can be a floating-point value to specify fractional seconds.
+- `seconds`: [UInt*](../../sql-reference/data-types/int-uint.md) or [Float](../../sql-reference/data-types/float.md) The number of seconds to pause the query execution to a maximum of 3 seconds. It can be a floating-point value to specify fractional seconds.
 
 **Returned value**
 
@@ -360,7 +360,7 @@ sleepEachRow(seconds)
 
 **Arguments**
 
-- `seconds`: [Int](../../sql-reference/data-types/int-uint.md) The number of seconds to pause the query execution for each row in the result set to a maximum of 3 seconds. It can be a floating-point value to specify fractional seconds.
+- `seconds`: [UInt*](../../sql-reference/data-types/int-uint.md) or [Float*](../../sql-reference/data-types/float.md) The number of seconds to pause the query execution for each row in the result set to a maximum of 3 seconds. It can be a floating-point value to specify fractional seconds.
 
 **Returned value**
 
diff --git a/src/Functions/sleep.h b/src/Functions/sleep.h
index 73d58ca6b5b..84f08dd5440 100644
--- a/src/Functions/sleep.h
+++ b/src/Functions/sleep.h
@@ -62,32 +62,17 @@ public:
     {
     }
 
-    /// Get the name of the function.
-    String getName() const override
-    {
-        return name;
-    }
-
-    /// Do not sleep during query analysis.
-    bool isSuitableForConstantFolding() const override
-    {
-        return false;
-    }
-
-    size_t getNumberOfArguments() const override
-    {
-        return 1;
-    }
-
+    String getName() const override { return name; }
+    bool isSuitableForConstantFolding() const override { return false; } /// Do not sleep during query analysis.
+    size_t getNumberOfArguments() const override { return 1; }
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
 
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
     {
         WhichDataType which(arguments[0]);
 
-        if (!which.isFloat()
-            && !which.isNativeUInt())
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}, expected Float64",
+        if (!which.isFloat() && !which.isNativeUInt())
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}, expected UInt* or Float*",
                 arguments[0]->getName(), getName());
 
         return std::make_shared<DataTypeUInt8>();

From f6e09fd02ccae269e5c54f817f6c36d7693c4376 Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Wed, 13 Mar 2024 14:11:50 +0100
Subject: [PATCH 444/985] address comments

---
 src/Common/CgroupsMemoryUsageObserver.cpp | 9 +++++----
 src/Common/CgroupsMemoryUsageObserver.h   | 4 ++--
 2 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/src/Common/CgroupsMemoryUsageObserver.cpp b/src/Common/CgroupsMemoryUsageObserver.cpp
index e9121754230..c8379aed248 100644
--- a/src/Common/CgroupsMemoryUsageObserver.cpp
+++ b/src/Common/CgroupsMemoryUsageObserver.cpp
@@ -49,7 +49,7 @@ CgroupsMemoryUsageObserver::~CgroupsMemoryUsageObserver()
 
 void CgroupsMemoryUsageObserver::setLimits(uint64_t hard_limit_, uint64_t soft_limit_)
 {
-    std::lock_guard<std::mutex> lock(set_limit_mutex);
+    std::lock_guard<std::mutex> lock(limit_mutex);
     if (hard_limit_ == hard_limit && soft_limit_ == soft_limit)
         return;
 
@@ -99,7 +99,7 @@ void CgroupsMemoryUsageObserver::setLimits(uint64_t hard_limit_, uint64_t soft_l
 
 void CgroupsMemoryUsageObserver::setOnMemoryLimitUpdate(UpdateMemLimitCallbackFn on_memory_limit_update_)
 {
-    std::lock_guard<std::mutex> set_limit_lock(set_limit_mutex);
+    std::lock_guard<std::mutex> set_limit_lock(limit_mutex);
     on_memory_limit_update = on_memory_limit_update_;
 }
 
@@ -298,11 +298,12 @@ void CgroupsMemoryUsageObserver::runThread()
             {
                 LOG_INFO(log, "Find memory amount change, old limit is {} bytes, new limit is {} bytes", last_process_memory_amount, process_memory_limit);
                 last_process_memory_amount = process_memory_limit;
-                /// if we find memory amount changes, we just reload config.
+                /// If the available memory for the process changes (typically because the limit was adjusted via cgroups), then we just reload the config.
                 /// Reloading config will check the memory amount again and calculate soft/hard limit again.
+                std::lock_guard<std::mutex> set_limit_lock(limit_mutex);
                 on_memory_limit_update();
             }
-            std::lock_guard<std::mutex> set_limit_lock(set_limit_mutex);
+            std::lock_guard<std::mutex> set_limit_lock(limit_mutex);
             if (soft_limit > 0 && hard_limit > 0)
             {
                 uint64_t memory_usage = file.readMemoryUsage();
diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index 24acc0d8f40..e1978af8d28 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -44,10 +44,11 @@ private:
 
     const std::chrono::seconds wait_time;
 
+    std::mutex limit_mutex;
     using CallbackFn = std::function<void(bool)>;
     CallbackFn on_hard_limit;
     CallbackFn on_soft_limit;
-    UpdateMemLimitCallbackFn on_memory_limit_update;
+    UpdateMemLimitCallbackFn on_memory_limit_update TSA_GUARDED_BY(limit_mutex);
 
     uint64_t last_usage = 0;
 
@@ -74,7 +75,6 @@ private:
     void processMemoryUsage(uint64_t usage);
 
     std::mutex thread_mutex;
-    std::mutex set_limit_mutex;
     std::condition_variable cond;
     ThreadFromGlobalPool thread;
     bool quit = false;

From e6af636a549f808730c87ab69a6b76531d3dbc95 Mon Sep 17 00:00:00 2001
From: Sema Checherinda <Sema.Checherinda@clickhouse.com>
Date: Wed, 13 Mar 2024 14:07:49 +0100
Subject: [PATCH 445/985] fix data race in poco tcp server

---
 base/poco/Net/src/TCPServerDispatcher.cpp  |  4 +++-
 src/Common/tests/gtest_connection_pool.cpp | 11 +++--------
 2 files changed, 6 insertions(+), 9 deletions(-)

diff --git a/base/poco/Net/src/TCPServerDispatcher.cpp b/base/poco/Net/src/TCPServerDispatcher.cpp
index 20a1ffe1b4f..7f9f9a20ee7 100644
--- a/base/poco/Net/src/TCPServerDispatcher.cpp
+++ b/base/poco/Net/src/TCPServerDispatcher.cpp
@@ -93,7 +93,7 @@ void TCPServerDispatcher::release()
 
 void TCPServerDispatcher::run()
 {
-	AutoPtr<TCPServerDispatcher> guard(this, true); // ensure object stays alive
+	AutoPtr<TCPServerDispatcher> guard(this); // ensure object stays alive
 
 	int idleTime = (int) _pParams->getThreadIdleTime().totalMilliseconds();
 
@@ -149,11 +149,13 @@ void TCPServerDispatcher::enqueue(const StreamSocket& socket)
 		{
 			try
 			{
+                this->duplicate();
 				_threadPool.startWithPriority(_pParams->getThreadPriority(), *this, threadName);
 				++_currentThreads;
 			}
 			catch (Poco::Exception& exc)
 			{
+                this->release();
 				++_refusedConnections;
 				std::cerr << "Got exception while starting thread for connection. Error code: "
 						  << exc.code() << ", message: '" << exc.displayText() << "'" << std::endl;
diff --git a/src/Common/tests/gtest_connection_pool.cpp b/src/Common/tests/gtest_connection_pool.cpp
index c271cc0e2ec..dcc3c11fd52 100644
--- a/src/Common/tests/gtest_connection_pool.cpp
+++ b/src/Common/tests/gtest_connection_pool.cpp
@@ -123,17 +123,15 @@ protected:
 
     std::string getServerUrl() const
     {
-        return "http://" + server_data.socket->address().toString();
+        return "http://" + server_data.server->socket().address().toString();
     }
 
     void startServer()
     {
         server_data.reset();
-        server_data.params = new Poco::Net::HTTPServerParams();
-        server_data.socket = std::make_unique<Poco::Net::ServerSocket>(server_data.port);
         server_data.handler_factory = new HTTPRequestHandlerFactory(slowdown_receive);
         server_data.server =  std::make_unique<Poco::Net::HTTPServer>(
-            server_data.handler_factory, *server_data.socket, server_data.params);
+            server_data.handler_factory, server_data.port);
 
         server_data.server->start();
     }
@@ -155,8 +153,7 @@ protected:
     {
         // just some port to avoid collisions with others tests
         UInt16 port = 9871;
-        Poco::Net::HTTPServerParams::Ptr params;
-        std::unique_ptr<Poco::Net::ServerSocket> socket;
+
         HTTPRequestHandlerFactory::Ptr handler_factory;
         std::unique_ptr<Poco::Net::HTTPServer> server;
 
@@ -171,8 +168,6 @@ protected:
 
             server = nullptr;
             handler_factory = nullptr;
-            socket = nullptr;
-            params = nullptr;
         }
 
         ~ServerData() {

From 9b1d8a2f52f2dd67a242eef0451b127c86066be5 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 14:15:34 +0100
Subject: [PATCH 446/985] fix style

---
 docs/en/operations/configuration-files.md | 2 +-
 programs/server/Server.cpp                | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index fbac2407640..6b2dd309623 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -116,7 +116,7 @@ XML substitution example:
 
 Substitutions can also be performed from ZooKeeper. To do this, specify the attribute `from_zk = "/path/to/node"`. The element value is replaced with the contents of the node at `/path/to/node` in ZooKeeper. You can also put an entire XML subtree on the ZooKeeper node, and it will be fully inserted into the source element.
 
-If you want to merge substitution content with existing configuration instead of append you can use attribute `merge="true`, for example: `<include from_zk="/some_path" merge="true">`. In this case existing configuration will be merged with content from substituion and existing configuration settings will be replaced with values from substituion.
+If you want to merge substitution content with existing configuration instead of append you can use attribute `merge="true`, for example: `<include from_zk="/some_path" merge="true">`. In this case existing configuration will be merged with content from substitution and existing configuration settings will be replaced with values from substituion.
 
 ## Encrypting and Hiding Configuration {#encryption}
 
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 9d7dd02a235..3be34341173 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -910,7 +910,7 @@ try
     /// We need to reload server settings because config could be updated via zookeeper.
     server_settings.loadSettingsFromConfig(config());
 
-    /// NOTE: Do sanity checks after we loaded all possible substituions from ZK
+    /// NOTE: Do sanity checks after we loaded all possible substitutions from ZK
     sanityChecks(*this);
 
 #if defined(OS_LINUX)

From fefee44540bd029eb2d354706f61a1d96ed0e272 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 13 Mar 2024 14:27:47 +0100
Subject: [PATCH 447/985] Update settings changes history

---
 src/Core/SettingsChangesHistory.h | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index e680c02671a..d7b0669f64f 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -93,6 +93,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"input_format_json_use_string_type_for_ambiguous_paths_in_named_tuples_inference_from_objects", false, false, "Allow to use String type for ambiguous paths during named tuple inference from JSON objects"},
               {"throw_if_deduplication_in_dependent_materialized_views_enabled_with_async_insert", false, true, "Deduplication is dependent materialized view cannot work together with async inserts."},
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
+              {"filesystem_cache_reserve_space_wait_lock_timeout_milliseconds", 1000, 1000, "Wait time to lock cache for sapce reservation in filesystem cache"},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},

From cf639bab44807e6403f9392c21628a1f86558ef3 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Wed, 13 Mar 2024 13:37:26 +0000
Subject: [PATCH 448/985] Fix attach bug

---
 src/Storages/System/attachSystemTables.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index 14125cbd506..3fa55fe28c5 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -119,8 +119,8 @@ namespace DB
 void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, bool has_zookeeper)
 {
     attachNoDescription<StorageSystemOne>(context, system_database, "one", "This table contains a single row with a single dummy UInt8 column containing the value 0. Used when the table is not specified explicitly, for example in queries like `SELECT 1`.");
-    attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers", "Generates all natural numbers, starting from 0 (to 2^64 - 1, and then again) in sorted order.", false, "numbers");
-    attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers_mt", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", true, "numbers");
+    attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers", "Generates all natural numbers, starting from 0 (to 2^64 - 1, and then again) in sorted order.", false, "number");
+    attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers_mt", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", true, "number");
     attachNoDescription<StorageSystemNumbers>(context, system_database, "generate_series", "Generates arithmetic progression of natural numbers in sorted order in a given segment with a given step", false, "generate_series");
     attachNoDescription<StorageSystemZeros>(context, system_database, "zeros", "Produces unlimited number of non-materialized zeros.", false);
     attachNoDescription<StorageSystemZeros>(context, system_database, "zeros_mt", "Multithreaded version of system.zeros.", true);

From 9bb71291d50d29dd0c401580402adc12290224bb Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 13 Mar 2024 14:42:57 +0100
Subject: [PATCH 449/985] Fix unit test

---
 src/Interpreters/tests/gtest_filecache.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Interpreters/tests/gtest_filecache.cpp b/src/Interpreters/tests/gtest_filecache.cpp
index b596ccb0285..2679d1b8d18 100644
--- a/src/Interpreters/tests/gtest_filecache.cpp
+++ b/src/Interpreters/tests/gtest_filecache.cpp
@@ -245,7 +245,7 @@ void download(FileSegment & file_segment)
     ASSERT_EQ(file_segment.state(), State::DOWNLOADING);
     ASSERT_EQ(file_segment.getDownloadedSize(), 0);
 
-    ASSERT_TRUE(file_segment.reserve(file_segment.range().size()));
+    ASSERT_TRUE(file_segment.reserve(file_segment.range().size(), 1000));
     download(cache_base_path, file_segment);
     ASSERT_EQ(file_segment.state(), State::DOWNLOADING);
 
@@ -257,7 +257,7 @@ void assertDownloadFails(FileSegment & file_segment)
 {
     ASSERT_EQ(file_segment.getOrSetDownloader(), FileSegment::getCallerId());
     ASSERT_EQ(file_segment.getDownloadedSize(), 0);
-    ASSERT_FALSE(file_segment.reserve(file_segment.range().size()));
+    ASSERT_FALSE(file_segment.reserve(file_segment.range().size(), 1000));
     file_segment.complete();
 }
 
@@ -956,7 +956,7 @@ TEST_F(FileCacheTest, temporaryData)
         for (auto & segment : *some_data_holder)
         {
             ASSERT_TRUE(segment->getOrSetDownloader() == DB::FileSegment::getCallerId());
-            ASSERT_TRUE(segment->reserve(segment->range().size()));
+            ASSERT_TRUE(segment->reserve(segment->range().size(), 1000));
             download(*segment);
             segment->complete();
         }

From 4f2be003521b00c9a9087e17fcffdf08cabcd5f1 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 13:55:32 +0000
Subject: [PATCH 450/985] Some fixups

---
 docs/en/sql-reference/functions/functions-for-nulls.md | 10 +++++-----
 docs/en/sql-reference/operators/index.md               |  4 ++--
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/docs/en/sql-reference/functions/functions-for-nulls.md b/docs/en/sql-reference/functions/functions-for-nulls.md
index e73d6c899e7..61da9a191a1 100644
--- a/docs/en/sql-reference/functions/functions-for-nulls.md
+++ b/docs/en/sql-reference/functions/functions-for-nulls.md
@@ -10,11 +10,13 @@ sidebar_label: Nullable
 
 Returns whether the argument is [NULL](../../sql-reference/syntax.md#null).
 
+See also operator [`IS NULL`](../operators/index.md#is_null).
+
 ``` sql
 isNull(x)
 ```
 
-Alias: `IS NULL`.
+Alias: `ISNULL`
 
 **Arguments**
 
@@ -54,12 +56,12 @@ Result:
 
 Returns whether the argument is not [NULL](../../sql-reference/syntax.md#null-literal).
 
+See also operator [`IS NOT NULL`](../operators/index.md#is_not_null).
+
 ``` sql
 isNotNull(x)
 ```
 
-Alias: `IS NOT NULL`.
-
 **Arguments:**
 
 - `x` — A value of non-compound data type.
@@ -102,8 +104,6 @@ Returns whether the argument is 0 (zero) or [NULL](../../sql-reference/syntax.md
 isZeroOrNull(x)
 ```
 
-Alias: `x = 0 OR x IS NULL`.
-
 **Arguments:**
 
 - `x` — A value of non-compound data type.
diff --git a/docs/en/sql-reference/operators/index.md b/docs/en/sql-reference/operators/index.md
index 120e464e009..31bf43e8b35 100644
--- a/docs/en/sql-reference/operators/index.md
+++ b/docs/en/sql-reference/operators/index.md
@@ -353,7 +353,7 @@ For efficiency, the `and` and `or` functions accept any number of arguments. The
 
 ClickHouse supports the `IS NULL` and `IS NOT NULL` operators.
 
-### IS NULL
+### IS NULL {#is_null}
 
 - For [Nullable](../../sql-reference/data-types/nullable.md) type values, the `IS NULL` operator returns:
     - `1`, if the value is `NULL`.
@@ -374,7 +374,7 @@ SELECT x+100 FROM t_null WHERE y IS NULL
 └──────────────┘
 ```
 
-### IS NOT NULL
+### IS NOT NULL {#is_not_null}
 
 - For [Nullable](../../sql-reference/data-types/nullable.md) type values, the `IS NOT NULL` operator returns:
     - `0`, if the value is `NULL`.

From 6bbf9eb5400206c326a4e453a38612c8beb6ef89 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 13:57:55 +0000
Subject: [PATCH 451/985] Fixup fixups

---
 docs/en/sql-reference/functions/functions-for-nulls.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/functions-for-nulls.md b/docs/en/sql-reference/functions/functions-for-nulls.md
index 61da9a191a1..4dfbf4262ed 100644
--- a/docs/en/sql-reference/functions/functions-for-nulls.md
+++ b/docs/en/sql-reference/functions/functions-for-nulls.md
@@ -16,7 +16,7 @@ See also operator [`IS NULL`](../operators/index.md#is_null).
 isNull(x)
 ```
 
-Alias: `ISNULL`
+Alias: `ISNULL`.
 
 **Arguments**
 

From 9338b681efa7ea67e09e2ee37636ca0d551590a6 Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 15:12:36 +0100
Subject: [PATCH 452/985] I will bypass style check

---
 docs/en/operations/configuration-files.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index 6b2dd309623..30f65261322 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -116,7 +116,7 @@ XML substitution example:
 
 Substitutions can also be performed from ZooKeeper. To do this, specify the attribute `from_zk = "/path/to/node"`. The element value is replaced with the contents of the node at `/path/to/node` in ZooKeeper. You can also put an entire XML subtree on the ZooKeeper node, and it will be fully inserted into the source element.
 
-If you want to merge substitution content with existing configuration instead of append you can use attribute `merge="true`, for example: `<include from_zk="/some_path" merge="true">`. In this case existing configuration will be merged with content from substitution and existing configuration settings will be replaced with values from substituion.
+If you want to merge substitution content with existing configuration instead of append you can use attribute `merge="true`, for example: `<include from_zk="/some_path" merge="true">`. In this case existing configuration will be merged with content from substitution and existing configuration settings will be replaced with values from substitution.
 
 ## Encrypting and Hiding Configuration {#encryption}
 

From ce665eae3012e330d0fb5186712c0e9c7086a4fa Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 15:13:17 +0000
Subject: [PATCH 453/985] Doc fixups

---
 docs/en/operations/configuration-files.md | 10 +++++-----
 programs/server/Server.cpp                |  2 +-
 src/Common/Config/ConfigProcessor.cpp     |  1 +
 3 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/docs/en/operations/configuration-files.md b/docs/en/operations/configuration-files.md
index 30f65261322..089704705d0 100644
--- a/docs/en/operations/configuration-files.md
+++ b/docs/en/operations/configuration-files.md
@@ -95,9 +95,11 @@ which is equal to
 
 ## Substituting Configuration {#substitution}
 
-The config can also define “substitutions”. If an element has the `incl` attribute, the corresponding substitution from the file will be used as the value. By default, the path to the file with substitutions is `/etc/metrika.xml`. This can be changed in the [include_from](../operations/server-configuration-parameters/settings.md#server_configuration_parameters-include_from) element in the server config. The substitution values are specified in `/clickhouse/substitution_name` elements in this file. If a substitution specified in `incl` does not exist, it is recorded in the log. To prevent ClickHouse from logging missing substitutions, specify the `optional="true"` attribute (for example, settings for [macros](../operations/server-configuration-parameters/settings.md#macros)).
+The config can define substitutions. There are two types of substitutions:
 
-If you want to replace an entire element with a substitution use `include` as the element name.
+- If an element has the `incl` attribute, the corresponding substitution from the file will be used as the value. By default, the path to the file with substitutions is `/etc/metrika.xml`. This can be changed in the [include_from](../operations/server-configuration-parameters/settings.md#server_configuration_parameters-include_from) element in the server config. The substitution values are specified in `/clickhouse/substitution_name` elements in this file. If a substitution specified in `incl` does not exist, it is recorded in the log. To prevent ClickHouse from logging missing substitutions, specify the `optional="true"` attribute (for example, settings for [macros](../operations/server-configuration-parameters/settings.md#macros)).
+
+- If you want to replace an entire element with a substitution, use `include` as the element name. Substitutions can also be performed from ZooKeeper by specifying attribute `from_zk = "/path/to/node"`. In this case, the element value is replaced with the contents of the Zookeeper node at `/path/to/node`. This also works with you store an entire XML subtree as a Zookeeper node, it will be fully inserted into the source element.
 
 XML substitution example:
 
@@ -114,9 +116,7 @@ XML substitution example:
 </clickhouse>
 ```
 
-Substitutions can also be performed from ZooKeeper. To do this, specify the attribute `from_zk = "/path/to/node"`. The element value is replaced with the contents of the node at `/path/to/node` in ZooKeeper. You can also put an entire XML subtree on the ZooKeeper node, and it will be fully inserted into the source element.
-
-If you want to merge substitution content with existing configuration instead of append you can use attribute `merge="true`, for example: `<include from_zk="/some_path" merge="true">`. In this case existing configuration will be merged with content from substitution and existing configuration settings will be replaced with values from substitution.
+If you want to merge the substituting content with the existing configuration instead of appending you can use attribute `merge="true"`, for example: `<include from_zk="/some_path" merge="true">`. In this case, the existing configuration will be merged with the content from the substitution and the existing configuration settings will be replaced with values from substitution.
 
 ## Encrypting and Hiding Configuration {#encryption}
 
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 3be34341173..d7030e3b0aa 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -910,7 +910,7 @@ try
     /// We need to reload server settings because config could be updated via zookeeper.
     server_settings.loadSettingsFromConfig(config());
 
-    /// NOTE: Do sanity checks after we loaded all possible substitutions from ZK
+    /// NOTE: Do sanity checks after we loaded all possible substitutions (for the configuration) from ZK
     sanityChecks(*this);
 
 #if defined(OS_LINUX)
diff --git a/src/Common/Config/ConfigProcessor.cpp b/src/Common/Config/ConfigProcessor.cpp
index d524db883eb..60407c6a174 100644
--- a/src/Common/Config/ConfigProcessor.cpp
+++ b/src/Common/Config/ConfigProcessor.cpp
@@ -427,6 +427,7 @@ void ConfigProcessor::doIncludesRecursive(
 
     /// Replace the original contents, not add to it.
     bool replace = attributes->getNamedItem("replace");
+    /// Merge with the original contents
     bool merge = attributes->getNamedItem("merge");
 
     bool included_something = false;

From b8abd57b0f1e4f7b059cb119ccc0a7ad1d723d2c Mon Sep 17 00:00:00 2001
From: qaziqarta <96023488+qaziqarta@users.noreply.github.com>
Date: Wed, 13 Mar 2024 21:18:05 +0600
Subject: [PATCH 454/985] Updated references to format settings in datetime.md

Updated references to date_time_input_format and date_time_output_format.
---
 docs/en/sql-reference/data-types/datetime.md | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/en/sql-reference/data-types/datetime.md b/docs/en/sql-reference/data-types/datetime.md
index 1adff18f598..a465106c2ff 100644
--- a/docs/en/sql-reference/data-types/datetime.md
+++ b/docs/en/sql-reference/data-types/datetime.md
@@ -36,9 +36,9 @@ You can explicitly set a time zone for `DateTime`-type columns when creating a t
 
 The [clickhouse-client](../../interfaces/cli.md) applies the server time zone by default if a time zone isn’t explicitly set when initializing the data type. To use the client time zone, run `clickhouse-client` with the `--use_client_time_zone` parameter.
 
-ClickHouse outputs values depending on the value of the [date_time_output_format](../../operations/settings/settings.md#settings-date_time_output_format) setting. `YYYY-MM-DD hh:mm:ss` text format by default. Additionally, you can change the output with the [formatDateTime](../../sql-reference/functions/date-time-functions.md#formatdatetime) function.
+ClickHouse outputs values depending on the value of the [date_time_output_format](../../operations/settings/settings-formats.md#date_time_output_format) setting. `YYYY-MM-DD hh:mm:ss` text format by default. Additionally, you can change the output with the [formatDateTime](../../sql-reference/functions/date-time-functions.md#formatdatetime) function.
 
-When inserting data into ClickHouse, you can use different formats of date and time strings, depending on the value of the [date_time_input_format](../../operations/settings/settings.md#settings-date_time_input_format) setting.
+When inserting data into ClickHouse, you can use different formats of date and time strings, depending on the value of the [date_time_input_format](../../operations/settings/settings-formats.md#date_time_input_format) setting.
 
 ## Examples
 
@@ -147,8 +147,8 @@ Time shifts for multiple days. Some pacific islands changed their timezone offse
 - [Type conversion functions](../../sql-reference/functions/type-conversion-functions.md)
 - [Functions for working with dates and times](../../sql-reference/functions/date-time-functions.md)
 - [Functions for working with arrays](../../sql-reference/functions/array-functions.md)
-- [The `date_time_input_format` setting](../../operations/settings/settings-formats.md#settings-date_time_input_format)
-- [The `date_time_output_format` setting](../../operations/settings/settings-formats.md#settings-date_time_output_format)
+- [The `date_time_input_format` setting](../../operations/settings/settings-formats.md#date_time_input_format)
+- [The `date_time_output_format` setting](../../operations/settings/settings-formats.md#date_time_output_format)
 - [The `timezone` server configuration parameter](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-timezone)
 - [The `session_timezone` setting](../../operations/settings/settings.md#session_timezone)
 - [Operators for working with dates and times](../../sql-reference/operators/index.md#operators-datetime)

From cb28c84a93709ab12fc32171bf880c0e911ec0d5 Mon Sep 17 00:00:00 2001
From: Sergei Trifonov <sergei@clickhouse.com>
Date: Wed, 13 Mar 2024 16:25:58 +0100
Subject: [PATCH 455/985] Fix `forget_partition` test (#61237)

---
 ...et_partition.sql => 02995_forget_partition.sh} | 15 ++++++++++++++-
 1 file changed, 14 insertions(+), 1 deletion(-)
 rename tests/queries/0_stateless/{02995_forget_partition.sql => 02995_forget_partition.sh} (63%)
 mode change 100644 => 100755

diff --git a/tests/queries/0_stateless/02995_forget_partition.sql b/tests/queries/0_stateless/02995_forget_partition.sh
old mode 100644
new mode 100755
similarity index 63%
rename from tests/queries/0_stateless/02995_forget_partition.sql
rename to tests/queries/0_stateless/02995_forget_partition.sh
index 269f7932ea4..8ece8d3ddb3
--- a/tests/queries/0_stateless/02995_forget_partition.sql
+++ b/tests/queries/0_stateless/02995_forget_partition.sh
@@ -1,5 +1,12 @@
--- Tags: zookeeper, no-replicated-database
+#!/usr/bin/env bash
+# Tags: zookeeper, no-replicated-database
 
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+
+${CLICKHOUSE_CLIENT} --multiline --multiquery -q """
 drop table if exists forget_partition;
 
 create table forget_partition
@@ -16,7 +23,12 @@ insert into forget_partition select number, '2024-01-01' + interval number day,
 
 alter table forget_partition drop partition '20240101';
 alter table forget_partition drop partition '20240102';
+"""
 
+# DROP PARTITION do not wait for a part to be removed from memory due to possible concurrent SELECTs, so we have to do wait manually here
+while [[ $(${CLICKHOUSE_CLIENT} -q "select count() from system.parts where database=currentDatabase() and table='forget_partition' and partition='20240101'") != 0 ]]; do sleep 0.1; done
+
+${CLICKHOUSE_CLIENT} --multiline --multiquery -q """
 set allow_unrestricted_reads_from_keeper=1;
 
 select '---before---';
@@ -31,3 +43,4 @@ select '---after---';
 select name from system.zookeeper where path = '/test/02995/' || currentDatabase() || '/rmt/block_numbers' order by name;
 
 drop table forget_partition;
+"""

From a366acf59c91fca4df1262c812ac8c58ee7643e2 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 13 Mar 2024 15:36:53 +0000
Subject: [PATCH 456/985] Don't use default cluster in test
 test_distibuted_settings

---
 .../test_distributed_config/configs/clusters.xml     | 12 ++++++++++++
 tests/integration/test_distributed_config/test.py    |  6 +++---
 2 files changed, 15 insertions(+), 3 deletions(-)
 create mode 100644 tests/integration/test_distributed_config/configs/clusters.xml

diff --git a/tests/integration/test_distributed_config/configs/clusters.xml b/tests/integration/test_distributed_config/configs/clusters.xml
new file mode 100644
index 00000000000..754d765f23f
--- /dev/null
+++ b/tests/integration/test_distributed_config/configs/clusters.xml
@@ -0,0 +1,12 @@
+<clickhouse>
+    <remote_servers>
+        <localhost_cluster>
+            <shard>
+                <replica>
+                    <host>localhost</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </localhost_cluster>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_distributed_config/test.py b/tests/integration/test_distributed_config/test.py
index 500e9ecdeed..c08334985b1 100644
--- a/tests/integration/test_distributed_config/test.py
+++ b/tests/integration/test_distributed_config/test.py
@@ -3,7 +3,7 @@ from helpers.cluster import ClickHouseCluster
 import logging
 
 cluster = ClickHouseCluster(__file__)
-node = cluster.add_instance("node", main_configs=["configs/overrides.xml"])
+node = cluster.add_instance("node", main_configs=["configs/overrides.xml", "configs/clusters.xml"])
 
 
 @pytest.fixture(scope="module")
@@ -23,7 +23,7 @@ def test_distibuted_settings(start_cluster):
     node.query(
         """
         CREATE TABLE data_1 (key Int) ENGINE Memory();
-        CREATE TABLE dist_1 as data_1 ENGINE Distributed(default, default, data_1) SETTINGS flush_on_detach = true;
+        CREATE TABLE dist_1 as data_1 ENGINE Distributed(localhost_cluster, default, data_1) SETTINGS flush_on_detach = true;
         SYSTEM STOP DISTRIBUTED SENDS dist_1;
         INSERT INTO dist_1 SETTINGS prefer_localhost_replica=0 VALUES (1);
         DETACH TABLE dist_1;
@@ -36,7 +36,7 @@ def test_distibuted_settings(start_cluster):
     node.query(
         """
         CREATE TABLE data_2 (key Int) ENGINE Memory();
-        CREATE TABLE dist_2 as data_2 ENGINE Distributed(default, default, data_2);
+        CREATE TABLE dist_2 as data_2 ENGINE Distributed(localhost_cluster, default, data_2);
         SYSTEM STOP DISTRIBUTED SENDS dist_2;
         INSERT INTO dist_2 SETTINGS prefer_localhost_replica=0 VALUES (2);
         DETACH TABLE dist_2;

From a4a859ba31c731d8d5163fe5759a166c8c95601c Mon Sep 17 00:00:00 2001
From: qaziqarta <96023488+qaziqarta@users.noreply.github.com>
Date: Wed, 13 Mar 2024 21:37:50 +0600
Subject: [PATCH 457/985] Updated ru portion of previous commit

---
 docs/ru/sql-reference/data-types/datetime.md | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/ru/sql-reference/data-types/datetime.md b/docs/ru/sql-reference/data-types/datetime.md
index 57f24786bb7..25e87794147 100644
--- a/docs/ru/sql-reference/data-types/datetime.md
+++ b/docs/ru/sql-reference/data-types/datetime.md
@@ -27,9 +27,9 @@ DateTime([timezone])
 
 Консольный клиент ClickHouse по умолчанию использует часовой пояс сервера, если для значения `DateTime` часовой пояс не был задан в явном виде при инициализации типа данных. Чтобы использовать часовой пояс клиента, запустите [clickhouse-client](../../interfaces/cli.md) с параметром `--use_client_time_zone`.
 
-ClickHouse отображает значения в зависимости от значения параметра [date\_time\_output\_format](../../operations/settings/index.md#settings-date_time_output_format). Текстовый формат по умолчанию `YYYY-MM-DD hh:mm:ss`. Кроме того, вы можете поменять отображение с помощью функции [formatDateTime](../../sql-reference/functions/date-time-functions.md#formatdatetime).
+ClickHouse отображает значения в зависимости от значения параметра [date\_time\_output\_format](../../operations/settings/settings-formats.md#date_time_output_format). Текстовый формат по умолчанию `YYYY-MM-DD hh:mm:ss`. Кроме того, вы можете поменять отображение с помощью функции [formatDateTime](../../sql-reference/functions/date-time-functions.md#formatdatetime).
 
-При вставке данных в ClickHouse, можно использовать различные форматы даты и времени в зависимости от значения настройки [date_time_input_format](../../operations/settings/index.md#settings-date_time_input_format).
+При вставке данных в ClickHouse, можно использовать различные форматы даты и времени в зависимости от значения настройки [date_time_input_format](../../operations/settings/settings-formats.md#date_time_input_format).
 
 ## Примеры {#primery}
 
@@ -119,8 +119,8 @@ FROM dt
 -   [Функции преобразования типов](../../sql-reference/functions/type-conversion-functions.md)
 -   [Функции для работы с датой и временем](../../sql-reference/functions/date-time-functions.md)
 -   [Функции для работы с массивами](../../sql-reference/functions/array-functions.md)
--   [Настройка `date_time_input_format`](../../operations/settings/index.md#settings-date_time_input_format)
--   [Настройка `date_time_output_format`](../../operations/settings/index.md)
+-   [Настройка `date_time_input_format`](../../operations/settings/settings-formats.md#date_time_input_format)
+-   [Настройка `date_time_output_format`](../../operations/settings/settings-formats.md#date_time_output_format)
 -   [Конфигурационный параметр сервера `timezone`](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-timezone)
 -   [Параметр `session_timezone`](../../operations/settings/settings.md#session_timezone)
 -   [Операторы для работы с датой и временем](../../sql-reference/operators/index.md#operators-datetime)

From 868d24415b295da1c0d325e837823bfb7cde9253 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 13 Mar 2024 15:48:29 +0000
Subject: [PATCH 458/985] Fix style

---
 tests/integration/test_distributed_config/test.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_distributed_config/test.py b/tests/integration/test_distributed_config/test.py
index c08334985b1..bf4bb5a4335 100644
--- a/tests/integration/test_distributed_config/test.py
+++ b/tests/integration/test_distributed_config/test.py
@@ -3,7 +3,9 @@ from helpers.cluster import ClickHouseCluster
 import logging
 
 cluster = ClickHouseCluster(__file__)
-node = cluster.add_instance("node", main_configs=["configs/overrides.xml", "configs/clusters.xml"])
+node = cluster.add_instance(
+    "node", main_configs=["configs/overrides.xml", "configs/clusters.xml"]
+)
 
 
 @pytest.fixture(scope="module")

From 51ccb520fb5747a00b7c56adae197467284c98d5 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 13 Mar 2024 15:54:06 +0000
Subject: [PATCH 459/985] Change only ignore_limits setting

---
 src/Planner/Planner.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index 861b12e3da2..fde9f110d09 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -1081,9 +1081,10 @@ void addBuildSubqueriesForSetsStepIfNeeded(
     for (auto & subquery : subqueries)
     {
         auto query_tree = subquery->detachQueryTree();
-        /// I suppose it should be better to use all flags from select_query_options,
+        auto subquery_options = select_query_options.subquery();
+        /// I don't know if this is a good decision,
         /// But for now it is done in the same way as in old analyzer.
-        auto subquery_options = SelectQueryOptions(QueryProcessingStage::Complete, select_query_options.subquery_depth).subquery();
+        subquery_options.ignore_limits = false;
         Planner subquery_planner(
             query_tree,
             subquery_options,

From 617138cf482f9a55487d0a6c2e63dacdbbdafe8d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 13 Mar 2024 16:54:28 +0100
Subject: [PATCH 460/985] Teach the fuzzer to use other numeric types

---
 src/Client/QueryFuzzer.cpp | 46 +++++++++++++++++++++++++++++++++++++-
 1 file changed, 45 insertions(+), 1 deletion(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index 7f1dce4b29a..38e78157096 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -914,6 +914,38 @@ ASTPtr QueryFuzzer::fuzzLiteralUnderExpressionList(ASTPtr child)
         child = makeASTFunction(
             "toFixedString", std::make_shared<ASTLiteral>(value), std::make_shared<ASTLiteral>(static_cast<UInt64>(value.size())));
     }
+    else if (type == Field::Types::Which::UInt64 && fuzz_rand() % 7 == 0)
+    {
+        child = makeASTFunction(fuzz_rand() % 2 == 0 ? "toUInt128" : "toUInt256", std::make_shared<ASTLiteral>(l->value.get<UInt64>()));
+    }
+    else if (type == Field::Types::Which::Int64 && fuzz_rand() % 7 == 0)
+    {
+        child = makeASTFunction(fuzz_rand() % 2 == 0 ? "toInt128" : "toInt256", std::make_shared<ASTLiteral>(l->value.get<Int64>()));
+    }
+    else if (type == Field::Types::Which::Float64 && fuzz_rand() % 7 == 0)
+    {
+        int decimal = fuzz_rand() % 4;
+        if (decimal == 0)
+            child = makeASTFunction(
+                "toDecimal32",
+                std::make_shared<ASTLiteral>(l->value.get<Float64>()),
+                std::make_shared<ASTLiteral>(static_cast<UInt64>(fuzz_rand() % 9)));
+        else if (decimal == 1)
+            child = makeASTFunction(
+                "toDecimal64",
+                std::make_shared<ASTLiteral>(l->value.get<Float64>()),
+                std::make_shared<ASTLiteral>(static_cast<UInt64>(fuzz_rand() % 18)));
+        else if (decimal == 2)
+            child = makeASTFunction(
+                "toDecimal128",
+                std::make_shared<ASTLiteral>(l->value.get<Float64>()),
+                std::make_shared<ASTLiteral>(static_cast<UInt64>(fuzz_rand() % 38)));
+        else
+            child = makeASTFunction(
+                "toDecimal256",
+                std::make_shared<ASTLiteral>(l->value.get<Float64>()),
+                std::make_shared<ASTLiteral>(static_cast<UInt64>(fuzz_rand() % 76)));
+    }
 
     if (fuzz_rand() % 7 == 0)
         child = makeASTFunction("toNullable", child);
@@ -933,7 +965,19 @@ ASTPtr QueryFuzzer::reverseLiteralFuzzing(ASTPtr child)
 {
     if (auto * function = child.get()->as<ASTFunction>())
     {
-        std::unordered_set<String> can_be_reverted{"toNullable", "toLowCardinality", "materialize"};
+        const std::unordered_set<String> can_be_reverted{
+            "materialize",
+            "toDecimal32", /// Keeping the first parameter only should be ok (valid query most of the time)
+            "toDecimal64",
+            "toDecimal128",
+            "toDecimal256",
+            "toFixedString", /// Same as toDecimal
+            "toInt128",
+            "toInt256",
+            "toLowCardinality"
+            "toNullable",
+            "toUInt128",
+            "toUInt256"};
         if (can_be_reverted.contains(function->name) && function->children.size() == 1)
         {
             if (fuzz_rand() % 7 == 0)

From aecc135f5dd76c55b99205af170beafc06b9ee62 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 13 Mar 2024 17:03:18 +0100
Subject: [PATCH 461/985] Add more details about how NULLs are processed in
 aggregations

---
 docs/en/sql-reference/aggregate-functions/index.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/en/sql-reference/aggregate-functions/index.md b/docs/en/sql-reference/aggregate-functions/index.md
index 5d2229fbcce..e97db436271 100644
--- a/docs/en/sql-reference/aggregate-functions/index.md
+++ b/docs/en/sql-reference/aggregate-functions/index.md
@@ -18,6 +18,10 @@ ClickHouse also supports:
 
 During aggregation, all `NULL`s are skipped. If the aggregation has several parameters it will ignore any row in which one or more of the parameters are NULL.
 
+There are a few exceptions to this rule:
+  - Both [`first_value`](../../sql-reference/aggregate-functions/reference/first_value.md) and [`last_value`](../../sql-reference/aggregate-functions/reference/last_value.md) support modifiers that respect NULLs (`first_value(b) ignore nulls`).
+  - [`count`](../../sql-reference/aggregate-functions/reference/count.md) without parameters (`count()`) or with constant ones (`count(1)`) will count NULL rows too. With a column as parameter, it will count only not null values.
+
 **Examples:**
 
 Consider this table:

From 5b15ec6ae19fe1caa3800dfa333b61570cfc92b4 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 13 Mar 2024 17:10:55 +0100
Subject: [PATCH 462/985] Move test from stateless to integration

---
 .../config.d/storage_conf.xml                 |  4 +
 .../integration/test_filesystem_cache/test.py | 75 +++++++++++++++++++
 ...810_system_sync_filesystem_cache.reference |  3 -
 .../02810_system_sync_filesystem_cache.sh     | 69 -----------------
 4 files changed, 79 insertions(+), 72 deletions(-)
 delete mode 100644 tests/queries/0_stateless/02810_system_sync_filesystem_cache.reference
 delete mode 100755 tests/queries/0_stateless/02810_system_sync_filesystem_cache.sh

diff --git a/tests/integration/test_filesystem_cache/config.d/storage_conf.xml b/tests/integration/test_filesystem_cache/config.d/storage_conf.xml
index b614815b34f..a8e4f9f8a99 100644
--- a/tests/integration/test_filesystem_cache/config.d/storage_conf.xml
+++ b/tests/integration/test_filesystem_cache/config.d/storage_conf.xml
@@ -7,4 +7,8 @@
             </hdd_blob>
         </disks>
     </storage_configuration>
+    <filesystem_cache_log>
+            <database>system</database>
+            <table>filesystem_cache_log</table>
+    </filesystem_cache_log>
 </clickhouse>
diff --git a/tests/integration/test_filesystem_cache/test.py b/tests/integration/test_filesystem_cache/test.py
index c44d817c57c..dfab462732a 100644
--- a/tests/integration/test_filesystem_cache/test.py
+++ b/tests/integration/test_filesystem_cache/test.py
@@ -426,3 +426,78 @@ def test_force_filesystem_cache_on_merges(cluster):
     test(node, True)
     node = cluster.instances["node"]
     test(node, False)
+
+
+def test_system_sync_filesystem_cache(cluster):
+    node = cluster.instances["node"]
+    node.query(
+        """
+DROP TABLE IF EXISTS test;
+
+CREATE TABLE test (a Int32, b String)
+ENGINE = MergeTree() ORDER BY tuple()
+SETTINGS disk = disk(type = cache,
+            max_size = '100Ki',
+            path = "test_system_sync_filesystem_cache",
+            delayed_cleanup_interval_ms = 10000000, disk = hdd_blob),
+        min_bytes_for_wide_part = 10485760;
+
+INSERT INTO test SELECT 1, 'test';
+    """
+    )
+
+    query_id = "system_sync_filesystem_cache_1"
+    node.query(
+        "SELECT * FROM test FORMAT Null SETTINGS enable_filesystem_cache_log = 1",
+        query_id=query_id,
+    )
+
+    key, offset = (
+        node.query(
+            f"""
+    SYSTEM FLUSH LOGS;
+    SELECT key, offset FROM system.filesystem_cache_log WHERE query_id = '{query_id}' ORDER BY size DESC LIMIT 1;
+    """
+        )
+        .strip()
+        .split("\t")
+    )
+
+    cache_path = node.query(
+        f"SELECT cache_path FROM system.filesystem_cache WHERE key = '{key}' and file_segment_range_begin = {offset}"
+    )
+
+    node.exec_in_container(["bash", "-c", f"rm {cache_path}"])
+
+    assert key in node.query("SYSTEM SYNC FILESYSTEM CACHE")
+
+    node.query("SELECT * FROM test FORMAT Null")
+    assert key not in node.query("SYSTEM SYNC FILESYSTEM CACHE")
+
+    query_id = "system_sync_filesystem_cache_2"
+    node.query(
+        "SELECT * FROM test FORMAT Null SETTINGS enable_filesystem_cache_log = 1",
+        query_id=query_id,
+    )
+
+    key, offset = (
+        node.query(
+            f"""
+    SYSTEM FLUSH LOGS;
+    SELECT key, offset FROM system.filesystem_cache_log WHERE query_id = '{query_id}' ORDER BY size DESC LIMIT 1;
+    """
+        )
+        .strip()
+        .split("\t")
+    )
+    cache_path = node.query(
+        f"SELECT cache_path FROM system.filesystem_cache WHERE key = '{key}' and file_segment_range_begin = {offset}"
+    )
+
+    node.exec_in_container(["bash", "-c", f"echo -n 'fff' > {cache_path}"])
+
+    assert key in node.query("SYSTEM SYNC FILESYSTEM CACHE")
+
+    node.query("SELECT * FROM test FORMAT Null")
+
+    assert key not in node.query("SYSTEM SYNC FILESYSTEM CACHE")
diff --git a/tests/queries/0_stateless/02810_system_sync_filesystem_cache.reference b/tests/queries/0_stateless/02810_system_sync_filesystem_cache.reference
deleted file mode 100644
index 7614df8ec46..00000000000
--- a/tests/queries/0_stateless/02810_system_sync_filesystem_cache.reference
+++ /dev/null
@@ -1,3 +0,0 @@
-ok
-ok
-ok
diff --git a/tests/queries/0_stateless/02810_system_sync_filesystem_cache.sh b/tests/queries/0_stateless/02810_system_sync_filesystem_cache.sh
deleted file mode 100755
index c88ba4d5a74..00000000000
--- a/tests/queries/0_stateless/02810_system_sync_filesystem_cache.sh
+++ /dev/null
@@ -1,69 +0,0 @@
-#!/usr/bin/env bash
-# Tags: no-fasttest, no-parallel, no-s3-storage, no-random-settings
-
-# set -x
-
-CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CUR_DIR"/../shell_config.sh
-
-
-$CLICKHOUSE_CLIENT -nm --query """
-DROP TABLE IF EXISTS test;
-
-CREATE TABLE test (a Int32, b String)
-ENGINE = MergeTree() ORDER BY tuple()
-SETTINGS disk = disk(type = cache, max_size = '100Ki', path = ${CLICKHOUSE_TEST_UNIQUE_NAME}, delayed_cleanup_interval_ms = 10000000, disk = s3_disk), min_bytes_for_wide_part = 10485760;
-
-INSERT INTO test SELECT 1, 'test';
-"""
-
-query_id=$RANDOM
-
-$CLICKHOUSE_CLIENT --query_id "$query_id" --query "SELECT * FROM test FORMAT Null SETTINGS enable_filesystem_cache_log = 1"
-
-${CLICKHOUSE_CLIENT} -q "system flush logs"
-
-key=$($CLICKHOUSE_CLIENT -nm --query """
-SELECT key FROM system.filesystem_cache_log WHERE query_id = '$query_id' ORDER BY size DESC LIMIT 1;
-""")
-
-offset=$($CLICKHOUSE_CLIENT -nm --query """
-SELECT offset FROM system.filesystem_cache_log WHERE query_id = '$query_id' ORDER BY size DESC LIMIT 1;
-""")
-
-path=$($CLICKHOUSE_CLIENT -nm --query """
-SELECT cache_path FROM system.filesystem_cache WHERE key = '$key' AND file_segment_range_begin = $offset;
-""")
-
-rm $path
-
-$CLICKHOUSE_CLIENT  --query "SELECT * FROM test FORMAT Null SETTINGS enable_filesystem_cache_log = 1" 2>&1 | grep -F -e "No such file or directory" > /dev/null && echo "ok" || echo "fail"
-
-CLICKHOUSE_CLIENT=$(echo ${CLICKHOUSE_CLIENT} | sed 's/'"--send_logs_level=${CLICKHOUSE_CLIENT_SERVER_LOGS_LEVEL}"'/--send_logs_level=fatal/g')
-
-$CLICKHOUSE_CLIENT --query "SYSTEM SYNC FILESYSTEM CACHE" 2>&1 | grep -q "$key" && echo 'ok' || echo 'fail'
-
-$CLICKHOUSE_CLIENT --query "SELECT * FROM test FORMAT Null"
-
-key=$($CLICKHOUSE_CLIENT -nm --query """
-SELECT key FROM system.filesystem_cache_log WHERE query_id = '$query_id' ORDER BY size DESC LIMIT 1;
-""")
-
-offset=$($CLICKHOUSE_CLIENT -nm --query """
-SELECT offset FROM system.filesystem_cache_log WHERE query_id = '$query_id' ORDER BY size DESC LIMIT 1;
-""")
-
-path=$($CLICKHOUSE_CLIENT -nm --query """
-SELECT cache_path FROM system.filesystem_cache WHERE key = '$key' AND file_segment_range_begin = $offset;
-""")
-
-echo -n 'fff' > $path
-
-#cat $path
-
-$CLICKHOUSE_CLIENT --query "SYSTEM SYNC FILESYSTEM CACHE" 2>&1 | grep -q "$key" && echo 'ok' || echo 'fail'
-
-$CLICKHOUSE_CLIENT --query "SELECT * FROM test FORMAT Null"
-
-$CLICKHOUSE_CLIENT --query "SYSTEM SYNC FILESYSTEM CACHE"

From b2e067b3daee284c4a97289dc1b4dac1f920c3e6 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Wed, 13 Mar 2024 16:41:35 +0000
Subject: [PATCH 463/985] Fix logical error in RabbitMQ storage with
 MATERIALIZED columns

---
 .../table-engines/integrations/rabbitmq.md    |  8 ++-
 src/Interpreters/InterpreterInsertQuery.cpp   | 23 +++++--
 src/Interpreters/InterpreterInsertQuery.h     |  2 +-
 src/Storages/RabbitMQ/RabbitMQSource.cpp      | 14 +++-
 src/Storages/RabbitMQ/StorageRabbitMQ.cpp     | 35 ++++++----
 .../integration/test_storage_rabbitmq/test.py | 64 ++++++++++++++-----
 .../test_rabbitmq_json.reference              | 50 ---------------
 7 files changed, 106 insertions(+), 90 deletions(-)
 delete mode 100644 tests/integration/test_storage_rabbitmq/test_rabbitmq_json.reference

diff --git a/docs/en/engines/table-engines/integrations/rabbitmq.md b/docs/en/engines/table-engines/integrations/rabbitmq.md
index 0f3fef3d6fb..a4d0cf78066 100644
--- a/docs/en/engines/table-engines/integrations/rabbitmq.md
+++ b/docs/en/engines/table-engines/integrations/rabbitmq.md
@@ -18,8 +18,8 @@ This engine allows integrating ClickHouse with [RabbitMQ](https://www.rabbitmq.c
 ``` sql
 CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
 (
-    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1],
-    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2],
+    name1 [type1],
+    name2 [type2],
     ...
 ) ENGINE = RabbitMQ SETTINGS
     rabbitmq_host_port = 'host:port' [or rabbitmq_address = 'amqp(s)://guest:guest@localhost/vhost'],
@@ -198,6 +198,10 @@ Additional virtual columns when `kafka_handle_error_mode='stream'`:
 
 Note: `_raw_message` and `_error` virtual columns are filled only in case of exception during parsing, they are always `NULL` when message was parsed successfully.
 
+## Caveats {#caveats}
+
+Even though you may specify [default column expressions](/docs/en/sql-reference/statements/create/table.md/#default_values) (such as `DEFAULT`, `MATERIALIZED`, `ALIAS`) in the table definition, these will be ignored. Instead, the columns will be filled with their respective default values for their types.
+
 ## Data formats support {#data-formats-support}
 
 RabbitMQ engine supports all [formats](../../../interfaces/formats.md) supported in ClickHouse.
diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index 70f9e0c51da..3e8bb268fe7 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -151,7 +151,7 @@ Block InterpreterInsertQuery::getSampleBlock(
         names.emplace_back(std::move(current_name));
     }
 
-    return getSampleBlock(names, table, metadata_snapshot, allow_materialized);
+    return getSampleBlockImpl(names, table, metadata_snapshot, no_destination, allow_materialized);
 }
 
 std::optional<Names> InterpreterInsertQuery::getInsertColumnNames() const
@@ -173,13 +173,18 @@ std::optional<Names> InterpreterInsertQuery::getInsertColumnNames() const
     return names;
 }
 
-Block InterpreterInsertQuery::getSampleBlock(
+Block InterpreterInsertQuery::getSampleBlockImpl(
     const Names & names,
     const StoragePtr & table,
     const StorageMetadataPtr & metadata_snapshot,
+    bool no_destination,
     bool allow_materialized)
 {
     Block table_sample_physical = metadata_snapshot->getSampleBlock();
+    Block table_sample_virtuals;
+    if (no_destination)
+        table_sample_virtuals = table->getVirtualsHeader();
+
     Block table_sample_insertable = metadata_snapshot->getSampleBlockInsertable();
     Block res;
     for (const auto & current_name : names)
@@ -194,13 +199,19 @@ Block InterpreterInsertQuery::getSampleBlock(
             if (table_sample_physical.has(current_name))
             {
                 if (!allow_materialized)
-                    throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert column {}, because it is MATERIALIZED column.",
-                        current_name);
+                    throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert column {}, because it is MATERIALIZED column", current_name);
                 res.insert(ColumnWithTypeAndName(table_sample_physical.getByName(current_name).type, current_name));
             }
-            else /// The table does not have a column with that name
+            else if (table_sample_virtuals.has(current_name))
+            {
+                res.insert(ColumnWithTypeAndName(table_sample_virtuals.getByName(current_name).type, current_name));
+            }
+            else
+            {
+                /// The table does not have a column with that name
                 throw Exception(ErrorCodes::NO_SUCH_COLUMN_IN_TABLE, "No such column {} in table {}",
                     current_name, table->getStorageID().getNameForLogs());
+            }
         }
         else
             res.insert(ColumnWithTypeAndName(table_sample_insertable.getByName(current_name).type, current_name));
@@ -276,7 +287,7 @@ Chain InterpreterInsertQuery::buildChain(
     if (!running_group)
         running_group = std::make_shared<ThreadGroup>(getContext());
 
-    auto sample = getSampleBlock(columns, table, metadata_snapshot, allow_materialized);
+    auto sample = getSampleBlockImpl(columns, table, metadata_snapshot, no_destination, allow_materialized);
     if (check_access)
         getContext()->checkAccess(AccessType::INSERT, table->getStorageID(), sample.getNames());
 
diff --git a/src/Interpreters/InterpreterInsertQuery.h b/src/Interpreters/InterpreterInsertQuery.h
index 3647126afb9..bf73fb2a319 100644
--- a/src/Interpreters/InterpreterInsertQuery.h
+++ b/src/Interpreters/InterpreterInsertQuery.h
@@ -69,7 +69,7 @@ public:
     bool shouldAddSquashingFroStorage(const StoragePtr & table) const;
 
 private:
-    static Block getSampleBlock(const Names & names, const StoragePtr & table, const StorageMetadataPtr & metadata_snapshot, bool allow_materialized);
+    static Block getSampleBlockImpl(const Names & names, const StoragePtr & table, const StorageMetadataPtr & metadata_snapshot, bool no_destination, bool allow_materialized);
 
     ASTPtr query_ptr;
     const bool allow_materialized;
diff --git a/src/Storages/RabbitMQ/RabbitMQSource.cpp b/src/Storages/RabbitMQ/RabbitMQSource.cpp
index 4dc257074f3..09c1bf1b2e7 100644
--- a/src/Storages/RabbitMQ/RabbitMQSource.cpp
+++ b/src/Storages/RabbitMQ/RabbitMQSource.cpp
@@ -11,11 +11,21 @@
 namespace DB
 {
 
-static std::pair<Block, Block> getHeaders(const StorageSnapshotPtr & storage_snapshot)
+static std::pair<Block, Block> getHeaders(const StorageSnapshotPtr & storage_snapshot, const Names & column_names)
 {
+    auto all_columns_header = storage_snapshot->metadata->getSampleBlock();
+
     auto non_virtual_header = storage_snapshot->metadata->getSampleBlockNonMaterialized();
     auto virtual_header = storage_snapshot->virtual_columns->getSampleBlock();
 
+    for (const auto & column_name : column_names)
+    {
+        if (non_virtual_header.has(column_name) || virtual_header.has(column_name))
+            continue;
+        const auto & column = all_columns_header.getByName(column_name);
+        non_virtual_header.insert(column);
+    }
+
     return {non_virtual_header, virtual_header};
 }
 
@@ -40,7 +50,7 @@ RabbitMQSource::RabbitMQSource(
     : RabbitMQSource(
         storage_,
         storage_snapshot_,
-        getHeaders(storage_snapshot_),
+        getHeaders(storage_snapshot_, columns),
         context_,
         columns,
         max_block_size_,
diff --git a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
index 980fccd307e..b882fd2728c 100644
--- a/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
+++ b/src/Storages/RabbitMQ/StorageRabbitMQ.cpp
@@ -8,6 +8,7 @@
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTInsertQuery.h>
+#include <Parsers/ASTIdentifier.h>
 #include <Processors/Executors/CompletedPipelineExecutor.h>
 #include <Processors/Executors/PushingPipelineExecutor.h>
 #include <Processors/Transforms/ExpressionTransform.h>
@@ -133,6 +134,9 @@ StorageRabbitMQ::StorageRabbitMQ(
     if (configuration.secure)
         SSL_library_init();
 
+    if (!columns_.getMaterialized().empty() || !columns_.getAliases().empty() || !columns_.getDefaults().empty() || !columns_.getEphemeral().empty())
+        context_->addWarningMessage("RabbitMQ table engine doesn't support ALIAS, DEFAULT or MATERIALIZED columns. They will be ignored and filled with default values");
+
     StorageInMemoryMetadata storage_metadata;
     storage_metadata.setColumns(columns_);
     setInMemoryMetadata(storage_metadata);
@@ -1055,18 +1059,7 @@ bool StorageRabbitMQ::tryStreamToViews()
     if (!table)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Engine table {} doesn't exist.", table_id.getNameForLogs());
 
-    // Create an INSERT query for streaming data
-    auto insert = std::make_shared<ASTInsertQuery>();
-    insert->table_id = table_id;
-
-    // Only insert into dependent views and expect that input blocks contain virtual columns
-    InterpreterInsertQuery interpreter(insert, rabbitmq_context, false, true, true);
-    auto block_io = interpreter.execute();
-
     auto storage_snapshot = getStorageSnapshot(getInMemoryMetadataPtr(), getContext());
-    auto column_names = block_io.pipeline.getHeader().getNames();
-    auto sample_block = storage_snapshot->getSampleBlockForColumns(column_names);
-
     auto block_size = getMaxBlockSize();
 
     // Create a stream for each consumer and join them in a union stream
@@ -1082,13 +1075,29 @@ bool StorageRabbitMQ::tryStreamToViews()
     for (size_t i = 0; i < num_created_consumers; ++i)
     {
         auto source = std::make_shared<RabbitMQSource>(
-            *this, storage_snapshot, rabbitmq_context, column_names, block_size,
-            max_execution_time_ms, rabbitmq_settings->rabbitmq_handle_error_mode, false);
+            *this, storage_snapshot, rabbitmq_context, Names{}, block_size,
+            max_execution_time_ms, rabbitmq_settings->rabbitmq_handle_error_mode);
 
         sources.emplace_back(source);
         pipes.emplace_back(source);
     }
 
+    // Create an INSERT query for streaming data
+    auto insert = std::make_shared<ASTInsertQuery>();
+    insert->table_id = table_id;
+    if (!sources.empty())
+    {
+        auto column_list = std::make_shared<ASTExpressionList>();
+        const auto & header = sources[0]->getPort().getHeader();
+        for (const auto & column : header)
+            column_list->children.emplace_back(std::make_shared<ASTIdentifier>(column.name));
+        insert->columns = std::move(column_list);
+    }
+
+    // Only insert into dependent views and expect that input blocks contain virtual columns
+    InterpreterInsertQuery interpreter(insert, rabbitmq_context, /* allow_materialized_ */ false, /* no_squash_ */ true, /* no_destination_ */ true);
+    auto block_io = interpreter.execute();
+
     block_io.pipeline.complete(Pipe::unitePipes(std::move(pipes)));
 
     std::atomic_size_t rows = 0;
diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 280ce230921..0f1c5eb17dd 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -53,13 +53,13 @@ instance3 = cluster.add_instance(
 # Helpers
 
 
-def rabbitmq_check_result(result, check=False, ref_file="test_rabbitmq_json.reference"):
-    fpath = p.join(p.dirname(__file__), ref_file)
-    with open(fpath) as reference:
-        if check:
-            assert TSV(result) == TSV(reference)
-        else:
-            return TSV(result) == TSV(reference)
+def rabbitmq_check_result(result, check=False, reference=None):
+    if reference is None:
+        reference = "\n".join([f"{i}\t{i}" for i in range(50)])
+    if check:
+        assert TSV(result) == TSV(reference)
+    else:
+        return TSV(result) == TSV(reference)
 
 
 def wait_rabbitmq_to_start(rabbitmq_docker_id, cookie, timeout=180):
@@ -133,9 +133,10 @@ def test_rabbitmq_select(rabbitmq_cluster, secure):
     if secure:
         port = cluster.rabbitmq_secure_port
 
+    # MATERIALIZED and ALIAS columns are not supported in RabbitMQ engine, but we can test that it does not fail
     instance.query(
         """
-        CREATE TABLE test.rabbitmq (key UInt64, value UInt64)
+        CREATE TABLE test.rabbitmq (key UInt64, value UInt64, value2 ALIAS value + 1, value3 MATERIALIZED value + 1)
             ENGINE = RabbitMQ
             SETTINGS rabbitmq_host_port = '{}:{}',
                      rabbitmq_exchange_name = 'select',
@@ -148,6 +149,11 @@ def test_rabbitmq_select(rabbitmq_cluster, secure):
         )
     )
 
+    assert (
+        "RabbitMQ table engine doesn\\'t support ALIAS, DEFAULT or MATERIALIZED columns"
+        in instance.query("SELECT * FROM system.warnings")
+    )
+
     credentials = pika.PlainCredentials("root", "clickhouse")
     parameters = pika.ConnectionParameters(
         rabbitmq_cluster.rabbitmq_ip, rabbitmq_cluster.rabbitmq_port, "/", credentials
@@ -379,7 +385,7 @@ def test_rabbitmq_macros(rabbitmq_cluster):
 def test_rabbitmq_materialized_view(rabbitmq_cluster):
     instance.query(
         """
-        CREATE TABLE test.rabbitmq (key UInt64, value UInt64)
+        CREATE TABLE test.rabbitmq (key UInt64, value UInt64, dt1 DateTime MATERIALIZED now(), value2 ALIAS value + 1)
             ENGINE = RabbitMQ
             SETTINGS rabbitmq_host_port = 'rabbitmq1:5672',
                      rabbitmq_exchange_name = 'mv',
@@ -484,9 +490,11 @@ def test_rabbitmq_many_materialized_views(rabbitmq_cluster):
         """
         DROP TABLE IF EXISTS test.view1;
         DROP TABLE IF EXISTS test.view2;
+        DROP TABLE IF EXISTS test.view3;
         DROP TABLE IF EXISTS test.consumer1;
         DROP TABLE IF EXISTS test.consumer2;
-        CREATE TABLE test.rabbitmq (key UInt64, value UInt64)
+        DROP TABLE IF EXISTS test.consumer3;
+        CREATE TABLE test.rabbitmq (key UInt64, value UInt64, value2 ALIAS value + 1, value3 MATERIALIZED value + 1, value4 DEFAULT 1)
             ENGINE = RabbitMQ
             SETTINGS rabbitmq_host_port = 'rabbitmq1:5672',
                      rabbitmq_exchange_name = 'mmv',
@@ -497,13 +505,18 @@ def test_rabbitmq_many_materialized_views(rabbitmq_cluster):
         CREATE TABLE test.view1 (key UInt64, value UInt64)
             ENGINE = MergeTree()
             ORDER BY key;
-        CREATE TABLE test.view2 (key UInt64, value UInt64)
+        CREATE TABLE test.view2 (key UInt64, value UInt64, value2 UInt64, value3 UInt64, value4 UInt64)
+            ENGINE = MergeTree()
+            ORDER BY key;
+        CREATE TABLE test.view3 (key UInt64)
             ENGINE = MergeTree()
             ORDER BY key;
         CREATE MATERIALIZED VIEW test.consumer1 TO test.view1 AS
             SELECT * FROM test.rabbitmq;
         CREATE MATERIALIZED VIEW test.consumer2 TO test.view2 AS
             SELECT * FROM test.rabbitmq;
+        CREATE MATERIALIZED VIEW test.consumer3 TO test.view3 AS
+            SELECT * FROM test.rabbitmq;
     """
     )
 
@@ -514,7 +527,7 @@ def test_rabbitmq_many_materialized_views(rabbitmq_cluster):
     connection = pika.BlockingConnection(parameters)
     channel = connection.channel()
 
-    instance.wait_for_log_line("Started streaming to 2 attached views")
+    instance.wait_for_log_line("Started streaming to 3 attached views")
 
     messages = []
     for i in range(50):
@@ -522,24 +535,43 @@ def test_rabbitmq_many_materialized_views(rabbitmq_cluster):
     for message in messages:
         channel.basic_publish(exchange="mmv", routing_key="", body=message)
 
-    while True:
+    is_check_passed = False
+    deadline = time.monotonic() + 60
+    while time.monotonic() < deadline:
         result1 = instance.query("SELECT * FROM test.view1 ORDER BY key")
         result2 = instance.query("SELECT * FROM test.view2 ORDER BY key")
-        if rabbitmq_check_result(result1) and rabbitmq_check_result(result2):
+        result3 = instance.query("SELECT * FROM test.view3 ORDER BY key")
+        # Note that for view2 result is `i i 0 0 0`, but not `i i i+1 i+1 1` as expected, ALIAS/MATERIALIZED/DEFAULT columns are not supported in RabbitMQ engine
+        # We onlt check that at least it do not fail
+        if (
+            rabbitmq_check_result(result1)
+            and rabbitmq_check_result(
+                result2, reference="\n".join([f"{i}\t{i}\t0\t0\t0" for i in range(50)])
+            )
+            and rabbitmq_check_result(
+                result3, reference="\n".join([str(i) for i in range(50)])
+            )
+        ):
+            is_check_passed = True
             break
+        time.sleep(0.1)
+
+    assert (
+        is_check_passed
+    ), f"References are not equal to results, result1: {result1}, result2: {result2}, result3: {result3}"
 
     instance.query(
         """
         DROP TABLE test.consumer1;
         DROP TABLE test.consumer2;
+        DROP TABLE test.consumer3;
         DROP TABLE test.view1;
         DROP TABLE test.view2;
+        DROP TABLE test.view3;
     """
     )
 
     connection.close()
-    rabbitmq_check_result(result1, True)
-    rabbitmq_check_result(result2, True)
 
 
 def test_rabbitmq_big_message(rabbitmq_cluster):
diff --git a/tests/integration/test_storage_rabbitmq/test_rabbitmq_json.reference b/tests/integration/test_storage_rabbitmq/test_rabbitmq_json.reference
deleted file mode 100644
index 959bb2aad74..00000000000
--- a/tests/integration/test_storage_rabbitmq/test_rabbitmq_json.reference
+++ /dev/null
@@ -1,50 +0,0 @@
-0	0
-1	1
-2	2
-3	3
-4	4
-5	5
-6	6
-7	7
-8	8
-9	9
-10	10
-11	11
-12	12
-13	13
-14	14
-15	15
-16	16
-17	17
-18	18
-19	19
-20	20
-21	21
-22	22
-23	23
-24	24
-25	25
-26	26
-27	27
-28	28
-29	29
-30	30
-31	31
-32	32
-33	33
-34	34
-35	35
-36	36
-37	37
-38	38
-39	39
-40	40
-41	41
-42	42
-43	43
-44	44
-45	45
-46	46
-47	47
-48	48
-49	49

From 4e12b5dc9197db89699a1a420471d31a4aeb03bc Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 16:54:20 +0000
Subject: [PATCH 464/985] Some fixups

---
 base/base/getMemoryAmount.cpp             |   3 -
 base/base/getMemoryAmount.h               |   9 +-
 programs/keeper/Keeper.cpp                |  19 ++--
 programs/server/Server.cpp                |   6 +-
 src/Common/CgroupsMemoryUsageObserver.cpp | 100 ++++++++++------------
 src/Common/CgroupsMemoryUsageObserver.h   |  60 ++++++-------
 6 files changed, 93 insertions(+), 104 deletions(-)

diff --git a/base/base/getMemoryAmount.cpp b/base/base/getMemoryAmount.cpp
index 0311238caed..3d01e301f45 100644
--- a/base/base/getMemoryAmount.cpp
+++ b/base/base/getMemoryAmount.cpp
@@ -50,9 +50,6 @@ std::optional<uint64_t> getCgroupsV2MemoryLimit()
 
 }
 
-/** Returns the size of physical memory (RAM) in bytes.
-  * Returns 0 on unsupported platform
-  */
 uint64_t getMemoryAmountOrZero()
 {
     int64_t num_pages = sysconf(_SC_PHYS_PAGES);
diff --git a/base/base/getMemoryAmount.h b/base/base/getMemoryAmount.h
index 7ebd92a8bcf..37ee0ebe7c6 100644
--- a/base/base/getMemoryAmount.h
+++ b/base/base/getMemoryAmount.h
@@ -2,11 +2,10 @@
 
 #include <cstdint>
 
-/** Returns the size of physical memory (RAM) in bytes.
-  * Returns 0 on unsupported platform or if it cannot determine the size of physical memory.
-  */
+/// Returns the size in bytes of physical memory (RAM) available to the process. The value can
+/// be smaller than the total available RAM available to the system due to cgroups settings.
+/// Returns 0 on unsupported platform or if it cannot determine the size of physical memory.
 uint64_t getMemoryAmountOrZero();
 
-/** Throws exception if it cannot determine the size of physical memory.
-  */
+/// Throws exception if it cannot determine the size of physical memory.
 uint64_t getMemoryAmount();
diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index 5ec1d2a6568..671dd50215b 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -625,23 +625,22 @@ try
     main_config_reloader->start();
 
     std::optional<CgroupsMemoryUsageObserver> observer;
-    auto cgroups_memory_observer_wait_time = config().getUInt64("keeper_server.cgroups_memory_observer_wait_time", 15);
-    if (cgroups_memory_observer_wait_time != 0)
+    try
     {
-        try
+        auto wait_time = config().getUInt64("keeper_server.cgroups_memory_observer_wait_time", 15);
+        if (wait_time != 0)
         {
-            observer.emplace(std::chrono::seconds(cgroups_memory_observer_wait_time));
-            observer->setOnMemoryLimitUpdate([&]()
+            observer.emplace(std::chrono::seconds(wait_time));
+            observer->setOnMemoryAmountAvailableChanged([&]()
             {
                 main_config_reloader->reload();
             });
             observer->startThread();
         }
-        catch (Exception &)
-        {
-            tryLogCurrentException(log, "Disabling cgroup memory observer because of an error during initialization");
-        }
-
+    }
+    catch (Exception &)
+    {
+        tryLogCurrentException(log, "Disabling cgroup memory observer because of an error during initialization");
     }
 
 
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 8e672f3f73e..78d95d8340f 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -1293,7 +1293,7 @@ try
     std::optional<CgroupsMemoryUsageObserver> cgroups_memory_usage_observer;
     try
     {
-        UInt64 wait_time = server_settings.cgroups_memory_usage_observer_wait_time;
+        auto wait_time = server_settings.cgroups_memory_usage_observer_wait_time;
         if (wait_time != 0)
             cgroups_memory_usage_observer.emplace(std::chrono::seconds(wait_time));
     }
@@ -1359,7 +1359,7 @@ try
             {
                 double hard_limit_ratio = new_server_settings.cgroup_memory_watcher_hard_limit_ratio;
                 double soft_limit_ratio = new_server_settings.cgroup_memory_watcher_soft_limit_ratio;
-                cgroups_memory_usage_observer->setLimits(
+                cgroups_memory_usage_observer->setMemoryUsageLimits(
                     static_cast<uint64_t>(max_server_memory_usage * hard_limit_ratio),
                     static_cast<uint64_t>(max_server_memory_usage * soft_limit_ratio));
             }
@@ -1702,7 +1702,7 @@ try
 
     if (cgroups_memory_usage_observer)
     {
-        cgroups_memory_usage_observer->setOnMemoryLimitUpdate([&]()
+        cgroups_memory_usage_observer->setOnMemoryAmountAvailableChanged([&]()
         {
             main_config_reloader->reload();
         });
diff --git a/src/Common/CgroupsMemoryUsageObserver.cpp b/src/Common/CgroupsMemoryUsageObserver.cpp
index c8379aed248..e55fd44a524 100644
--- a/src/Common/CgroupsMemoryUsageObserver.cpp
+++ b/src/Common/CgroupsMemoryUsageObserver.cpp
@@ -37,7 +37,7 @@ namespace ErrorCodes
 CgroupsMemoryUsageObserver::CgroupsMemoryUsageObserver(std::chrono::seconds wait_time_)
     : log(getLogger("CgroupsMemoryUsageObserver"))
     , wait_time(wait_time_)
-    , file(log)
+    , memory_usage_file(log)
 {
     LOG_INFO(log, "Initialized cgroups memory limit observer, wait time is {} sec", wait_time.count());
 }
@@ -47,9 +47,10 @@ CgroupsMemoryUsageObserver::~CgroupsMemoryUsageObserver()
     stopThread();
 }
 
-void CgroupsMemoryUsageObserver::setLimits(uint64_t hard_limit_, uint64_t soft_limit_)
+void CgroupsMemoryUsageObserver::setMemoryUsageLimits(uint64_t hard_limit_, uint64_t soft_limit_)
 {
-    std::lock_guard<std::mutex> lock(limit_mutex);
+    std::lock_guard<std::mutex> limit_lock(limit_mutex);
+
     if (hard_limit_ == hard_limit && soft_limit_ == soft_limit)
         return;
 
@@ -83,10 +84,10 @@ void CgroupsMemoryUsageObserver::setLimits(uint64_t hard_limit_, uint64_t soft_l
             mallctl("arena." STRINGIFY(MALLCTL_ARENAS_ALL) ".purge", nullptr, nullptr, nullptr, 0);
 #endif
             /// Reset current usage in memory tracker. Expect zero for free_memory_in_allocator_arenas as we just purged them.
-            uint64_t current_usage = readMemoryUsage();
-            MemoryTracker::setRSS(current_usage, 0);
+            uint64_t memory_usage = readMemoryUsage();
+            MemoryTracker::setRSS(memory_usage, 0);
 
-            LOG_INFO(log, "Purged jemalloc arenas. Current memory usage is {}", ReadableSize(current_usage));
+            LOG_INFO(log, "Purged jemalloc arenas. Current memory usage is {}", ReadableSize(memory_usage));
         }
         else
         {
@@ -97,15 +98,15 @@ void CgroupsMemoryUsageObserver::setLimits(uint64_t hard_limit_, uint64_t soft_l
     LOG_INFO(log, "Set new limits, soft limit: {}, hard limit: {}", ReadableSize(soft_limit_), ReadableSize(hard_limit_));
 }
 
-void CgroupsMemoryUsageObserver::setOnMemoryLimitUpdate(UpdateMemLimitCallbackFn on_memory_limit_update_)
+void CgroupsMemoryUsageObserver::setOnMemoryAmountAvailableChanged(OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed_)
 {
-    std::lock_guard<std::mutex> set_limit_lock(limit_mutex);
-    on_memory_limit_update = on_memory_limit_update_;
+    std::lock_guard<std::mutex> limit_lock(limit_mutex);
+    on_memory_amount_available_changed = on_memory_amount_available_changed_;
 }
 
 uint64_t CgroupsMemoryUsageObserver::readMemoryUsage() const
 {
-    return file.readMemoryUsage();
+    return memory_usage_file.readMemoryUsage();
 }
 
 namespace
@@ -167,7 +168,7 @@ std::pair<std::string, CgroupsMemoryUsageObserver::CgroupsVersion> getCgroupsFil
 
 }
 
-CgroupsMemoryUsageObserver::File::File(LoggerPtr log_)
+CgroupsMemoryUsageObserver::MemoryUsageFile::MemoryUsageFile(LoggerPtr log_)
     : log(log_)
 {
     std::tie(file_name, version) = getCgroupsFileName();
@@ -181,7 +182,7 @@ CgroupsMemoryUsageObserver::File::File(LoggerPtr log_)
             file_name, "Cannot open file '{}'", file_name);
 }
 
-CgroupsMemoryUsageObserver::File::~File()
+CgroupsMemoryUsageObserver::MemoryUsageFile::~MemoryUsageFile()
 {
     assert(fd != -1);
     if (::close(fd) != 0)
@@ -199,7 +200,7 @@ CgroupsMemoryUsageObserver::File::~File()
     }
 }
 
-uint64_t CgroupsMemoryUsageObserver::File::readMemoryUsage() const
+uint64_t CgroupsMemoryUsageObserver::MemoryUsageFile::readMemoryUsage() const
 {
     /// File read is probably not read is thread-safe, just to be sure
     std::lock_guard lock(mutex);
@@ -282,8 +283,8 @@ void CgroupsMemoryUsageObserver::runThread()
 {
     setThreadName("CgrpMemUsgObsr");
 
-    last_process_memory_amount = getMemoryAmount();
-    LOG_INFO(log, "Init memory amount is {} bytes", last_process_memory_amount);
+    last_available_memory_amount = getMemoryAmount();
+    LOG_INFO(log, "Memory amount initially available to the process is {}", ReadableSize(last_available_memory_amount));
 
     std::unique_lock lock(thread_mutex);
     while (true)
@@ -293,21 +294,41 @@ void CgroupsMemoryUsageObserver::runThread()
 
         try
         {
-            uint64_t process_memory_limit = getMemoryAmount();
-            if (process_memory_limit != last_process_memory_amount)
+            uint64_t available_memory_amount = getMemoryAmount();
+            if (available_memory_amount != last_available_memory_amount)
             {
-                LOG_INFO(log, "Find memory amount change, old limit is {} bytes, new limit is {} bytes", last_process_memory_amount, process_memory_limit);
-                last_process_memory_amount = process_memory_limit;
-                /// If the available memory for the process changes (typically because the limit was adjusted via cgroups), then we just reload the config.
-                /// Reloading config will check the memory amount again and calculate soft/hard limit again.
-                std::lock_guard<std::mutex> set_limit_lock(limit_mutex);
-                on_memory_limit_update();
+                LOG_INFO(log, "Memory amount available to the process changed from {} to {}", ReadableSize(last_available_memory_amount), ReadableSize(available_memory_amount));
+                last_available_memory_amount = available_memory_amount;
+                std::lock_guard<std::mutex> limit_lock(limit_mutex);
+                on_memory_amount_available_changed();
             }
-            std::lock_guard<std::mutex> set_limit_lock(limit_mutex);
+
+            std::lock_guard<std::mutex> limit_lock(limit_mutex);
             if (soft_limit > 0 && hard_limit > 0)
             {
-                uint64_t memory_usage = file.readMemoryUsage();
-                processMemoryUsage(memory_usage);
+                uint64_t memory_usage = memory_usage_file.readMemoryUsage();
+                if (memory_usage > hard_limit)
+                {
+                    if (last_memory_usage <= hard_limit)
+                        on_hard_limit(true);
+                }
+                else
+                {
+                    if (last_memory_usage > hard_limit)
+                        on_hard_limit(false);
+                }
+
+                if (memory_usage > soft_limit)
+                {
+                    if (last_memory_usage <= soft_limit)
+                        on_soft_limit(true);
+                }
+                else
+                {
+                    if (last_memory_usage > soft_limit)
+                        on_soft_limit(false);
+                }
+                last_memory_usage = memory_usage;
             }
         }
         catch (...)
@@ -317,33 +338,6 @@ void CgroupsMemoryUsageObserver::runThread()
     }
 }
 
-void CgroupsMemoryUsageObserver::processMemoryUsage(uint64_t current_usage)
-{
-    if (current_usage > hard_limit)
-    {
-        if (last_usage <= hard_limit)
-            on_hard_limit(true);
-    }
-    else
-    {
-        if (last_usage > hard_limit)
-            on_hard_limit(false);
-    }
-
-    if (current_usage > soft_limit)
-    {
-        if (last_usage <= soft_limit)
-            on_soft_limit(true);
-    }
-    else
-    {
-        if (last_usage > soft_limit)
-            on_soft_limit(false);
-    }
-
-    last_usage = current_usage;
-}
-
 }
 
 #endif
diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index e1978af8d28..eb755d04187 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -9,55 +9,59 @@
 namespace DB
 {
 
-/// Periodically reads the current memory usage from Linux cgroups.
-/// You can specify soft or hard memory limits:
-/// - When the soft memory limit is hit, drop jemalloc cache.
-/// - When the hard memory limit is hit, update MemoryTracking metric to throw memory exceptions faster.
+/// Does two things:
+/// 1. Periodically reads the memory usage of the process from Linux cgroups.
+///    You can specify soft or hard memory limits:
+///    - When the soft memory limit is hit, drop jemalloc cache.
+///    - When the hard memory limit is hit, update MemoryTracking metric to throw memory exceptions faster.
+/// 2. Periodically reads the the maximum memory available to the process (which can change due to cgroups settings).
+///    You can specify a callback to react on changes. The callback typically performs circular logic: It reloads the
+///    configuration (e.g. server configuration file), which will check the memory amount again and re-calculate
+///    soft/hard limits (see 1.).
 #if defined(OS_LINUX)
 class CgroupsMemoryUsageObserver
 {
 public:
+    using OnMemoryLimitFn = std::function<void(bool)>;
+    using OnMemoryAmountAvailableChangedFn = std::function<void()>;
+
     enum class CgroupsVersion
     {
         V1,
         V2
-
     };
+
     explicit CgroupsMemoryUsageObserver(std::chrono::seconds wait_time_);
     ~CgroupsMemoryUsageObserver();
 
-    void setLimits(uint64_t hard_limit_, uint64_t soft_limit_);
-    using UpdateMemLimitCallbackFn = std::function<void()>;
-    void setOnMemoryLimitUpdate(UpdateMemLimitCallbackFn on_memory_limit_update_);
-    void startThread();
+    void setMemoryUsageLimits(uint64_t hard_limit_, uint64_t soft_limit_);
+    void setOnMemoryAmountAvailableChanged(OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed);
 
-    size_t getHardLimit() const { return hard_limit; }
-    size_t getSoftLimit() const { return soft_limit; }
+    void startThread();
 
     uint64_t readMemoryUsage() const;
 
 private:
     LoggerPtr log;
 
-    std::atomic<size_t> hard_limit = 0;
-    std::atomic<size_t> soft_limit = 0;
-
     const std::chrono::seconds wait_time;
 
     std::mutex limit_mutex;
-    using CallbackFn = std::function<void(bool)>;
-    CallbackFn on_hard_limit;
-    CallbackFn on_soft_limit;
-    UpdateMemLimitCallbackFn on_memory_limit_update TSA_GUARDED_BY(limit_mutex);
+    size_t hard_limit TSA_GUARDED_BY(limit_mutex) = 0;
+    size_t soft_limit TSA_GUARDED_BY(limit_mutex) = 0;
+    OnMemoryLimitFn on_hard_limit TSA_GUARDED_BY(limit_mutex);
+    OnMemoryLimitFn on_soft_limit TSA_GUARDED_BY(limit_mutex);
+    OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed TSA_GUARDED_BY(limit_mutex);
 
-    uint64_t last_usage = 0;
+    uint64_t last_memory_usage = 0;        /// how much memory does the process use
+    uint64_t last_available_memory_amount; /// how much memory can the process use
 
     /// Represents the cgroup virtual file that shows the memory consumption of the process's cgroup.
-    struct File
+    struct MemoryUsageFile
     {
     public:
-        explicit File(LoggerPtr log_);
-        ~File();
+        explicit MemoryUsageFile(LoggerPtr log_);
+        ~MemoryUsageFile();
         uint64_t readMemoryUsage() const;
     private:
         LoggerPtr log;
@@ -67,18 +71,16 @@ private:
         std::string file_name;
     };
 
-    File file;
+    MemoryUsageFile memory_usage_file;
 
     void stopThread();
 
     void runThread();
-    void processMemoryUsage(uint64_t usage);
 
     std::mutex thread_mutex;
     std::condition_variable cond;
     ThreadFromGlobalPool thread;
     bool quit = false;
-    uint64_t last_process_memory_amount;
 };
 
 #else
@@ -87,12 +89,10 @@ class CgroupsMemoryUsageObserver
 public:
     explicit CgroupsMemoryUsageObserver(std::chrono::seconds) {}
 
-    void setLimits(uint64_t, uint64_t) {}
-    size_t readMemoryUsage() { return 0; }
+    void setMemoryUsageLimits(uint64_t, uint64_t) {}
+    void setOnMemoryAmountAvailableChanged(OnMemoryAmountAvailableChangedFn) {}
     void startThread() {}
-    size_t getHardLimit() { return 0; }
-    size_t getSoftLimit() { return 0; }
-    void setOnMemoryLimitUpdate(std::function<void()>) {}
+    size_t readMemoryUsage() { return 0; }
 };
 #endif
 

From 4670f055649f5f8f216acd42947881038dedbdbd Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Wed, 13 Mar 2024 17:18:13 +0000
Subject: [PATCH 465/985] Fix test
 test_input_format_parallel_parsing_memory_tracking

---
 .../test.py                                                   | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_input_format_parallel_parsing_memory_tracking/test.py b/tests/integration/test_input_format_parallel_parsing_memory_tracking/test.py
index c95bbfda708..a89cb619350 100644
--- a/tests/integration/test_input_format_parallel_parsing_memory_tracking/test.py
+++ b/tests/integration/test_input_format_parallel_parsing_memory_tracking/test.py
@@ -41,7 +41,7 @@ def test_memory_tracking_total():
         [
             "bash",
             "-c",
-            "clickhouse local -q \"SELECT arrayStringConcat(arrayMap(x->toString(cityHash64(x)), range(1000)), ' ') from numbers(10000)\" > data.json",
+            "clickhouse local -q \"SELECT arrayStringConcat(arrayMap(x->toString(cityHash64(x)), range(1000)), ' ') from numbers(10000)\" > data.jsonl",
         ]
     )
 
@@ -56,7 +56,7 @@ def test_memory_tracking_total():
                     "--show-error",
                     "--data-binary",
                     "@data.json",
-                    "http://127.1:8123/?query=INSERT%20INTO%20null%20FORMAT%20TSV",
+                    "http://127.1:8123/?query=INSERT%20INTO%20null%20FORMAT%20JSONEachRow",
                 ]
             )
             == ""

From 83019102f3bac7bccfdd25fbbc264bcc1468dc00 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Wed, 13 Mar 2024 17:43:48 +0000
Subject: [PATCH 466/985] Correct fast test ande fix perfomance issue

---
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 25 ++++++++++++++-----
 .../02992_all_columns_should_have_comment.sql |  2 +-
 2 files changed, 20 insertions(+), 7 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 6c3a4245a96..52b5eeb2ca3 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -66,13 +66,13 @@ protected:
         UInt64 * pos = vec.data(); /// This also accelerates the code.
 
         UInt64 * current_end = &vec[real_block_size];
-        if (step > 1)
+        if (step == 1)
         {
-            iota_with_step(pos, static_cast<size_t>(current_end - pos), curr, step);
+            iota(pos, static_cast<size_t>(current_end - pos), curr);
         }
         else
         {
-            iota(pos, static_cast<size_t>(current_end - pos), curr);
+            iota_with_step(pos, static_cast<size_t>(current_end - pos), curr, step);
         }
 
         next += chunk_step;
@@ -286,7 +286,14 @@ protected:
                     auto start_value_64 = static_cast<UInt64>(start_value);
                     auto end_value_64 = static_cast<UInt64>(end_value);
                     auto size = (end_value_64 - start_value_64) / this->step;
-                    iota_with_step(pos, static_cast<size_t>(size), start_value_64, step);
+                    if (step == 1)
+                    {
+                        iota(pos, static_cast<size_t>(size), start_value_64);
+                    }
+                    else
+                    {
+                        iota_with_step(pos, static_cast<size_t>(size), start_value_64, step);
+                    }
                     pos += size;
                 }
             };
@@ -295,9 +302,15 @@ protected:
             {
                 UInt64 start_value = range.left + cursor.offset_in_range * step;
                 /// end_value will never overflow
-                iota_with_step(pos, static_cast<size_t>(need), start_value, step);
+                if (step == 1)
+                {
+                    iota(pos, static_cast<size_t>(need), start_value);
+                }
+                else
+                {
+                    iota_with_step(pos, static_cast<size_t>(need), start_value, step);
+                }
                 pos += need;
-
                 provided += need;
                 cursor.offset_in_range += need;
             }
diff --git a/tests/queries/0_stateless/02992_all_columns_should_have_comment.sql b/tests/queries/0_stateless/02992_all_columns_should_have_comment.sql
index b984c12e285..b90faeac359 100644
--- a/tests/queries/0_stateless/02992_all_columns_should_have_comment.sql
+++ b/tests/queries/0_stateless/02992_all_columns_should_have_comment.sql
@@ -1,4 +1,4 @@
 SYSTEM FLUSH LOGS;
 SELECT 'Column ' || name || ' from table ' || concat(database, '.', table) || ' should have a comment'
 FROM system.columns
-WHERE (database = 'system') AND (comment = '') AND (table NOT ILIKE '%_log_%') AND (table NOT IN ('numbers', 'numbers_mt', 'one')) AND (default_kind != 'ALIAS');
+WHERE (database = 'system') AND (comment = '') AND (table NOT ILIKE '%_log_%') AND (table NOT IN ('numbers', 'numbers_mt', 'one', 'generate_series')) AND (default_kind != 'ALIAS');

From c73e299820ffef1142c3b6cc9ef89b7dc69e3525 Mon Sep 17 00:00:00 2001
From: Jake Bamrah <login@bamrah.sh>
Date: Thu, 29 Feb 2024 23:42:23 +0100
Subject: [PATCH 467/985] add size cap to memory tables

---
 src/Core/Settings.h                           |  4 ++
 src/Core/SettingsChangesHistory.h             |  4 ++
 src/Storages/StorageMemory.cpp                | 40 ++++++++++++++--
 ...storage_memory_circ_buffer_usage.reference |  8 ++++
 ...03001_storage_memory_circ_buffer_usage.sql | 47 +++++++++++++++++++
 5 files changed, 98 insertions(+), 5 deletions(-)
 create mode 100644 tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.reference
 create mode 100644 tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.sql

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d70a6cf51c5..500157081a3 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -885,6 +885,10 @@ class IColumn;
     M(Int64, ignore_cold_parts_seconds, 0, "Only available in ClickHouse Cloud. Exclude new data parts from SELECT queries until they're either pre-warmed (see cache_populated_by_fetch) or this many seconds old. Only for Replicated-/SharedMergeTree.", 0) \
     M(Int64, prefer_warmed_unmerged_parts_seconds, 0, "Only available in ClickHouse Cloud. If a merged part is less than this many seconds old and is not pre-warmed (see cache_populated_by_fetch), but all its source parts are available and pre-warmed, SELECT queries will read from those parts instead. Only for ReplicatedMergeTree. Note that this only checks whether CacheWarmer processed the part; if the part was fetched into cache by something else, it'll still be considered cold until CacheWarmer gets to it; if it was warmed, then evicted from cache, it'll still be considered warm.", 0) \
     M(Bool, iceberg_engine_ignore_schema_evolution, false, "Ignore schema evolution in Iceberg table engine and read all data using latest schema saved on table creation. Note that it can lead to incorrect result", 0) \
+    M(UInt64, min_rows_to_keep, 0, "Minimum block size (in rows) to retain in Memory table buffer.", 0) \
+    M(UInt64, max_rows_to_keep, 0, "Maximum block size (in rows) to retain in Memory table buffer.", 0) \
+    M(UInt64, min_bytes_to_keep, 0, "Minimum block size (in bytes) to retain in Memory table buffer.", 0) \
+    M(UInt64, max_bytes_to_keep, 0, "Maximum block size (in bytes) to retain in Memory table buffer.", 0) \
 
 // End of COMMON_SETTINGS
 // Please add settings related to formats into the FORMAT_FACTORY_SETTINGS, move obsolete settings to OBSOLETE_SETTINGS and obsolete format settings to OBSOLETE_FORMAT_SETTINGS.
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index e680c02671a..436c6963fb8 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -93,6 +93,10 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"input_format_json_use_string_type_for_ambiguous_paths_in_named_tuples_inference_from_objects", false, false, "Allow to use String type for ambiguous paths during named tuple inference from JSON objects"},
               {"throw_if_deduplication_in_dependent_materialized_views_enabled_with_async_insert", false, true, "Deduplication is dependent materialized view cannot work together with async inserts."},
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
+              {"max_rows_to_keep", 0, 0, "Introducing new feature for memory tables."},
+              {"min_rows_to_keep", 0, 0, "Introducing new feature for memory tables."},
+              {"max_bytes_to_keep", 0, 0, "Introducing new feature for memory tables."},
+              {"min_bytes_to_keep", 0, 0, "Introducing new feature for memory tables."},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
diff --git a/src/Storages/StorageMemory.cpp b/src/Storages/StorageMemory.cpp
index 7a8fb9feeda..518b9f5b212 100644
--- a/src/Storages/StorageMemory.cpp
+++ b/src/Storages/StorageMemory.cpp
@@ -46,6 +46,7 @@ namespace ErrorCodes
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int CANNOT_RESTORE_TABLE;
     extern const int NOT_IMPLEMENTED;
+    extern const int SETTING_CONSTRAINT_VIOLATION;
 }
 
 class MemorySink : public SinkToStorage
@@ -54,10 +55,11 @@ public:
     MemorySink(
         StorageMemory & storage_,
         const StorageMetadataPtr & metadata_snapshot_,
-        ContextPtr context)
+        ContextPtr context_)
         : SinkToStorage(metadata_snapshot_->getSampleBlock())
         , storage(storage_)
-        , storage_snapshot(storage_.getStorageSnapshot(metadata_snapshot_, context))
+        , storage_snapshot(storage_.getStorageSnapshot(metadata_snapshot_, context_))
+        , context(context_)
     {
     }
 
@@ -100,21 +102,49 @@ public:
             inserted_rows += block.rows();
         }
 
+        Settings settings = context->getSettings();
+        if ((settings.min_bytes_to_keep && settings.min_bytes_to_keep > settings.max_bytes_to_keep)
+            || (settings.min_rows_to_keep && settings.min_rows_to_keep > settings.max_rows_to_keep)) {
+            throw Exception(ErrorCodes::SETTING_CONSTRAINT_VIOLATION, "Min. bytes / rows must be set with a max.");
+        }
+
         std::lock_guard lock(storage.mutex);
 
         auto new_data = std::make_unique<Blocks>(*(storage.data.get()));
+        UInt64 new_total_rows = storage.total_size_rows.load(std::memory_order_relaxed) + inserted_rows;
+        UInt64 new_total_bytes = storage.total_size_bytes.load(std::memory_order_relaxed) + inserted_bytes;
+        while (!new_data->empty()
+               && ((settings.max_bytes_to_keep && new_total_bytes > settings.max_bytes_to_keep)
+                   || (settings.max_rows_to_keep && new_total_rows > settings.max_rows_to_keep)))
+        {
+            Block oldest_block = new_data->front();
+            UInt64 rows_to_remove = oldest_block.rows();
+            UInt64 bytes_to_remove = oldest_block.allocatedBytes();
+            if (new_total_bytes - bytes_to_remove < settings.min_bytes_to_keep
+                || new_total_rows - rows_to_remove < settings.min_rows_to_keep)
+            {
+                break; // stop - removing next block will put us under min_bytes / min_rows threshold
+            }
+
+            // delete old block from current storage table
+            new_total_rows -= rows_to_remove;
+            new_total_bytes -= bytes_to_remove;
+            new_data->erase(new_data->begin());
+        }
+
+        // finally - append new data to modified storage table and commit
         new_data->insert(new_data->end(), new_blocks.begin(), new_blocks.end());
 
         storage.data.set(std::move(new_data));
-        storage.total_size_bytes.fetch_add(inserted_bytes, std::memory_order_relaxed);
-        storage.total_size_rows.fetch_add(inserted_rows, std::memory_order_relaxed);
+        storage.total_size_rows.store(new_total_rows, std::memory_order_relaxed);
+        storage.total_size_bytes.store(new_total_bytes, std::memory_order_relaxed);
     }
 
 private:
     Blocks new_blocks;
-
     StorageMemory & storage;
     StorageSnapshotPtr storage_snapshot;
+    ContextPtr context;
 };
 
 
diff --git a/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.reference b/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.reference
new file mode 100644
index 00000000000..e9e710a535b
--- /dev/null
+++ b/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.reference
@@ -0,0 +1,8 @@
+8192
+9216
+9216
+65536
+50
+1000
+1020
+1100
diff --git a/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.sql b/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.sql
new file mode 100644
index 00000000000..13ddc428415
--- /dev/null
+++ b/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.sql
@@ -0,0 +1,47 @@
+DROP TABLE IF EXISTS memory;
+CREATE TABLE memory (i UInt32) ENGINE = Memory;
+SET min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
+
+/* TESTING BYTES */
+/* 1. testing oldest block doesn't get deleted because of min-threshold */
+INSERT INTO memory SELECT * FROM numbers(0, 1600);
+SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+/* 2. adding block that doesn't get deleted */
+INSERT INTO memory SELECT * FROM numbers(1000, 100);
+SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+/* 3. testing oldest block gets deleted - 9216 bytes - 1100 */
+INSERT INTO memory SELECT * FROM numbers(9000, 1000);
+SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+/* 4.check large block over-writes all bytes / rows */
+INSERT INTO memory SELECT * FROM numbers(9000, 10000);
+SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+
+truncate memory;
+SET min_rows_to_keep = 100, max_rows_to_keep = 1000;
+
+/* TESTING ROWS */
+/* 1. add normal number of rows */
+INSERT INTO memory SELECT * FROM numbers(0, 50);
+SELECT total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+/* 2. table should have 1000 */
+INSERT INTO memory SELECT * FROM numbers(50, 950);
+SELECT total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+/* 3. table should have 1020 - removed first 50 */
+INSERT INTO memory SELECT * FROM numbers(2000, 70);
+SELECT total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+/* 4. check large block over-writes all rows */
+INSERT INTO memory SELECT * FROM numbers(3000, 1100);
+SELECT total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+/* test invalid settings */
+SET min_bytes_to_keep = 4096, max_bytes_to_keep = 0;
+INSERT INTO memory SELECT * FROM numbers(3000, 1100); -- { serverError 452 }
+
+DROP TABLE memory;
\ No newline at end of file

From 000719aa2ab71947b7ad67e92c10e1a8663e9e2c Mon Sep 17 00:00:00 2001
From: Jake Bamrah <45361366+JakeBamrah@users.noreply.github.com>
Date: Thu, 29 Feb 2024 23:54:55 +0100
Subject: [PATCH 468/985] update memory table docs with size cap changes

---
 .../engines/table-engines/special/memory.md   | 53 +++++++++++++++++++
 1 file changed, 53 insertions(+)

diff --git a/docs/en/engines/table-engines/special/memory.md b/docs/en/engines/table-engines/special/memory.md
index 0d552a69804..d6bcce68a0e 100644
--- a/docs/en/engines/table-engines/special/memory.md
+++ b/docs/en/engines/table-engines/special/memory.md
@@ -21,3 +21,56 @@ When restarting a server, data disappears from the table and the table becomes e
 Normally, using this table engine is not justified. However, it can be used for tests, and for tasks where maximum speed is required on a relatively small number of rows (up to approximately 100,000,000).
 
 The Memory engine is used by the system for temporary tables with external query data (see the section “External data for processing a query”), and for implementing `GLOBAL IN` (see the section “IN operators”).
+
+## Engine Parameters
+
+- `min_bytes_to_keep` — Minimum bytes to keep when memory table is size-capped.
+  - Default value: `0`
+  - Requires `max_bytes_to_keep`
+- `max_bytes_to_keep` — Maximum bytes to keep within memory table where oldest rows are deleted on each insertion (i.e circular buffer). Max bytes can exceed the stated limit if the oldest batch of rows to remove falls under the `min_bytes_to_keep` limit when adding a large block.
+  - Default value: `0`
+- `min_rows_to_keep` — Minimum rows to keep when memory table is size-capped.
+  - Default value: `0`
+  - Requires `max_rows_to_keep`
+- `max_rows_to_keep` — Maximum rows to keep within memory table where oldest rows are deleted on each insertion (i.e circular buffer). Max rows can exceed the stated limit if the oldest batch of rows to remove falls under the `min_rows_to_keep` limit when adding a large block.
+  - Default value: `0`
+
+## Usage {#usage}
+
+``` sql
+CREATE TABLE memory (i UInt32) ENGINE = Memory;
+```
+
+## Examples {#examples}
+
+**Example 1: Setting parameters**
+``` sql
+SET min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
+```
+
+**Note:** Both `bytes` and `rows` capping parameters can be set at the same time, however, the lower bounds of `max` and `min` will be adhered to.
+
+**Example 2: Basic usage**
+``` sql
+CREATE TABLE memory (i UInt32) ENGINE = Memory;
+
+SET min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
+
+/* 1. testing oldest block doesn't get deleted due to min-threshold - 3000 rows */
+INSERT INTO memory SELECT * FROM numbers(0, 1600);
+
+/* 2. adding block that doesn't get deleted */
+INSERT INTO memory SELECT * FROM numbers(1000, 100);
+
+/* 3. testing oldest block gets deleted - 9216 bytes - 1100 */
+INSERT INTO memory SELECT * FROM numbers(9000, 1000);
+
+/* 4. checking a very large block overrides all */
+INSERT INTO memory SELECT * FROM numbers(9000, 10000);
+```
+
+``` text
+┌─total_bytes─┬─total_rows─┐
+│       65536 │      10000 │
+└─────────────┴────────────┘
+```

From 77223d682d9d4ba7dcb7d3c36d323c43cd224bdd Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 1 Mar 2024 02:01:40 +0100
Subject: [PATCH 469/985] reload tests

---
 src/Storages/StorageMemory.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageMemory.cpp b/src/Storages/StorageMemory.cpp
index 518b9f5b212..1a7a76ee285 100644
--- a/src/Storages/StorageMemory.cpp
+++ b/src/Storages/StorageMemory.cpp
@@ -132,7 +132,7 @@ public:
             new_data->erase(new_data->begin());
         }
 
-        // finally - append new data to modified storage table and commit
+        // append new data to modified storage table and commit
         new_data->insert(new_data->end(), new_blocks.begin(), new_blocks.end());
 
         storage.data.set(std::move(new_data));

From 4aab1170ef6c167df867a0565968744f9eb79852 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Thu, 7 Mar 2024 12:34:53 +0100
Subject: [PATCH 470/985] fix style

---
 src/Storages/StorageMemory.cpp | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Storages/StorageMemory.cpp b/src/Storages/StorageMemory.cpp
index 1a7a76ee285..6afe3331054 100644
--- a/src/Storages/StorageMemory.cpp
+++ b/src/Storages/StorageMemory.cpp
@@ -104,9 +104,8 @@ public:
 
         Settings settings = context->getSettings();
         if ((settings.min_bytes_to_keep && settings.min_bytes_to_keep > settings.max_bytes_to_keep)
-            || (settings.min_rows_to_keep && settings.min_rows_to_keep > settings.max_rows_to_keep)) {
+            || (settings.min_rows_to_keep && settings.min_rows_to_keep > settings.max_rows_to_keep))
             throw Exception(ErrorCodes::SETTING_CONSTRAINT_VIOLATION, "Min. bytes / rows must be set with a max.");
-        }
 
         std::lock_guard lock(storage.mutex);
 

From e53d052dccf6c2a1e913224b5d4d3a00a86be921 Mon Sep 17 00:00:00 2001
From: Jake Bamrah <login@bamrah.sh>
Date: Sun, 10 Mar 2024 22:38:05 +0100
Subject: [PATCH 471/985] update docs to include circular buffer behaviour

---
 docs/en/engines/table-engines/special/memory.md | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/docs/en/engines/table-engines/special/memory.md b/docs/en/engines/table-engines/special/memory.md
index d6bcce68a0e..e008ed8619d 100644
--- a/docs/en/engines/table-engines/special/memory.md
+++ b/docs/en/engines/table-engines/special/memory.md
@@ -22,7 +22,10 @@ Normally, using this table engine is not justified. However, it can be used for
 
 The Memory engine is used by the system for temporary tables with external query data (see the section “External data for processing a query”), and for implementing `GLOBAL IN` (see the section “IN operators”).
 
-## Engine Parameters
+Upper and lower bounds can be specified to limit Memory engine table size, effectively allowing it to act as a circular
+buffer (see [Engine Parameters](#engine-parameters)).
+
+## Engine Parameters {#engine-parameters}
 
 - `min_bytes_to_keep` — Minimum bytes to keep when memory table is size-capped.
   - Default value: `0`

From a9e054e1c8c1b6435cb3f152eb6e31d3086b04b4 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Mon, 11 Mar 2024 13:17:33 +0100
Subject: [PATCH 472/985] Reload CI


From 5e66cd7154e36cc9ffbbfaf123c3aeb81d2a14de Mon Sep 17 00:00:00 2001
From: Jake Bamrah <login@bamrah.sh>
Date: Tue, 12 Mar 2024 23:41:00 +0100
Subject: [PATCH 473/985] fix settings seg-fault and expand test case coverage

---
 .../engines/table-engines/special/memory.md   | 14 ++++-----
 src/Core/Settings.h                           |  4 ---
 src/Core/SettingsChangesHistory.h             |  4 ---
 src/Storages/MemorySettings.h                 |  4 +++
 src/Storages/StorageMemory.cpp                | 31 +++++++++----------
 src/Storages/StorageMemory.h                  |  8 ++++-
 ...torage_memory_circ_buffer_usage.reference} |  4 +++
 ...3009_storage_memory_circ_buffer_usage.sql} | 30 +++++++++++++-----
 8 files changed, 58 insertions(+), 41 deletions(-)
 rename tests/queries/0_stateless/{03001_storage_memory_circ_buffer_usage.reference => 03009_storage_memory_circ_buffer_usage.reference} (63%)
 rename tests/queries/0_stateless/{03001_storage_memory_circ_buffer_usage.sql => 03009_storage_memory_circ_buffer_usage.sql} (59%)

diff --git a/docs/en/engines/table-engines/special/memory.md b/docs/en/engines/table-engines/special/memory.md
index e008ed8619d..8ebdd57ae67 100644
--- a/docs/en/engines/table-engines/special/memory.md
+++ b/docs/en/engines/table-engines/special/memory.md
@@ -44,20 +44,16 @@ buffer (see [Engine Parameters](#engine-parameters)).
 CREATE TABLE memory (i UInt32) ENGINE = Memory;
 ```
 
-## Examples {#examples}
-
-**Example 1: Setting parameters**
+**Initialize settings**
 ``` sql
-SET min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
+CREATE TABLE memory (i UInt32) ENGINE = Memory SETTINGS min_rows_to_keep = 100, max_rows_to_keep = 1000;
 ```
 
 **Note:** Both `bytes` and `rows` capping parameters can be set at the same time, however, the lower bounds of `max` and `min` will be adhered to.
 
-**Example 2: Basic usage**
+## Examples {#examples}
 ``` sql
-CREATE TABLE memory (i UInt32) ENGINE = Memory;
-
-SET min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
+CREATE TABLE memory (i UInt32) ENGINE = Memory SETTINGS min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
 
 /* 1. testing oldest block doesn't get deleted due to min-threshold - 3000 rows */
 INSERT INTO memory SELECT * FROM numbers(0, 1600);
@@ -70,6 +66,8 @@ INSERT INTO memory SELECT * FROM numbers(9000, 1000);
 
 /* 4. checking a very large block overrides all */
 INSERT INTO memory SELECT * FROM numbers(9000, 10000);
+
+SELECT total_bytes, total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
 ```
 
 ``` text
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 500157081a3..d70a6cf51c5 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -885,10 +885,6 @@ class IColumn;
     M(Int64, ignore_cold_parts_seconds, 0, "Only available in ClickHouse Cloud. Exclude new data parts from SELECT queries until they're either pre-warmed (see cache_populated_by_fetch) or this many seconds old. Only for Replicated-/SharedMergeTree.", 0) \
     M(Int64, prefer_warmed_unmerged_parts_seconds, 0, "Only available in ClickHouse Cloud. If a merged part is less than this many seconds old and is not pre-warmed (see cache_populated_by_fetch), but all its source parts are available and pre-warmed, SELECT queries will read from those parts instead. Only for ReplicatedMergeTree. Note that this only checks whether CacheWarmer processed the part; if the part was fetched into cache by something else, it'll still be considered cold until CacheWarmer gets to it; if it was warmed, then evicted from cache, it'll still be considered warm.", 0) \
     M(Bool, iceberg_engine_ignore_schema_evolution, false, "Ignore schema evolution in Iceberg table engine and read all data using latest schema saved on table creation. Note that it can lead to incorrect result", 0) \
-    M(UInt64, min_rows_to_keep, 0, "Minimum block size (in rows) to retain in Memory table buffer.", 0) \
-    M(UInt64, max_rows_to_keep, 0, "Maximum block size (in rows) to retain in Memory table buffer.", 0) \
-    M(UInt64, min_bytes_to_keep, 0, "Minimum block size (in bytes) to retain in Memory table buffer.", 0) \
-    M(UInt64, max_bytes_to_keep, 0, "Maximum block size (in bytes) to retain in Memory table buffer.", 0) \
 
 // End of COMMON_SETTINGS
 // Please add settings related to formats into the FORMAT_FACTORY_SETTINGS, move obsolete settings to OBSOLETE_SETTINGS and obsolete format settings to OBSOLETE_FORMAT_SETTINGS.
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 436c6963fb8..e680c02671a 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -93,10 +93,6 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"input_format_json_use_string_type_for_ambiguous_paths_in_named_tuples_inference_from_objects", false, false, "Allow to use String type for ambiguous paths during named tuple inference from JSON objects"},
               {"throw_if_deduplication_in_dependent_materialized_views_enabled_with_async_insert", false, true, "Deduplication is dependent materialized view cannot work together with async inserts."},
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
-              {"max_rows_to_keep", 0, 0, "Introducing new feature for memory tables."},
-              {"min_rows_to_keep", 0, 0, "Introducing new feature for memory tables."},
-              {"max_bytes_to_keep", 0, 0, "Introducing new feature for memory tables."},
-              {"min_bytes_to_keep", 0, 0, "Introducing new feature for memory tables."},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
diff --git a/src/Storages/MemorySettings.h b/src/Storages/MemorySettings.h
index 9e1a8db3595..ac6cdf73329 100644
--- a/src/Storages/MemorySettings.h
+++ b/src/Storages/MemorySettings.h
@@ -10,6 +10,10 @@ class ASTStorage;
 
 #define MEMORY_SETTINGS(M, ALIAS) \
     M(Bool, compress, false, "Compress data in memory", 0) \
+    M(UInt64, min_rows_to_keep, 0, "Minimum block size (in rows) to retain in Memory table buffer.", 0) \
+    M(UInt64, max_rows_to_keep, 0, "Maximum block size (in rows) to retain in Memory table buffer.", 0) \
+    M(UInt64, min_bytes_to_keep, 0, "Minimum block size (in bytes) to retain in Memory table buffer.", 0) \
+    M(UInt64, max_bytes_to_keep, 0, "Maximum block size (in bytes) to retain in Memory table buffer.", 0) \
 
 DECLARE_SETTINGS_TRAITS(memorySettingsTraits, MEMORY_SETTINGS)
 
diff --git a/src/Storages/StorageMemory.cpp b/src/Storages/StorageMemory.cpp
index 6afe3331054..c6222d2124e 100644
--- a/src/Storages/StorageMemory.cpp
+++ b/src/Storages/StorageMemory.cpp
@@ -55,11 +55,10 @@ public:
     MemorySink(
         StorageMemory & storage_,
         const StorageMetadataPtr & metadata_snapshot_,
-        ContextPtr context_)
+        ContextPtr context)
         : SinkToStorage(metadata_snapshot_->getSampleBlock())
         , storage(storage_)
-        , storage_snapshot(storage_.getStorageSnapshot(metadata_snapshot_, context_))
-        , context(context_)
+        , storage_snapshot(storage_.getStorageSnapshot(metadata_snapshot_, context))
     {
     }
 
@@ -102,25 +101,20 @@ public:
             inserted_rows += block.rows();
         }
 
-        Settings settings = context->getSettings();
-        if ((settings.min_bytes_to_keep && settings.min_bytes_to_keep > settings.max_bytes_to_keep)
-            || (settings.min_rows_to_keep && settings.min_rows_to_keep > settings.max_rows_to_keep))
-            throw Exception(ErrorCodes::SETTING_CONSTRAINT_VIOLATION, "Min. bytes / rows must be set with a max.");
-
         std::lock_guard lock(storage.mutex);
 
         auto new_data = std::make_unique<Blocks>(*(storage.data.get()));
         UInt64 new_total_rows = storage.total_size_rows.load(std::memory_order_relaxed) + inserted_rows;
         UInt64 new_total_bytes = storage.total_size_bytes.load(std::memory_order_relaxed) + inserted_bytes;
         while (!new_data->empty()
-               && ((settings.max_bytes_to_keep && new_total_bytes > settings.max_bytes_to_keep)
-                   || (settings.max_rows_to_keep && new_total_rows > settings.max_rows_to_keep)))
+               && ((storage.max_bytes_to_keep && new_total_bytes > storage.max_bytes_to_keep)
+                   || (storage.max_rows_to_keep && new_total_rows > storage.max_rows_to_keep)))
         {
             Block oldest_block = new_data->front();
             UInt64 rows_to_remove = oldest_block.rows();
             UInt64 bytes_to_remove = oldest_block.allocatedBytes();
-            if (new_total_bytes - bytes_to_remove < settings.min_bytes_to_keep
-                || new_total_rows - rows_to_remove < settings.min_rows_to_keep)
+            if (new_total_bytes - bytes_to_remove < storage.min_bytes_to_keep
+                || new_total_rows - rows_to_remove < storage.min_rows_to_keep)
             {
                 break; // stop - removing next block will put us under min_bytes / min_rows threshold
             }
@@ -143,7 +137,6 @@ private:
     Blocks new_blocks;
     StorageMemory & storage;
     StorageSnapshotPtr storage_snapshot;
-    ContextPtr context;
 };
 
 
@@ -152,8 +145,10 @@ StorageMemory::StorageMemory(
     ColumnsDescription columns_description_,
     ConstraintsDescription constraints_,
     const String & comment,
-    bool compress_)
-    : IStorage(table_id_), data(std::make_unique<const Blocks>()), compress(compress_)
+    const MemorySettings & settings)
+    : IStorage(table_id_), data(std::make_unique<const Blocks>()), compress(settings.compress),
+    min_rows_to_keep(settings.min_rows_to_keep), max_rows_to_keep(settings.max_rows_to_keep),
+    min_bytes_to_keep(settings.min_bytes_to_keep), max_bytes_to_keep(settings.max_bytes_to_keep)
 {
     StorageInMemoryMetadata storage_metadata;
     storage_metadata.setColumns(std::move(columns_description_));
@@ -571,7 +566,11 @@ void registerStorageMemory(StorageFactory & factory)
         if (has_settings)
             settings.loadFromQuery(*args.storage_def);
 
-        return std::make_shared<StorageMemory>(args.table_id, args.columns, args.constraints, args.comment, settings.compress);
+        if (settings.min_bytes_to_keep > settings.max_bytes_to_keep
+            || settings.min_rows_to_keep > settings.max_rows_to_keep)
+            throw Exception(ErrorCodes::SETTING_CONSTRAINT_VIOLATION, "Min. bytes / rows must be set with a max.");
+
+        return std::make_shared<StorageMemory>(args.table_id, args.columns, args.constraints, args.comment, settings);
     },
     {
         .supports_settings = true,
diff --git a/src/Storages/StorageMemory.h b/src/Storages/StorageMemory.h
index 3293e5e4fe5..13f1c971d82 100644
--- a/src/Storages/StorageMemory.h
+++ b/src/Storages/StorageMemory.h
@@ -7,6 +7,7 @@
 #include <Core/NamesAndTypes.h>
 #include <Interpreters/DatabaseCatalog.h>
 #include <Storages/IStorage.h>
+#include <Storages/MemorySettings.h>
 
 #include <Common/MultiVersion.h>
 
@@ -30,7 +31,7 @@ public:
         ColumnsDescription columns_description_,
         ConstraintsDescription constraints_,
         const String & comment,
-        bool compress_ = false);
+        const MemorySettings & settings = MemorySettings());
 
     String getName() const override { return "Memory"; }
 
@@ -134,6 +135,11 @@ private:
     std::atomic<size_t> total_size_rows = 0;
 
     bool compress;
+    UInt64 min_rows_to_keep;
+    UInt64 max_rows_to_keep;
+    UInt64 min_bytes_to_keep;
+    UInt64 max_bytes_to_keep;
+
 
     friend class ReadFromMemoryStorageStep;
 };
diff --git a/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.reference b/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.reference
similarity index 63%
rename from tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.reference
rename to tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.reference
index e9e710a535b..0bcc6fe4434 100644
--- a/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.reference
+++ b/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.reference
@@ -6,3 +6,7 @@
 1000
 1020
 1100
+8192
+9216
+17408
+82944
diff --git a/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.sql b/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.sql
similarity index 59%
rename from tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.sql
rename to tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.sql
index 13ddc428415..77aa1d0befc 100644
--- a/tests/queries/0_stateless/03001_storage_memory_circ_buffer_usage.sql
+++ b/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.sql
@@ -1,6 +1,5 @@
 DROP TABLE IF EXISTS memory;
-CREATE TABLE memory (i UInt32) ENGINE = Memory;
-SET min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
+CREATE TABLE memory (i UInt32) ENGINE = Memory SETTINGS min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
 
 /* TESTING BYTES */
 /* 1. testing oldest block doesn't get deleted because of min-threshold */
@@ -19,9 +18,8 @@ SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = curre
 INSERT INTO memory SELECT * FROM numbers(9000, 10000);
 SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
 
-
-truncate memory;
-SET min_rows_to_keep = 100, max_rows_to_keep = 1000;
+DROP TABLE IF EXISTS memory;
+CREATE TABLE memory (i UInt32) ENGINE = Memory SETTINGS min_rows_to_keep = 100, max_rows_to_keep = 1000;
 
 /* TESTING ROWS */
 /* 1. add normal number of rows */
@@ -40,8 +38,24 @@ SELECT total_rows FROM system.tables WHERE name = 'memory' and database = curren
 INSERT INTO memory SELECT * FROM numbers(3000, 1100);
 SELECT total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
 
-/* test invalid settings */
-SET min_bytes_to_keep = 4096, max_bytes_to_keep = 0;
-INSERT INTO memory SELECT * FROM numbers(3000, 1100); -- { serverError 452 }
+/* TESTING NO CIRCULAR-BUFFER */
+DROP TABLE IF EXISTS memory;
+CREATE TABLE memory (i UInt32) ENGINE = Memory;
+
+INSERT INTO memory SELECT * FROM numbers(0, 1600);
+SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+INSERT INTO memory SELECT * FROM numbers(1000, 100);
+SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+INSERT INTO memory SELECT * FROM numbers(9000, 1000);
+SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+INSERT INTO memory SELECT * FROM numbers(9000, 10000);
+SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+
+/* TESTING INVALID SETTINGS */
+CREATE TABLE faulty_memory (i UInt32) ENGINE = Memory SETTINGS min_rows_to_keep = 100;  -- { serverError 452 }
+CREATE TABLE faulty_memory (i UInt32) ENGINE = Memory SETTINGS min_bytes_to_keep = 100; -- { serverError 452 }
 
 DROP TABLE memory;
\ No newline at end of file

From a915dace2752947e8d8d4e256342f59f8a287fff Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Wed, 13 Mar 2024 16:19:44 +0100
Subject: [PATCH 474/985] reload CI


From 208a91a2f7ae97795e03c62c1cce121775ee58ff Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 13 Mar 2024 19:03:29 +0100
Subject: [PATCH 475/985] Add retries exists check in loadOutdatedDataParts

---
 src/Storages/StorageReplicatedMergeTree.cpp | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 73c7e484bcb..71ac1fc4965 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -7680,9 +7680,13 @@ void StorageReplicatedMergeTree::forcefullyRemoveBrokenOutdatedPartFromZooKeeper
     /// It could became Outdated because it was merged/mutated (so we have a covering part) or because it was dropped.
     /// But DROP [PART]ITION waits for all Outdated parts to be loaded, so it's not the case.
 
-    auto zookeeper = getZooKeeper();
+    bool exists = false;
     String part_path = replica_path + "/parts/" + part_name;
-    if (!zookeeper->exists(part_path))
+    ZooKeeperRetriesInfo retries_info{/* max_retries */5, /* initial_backoff_ms */100, /* max_backoff_ms */100};
+    ZooKeeperRetriesControl retries_ctl("outdatedPartExists", log.load(), retries_info, nullptr);
+
+    retries_ctl.retryLoop([&]() { exists = getZooKeeper()->exists(part_path); });
+    if (!exists)
         return;
 
     auto part = getActiveContainingPart(part_name);

From 42a1cc47e6e24c3e854346bf9dec522677bb0d09 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 13 Mar 2024 18:05:08 +0000
Subject: [PATCH 476/985] Fix 01761_cast_to_enum_nullable with analyzer.

---
 src/DataTypes/DataTypeNullable.cpp | 25 +++++++++++++++++++++++++
 src/DataTypes/DataTypeNullable.h   |  1 +
 tests/analyzer_tech_debt.txt       |  1 -
 3 files changed, 26 insertions(+), 1 deletion(-)

diff --git a/src/DataTypes/DataTypeNullable.cpp b/src/DataTypes/DataTypeNullable.cpp
index 16d5d41e5e5..db252659d41 100644
--- a/src/DataTypes/DataTypeNullable.cpp
+++ b/src/DataTypes/DataTypeNullable.cpp
@@ -4,6 +4,7 @@
 #include <DataTypes/Serializations/SerializationNullable.h>
 #include <DataTypes/DataTypeLowCardinality.h>
 #include <Columns/ColumnNullable.h>
+#include <Columns/ColumnConst.h>
 #include <Core/Field.h>
 #include <Parsers/IAST.h>
 #include <Common/typeid_cast.h>
@@ -56,6 +57,30 @@ bool DataTypeNullable::equals(const IDataType & rhs) const
     return rhs.isNullable() && nested_data_type->equals(*static_cast<const DataTypeNullable &>(rhs).nested_data_type);
 }
 
+ColumnPtr DataTypeNullable::createColumnConst(size_t size, const Field & field) const
+{
+    if (onlyNull())
+    {
+        auto column = createColumn();
+        column->insert(field);
+        return ColumnConst::create(std::move(column), size);
+    }
+
+    auto column = nested_data_type->createColumn();
+    bool is_null = field.isNull();
+
+    if (is_null)
+        nested_data_type->insertDefaultInto(*column);
+    else
+        column->insert(field);
+
+    auto null_mask = ColumnUInt8::create();
+    null_mask->getData().push_back(is_null ? 1 : 0);
+
+    auto res = ColumnNullable::create(std::move(column), std::move(null_mask));
+    return ColumnConst::create(std::move(res), size);
+}
+
 SerializationPtr DataTypeNullable::doGetDefaultSerialization() const
 {
     return std::make_shared<SerializationNullable>(nested_data_type->getDefaultSerialization());
diff --git a/src/DataTypes/DataTypeNullable.h b/src/DataTypes/DataTypeNullable.h
index b102c767993..71abe48c151 100644
--- a/src/DataTypes/DataTypeNullable.h
+++ b/src/DataTypes/DataTypeNullable.h
@@ -41,6 +41,7 @@ public:
     bool onlyNull() const override;
     bool canBeInsideLowCardinality() const override { return nested_data_type->canBeInsideLowCardinality(); }
     bool canBePromoted() const override { return nested_data_type->canBePromoted(); }
+    ColumnPtr createColumnConst(size_t size, const Field & field) const override;
 
     const DataTypePtr & getNestedType() const { return nested_data_type; }
 
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index dbd216ea7be..b4cf3cf288b 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -7,7 +7,6 @@
 01584_distributed_buffer_cannot_find_column
 01624_soft_constraints
 01747_join_view_filter_dictionary
-01761_cast_to_enum_nullable
 01925_join_materialized_columns
 01952_optimize_distributed_group_by_sharding_key
 02354_annoy

From 2982f3b369eeb5a9ef7dce2790c4e66c68c7f41b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 13 Mar 2024 19:11:40 +0100
Subject: [PATCH 477/985] Fix stress test sanitizer report

---
 docker/test/stateless/stress_tests.lib | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/stateless/stress_tests.lib b/docker/test/stateless/stress_tests.lib
index c0fc32ab718..b69f1d28fcf 100644
--- a/docker/test/stateless/stress_tests.lib
+++ b/docker/test/stateless/stress_tests.lib
@@ -215,7 +215,7 @@ function check_server_start()
 function check_logs_for_critical_errors()
 {
     # Sanitizer asserts
-    sed -n '/WARNING:.*anitizer/,/^$/p' >> /test_output/tmp
+    sed -n '/WARNING:.*anitizer/,/^$/p' /var/log/clickhouse-server/stderr.log >> /test_output/tmp
     rg -Fav -e "ASan doesn't fully support makecontext/swapcontext functions" -e "DB::Exception" /test_output/tmp > /dev/null \
         && echo -e "Sanitizer assert (in stderr.log)$FAIL$(head_escaped /test_output/tmp)" >> /test_output/test_results.tsv \
         || echo -e "No sanitizer asserts$OK" >> /test_output/test_results.tsv

From f63368d83d5e7ed1168bed2ad112d06f663614c8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 13 Mar 2024 19:12:27 +0100
Subject: [PATCH 478/985] Separate stdout and stderr in fuzzer report

---
 docker/test/fuzzer/run-fuzzer.sh | 8 +++++---
 tests/ci/ast_fuzzer_check.py     | 8 ++++++++
 2 files changed, 13 insertions(+), 3 deletions(-)

diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index 63471c288dd..1c41d299ac3 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -174,7 +174,7 @@ function fuzz
     mkdir -p /var/run/clickhouse-server
 
     # NOTE: we use process substitution here to preserve keep $! as a pid of clickhouse-server
-    clickhouse-server --config-file db/config.xml --pid-file /var/run/clickhouse-server/clickhouse-server.pid -- --path db > server.log 2>&1 &
+    clickhouse-server --config-file db/config.xml --pid-file /var/run/clickhouse-server/clickhouse-server.pid -- --path db > server.log 2>>stderr.log &
     server_pid=$!
 
     kill -0 $server_pid
@@ -303,7 +303,7 @@ quit
     if [ "$server_died" == 1 ]
     then
         # The server has died.
-        if ! rg --text -o 'Received signal.*|Logical error.*|Assertion.*failed|Failed assertion.*|.*runtime error: .*|.*is located.*|(SUMMARY|ERROR): [a-zA-Z]+Sanitizer:.*|.*_LIBCPP_ASSERT.*|.*Child process was terminated by signal 9.*' server.log > description.txt
+        if ! rg --text -o 'Received signal.*|Logical error.*|Assertion.*failed|Failed assertion.*|.*runtime error: .*|.*is located.*|(SUMMARY|ERROR): [a-zA-Z]+Sanitizer:.*|.*_LIBCPP_ASSERT.*|.*Child process was terminated by signal 9.*' server.log stderr.log > description.txt
         then
             echo "Lost connection to server. See the logs." > description.txt
         fi
@@ -392,7 +392,7 @@ if [ -f core.zst ]; then
 fi
 
 # Keep all the lines in the paragraphs containing <Fatal> that either contain <Fatal> or don't start with 20... (year)
-sed -n '/<Fatal>/,/^$/p' server.log | awk '/<Fatal>/ || !/^20/' > fatal.log ||:
+sed -n '/<Fatal>/,/^$/p' server.log stderr.log | awk '/<Fatal>/ || !/^20/' > fatal.log ||:
 FATAL_LINK=''
 if [ -s fatal.log ]; then
     FATAL_LINK='<a href="fatal.log">fatal.log</a>'
@@ -401,6 +401,7 @@ fi
 dmesg -T > dmesg.log ||:
 
 zstd --threads=0 --rm server.log
+zstd --threads=0 --rm stderr.log
 zstd --threads=0 --rm fuzzer.log
 
 cat > report.html <<EOF ||:
@@ -427,6 +428,7 @@ p.links a { padding: 5px; margin: 3px; background: #FFF; line-height: 2; white-s
   <a href="run.log">run.log</a>
   <a href="fuzzer.log.zst">fuzzer.log.zst</a>
   <a href="server.log.zst">server.log.zst</a>
+  <a href="stderr.log.zst">stderr.log.zst</a>
   <a href="main.log">main.log</a>
   <a href="dmesg.log">dmesg.log</a>
   ${CORE_LINK}
diff --git a/tests/ci/ast_fuzzer_check.py b/tests/ci/ast_fuzzer_check.py
index 1ecf805cadc..c24a67a7a6e 100644
--- a/tests/ci/ast_fuzzer_check.py
+++ b/tests/ci/ast_fuzzer_check.py
@@ -126,6 +126,14 @@ def main():
         if not_compressed_server_log_path.exists():
             paths["server.log"] = not_compressed_server_log_path
 
+    compressed_stderr_log_path = workspace_path / "stderr.log.zst"
+    if compressed_stderr_log_path.exists():
+        paths["stderr.log.zst"] = compressed_stderr_log_path
+    else:
+        not_compressed_stderr_log_path = workspace_path / "stderr.log"
+        if compressed_stderr_log_path.exists():
+            paths["stderr.log"] = not_compressed_stderr_log_path
+
     # Same idea but with the fuzzer log
     compressed_fuzzer_log_path = workspace_path / "fuzzer.log.zst"
     if compressed_fuzzer_log_path.exists():

From 6e6a67a2fb37ef22807d22aac1a8958bc618dc4d Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 13 Mar 2024 19:13:39 +0100
Subject: [PATCH 479/985] Fix unit test

---
 .../Cache/WriteBufferToFileSegment.cpp        | 19 ++++++++++++++-----
 .../Cache/WriteBufferToFileSegment.h          |  2 +-
 2 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/src/Interpreters/Cache/WriteBufferToFileSegment.cpp b/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
index 759135722dc..51914c0a14e 100644
--- a/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
+++ b/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
@@ -19,9 +19,22 @@ namespace ErrorCodes
     extern const int NOT_ENOUGH_SPACE;
 }
 
+namespace
+{
+    size_t getCacheLockWaitTimeout()
+    {
+        auto query_context = CurrentThread::getQueryContext();
+        if (query_context)
+            return query_context->getReadSettings().filesystem_cache_reserve_space_wait_lock_timeout_milliseconds;
+        else
+            return Context::getGlobalContextInstance()->getReadSettings().filesystem_cache_reserve_space_wait_lock_timeout_milliseconds;
+    }
+}
+
 WriteBufferToFileSegment::WriteBufferToFileSegment(FileSegment * file_segment_)
     : WriteBufferFromFileDecorator(std::make_unique<WriteBufferFromFile>(file_segment_->getPath()))
     , file_segment(file_segment_)
+    , reserve_space_lock_wait_timeout_milliseconds(getCacheLockWaitTimeout())
 {
 }
 
@@ -32,12 +45,8 @@ WriteBufferToFileSegment::WriteBufferToFileSegment(FileSegmentsHolderPtr segment
         : throw Exception(ErrorCodes::LOGICAL_ERROR, "WriteBufferToFileSegment can be created only from single segment"))
     , file_segment(&segment_holder_->front())
     , segment_holder(std::move(segment_holder_))
+    , reserve_space_lock_wait_timeout_milliseconds(getCacheLockWaitTimeout())
 {
-    auto query_context = CurrentThread::getQueryContext();
-    if (query_context)
-        reserve_space_lock_wait_timeout_milliseconds = query_context->getReadSettings().filesystem_cache_reserve_space_wait_lock_timeout_milliseconds;
-    else
-        reserve_space_lock_wait_timeout_milliseconds = Context::getGlobalContextInstance()->getReadSettings().filesystem_cache_reserve_space_wait_lock_timeout_milliseconds;
 }
 
 /// If it throws an exception, the file segment will be incomplete, so you should not use it in the future.
diff --git a/src/Interpreters/Cache/WriteBufferToFileSegment.h b/src/Interpreters/Cache/WriteBufferToFileSegment.h
index bff340d79b3..822488ceb48 100644
--- a/src/Interpreters/Cache/WriteBufferToFileSegment.h
+++ b/src/Interpreters/Cache/WriteBufferToFileSegment.h
@@ -29,7 +29,7 @@ private:
     /// Empty if file_segment is not owned by this WriteBufferToFileSegment
     FileSegmentsHolderPtr segment_holder;
 
-    size_t reserve_space_lock_wait_timeout_milliseconds;
+    const size_t reserve_space_lock_wait_timeout_milliseconds;
 };
 
 
From 2cb1fa79d9741100063dd29a8033b0888c863dad Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 20:01:54 +0100
Subject: [PATCH 480/985] Bump CI


From 89de338676a0233dac4563d9f4ba7e4a16b54135 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 13 Mar 2024 17:33:39 +0100
Subject: [PATCH 481/985] Better

---
 .../aggregate-functions/index.md              | 53 +++++++++++++++++--
 1 file changed, 49 insertions(+), 4 deletions(-)

diff --git a/docs/en/sql-reference/aggregate-functions/index.md b/docs/en/sql-reference/aggregate-functions/index.md
index e97db436271..96bf0c5d93b 100644
--- a/docs/en/sql-reference/aggregate-functions/index.md
+++ b/docs/en/sql-reference/aggregate-functions/index.md
@@ -16,11 +16,9 @@ ClickHouse also supports:
 
 ## NULL Processing
 
-During aggregation, all `NULL`s are skipped. If the aggregation has several parameters it will ignore any row in which one or more of the parameters are NULL.
+During aggregation, all `NULL` arguments are skipped. If the aggregation has several arguments it will ignore any row in which one or more of them are NULL.
 
-There are a few exceptions to this rule:
-  - Both [`first_value`](../../sql-reference/aggregate-functions/reference/first_value.md) and [`last_value`](../../sql-reference/aggregate-functions/reference/last_value.md) support modifiers that respect NULLs (`first_value(b) ignore nulls`).
-  - [`count`](../../sql-reference/aggregate-functions/reference/count.md) without parameters (`count()`) or with constant ones (`count(1)`) will count NULL rows too. With a column as parameter, it will count only not null values.
+There is an exception to this rule, which are the functions [`first_value`](../../sql-reference/aggregate-functions/reference/first_value.md), [`last_value`](../../sql-reference/aggregate-functions/reference/last_value.md) and their aliases when followed by the modifier `RESPECT NULLS`: `FIRST_VALUE(b) RESPECT NULLS`.
 
 **Examples:**
 
@@ -89,3 +87,50 @@ FROM t_null_big;
 │ [2,2,3]       │ [2,NULL,2,3,NULL]                     │
 └───────────────┴───────────────────────────────────────┘
 ```
+
+Note that aggregations are skipped when the columns are used as arguments to an aggregated function.  For example [`count`](../../sql-reference/aggregate-functions/reference/count.md) without parameters (`count()`) or with constant ones (`count(1)`) will count all rows in the block (independently of the value of the GROUP BY column as it's not an argument), while `count(column)` will only return the number of rows where column is not NULL.
+
+```sql
+SELECT
+    v,
+    count(1),
+    count(v)
+FROM
+(
+    SELECT if(number < 10, NULL, number % 3) AS v
+    FROM numbers(15)
+)
+GROUP BY v
+
+┌────v─┬─count()─┬─count(v)─┐
+│ ᴺᵁᴸᴸ │      10 │        0 │
+│    0 │       1 │        1 │
+│    1 │       2 │        2 │
+│    2 │       2 │        2 │
+└──────┴─────────┴──────────┘
+```
+
+And here is an example of of first_value with `RESPECT NULLS` where we can see that NULL inputs are respected and it will return the first value read, whether it's NULL or not:
+
+```sql
+SELECT
+    col || '_' || ((col + 1) * 5 - 1) as range,
+    first_value(odd_or_null) as first,
+    first_value(odd_or_null) IGNORE NULLS as first_ignore_null,
+    first_value(odd_or_null) RESPECT NULLS as first_respect_nulls
+FROM
+(
+    SELECT
+        intDiv(number, 5) AS col,
+        if(number % 2 == 0, NULL, number) as odd_or_null
+    FROM numbers(15)
+)
+GROUP BY col
+ORDER BY col
+
+┌─range─┬─first─┬─first_ignore_null─┬─first_respect_nulls─┐
+│ 0_4   │     1 │                 1 │                ᴺᵁᴸᴸ │
+│ 1_9   │     5 │                 5 │                   5 │
+│ 2_14  │    11 │                11 │                ᴺᵁᴸᴸ │
+└───────┴───────┴───────────────────┴─────────────────────┘
+```

From 31ebee41d040f3af8d4266623ba25a37d7df1fbd Mon Sep 17 00:00:00 2001
From: alesapin <alesapin@gmail.com>
Date: Wed, 13 Mar 2024 20:06:15 +0100
Subject: [PATCH 482/985] Fxi

---
 .../0_stateless/02151_invalid_setting_with_hints_in_query.sh    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02151_invalid_setting_with_hints_in_query.sh b/tests/queries/0_stateless/02151_invalid_setting_with_hints_in_query.sh
index 2faaa3bb1b6..367d0163497 100755
--- a/tests/queries/0_stateless/02151_invalid_setting_with_hints_in_query.sh
+++ b/tests/queries/0_stateless/02151_invalid_setting_with_hints_in_query.sh
@@ -4,4 +4,4 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_LOCAL --query="SET input_format_with_names_use_headers = 1" 2>&1 | grep -qF "Code: 115. DB::Exception: Unknown setting input_format_with_names_use_headers: Maybe you meant ['input_format_with_names_use_header','input_format_with_types_use_header']. (UNKNOWN_SETTING)" && echo 'OK' || echo 'FAIL' ||:
+$CLICKHOUSE_LOCAL --query="SET input_format_with_names_use_headers = 1" 2>&1 | grep -qF "Code: 115. DB::Exception: Unknown setting 'input_format_with_names_use_headers': Maybe you meant ['input_format_with_names_use_header','input_format_with_types_use_header']. (UNKNOWN_SETTING)" && echo 'OK' || echo 'FAIL' ||:

From bd6bed161cc3beddd3966842385df66a0fb71e1a Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 13 Mar 2024 20:38:55 +0000
Subject: [PATCH 483/985] Try to fix flaky test_undrop_query

---
 .../settings.md                               |  4 +-
 docs/en/sql-reference/statements/undrop.md    | 48 +++++++------------
 src/Interpreters/DatabaseCatalog.cpp          |  4 +-
 src/Interpreters/InterpreterUndropQuery.cpp   |  6 ++-
 tests/integration/test_undrop_query/test.py   | 25 ++++++----
 .../0_stateless/02681_undrop_query.sql        |  2 +-
 6 files changed, 43 insertions(+), 46 deletions(-)

diff --git a/docs/en/operations/server-configuration-parameters/settings.md b/docs/en/operations/server-configuration-parameters/settings.md
index 07c9a2b88ab..f20dcb9025e 100644
--- a/docs/en/operations/server-configuration-parameters/settings.md
+++ b/docs/en/operations/server-configuration-parameters/settings.md
@@ -933,9 +933,9 @@ Hard limit is configured via system tools
 
 ## database_atomic_delay_before_drop_table_sec {#database_atomic_delay_before_drop_table_sec}
 
-Sets the delay before remove table data in seconds. If the query has `SYNC` modifier, this setting is ignored.
+The delay before a table data is dropped in seconds. If the `DROP TABLE` query has a `SYNC` modifier, this setting is ignored.
 
-Default value: `480` (8 minute).
+Default value: `480` (8 minutes).
 
 ## database_catalog_unused_dir_hide_timeout_sec {#database_catalog_unused_dir_hide_timeout_sec}
 
diff --git a/docs/en/sql-reference/statements/undrop.md b/docs/en/sql-reference/statements/undrop.md
index 40ac1ab4f99..4b138bfe679 100644
--- a/docs/en/sql-reference/statements/undrop.md
+++ b/docs/en/sql-reference/statements/undrop.md
@@ -13,13 +13,6 @@ a system table called `system.dropped_tables`.
 
 If you have a materialized view without a `TO` clause associated with the dropped table, then you will also have to UNDROP the inner table of that view.
 
-:::note
-UNDROP TABLE is experimental.  To use it add this setting: 
-```sql
-set allow_experimental_undrop_table_query = 1;
-```
-:::
-
 :::tip
 Also see [DROP TABLE](/docs/en/sql-reference/statements/drop.md)
 :::
@@ -32,60 +25,53 @@ UNDROP TABLE [db.]name [UUID '<uuid>'] [ON CLUSTER cluster]
 
 **Example**
 
-``` sql
-set allow_experimental_undrop_table_query = 1;
-```
-
 ```sql
-CREATE TABLE undropMe
+CREATE TABLE tab
 (
     `id` UInt8
 )
 ENGINE = MergeTree
-ORDER BY id
-```
+ORDER BY id;
+
+DROP TABLE tab;
 
-```sql
-DROP TABLE undropMe
-```
-```sql
 SELECT *
 FROM system.dropped_tables
-FORMAT Vertical
+FORMAT Vertical;
 ```
+
 ```response
 Row 1:
 ──────
 index:                 0
 database:              default
-table:                 undropMe
+table:                 tab
 uuid:                  aa696a1a-1d70-4e60-a841-4c80827706cc
 engine:                MergeTree
-metadata_dropped_path: /var/lib/clickhouse/metadata_dropped/default.undropMe.aa696a1a-1d70-4e60-a841-4c80827706cc.sql
+metadata_dropped_path: /var/lib/clickhouse/metadata_dropped/default.tab.aa696a1a-1d70-4e60-a841-4c80827706cc.sql
 table_dropped_time:    2023-04-05 14:12:12
 
 1 row in set. Elapsed: 0.001 sec. 
 ```
+
 ```sql
-UNDROP TABLE undropMe
-```
-```response
-Ok.
-```
-```sql
+UNDROP TABLE tab;
+
 SELECT *
 FROM system.dropped_tables
-FORMAT Vertical
-```
+FORMAT Vertical;
+
 ```response
 Ok.
 
 0 rows in set. Elapsed: 0.001 sec. 
 ```
+
 ```sql
-DESCRIBE TABLE undropMe
-FORMAT Vertical
+DESCRIBE TABLE tab
+FORMAT Vertical;
 ```
+
 ```response
 Row 1:
 ──────
diff --git a/src/Interpreters/DatabaseCatalog.cpp b/src/Interpreters/DatabaseCatalog.cpp
index a9fd5c852ba..9d9f418934f 100644
--- a/src/Interpreters/DatabaseCatalog.cpp
+++ b/src/Interpreters/DatabaseCatalog.cpp
@@ -1143,7 +1143,7 @@ void DatabaseCatalog::dequeueDroppedTableCleanup(StorageID table_id)
     TableMarkedAsDropped dropped_table;
     {
         std::lock_guard lock(tables_marked_dropped_mutex);
-        time_t latest_drop_time = std::numeric_limits<time_t>::min();
+        auto latest_drop_time = std::numeric_limits<time_t>::min();
         auto it_dropped_table = tables_marked_dropped.end();
         for (auto it = tables_marked_dropped.begin(); it != tables_marked_dropped.end(); ++it)
         {
@@ -1168,7 +1168,7 @@ void DatabaseCatalog::dequeueDroppedTableCleanup(StorageID table_id)
         }
         if (it_dropped_table == tables_marked_dropped.end())
             throw Exception(ErrorCodes::UNKNOWN_TABLE,
-                "The drop task of table {} is in progress, has been dropped or the database engine doesn't support it",
+                "Table {} is being dropped, has been dropped, or the database engine does not support UNDROP",
                 table_id.getNameForLogs());
         latest_metadata_dropped_path = it_dropped_table->metadata_path;
         String table_metadata_path = getPathForMetadata(it_dropped_table->table_id);
diff --git a/src/Interpreters/InterpreterUndropQuery.cpp b/src/Interpreters/InterpreterUndropQuery.cpp
index 8401c47df6b..f628a656947 100644
--- a/src/Interpreters/InterpreterUndropQuery.cpp
+++ b/src/Interpreters/InterpreterUndropQuery.cpp
@@ -17,14 +17,16 @@ namespace ErrorCodes
     extern const int SUPPORT_IS_DISABLED;
 }
 
-InterpreterUndropQuery::InterpreterUndropQuery(const ASTPtr & query_ptr_, ContextMutablePtr context_) : WithMutableContext(context_), query_ptr(query_ptr_)
+InterpreterUndropQuery::InterpreterUndropQuery(const ASTPtr & query_ptr_, ContextMutablePtr context_)
+    : WithMutableContext(context_)
+    , query_ptr(query_ptr_)
 {
 }
 
-
 BlockIO InterpreterUndropQuery::execute()
 {
     getContext()->checkAccess(AccessType::UNDROP_TABLE);
+
     auto & undrop = query_ptr->as<ASTUndropQuery &>();
     if (!undrop.cluster.empty() && !maybeRemoveOnCluster(query_ptr, getContext()))
     {
diff --git a/tests/integration/test_undrop_query/test.py b/tests/integration/test_undrop_query/test.py
index 590a5690e55..d57aa8c2dc7 100644
--- a/tests/integration/test_undrop_query/test.py
+++ b/tests/integration/test_undrop_query/test.py
@@ -29,30 +29,39 @@ def test_undrop_drop_and_undrop_loop(started_cluster):
         logging.info(
             "random_sec: " + random_sec.__str__() + ", table_uuid: " + table_uuid
         )
+
         node.query(
-            "create table test_undrop_loop"
+            "CREATE TABLE test_undrop_loop"
             + count.__str__()
             + " UUID '"
             + table_uuid
-            + "' (id Int32) Engine=MergeTree() order by id;"
+            + "' (id Int32) ENGINE = MergeTree() ORDER BY id;"
         )
-        node.query("drop table test_undrop_loop" + count.__str__() + ";")
+
+        node.query("DROP TABLE test_undrop_loop" + count.__str__() + ";")
+
         time.sleep(random_sec)
+
         if random_sec >= 5:
             error = node.query_and_get_error(
-                "undrop table test_undrop_loop"
+                "UNDROP TABLE test_undrop_loop"
                 + count.__str__()
-                + " uuid '"
+                + " UUID '"
                 + table_uuid
                 + "';"
             )
             assert "UNKNOWN_TABLE" in error
-        else:
+        elif random_sec <= 3:
+            # (*)
             node.query(
-                "undrop table test_undrop_loop"
+                "UNDROP TABLE test_undrop_loop"
                 + count.__str__()
-                + " uuid '"
+                + " UUID '"
                 + table_uuid
                 + "';"
             )
             count = count + 1
+        else:
+            pass
+            # ignore random_sec = 4 to account for communication delay with the database.
+            # if we don't do that, then the second case (*) may find the table already dropped and receive an unexpected exception from the database (Bug #55167)
diff --git a/tests/queries/0_stateless/02681_undrop_query.sql b/tests/queries/0_stateless/02681_undrop_query.sql
index 66447fc6c44..d038a383690 100644
--- a/tests/queries/0_stateless/02681_undrop_query.sql
+++ b/tests/queries/0_stateless/02681_undrop_query.sql
@@ -85,5 +85,5 @@ drop table 02681_undrop_multiple;
 select table from system.dropped_tables where table = '02681_undrop_multiple' limit 1;
 undrop table 02681_undrop_multiple;
 select * from 02681_undrop_multiple order by id;
-undrop table 02681_undrop_multiple; -- { serverError 57 }
+undrop table 02681_undrop_multiple; -- { serverError TABLE_ALREADY_EXISTS }
 drop table 02681_undrop_multiple sync;

From be9a77b6ca7aa35b78857bc812ccacbe1d22bfa3 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 14 Mar 2024 03:54:07 +0300
Subject: [PATCH 484/985] Update SettingsChangesHistory.h

---
 src/Core/SettingsChangesHistory.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 129a89bfa23..04b6add0e56 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -88,6 +88,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
     {"24.3", {{"use_page_cache_for_disks_without_file_cache", false, false, "Added userspace page cache"},
               {"read_from_page_cache_if_exists_otherwise_bypass_cache", false, false, "Added userspace page cache"},
               {"page_cache_inject_eviction", false, false, "Added userspace page cache"},
+              {"default_table_engine", "None", "MergeTree", "Set default table engine to MergeTree for better usability"},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
@@ -136,7 +137,6 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"function_visible_width_behavior", 0, 1, "We changed the default behavior of `visibleWidth` to be more precise"},
               {"max_estimated_execution_time", 0, 0, "Separate max_execution_time and max_estimated_execution_time"},
               {"iceberg_engine_ignore_schema_evolution", false, false, "Allow to ignore schema evolution in Iceberg table engine"},
-              {"default_table_engine", "None", "MergeTree", "Set default table engine to MergeTree for better usability"},
               {"optimize_injective_functions_in_group_by", false, true, "Replace injective functions by it's arguments in GROUP BY section in analyzer"},
               {"update_insert_deduplication_token_in_dependent_materialized_views", false, false, "Allow to update insert deduplication token with table identifier during insert in dependent materialized views"},
               {"azure_max_unexpected_write_error_retries", 4, 4, "The maximum number of retries in case of unexpected errors during Azure blob storage write"},

From 6b26d05346f6d6b9879cde2a12c2ca8ddc78da4e Mon Sep 17 00:00:00 2001
From: lgbo-ustc <lgbo.ustc@gmail.com>
Date: Thu, 14 Mar 2024 08:55:59 +0800
Subject: [PATCH 485/985] fixed

---
 src/Interpreters/AggregatedDataVariants.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Interpreters/AggregatedDataVariants.cpp b/src/Interpreters/AggregatedDataVariants.cpp
index 9b67bdf1281..87cfdda5948 100644
--- a/src/Interpreters/AggregatedDataVariants.cpp
+++ b/src/Interpreters/AggregatedDataVariants.cpp
@@ -18,7 +18,6 @@ namespace ErrorCodes
 }
 using ColumnsHashing::HashMethodContext;
 using ColumnsHashing::HashMethodContextPtr;
-using ColumnsHashing::LastElementCacheStats;
 
 AggregatedDataVariants::AggregatedDataVariants() : aggregates_pools(1, std::make_shared<Arena>()), aggregates_pool(aggregates_pools.back().get()) {}
 

From 0b522f5fb34a774ce6cf6092dc97d5360fde7ea6 Mon Sep 17 00:00:00 2001
From: peter279k <peter279k@gmail.com>
Date: Thu, 14 Mar 2024 13:53:26 +0800
Subject: [PATCH 486/985] Fix issue #61351

---
 docs/en/getting-started/example-datasets/laion.md | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/docs/en/getting-started/example-datasets/laion.md b/docs/en/getting-started/example-datasets/laion.md
index 0dbaceffc13..327c1796d11 100644
--- a/docs/en/getting-started/example-datasets/laion.md
+++ b/docs/en/getting-started/example-datasets/laion.md
@@ -10,10 +10,14 @@ The embeddings and the metadata are stored in separate files in the raw data. A
 converts them to CSV and imports them into ClickHouse. You can use the following `download.sh` script for that:
 
 ```bash
-wget --tries=100 https://deploy.laion.ai/8f83b608504d46bb81708ec86e912220/embeddings/img_emb/img_emb_${1}.npy          # download image embedding
-wget --tries=100 https://deploy.laion.ai/8f83b608504d46bb81708ec86e912220/embeddings/text_emb/text_emb_${1}.npy        # download text embedding
-wget --tries=100 https://deploy.laion.ai/8f83b608504d46bb81708ec86e912220/embeddings/metadata/metadata_${1}.parquet    # download metadata
-python3 process.py ${1} # merge files and convert to CSV
+number=${1}
+if [[ $number == '' ]]; then
+    number=1
+fi;
+wget --tries=100 https://deploy.laion.ai/8f83b608504d46bb81708ec86e912220/embeddings/img_emb/img_emb_${number}.npy          # download image embedding
+wget --tries=100 https://deploy.laion.ai/8f83b608504d46bb81708ec86e912220/embeddings/text_emb/text_emb_${number}.npy        # download text embedding
+wget --tries=100 https://deploy.laion.ai/8f83b608504d46bb81708ec86e912220/embeddings/metadata/metadata_${number}.parquet    # download metadata
+python3 process.py $number # merge files and convert to CSV
 ```
 Script `process.py` is defined as follows:
 

From 0e9c64899a5fe86f08d51ada8d5a779e516735fd Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 14 Mar 2024 10:31:21 +0100
Subject: [PATCH 487/985] tests: do not rely on GROUP BY const behaviour in
 01056_predicate_optimizer_bugs

The behaviour of GROUP BY const in analyzer is slightly different, it
still preserves the const property from the subqueries, and that's why
it simply do not execute filters after GROUP BY, but simply one time for
the const.

The initial bug was about predicate pushdown not about GROUP BY const,
so I will update the test.

I've also tested the initial bug with fiddle and the new test is
idential:
- 19.17 (without the fix) - https://fiddle.clickhouse.com/312a48f4-6a5b-411d-a4bb-4b1a757effaf
- 20.2 (with the fix) - https://fiddle.clickhouse.com/4e1ad2e5-1c03-4ce7-9ac3-e878ccfae83a

Refs: https://github.com/ClickHouse/ClickHouse/pull/8503
Refs: https://github.com/ClickHouse/ClickHouse/issues/5682

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 .../0_stateless/01056_predicate_optimizer_bugs.reference    | 6 +++---
 .../queries/0_stateless/01056_predicate_optimizer_bugs.sql  | 4 ++--
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/tests/queries/0_stateless/01056_predicate_optimizer_bugs.reference b/tests/queries/0_stateless/01056_predicate_optimizer_bugs.reference
index dd52fd1c1b2..e8a9b79bf7c 100644
--- a/tests/queries/0_stateless/01056_predicate_optimizer_bugs.reference
+++ b/tests/queries/0_stateless/01056_predicate_optimizer_bugs.reference
@@ -36,9 +36,9 @@ FROM
     FROM
     (
         SELECT
-            1 AS co,
-            2 AS co2,
-            3 AS co3
+            dummy + 1 AS co,
+            dummy + 2 AS co2,
+            dummy + 3 AS co3
     )
     GROUP BY
         co,
diff --git a/tests/queries/0_stateless/01056_predicate_optimizer_bugs.sql b/tests/queries/0_stateless/01056_predicate_optimizer_bugs.sql
index f237768bc4c..13d90b9f43e 100644
--- a/tests/queries/0_stateless/01056_predicate_optimizer_bugs.sql
+++ b/tests/queries/0_stateless/01056_predicate_optimizer_bugs.sql
@@ -8,8 +8,8 @@ EXPLAIN SYNTAX SELECT k, v, d, i FROM (SELECT t.1 AS k, t.2 AS v, runningDiffere
 SELECT k, v, d, i FROM (SELECT t.1 AS k, t.2 AS v, runningDifference(v) AS d, runningDifference(cityHash64(t.1)) AS i FROM (   SELECT arrayJoin([('a', 1), ('a', 2), ('a', 3), ('b', 11), ('b', 13), ('b', 15)]) AS t)) WHERE i = 0;
 
 -- https://github.com/ClickHouse/ClickHouse/issues/5682
-EXPLAIN SYNTAX SELECT co,co2,co3,num FROM ( SELECT co,co2,co3,count() AS num FROM ( SELECT 1 AS co,2 AS co2 ,3 AS co3 ) GROUP BY cube (co,co2,co3) ) WHERE co!=0 AND co2 !=2;
-SELECT co,co2,co3,num FROM ( SELECT co,co2,co3,count() AS num FROM ( SELECT 1 AS co,2 AS co2 ,3 AS co3 ) GROUP BY cube (co,co2,co3) ) WHERE co!=0 AND co2 !=2;
+EXPLAIN SYNTAX SELECT co,co2,co3,num FROM ( SELECT co,co2,co3,count() AS num FROM (SELECT dummy+1 AS co,dummy+2 AS co2 ,dummy+3 AS co3) GROUP BY cube (co,co2,co3) ) WHERE co!=0 AND co2 !=2;
+SELECT co,co2,co3,num FROM ( SELECT co,co2,co3,count() AS num FROM (SELECT dummy+1 AS co,dummy+2 AS co2 ,dummy+3 AS co3) GROUP BY cube (co,co2,co3) ) WHERE co!=0 AND co2 !=2;
 
 -- https://github.com/ClickHouse/ClickHouse/issues/6734
 EXPLAIN SYNTAX SELECT name FROM ( SELECT name FROM system.settings ) ANY INNER JOIN ( SELECT name FROM system.settings ) USING (name) WHERE name = 'enable_optimize_predicate_expression';

From ff976520389c277cfcb034466aed514fe96acc6d Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Thu, 14 Mar 2024 09:53:18 +0000
Subject: [PATCH 488/985] fix spell check

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index c7eb213bff2..1706d44bc8a 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -2687,7 +2687,9 @@ userver
 utils
 uuid
 varPop
+varPopStable
 varSamp
+varSampStable
 variadic
 variantElement
 variantType

From d2b8afb98b39067d057ce0159d24d5879d284e44 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Thu, 14 Mar 2024 18:26:13 +0800
Subject: [PATCH 489/985] add benchmarks for column::insertmanyfrom

---
 src/Columns/CMakeLists.txt                    |   4 +
 src/Columns/benchmarks/CMakeLists.txt         |   4 +
 .../benchmark_column_insert_many_from.cpp     | 102 ++++++++++++++++++
 3 files changed, 110 insertions(+)
 create mode 100644 src/Columns/benchmarks/CMakeLists.txt
 create mode 100644 src/Columns/benchmarks/benchmark_column_insert_many_from.cpp

diff --git a/src/Columns/CMakeLists.txt b/src/Columns/CMakeLists.txt
index f676f415eea..1febe4f71d7 100644
--- a/src/Columns/CMakeLists.txt
+++ b/src/Columns/CMakeLists.txt
@@ -1,3 +1,7 @@
 if (ENABLE_EXAMPLES)
     add_subdirectory (examples)
 endif ()
+
+if (ENABLE_BENCHMARKS)
+    add_subdirectory(benchmarks)
+endif()
diff --git a/src/Columns/benchmarks/CMakeLists.txt b/src/Columns/benchmarks/CMakeLists.txt
new file mode 100644
index 00000000000..47f5dfe4c59
--- /dev/null
+++ b/src/Columns/benchmarks/CMakeLists.txt
@@ -0,0 +1,4 @@
+clickhouse_add_executable(column_insert_many_from benchmark_column_insert_many_from.cpp)
+target_link_libraries (column_insert_many_from PRIVATE
+    ch_contrib::gbenchmark_all
+    dbms)
\ No newline at end of file
diff --git a/src/Columns/benchmarks/benchmark_column_insert_many_from.cpp b/src/Columns/benchmarks/benchmark_column_insert_many_from.cpp
new file mode 100644
index 00000000000..325cf5559cd
--- /dev/null
+++ b/src/Columns/benchmarks/benchmark_column_insert_many_from.cpp
@@ -0,0 +1,102 @@
+#include <cstddef>
+#include <Columns/IColumn.h>
+#include <Core/Block.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/IDataType.h>
+#include <base/types.h>
+#include <benchmark/benchmark.h>
+
+using namespace DB;
+
+static constexpr size_t ROWS = 65536;
+
+static ColumnPtr mockColumn(const DataTypePtr & type, size_t rows)
+{
+    const auto * type_array = typeid_cast<const DataTypeArray *>(type.get());
+    if (type_array)
+    {
+        auto data_col = mockColumn(type_array->getNestedType(), rows);
+        auto offset_col = ColumnArray::ColumnOffsets::create(rows);
+        auto & offsets = offset_col->getData();
+        for (size_t i = 0; i < data_col->size(); ++i)
+            offsets[i] = offsets[i - 1] + (rand() % 10);
+        auto new_data_col = data_col->replicate(offsets);
+
+        return ColumnArray::create(new_data_col, std::move(offset_col));
+    }
+
+    auto type_not_nullable = removeNullable(type);
+    auto column = type->createColumn();
+    for (size_t i = 0; i < rows; ++i)
+    {
+        if (i % 100)
+            column->insertDefault();
+        else if (isInt(type_not_nullable))
+            column->insert(i);
+        else if (isFloat(type_not_nullable))
+        {
+            double d = i * 1.0;
+            column->insert(d);
+        }
+        else if (isString(type_not_nullable))
+        {
+            String s = "helloworld";
+            column->insert(s);
+        }
+        else
+            column->insertDefault();
+    }
+    return std::move(column);
+}
+
+
+static NO_INLINE void insertManyFrom(IColumn & dst, const IColumn & src)
+{
+    size_t size = src.size();
+    dst.insertManyFrom(src, size / 2, size);
+}
+
+
+template <const std::string & str_type>
+static void BM_insertManyFrom(benchmark::State & state)
+{
+    auto type = DataTypeFactory::instance().get(str_type);
+    auto src = mockColumn(type, ROWS);
+
+    for (auto _ : state)
+    {
+        state.PauseTiming();
+        auto dst = type->createColumn();
+        dst->reserve(ROWS);
+        state.ResumeTiming();
+
+        insertManyFrom(*dst, *src);
+        benchmark::DoNotOptimize(dst);
+    }
+}
+
+static const String type_int64 = "Int64";
+static const String type_nullable_int64 = "Nullable(Int64)";
+static const String type_string = "String";
+static const String type_nullable_string = "Nullable(String)";
+static const String type_decimal = "Decimal128(3)";
+static const String type_nullable_decimal = "Nullable(Decimal128(3))";
+
+static const String type_array_int64 = "Array(Int64)";
+static const String type_array_nullable_int64 = "Array(Nullable(Int64))";
+static const String type_array_string = "Array(String)";
+static const String type_array_nullable_string = "Array(Nullable(String))";
+
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_int64);
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_nullable_int64);
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_string);
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_nullable_string);
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_decimal);
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_nullable_decimal);
+
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_array_int64);
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_array_nullable_int64);
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_array_string);
+BENCHMARK_TEMPLATE(BM_insertManyFrom, type_array_nullable_string);

From c6f0b2a5a458648c179456a6843aae8c9c3fb53a Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Thu, 14 Mar 2024 11:57:03 +0100
Subject: [PATCH 490/985] Revert "Fix usage of session_token in S3 engine"

---
 src/Coordination/KeeperSnapshotManagerS3.cpp | 3 +--
 src/Storages/StorageS3.cpp                   | 3 +--
 2 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/src/Coordination/KeeperSnapshotManagerS3.cpp b/src/Coordination/KeeperSnapshotManagerS3.cpp
index 796506a07db..80345db2524 100644
--- a/src/Coordination/KeeperSnapshotManagerS3.cpp
+++ b/src/Coordination/KeeperSnapshotManagerS3.cpp
@@ -121,8 +121,7 @@ void KeeperSnapshotManagerS3::updateS3Configuration(const Poco::Util::AbstractCo
                 auth_settings.use_insecure_imds_request.value_or(false),
                 auth_settings.expiration_window_seconds.value_or(S3::DEFAULT_EXPIRATION_WINDOW_SECONDS),
                 auth_settings.no_sign_request.value_or(false),
-            },
-            credentials.GetSessionToken());
+            });
 
         auto new_client = std::make_shared<KeeperSnapshotManagerS3::S3Configuration>(std::move(new_uri), std::move(auth_settings), std::move(client));
 
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index ff055508aa6..11da394feec 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -1451,8 +1451,7 @@ void StorageS3::Configuration::connect(const ContextPtr & context)
             auth_settings.expiration_window_seconds.value_or(
                 context->getConfigRef().getUInt64("s3.expiration_window_seconds", S3::DEFAULT_EXPIRATION_WINDOW_SECONDS)),
             auth_settings.no_sign_request.value_or(context->getConfigRef().getBool("s3.no_sign_request", false)),
-        },
-        credentials.GetSessionToken());
+        });
 }
 
 void StorageS3::processNamedCollectionResult(StorageS3::Configuration & configuration, const NamedCollection & collection)

From 1ac247ed82e583a47c30ee172a856c272f25d00d Mon Sep 17 00:00:00 2001
From: Alexander Sapin <alesapin@gmail.com>
Date: Thu, 14 Mar 2024 12:13:33 +0100
Subject: [PATCH 491/985] Tiny improvement for replication.lib

---
 tests/queries/0_stateless/replication.lib | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/replication.lib b/tests/queries/0_stateless/replication.lib
index 143332d9974..2e21f351d2a 100755
--- a/tests/queries/0_stateless/replication.lib
+++ b/tests/queries/0_stateless/replication.lib
@@ -26,12 +26,15 @@ function try_sync_replicas()
         done
     done
 
-    i=0
     for t in "${tables_arr[@]}"
     do
         # Do not start new merges (it can make SYNC a bit faster)
         $CLICKHOUSE_CLIENT -q "ALTER TABLE $t MODIFY SETTING max_replicated_merges_in_queue=0"
+    done
 
+    i=0
+    for t in "${tables_arr[@]}"
+    do
         $CLICKHOUSE_CLIENT --receive_timeout $time_left -q "SYSTEM SYNC REPLICA $t STRICT" || ($CLICKHOUSE_CLIENT -q \
             "select 'sync failed, queue:', * from system.replication_queue where database=currentDatabase() and table='$t' order by database, table, node_name" && exit 1) &
         pids[${i}]=$!

From f63e1b48e63443aa63acd53962b99c7d645a9507 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Thu, 14 Mar 2024 11:21:49 +0000
Subject: [PATCH 492/985] Temporarily increase build limit with sanitizers

---
 CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 9ffb4789dc9..7a07cf2b436 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -63,7 +63,7 @@ if (ENABLE_CHECK_HEAVY_BUILDS)
 
     # -fsanitize=memory and address are too heavy
     if (SANITIZE)
-       set (RLIMIT_DATA 10000000000) # 10G
+       set (RLIMIT_DATA 15000000000) # 10G
     endif()
 
     set (CMAKE_CXX_COMPILER_LAUNCHER prlimit --as=${RLIMIT_AS} --data=${RLIMIT_DATA} --cpu=${RLIMIT_CPU} ${CMAKE_CXX_COMPILER_LAUNCHER})

From 56220b5105005acef0ab4b09d4f7b48c6aac8d66 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Thu, 14 Mar 2024 12:23:32 +0100
Subject: [PATCH 493/985] Revert "Revert "Fix usage of session_token in S3
 engine""

---
 src/Coordination/KeeperSnapshotManagerS3.cpp | 3 ++-
 src/Storages/StorageS3.cpp                   | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/Coordination/KeeperSnapshotManagerS3.cpp b/src/Coordination/KeeperSnapshotManagerS3.cpp
index 80345db2524..796506a07db 100644
--- a/src/Coordination/KeeperSnapshotManagerS3.cpp
+++ b/src/Coordination/KeeperSnapshotManagerS3.cpp
@@ -121,7 +121,8 @@ void KeeperSnapshotManagerS3::updateS3Configuration(const Poco::Util::AbstractCo
                 auth_settings.use_insecure_imds_request.value_or(false),
                 auth_settings.expiration_window_seconds.value_or(S3::DEFAULT_EXPIRATION_WINDOW_SECONDS),
                 auth_settings.no_sign_request.value_or(false),
-            });
+            },
+            credentials.GetSessionToken());
 
         auto new_client = std::make_shared<KeeperSnapshotManagerS3::S3Configuration>(std::move(new_uri), std::move(auth_settings), std::move(client));
 
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 11da394feec..ff055508aa6 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -1451,7 +1451,8 @@ void StorageS3::Configuration::connect(const ContextPtr & context)
             auth_settings.expiration_window_seconds.value_or(
                 context->getConfigRef().getUInt64("s3.expiration_window_seconds", S3::DEFAULT_EXPIRATION_WINDOW_SECONDS)),
             auth_settings.no_sign_request.value_or(context->getConfigRef().getBool("s3.no_sign_request", false)),
-        });
+        },
+        credentials.GetSessionToken());
 }
 
 void StorageS3::processNamedCollectionResult(StorageS3::Configuration & configuration, const NamedCollection & collection)

From c7e8ca789f8bffa4451765bd51882014ed1768c3 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Tue, 12 Mar 2024 15:41:43 +0000
Subject: [PATCH 494/985] Followup fix ASTRenameQuery::clone  #61013

---
 src/Parsers/ASTRenameQuery.h | 25 ++++++++++++++++++++++++-
 1 file changed, 24 insertions(+), 1 deletion(-)

diff --git a/src/Parsers/ASTRenameQuery.h b/src/Parsers/ASTRenameQuery.h
index beaf93c4761..d51c382f374 100644
--- a/src/Parsers/ASTRenameQuery.h
+++ b/src/Parsers/ASTRenameQuery.h
@@ -94,7 +94,24 @@ public:
     ASTPtr clone() const override
     {
         auto res = std::make_shared<ASTRenameQuery>(*this);
-        res->cloneChildren();
+        res->children.clear();
+
+        auto clone_child = [&res](ASTPtr & node)
+        {
+            if (node)
+            {
+                node = node->clone();
+                res->children.push_back(node);
+            }
+        };
+
+        for (auto & elem : res->elements)
+        {
+            clone_child(elem.from.database);
+            clone_child(elem.from.table);
+            clone_child(elem.to.database);
+            clone_child(elem.to.table);
+        }
         cloneOutputOptions(*res);
         return res;
     }
@@ -108,9 +125,15 @@ public:
         for (Element & elem : query.elements)
         {
             if (!elem.from.database)
+            {
                 elem.from.database = std::make_shared<ASTIdentifier>(params.default_database);
+                query.children.push_back(elem.from.database);
+            }
             if (!elem.to.database)
+            {
                 elem.to.database = std::make_shared<ASTIdentifier>(params.default_database);
+                query.children.push_back(elem.to.database);
+            }
         }
 
         return query_ptr;

From a0044f3aa4d5c297229be6f6829f8d7b5e7d75c5 Mon Sep 17 00:00:00 2001
From: Nikolay Degterinsky <evillique@gmail.com>
Date: Thu, 14 Mar 2024 11:44:35 +0000
Subject: [PATCH 495/985] Fix ATTACH query with external ON CLUSTER

---
 src/Interpreters/InterpreterCreateQuery.cpp     | 7 +++++--
 tests/integration/test_external_cluster/test.py | 6 ++++++
 2 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index edd7452c130..fb421ee0a5e 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -1087,8 +1087,8 @@ BlockIO InterpreterCreateQuery::createTable(ASTCreateQuery & create)
     // If this is a stub ATTACH query, read the query definition from the database
     if (create.attach && !create.storage && !create.columns_list)
     {
-        auto database = DatabaseCatalog::instance().getDatabase(database_name);
-        if (database->shouldReplicateQuery(getContext(), query_ptr))
+        auto database = DatabaseCatalog::instance().tryGetDatabase(database_name);
+        if (database && database->shouldReplicateQuery(getContext(), query_ptr))
         {
             auto guard = DatabaseCatalog::instance().getDDLGuard(database_name, create.getTable());
             create.setDatabase(database_name);
@@ -1099,6 +1099,9 @@ BlockIO InterpreterCreateQuery::createTable(ASTCreateQuery & create)
         if (!create.cluster.empty())
             return executeQueryOnCluster(create);
 
+        if (!database)
+            throw Exception(ErrorCodes::UNKNOWN_DATABASE, "Database {} does not exist", backQuoteIfNeed(database_name));
+
         /// For short syntax of ATTACH query we have to lock table name here, before reading metadata
         /// and hold it until table is attached
         if (likely(need_ddl_guard))
diff --git a/tests/integration/test_external_cluster/test.py b/tests/integration/test_external_cluster/test.py
index 2ed8ada3df4..6fa9cd16dbc 100644
--- a/tests/integration/test_external_cluster/test.py
+++ b/tests/integration/test_external_cluster/test.py
@@ -46,6 +46,12 @@ def test_ddl(started_cluster):
     control_node.query(
         "ALTER TABLE test_db.test_table ON CLUSTER 'external' add column data String"
     )
+    control_node.query("DETACH TABLE test_db.test_table ON CLUSTER 'external'")
+
+    expected = ""
+    assert_create_query(data_node, "test_db", "test_table", expected)
+
+    control_node.query("ATTACH TABLE test_db.test_table ON CLUSTER 'external'")
 
     expected = "CREATE TABLE test_db.test_table (`id` Int64, `data` String) ENGINE = MergeTree ORDER BY id SETTINGS index_granularity = 8192"
     assert_create_query(data_node, "test_db", "test_table", expected)

From b43d1c4eb5c2cb661f3bb8aeb65b4549b8fea6bb Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 14 Mar 2024 13:13:33 +0100
Subject: [PATCH 496/985] Fix macro

---
 base/base/itoa.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/base/base/itoa.h b/base/base/itoa.h
index e69ce0ef17d..3461d679d43 100644
--- a/base/base/itoa.h
+++ b/base/base/itoa.h
@@ -26,5 +26,5 @@ INSTANTIATION(unsigned long)
 INSTANTIATION(long)
 #endif
 
-#undef FOR_MISSING_INTEGER_TYPES
+#undef FOR_INTEGER_TYPES
 #undef INSTANTIATION

From 95b218e7d40cc6527a597f962947424cfe540a34 Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Thu, 14 Mar 2024 13:25:24 +0100
Subject: [PATCH 497/985] fix dead lock

---
 src/Common/CgroupsMemoryUsageObserver.cpp | 4 ++--
 src/Common/CgroupsMemoryUsageObserver.h   | 4 +++-
 2 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/Common/CgroupsMemoryUsageObserver.cpp b/src/Common/CgroupsMemoryUsageObserver.cpp
index e55fd44a524..661b80a6059 100644
--- a/src/Common/CgroupsMemoryUsageObserver.cpp
+++ b/src/Common/CgroupsMemoryUsageObserver.cpp
@@ -100,7 +100,7 @@ void CgroupsMemoryUsageObserver::setMemoryUsageLimits(uint64_t hard_limit_, uint
 
 void CgroupsMemoryUsageObserver::setOnMemoryAmountAvailableChanged(OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed_)
 {
-    std::lock_guard<std::mutex> limit_lock(limit_mutex);
+    std::lock_guard<std::mutex> memory_amount_change_lock(memory_amount_change_mutex);
     on_memory_amount_available_changed = on_memory_amount_available_changed_;
 }
 
@@ -299,7 +299,7 @@ void CgroupsMemoryUsageObserver::runThread()
             {
                 LOG_INFO(log, "Memory amount available to the process changed from {} to {}", ReadableSize(last_available_memory_amount), ReadableSize(available_memory_amount));
                 last_available_memory_amount = available_memory_amount;
-                std::lock_guard<std::mutex> limit_lock(limit_mutex);
+                std::lock_guard<std::mutex> memory_amount_change_lock(memory_amount_change_mutex);
                 on_memory_amount_available_changed();
             }
 
diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index eb755d04187..7ad0f882edd 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -51,7 +51,8 @@ private:
     size_t soft_limit TSA_GUARDED_BY(limit_mutex) = 0;
     OnMemoryLimitFn on_hard_limit TSA_GUARDED_BY(limit_mutex);
     OnMemoryLimitFn on_soft_limit TSA_GUARDED_BY(limit_mutex);
-    OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed TSA_GUARDED_BY(limit_mutex);
+    std::mutex memory_amount_change_mutex;
+    OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed TSA_GUARDED_BY(memory_amount_change_mutex);
 
     uint64_t last_memory_usage = 0;        /// how much memory does the process use
     uint64_t last_available_memory_amount; /// how much memory can the process use
@@ -86,6 +87,7 @@ private:
 #else
 class CgroupsMemoryUsageObserver
 {
+    using OnMemoryAmountAvailableChangedFn = std::function<void()>;
 public:
     explicit CgroupsMemoryUsageObserver(std::chrono::seconds) {}
 

From 8fdf3ae747877b1aa0cbab3a74290f5a94edea63 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Thu, 14 Mar 2024 12:31:30 +0000
Subject: [PATCH 498/985] Add a comment.

---
 src/Planner/Planner.cpp | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index fde9f110d09..5624a911210 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -1084,6 +1084,8 @@ void addBuildSubqueriesForSetsStepIfNeeded(
         auto subquery_options = select_query_options.subquery();
         /// I don't know if this is a good decision,
         /// But for now it is done in the same way as in old analyzer.
+        /// This would not ignore limits for subqueries (affects mutations only).
+        /// See test_build_sets_from_multiple_threads-analyzer.
         subquery_options.ignore_limits = false;
         Planner subquery_planner(
             query_tree,

From b59680911c036eca84776247b9644b9f5475e25c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Thu, 14 Mar 2024 12:32:13 +0000
Subject: [PATCH 499/985] Move `getItemsShortCircuitImpl` and `getItemsImpl`
 into separate files

---
 src/Dictionaries/DictionaryStructure.h       |  27 ++
 src/Dictionaries/RangeHashedDictionary.cpp   | 218 ----------------
 src/Dictionaries/RangeHashedDictionary.h     |  13 +-
 src/Dictionaries/RangeHashedDictionary_2.cpp | 250 +++++++++++++++++++
 src/Dictionaries/RangeHashedDictionary_3.cpp | 135 ++++++++++
 utils/check-style/check-large-objects.sh     |   1 +
 6 files changed, 422 insertions(+), 222 deletions(-)
 create mode 100644 src/Dictionaries/RangeHashedDictionary_2.cpp
 create mode 100644 src/Dictionaries/RangeHashedDictionary_3.cpp

diff --git a/src/Dictionaries/DictionaryStructure.h b/src/Dictionaries/DictionaryStructure.h
index 55060b1592f..56d11be9837 100644
--- a/src/Dictionaries/DictionaryStructure.h
+++ b/src/Dictionaries/DictionaryStructure.h
@@ -41,6 +41,33 @@ enum class AttributeUnderlyingType : TypeIndexUnderlying
 
 #undef map_item
 
+
+#define CALL_FOR_ALL_DICTIONARY_ATTRIBUTE_TYPES(M) \
+    M(UInt8) \
+    M(UInt16) \
+    M(UInt32) \
+    M(UInt64) \
+    M(UInt128) \
+    M(UInt256) \
+    M(Int8) \
+    M(Int16) \
+    M(Int32) \
+    M(Int64) \
+    M(Int128) \
+    M(Int256) \
+    M(Decimal32) \
+    M(Decimal64) \
+    M(Decimal128) \
+    M(Decimal256) \
+    M(DateTime64) \
+    M(Float32) \
+    M(Float64) \
+    M(UUID) \
+    M(IPv4) \
+    M(IPv6) \
+    M(String) \
+    M(Array)
+
 /// Min and max lifetimes for a dictionary or its entry
 using DictionaryLifetime = ExternalLoadableLifetime;
 
diff --git a/src/Dictionaries/RangeHashedDictionary.cpp b/src/Dictionaries/RangeHashedDictionary.cpp
index 203561fc23d..8299c3ad93a 100644
--- a/src/Dictionaries/RangeHashedDictionary.cpp
+++ b/src/Dictionaries/RangeHashedDictionary.cpp
@@ -211,224 +211,6 @@ ColumnPtr RangeHashedDictionary<dictionary_key_type>::getColumn(
     return result;
 }
 
-template <DictionaryKeyType dictionary_key_type>
-template <typename AttributeType, bool is_nullable, typename ValueSetter, typename DefaultValueExtractor>
-void RangeHashedDictionary<dictionary_key_type>::getItemsImpl(
-    const Attribute & attribute,
-    const Columns & key_columns,
-    ValueSetter && set_value,
-    DefaultValueExtractor & default_value_extractor) const
-{
-    const auto & attribute_container = std::get<AttributeContainerType<AttributeType>>(attribute.container);
-
-    size_t keys_found = 0;
-
-    const ColumnPtr & range_column = key_columns.back();
-    auto key_columns_copy = key_columns;
-    key_columns_copy.pop_back();
-
-    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
-    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
-    const size_t keys_size = keys_extractor.getKeysSize();
-
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
-    {
-        using Types = std::decay_t<decltype(types)>;
-        using RangeColumnType = typename Types::LeftType;
-        using RangeStorageType = typename RangeColumnType::ValueType;
-        using RangeInterval = Interval<RangeStorageType>;
-
-        const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
-        if (!range_column_typed)
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "Dictionary {} range column type should be equal to {}",
-                getFullName(),
-                dict_struct.range_min->type->getName());
-
-        const auto & range_column_data = range_column_typed->getData();
-
-        const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
-
-        for (size_t key_index = 0; key_index < keys_size; ++key_index)
-        {
-            auto key = keys_extractor.extractCurrentKey();
-            const auto it = key_attribute_container.find(key);
-
-            if (it)
-            {
-                const auto date = range_column_data[key_index];
-                const auto & interval_tree = it->getMapped();
-
-                size_t value_index = 0;
-                std::optional<RangeInterval> range;
-
-                interval_tree.find(date, [&](auto & interval, auto & interval_value_index)
-                {
-                    if (range)
-                    {
-                        if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
-                        {
-                            range = interval;
-                            value_index = interval_value_index;
-                        }
-                        else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > * range)
-                        {
-                            range = interval;
-                            value_index = interval_value_index;
-                        }
-                    }
-                    else
-                    {
-                        range = interval;
-                        value_index = interval_value_index;
-                    }
-
-                    return true;
-                });
-
-                if (range.has_value())
-                {
-                    ++keys_found;
-
-                    AttributeType value = attribute_container[value_index];
-
-                    if constexpr (is_nullable)
-                    {
-                        bool is_null = (*attribute.is_value_nullable)[value_index];
-                        set_value(key_index, value, is_null);
-                    }
-                    else
-                    {
-                        set_value(key_index, value, false);
-                    }
-
-                    keys_extractor.rollbackCurrentKey();
-                    continue;
-                }
-            }
-
-            if constexpr (is_nullable)
-                set_value(key_index, default_value_extractor[key_index], default_value_extractor.isNullAt(key_index));
-            else
-                set_value(key_index, default_value_extractor[key_index], false);
-
-            keys_extractor.rollbackCurrentKey();
-        }
-    });
-
-    query_count.fetch_add(keys_size, std::memory_order_relaxed);
-    found_count.fetch_add(keys_found, std::memory_order_relaxed);
-}
-
-template <DictionaryKeyType dictionary_key_type>
-template <typename AttributeType, bool is_nullable, typename ValueSetter>
-size_t RangeHashedDictionary<dictionary_key_type>::getItemsShortCircuitImpl(
-    const Attribute & attribute,
-    const Columns & key_columns,
-    ValueSetter && set_value,
-    IColumn::Filter & default_mask) const
-{
-    const auto & attribute_container = std::get<AttributeContainerType<AttributeType>>(attribute.container);
-
-    size_t keys_found = 0;
-
-    const ColumnPtr & range_column = key_columns.back();
-    auto key_columns_copy = key_columns;
-    key_columns_copy.pop_back();
-
-    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
-    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
-    const size_t keys_size = keys_extractor.getKeysSize();
-    default_mask.resize(keys_size);
-
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
-    {
-        using Types = std::decay_t<decltype(types)>;
-        using RangeColumnType = typename Types::LeftType;
-        using RangeStorageType = typename RangeColumnType::ValueType;
-        using RangeInterval = Interval<RangeStorageType>;
-
-        const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
-        if (!range_column_typed)
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "Dictionary {} range column type should be equal to {}",
-                getFullName(),
-                dict_struct.range_min->type->getName());
-
-        const auto & range_column_data = range_column_typed->getData();
-
-        const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
-
-        for (size_t key_index = 0; key_index < keys_size; ++key_index)
-        {
-            auto key = keys_extractor.extractCurrentKey();
-            const auto it = key_attribute_container.find(key);
-
-            if (it)
-            {
-                const auto date = range_column_data[key_index];
-                const auto & interval_tree = it->getMapped();
-
-                size_t value_index = 0;
-                std::optional<RangeInterval> range;
-
-                interval_tree.find(date, [&](auto & interval, auto & interval_value_index)
-                {
-                    if (range)
-                    {
-                        if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
-                        {
-                            range = interval;
-                            value_index = interval_value_index;
-                        }
-                        else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > * range)
-                        {
-                            range = interval;
-                            value_index = interval_value_index;
-                        }
-                    }
-                    else
-                    {
-                        range = interval;
-                        value_index = interval_value_index;
-                    }
-
-                    return true;
-                });
-
-                if (range.has_value())
-                {
-                    default_mask[key_index] = 0;
-                    ++keys_found;
-
-                    AttributeType value = attribute_container[value_index];
-
-                    if constexpr (is_nullable)
-                    {
-                        bool is_null = (*attribute.is_value_nullable)[value_index];
-                        set_value(key_index, value, is_null);
-                    }
-                    else
-                    {
-                        set_value(key_index, value, false);
-                    }
-
-                    keys_extractor.rollbackCurrentKey();
-                    continue;
-                }
-            }
-
-            default_mask[key_index] = 1;
-
-            keys_extractor.rollbackCurrentKey();
-        }
-    });
-
-    query_count.fetch_add(keys_size, std::memory_order_relaxed);
-    found_count.fetch_add(keys_found, std::memory_order_relaxed);
-    return keys_found;
-}
-
 template
 ColumnPtr RangeHashedDictionary<DictionaryKeyType::Simple>::getColumn(
     const std::string & attribute_name,
diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index 4a8008b9051..a5dedae97c4 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -236,18 +236,23 @@ private:
 
     static Attribute createAttribute(const DictionaryAttribute & dictionary_attribute);
 
-    template <typename AttributeType, bool is_nullable, typename ValueSetter, typename DefaultValueExtractor>
+
+
+    template <typename ValueType>
+    using ValueSetterFunc = std::function<void(size_t, const ValueType &, bool)>;
+
+    template <typename ValueType, bool is_nullable, typename DefaultValueExtractor>
     void getItemsImpl(
         const Attribute & attribute,
         const Columns & key_columns,
-        ValueSetter && set_value,
+        ValueSetterFunc<ValueType> && set_value,
         DefaultValueExtractor & default_value_extractor) const;
 
-    template <typename AttributeType, bool is_nullable, typename ValueSetter>
+    template <typename ValueType, bool is_nullable>
     size_t getItemsShortCircuitImpl(
         const Attribute & attribute,
         const Columns & key_columns,
-        ValueSetter && set_value,
+        ValueSetterFunc<ValueType> && set_value,
         IColumn::Filter & default_mask) const;
 
     ColumnPtr getColumnInternal(
diff --git a/src/Dictionaries/RangeHashedDictionary_2.cpp b/src/Dictionaries/RangeHashedDictionary_2.cpp
new file mode 100644
index 00000000000..2329d621da4
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionary_2.cpp
@@ -0,0 +1,250 @@
+#include <Dictionaries/RangeHashedDictionary.h>
+
+namespace DB
+{
+
+
+template <DictionaryKeyType dictionary_key_type>
+template <typename ValueType, bool is_nullable>
+size_t RangeHashedDictionary<dictionary_key_type>::getItemsShortCircuitImpl(
+    const Attribute & attribute,
+    const Columns & key_columns,
+    typename RangeHashedDictionary<dictionary_key_type>::ValueSetterFunc<ValueType> && set_value,
+    IColumn::Filter & default_mask) const
+{
+    const auto & attribute_container = std::get<AttributeContainerType<ValueType>>(attribute.container);
+
+    size_t keys_found = 0;
+
+    const ColumnPtr & range_column = key_columns.back();
+    auto key_columns_copy = key_columns;
+    key_columns_copy.pop_back();
+
+    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
+    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
+    const size_t keys_size = keys_extractor.getKeysSize();
+    default_mask.resize(keys_size);
+
+    callOnRangeType(
+        dict_struct.range_min->type,
+        [&](const auto & types)
+        {
+            using Types = std::decay_t<decltype(types)>;
+            using RangeColumnType = typename Types::LeftType;
+            using RangeStorageType = typename RangeColumnType::ValueType;
+            using RangeInterval = Interval<RangeStorageType>;
+
+            const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
+            if (!range_column_typed)
+                throw Exception(
+                    ErrorCodes::TYPE_MISMATCH,
+                    "Dictionary {} range column type should be equal to {}",
+                    getFullName(),
+                    dict_struct.range_min->type->getName());
+
+            const auto & range_column_data = range_column_typed->getData();
+
+            const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
+
+            for (size_t key_index = 0; key_index < keys_size; ++key_index)
+            {
+                auto key = keys_extractor.extractCurrentKey();
+                const auto it = key_attribute_container.find(key);
+
+                if (it)
+                {
+                    const auto date = range_column_data[key_index];
+                    const auto & interval_tree = it->getMapped();
+
+                    size_t value_index = 0;
+                    std::optional<RangeInterval> range;
+
+                    interval_tree.find(
+                        date,
+                        [&](auto & interval, auto & interval_value_index)
+                        {
+                            if (range)
+                            {
+                                if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
+                                {
+                                    range = interval;
+                                    value_index = interval_value_index;
+                                }
+                                else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > *range)
+                                {
+                                    range = interval;
+                                    value_index = interval_value_index;
+                                }
+                            }
+                            else
+                            {
+                                range = interval;
+                                value_index = interval_value_index;
+                            }
+
+                            return true;
+                        });
+
+                    if (range.has_value())
+                    {
+                        default_mask[key_index] = 0;
+                        ++keys_found;
+
+                        ValueType value = attribute_container[value_index];
+
+                        if constexpr (is_nullable)
+                        {
+                            bool is_null = (*attribute.is_value_nullable)[value_index];
+                            set_value(key_index, value, is_null);
+                        }
+                        else
+                        {
+                            set_value(key_index, value, false);
+                        }
+
+                        keys_extractor.rollbackCurrentKey();
+                        continue;
+                    }
+                }
+
+                default_mask[key_index] = 1;
+
+                keys_extractor.rollbackCurrentKey();
+            }
+        });
+
+    query_count.fetch_add(keys_size, std::memory_order_relaxed);
+    found_count.fetch_add(keys_found, std::memory_order_relaxed);
+    return keys_found;
+}
+
+template <DictionaryKeyType dictionary_key_type>
+template <typename ValueType, bool is_nullable, typename DefaultValueExtractor>
+void RangeHashedDictionary<dictionary_key_type>::getItemsImpl(
+    const Attribute & attribute,
+    const Columns & key_columns,
+    typename RangeHashedDictionary<dictionary_key_type>::ValueSetterFunc<ValueType> && set_value,
+    DefaultValueExtractor & default_value_extractor) const
+{
+    const auto & attribute_container = std::get<AttributeContainerType<ValueType>>(attribute.container);
+
+    size_t keys_found = 0;
+
+    const ColumnPtr & range_column = key_columns.back();
+    auto key_columns_copy = key_columns;
+    key_columns_copy.pop_back();
+
+    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
+    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
+    const size_t keys_size = keys_extractor.getKeysSize();
+
+    callOnRangeType(
+        dict_struct.range_min->type,
+        [&](const auto & types)
+        {
+            using Types = std::decay_t<decltype(types)>;
+            using RangeColumnType = typename Types::LeftType;
+            using RangeStorageType = typename RangeColumnType::ValueType;
+            using RangeInterval = Interval<RangeStorageType>;
+
+            const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
+            if (!range_column_typed)
+                throw Exception(
+                    ErrorCodes::TYPE_MISMATCH,
+                    "Dictionary {} range column type should be equal to {}",
+                    getFullName(),
+                    dict_struct.range_min->type->getName());
+
+            const auto & range_column_data = range_column_typed->getData();
+
+            const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
+
+            for (size_t key_index = 0; key_index < keys_size; ++key_index)
+            {
+                auto key = keys_extractor.extractCurrentKey();
+                const auto it = key_attribute_container.find(key);
+
+                if (it)
+                {
+                    const auto date = range_column_data[key_index];
+                    const auto & interval_tree = it->getMapped();
+
+                    size_t value_index = 0;
+                    std::optional<RangeInterval> range;
+
+                    interval_tree.find(
+                        date,
+                        [&](auto & interval, auto & interval_value_index)
+                        {
+                            if (range)
+                            {
+                                if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
+                                {
+                                    range = interval;
+                                    value_index = interval_value_index;
+                                }
+                                else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > *range)
+                                {
+                                    range = interval;
+                                    value_index = interval_value_index;
+                                }
+                            }
+                            else
+                            {
+                                range = interval;
+                                value_index = interval_value_index;
+                            }
+
+                            return true;
+                        });
+
+                    if (range.has_value())
+                    {
+                        ++keys_found;
+
+                        ValueType value = attribute_container[value_index];
+
+                        if constexpr (is_nullable)
+                        {
+                            bool is_null = (*attribute.is_value_nullable)[value_index];
+                            set_value(key_index, value, is_null);
+                        }
+                        else
+                        {
+                            set_value(key_index, value, false);
+                        }
+
+                        keys_extractor.rollbackCurrentKey();
+                        continue;
+                    }
+                }
+
+                if constexpr (is_nullable)
+                    set_value(key_index, default_value_extractor[key_index], default_value_extractor.isNullAt(key_index));
+                else
+                    set_value(key_index, default_value_extractor[key_index], false);
+
+                keys_extractor.rollbackCurrentKey();
+            }
+        });
+
+    query_count.fetch_add(keys_size, std::memory_order_relaxed);
+    found_count.fetch_add(keys_found, std::memory_order_relaxed);
+}
+
+#define INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType, IsNullable, ValueType) \
+    template size_t RangeHashedDictionary<DictionaryKeyType>::getItemsShortCircuitImpl<ValueType, IsNullable>( \
+        const Attribute & attribute, \
+        const Columns & key_columns, \
+        typename RangeHashedDictionary<DictionaryKeyType>::ValueSetterFunc<ValueType> && set_value, \
+        IColumn::Filter & default_mask) const;
+
+#define INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(AttributeType) \
+    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Simple, true, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Simple, false, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Complex, true, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Complex, false, DictionaryValueType<AttributeType>)
+
+CALL_FOR_ALL_DICTIONARY_ATTRIBUTE_TYPES(INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE)
+
+}
diff --git a/src/Dictionaries/RangeHashedDictionary_3.cpp b/src/Dictionaries/RangeHashedDictionary_3.cpp
new file mode 100644
index 00000000000..a3136d6f63d
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionary_3.cpp
@@ -0,0 +1,135 @@
+#include <Dictionaries/RangeHashedDictionary.h>
+
+namespace DB
+{
+
+template <DictionaryKeyType dictionary_key_type>
+template <typename ValueType, bool is_nullable, typename DefaultValueExtractor>
+void RangeHashedDictionary<dictionary_key_type>::getItemsImpl(
+    const Attribute & attribute,
+    const Columns & key_columns,
+    typename RangeHashedDictionary<dictionary_key_type>::ValueSetterFunc<ValueType> && set_value,
+    DefaultValueExtractor & default_value_extractor) const
+{
+    const auto & attribute_container = std::get<AttributeContainerType<ValueType>>(attribute.container);
+
+    size_t keys_found = 0;
+
+    const ColumnPtr & range_column = key_columns.back();
+    auto key_columns_copy = key_columns;
+    key_columns_copy.pop_back();
+
+    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
+    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
+    const size_t keys_size = keys_extractor.getKeysSize();
+
+    callOnRangeType(
+        dict_struct.range_min->type,
+        [&](const auto & types)
+        {
+            using Types = std::decay_t<decltype(types)>;
+            using RangeColumnType = typename Types::LeftType;
+            using RangeStorageType = typename RangeColumnType::ValueType;
+            using RangeInterval = Interval<RangeStorageType>;
+
+            const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
+            if (!range_column_typed)
+                throw Exception(
+                    ErrorCodes::TYPE_MISMATCH,
+                    "Dictionary {} range column type should be equal to {}",
+                    getFullName(),
+                    dict_struct.range_min->type->getName());
+
+            const auto & range_column_data = range_column_typed->getData();
+
+            const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
+
+            for (size_t key_index = 0; key_index < keys_size; ++key_index)
+            {
+                auto key = keys_extractor.extractCurrentKey();
+                const auto it = key_attribute_container.find(key);
+
+                if (it)
+                {
+                    const auto date = range_column_data[key_index];
+                    const auto & interval_tree = it->getMapped();
+
+                    size_t value_index = 0;
+                    std::optional<RangeInterval> range;
+
+                    interval_tree.find(
+                        date,
+                        [&](auto & interval, auto & interval_value_index)
+                        {
+                            if (range)
+                            {
+                                if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
+                                {
+                                    range = interval;
+                                    value_index = interval_value_index;
+                                }
+                                else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > *range)
+                                {
+                                    range = interval;
+                                    value_index = interval_value_index;
+                                }
+                            }
+                            else
+                            {
+                                range = interval;
+                                value_index = interval_value_index;
+                            }
+
+                            return true;
+                        });
+
+                    if (range.has_value())
+                    {
+                        ++keys_found;
+
+                        ValueType value = attribute_container[value_index];
+
+                        if constexpr (is_nullable)
+                        {
+                            bool is_null = (*attribute.is_value_nullable)[value_index];
+                            set_value(key_index, value, is_null);
+                        }
+                        else
+                        {
+                            set_value(key_index, value, false);
+                        }
+
+                        keys_extractor.rollbackCurrentKey();
+                        continue;
+                    }
+                }
+
+                if constexpr (is_nullable)
+                    set_value(key_index, default_value_extractor[key_index], default_value_extractor.isNullAt(key_index));
+                else
+                    set_value(key_index, default_value_extractor[key_index], false);
+
+                keys_extractor.rollbackCurrentKey();
+            }
+        });
+
+    query_count.fetch_add(keys_size, std::memory_order_relaxed);
+    found_count.fetch_add(keys_found, std::memory_order_relaxed);
+}
+
+#define INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType, IsNullable, AttributeType, ValueType) \
+template void RangeHashedDictionary<DictionaryKeyType>::getItemsImpl<ValueType, IsNullable, DictionaryDefaultValueExtractor<AttributeType>>( \
+    const Attribute & attribute,\
+    const Columns & key_columns,\
+    typename RangeHashedDictionary<DictionaryKeyType>::ValueSetterFunc<ValueType> && set_value,\
+    DictionaryDefaultValueExtractor<AttributeType> & default_value_extractor) const;
+
+#define INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(AttributeType) \
+    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Simple, true, AttributeType, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Simple, false, AttributeType, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Complex, true, AttributeType, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Complex, false, AttributeType, DictionaryValueType<AttributeType>)
+
+CALL_FOR_ALL_DICTIONARY_ATTRIBUTE_TYPES(INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE)
+
+}
diff --git a/utils/check-style/check-large-objects.sh b/utils/check-style/check-large-objects.sh
index 5b0e8e88df5..5ef57ea4f6c 100755
--- a/utils/check-style/check-large-objects.sh
+++ b/utils/check-style/check-large-objects.sh
@@ -6,6 +6,7 @@ TU_EXCLUDES=(
     CastOverloadResolver
     AggregateFunctionUniq
     FunctionsConversion
+    RangeHashedDictionary_
 
     Aggregator
 )

From 85a79bc1cc8b9a374bfa2584dc4af87b24267cfd Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Thu, 14 Mar 2024 12:39:23 +0000
Subject: [PATCH 500/985] Fix the longest test unnecessary 3 minute wait

---
 .../01599_multiline_input_and_singleline_comments.sh  | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh b/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh
index 7f77f8bb403..a537dce2d92 100755
--- a/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh
+++ b/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh
@@ -1,9 +1,10 @@
 #!/usr/bin/expect -f
-# Tags: no-fasttest
-# Tag no-fasttest: 180 seconds running
 
 log_user 0
+
+# In some places `-timeout 1`` is used to avoid expect to always wait for the whole timeout
 set timeout 60
+
 match_max 100000
 
 if ![info exists env(CLICKHOUSE_PORT_TCP)] {set env(CLICKHOUSE_PORT_TCP) 9000}
@@ -13,11 +14,11 @@ expect ":) "
 
 # Make a query
 send -- "SELECT 1\r"
-expect ":-] "
+expect -timeout 1 ":-] "
 send -- "-- xxx\r"
-expect ":-] "
+expect -timeout 1 ":-] "
 send -- ", 2\r"
-expect ":-] "
+expect -timeout 1 ":-] "
 send -- ";\r"
 
 expect "│ 1 │ 2 │"

From 37913d94a3c9704775010cfc2f1d1fb9c705f7a9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 14 Mar 2024 13:39:50 +0100
Subject: [PATCH 501/985] Merge with master

---
 src/Functions/FunctionsConversion.cpp | 18 ++++++++----------
 1 file changed, 8 insertions(+), 10 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 70cbf31bcb3..42056067f00 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -4471,20 +4471,20 @@ arguments, result_type, input_rows_count); \
 
                 if (from_low_cardinality)
                 {
-                    const auto * col_low_cardinality = typeid_cast<const ColumnLowCardinality *>(arguments[0].column.get());
+                    const auto & col_low_cardinality = typeid_cast<const ColumnLowCardinality &>(*arguments[0].column);
 
-                    if (skip_not_null_check && col_low_cardinality->containsNull())
+                    if (skip_not_null_check && col_low_cardinality.containsNull())
                         throw Exception(ErrorCodes::CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN, "Cannot convert NULL value to non-Nullable type");
 
-                    arg.column = col_low_cardinality->getDictionary().getNestedColumn();
+                    arg.column = col_low_cardinality.getDictionary().getNestedColumn();
                     arg.type = from_low_cardinality->getDictionaryType();
 
                     /// TODO: Make map with defaults conversion.
                     src_converted_to_full_column = !removeNullable(arg.type)->equals(*removeNullable(res_type));
                     if (src_converted_to_full_column)
-                        arg.column = arg.column->index(col_low_cardinality->getIndexes(), 0);
+                        arg.column = arg.column->index(col_low_cardinality.getIndexes(), 0);
                     else
-                        res_indexes = col_low_cardinality->getIndexesPtr();
+                        res_indexes = col_low_cardinality.getIndexesPtr();
 
                     tmp_rows_count = arg.column->size();
                 }
@@ -4496,14 +4496,12 @@ arguments, result_type, input_rows_count); \
             if (to_low_cardinality)
             {
                 auto res_column = to_low_cardinality->createColumn();
-                auto * col_low_cardinality = typeid_cast<ColumnLowCardinality *>(res_column.get());
+                auto & col_low_cardinality = typeid_cast<ColumnLowCardinality &>(*res_column);
 
                 if (from_low_cardinality && !src_converted_to_full_column)
-                {
-                    col_low_cardinality->insertRangeFromDictionaryEncodedColumn(*converted_column, *res_indexes);
-                }
+                    col_low_cardinality.insertRangeFromDictionaryEncodedColumn(*converted_column, *res_indexes);
                 else
-                    col_low_cardinality->insertRangeFromFullColumn(*converted_column, 0, converted_column->size());
+                    col_low_cardinality.insertRangeFromFullColumn(*converted_column, 0, converted_column->size());
 
                 return res_column;
             }

From 107acf54c609147acc6bf84407f168e274079505 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Thu, 14 Mar 2024 13:42:07 +0100
Subject: [PATCH 502/985] Fix tests

---
 tests/integration/test_storage_s3/test.py | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index dbbe670e8ca..6d5b84a8143 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -1414,10 +1414,10 @@ def test_signatures(started_cluster):
     )
     assert int(result) == 1
 
-    result = instance.query(
+    error = instance.query_and_get_error(
         f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'minio', 'minio123', '{session_token}')"
     )
-    assert int(result) == 1
+    assert "S3_ERROR" in error
 
     result = instance.query(
         f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'Arrow', 'x UInt64', 'auto')"
@@ -1429,20 +1429,20 @@ def test_signatures(started_cluster):
     )
     assert int(result) == 1
 
-    result = instance.query(
+    error = instance.query_and_get_error(
         f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'minio', 'minio123', '{session_token}', 'Arrow')"
     )
-    assert int(result) == 1
+    assert "S3_ERROR" in error
 
-    lt = instance.query(
+    error = instance.query_and_get_error(
         f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'minio', 'minio123', '{session_token}', 'Arrow', 'x UInt64')"
     )
-    assert int(result) == 1
+    assert "S3_ERROR" in error
 
-    lt = instance.query(
+    error = instance.query_and_get_error(
         f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'minio', 'minio123', '{session_token}', 'Arrow', 'x UInt64', 'auto')"
     )
-    assert int(result) == 1
+    assert "S3_ERROR" in error
 
 
 def test_select_columns(started_cluster):

From 047fb87a9ae20dd57ba370a277cfd4a43411876d Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Thu, 14 Mar 2024 12:46:45 +0000
Subject: [PATCH 503/985] typo

---
 .../01599_multiline_input_and_singleline_comments.sh            | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh b/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh
index a537dce2d92..f1acd39136f 100755
--- a/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh
+++ b/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh
@@ -2,7 +2,7 @@
 
 log_user 0
 
-# In some places `-timeout 1`` is used to avoid expect to always wait for the whole timeout
+# In some places `-timeout 1` is used to avoid expect to always wait for the whole timeout
 set timeout 60
 
 match_max 100000

From bf9da768bfb090dec9b366d97240a2949b0e150e Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 14 Mar 2024 13:53:40 +0100
Subject: [PATCH 504/985] More detailed explanation

---
 docs/en/operations/storing-data.md | 42 +++++++++++++++++++++++++-----
 1 file changed, 36 insertions(+), 6 deletions(-)

diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index 4f676904375..fd81bc197d1 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -10,7 +10,11 @@ Data, processed in ClickHouse, is usually stored in the local file system — on
 2. The Hadoop Distributed File System ([HDFS](https://hadoop.apache.org/docs/current/hadoop-project-dist/hadoop-hdfs/HdfsDesign.html))
 3. [Azure Blob Storage](https://azure.microsoft.com/en-us/products/storage/blobs).
 
-Note: to work with data stored on `Amazon S3` disks use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine, to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine, and to work with data stored in Azure Blob Storage use [AzureBlobStorage](/docs/en/engines/table-engines/integrations/azureBlobStorage.md) table engine. They are different from external storage described on this page as they allow to read data stored in some general file format (like Parquet), while on this page we are describing storage configuration for ClickHouse `MergeTree` family or `Log` family tables.
+:::note ClickHouse also has support for external table engines, which are different from external storage option described on this page as they allow to read data stored in some general file format (like Parquet), while on this page we are describing storage configuration for ClickHouse `MergeTree` family or `Log` family tables.
+1. to work with data stored on `Amazon S3` disks, use [S3](/docs/en/engines/table-engines/integrations/s3.md) table engine.
+2. to work with data in the Hadoop Distributed File System — [HDFS](/docs/en/engines/table-engines/integrations/hdfs.md) table engine.
+3. to work with data stored in Azure Blob Storage use [AzureBlobStorage](/docs/en/engines/table-engines/integrations/azureBlobStorage.md) table engine.
+:::
 
 ## Configuring external storage {#configuring-external-storage}
 
@@ -23,8 +27,9 @@ Disk configuration requires:
 Starting from 24.1 clickhouse version, it is possible to use a new configuration option.
 It requires to specify:
 1. `type` equal to `object_storage`
-2. `object_storage_type`, equal to one of `s3`, `azure_blob_storage`, `hdfs`, `local_blob_storage`, `web`.
+2. `object_storage_type`, equal to one of `s3`, `azure_blob_storage` (or just `azure` from `24.3`), `hdfs`, `local_blob_storage` (or just `local` from `24.3`), `web`.
 Optionally, `metadata_type` can be specified (it is equal to `local` by default), but it can also be set to `plain`, `web`.
+Usage of `plain` metadata type is described in [plain storage section](/docs/en/operations/storing-data.md/#storing-data-on-webserver), `web` metadata type can be used only with `web` object storage type, `local` metadata type stores metadata files locally (each metadata files contains mapping to files in object storage and some additional meta information about them).
 
 E.g. configuration option
 ``` xml
@@ -143,7 +148,7 @@ SETTINGS disk = 's3';
 
 ## Dynamic Configuration {#dynamic-configuration}
 
-There is also a possibility to specify storage configuration without a predefined disk in configuration in a configuration file, but can be configured in the CREATE/ATTACH query settings.
+There is also a possibility to specify storage configuration without a predefined disk in configuration in a configuration file, but can be configured in the `CREATE`/`ATTACH` query settings.
 
 The following example query builds on the above dynamic disk configuration and shows how to use a local disk to cache data from a table stored at a URL.
 
@@ -306,10 +311,35 @@ Optional parameters:
 Google Cloud Storage (GCS) is also supported using the type `s3`. See [GCS backed MergeTree](/docs/en/integrations/gcs).
 :::
 
-### Using Plain Storage {#s3-storage}
+### Using Plain Storage {#plain-storage}
 
-There is a disk type `s3_plain`, which provides a write-once storage. Unlike `s3` disk type, it stores data as is, e.g. instead of randomly-generated blob names, it uses normal file names as clickhouse stores files on local disk. So this disk type allows to keeper a static version of the table and can also be used to create backups on it.
-Configuration parameters are the same as for `s3` disk type.
+In `22.10` a new disk type `s3_plain` was introduced, which provides a write-once storage. Configuration parameters are the same as for `s3` disk type.
+Unlike `s3` disk type, it stores data as is, e.g. instead of randomly-generated blob names, it uses normal file names (the same way as clickhouse stores files on local disk) and does not store any metadata locally, e.g. it is derived from data on `s3`.
+
+This disk type allows to keep a static version of the table, as it does not allow executing merges on the existing data and does not allow inserting of new data.
+A use case for this disk type is to create backups on it, which can be done via `BACKUP TABLE data TO Disk('plain_disk_name', 'backup_name')`. Afterwards you can do `RESTORE TABLE data AS data_restored FROM Disk('plain_disk_name', 'backup_name')` or using `ATTACH TABLE data (...) ENGINE = MergeTree() SETTINGS disk = 'plain_disk_name'`.
+
+Configuration:
+``` xml
+<s3_plain>
+    <type>s3_plain</type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3_plain>
+```
+
+Starting from `24.1` it is possible configure any object storage disk (`s3`, `azure`, `hdfs`, `local`) using `plain` metadata type.
+
+Configuration:
+``` xml
+<s3_plain>
+    <type>object_storage</type>
+    <object_storage_type>azure</object_storage_type>
+    <metadata_type>plain</metadata_type>
+    <endpoint>https://s3.eu-west-1.amazonaws.com/clickhouse-eu-west-1.clickhouse.com/data/</endpoint>
+    <use_invironment_credentials>1</use_invironment_credentials>
+</s3_plain>
+```
 
 ### Using Azure Blob Storage {#azure-blob-storage}
 

From c3aefb28e5eb11c171700dfe439c2371c6a3825e Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 14 Mar 2024 14:13:15 +0100
Subject: [PATCH 505/985] Remove unnecessary layers from clickhouse/cctools

---
 docker/packager/cctools/Dockerfile | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/docker/packager/cctools/Dockerfile b/docker/packager/cctools/Dockerfile
index 1b8c675a5c5..d986c6a3c86 100644
--- a/docker/packager/cctools/Dockerfile
+++ b/docker/packager/cctools/Dockerfile
@@ -2,7 +2,7 @@
 # It's based on the assumption that we don't care of the cctools version so much
 # It event does not depend on the clickhouse/fasttest in the `docker/images.json`
 ARG FROM_TAG=latest
-FROM clickhouse/fasttest:$FROM_TAG
+FROM clickhouse/fasttest:$FROM_TAG as builder
 
 ENV CC=clang-${LLVM_VERSION}
 ENV CXX=clang++-${LLVM_VERSION}
@@ -29,3 +29,6 @@ RUN git clone https://github.com/tpoechtrager/cctools-port.git \
     && make install -j$(nproc) \
     && cd ../.. \
     && rm -rf cctools-port
+
+FROM scratch
+COPY --from=builder /cctools /cctools

From 9067c1ab9292de5064a3cb8547557798ace4ac99 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 14 Mar 2024 14:14:24 +0100
Subject: [PATCH 506/985] Merge with master

---
 src/Functions/FunctionsConversion.h | 4990 ---------------------------
 1 file changed, 4990 deletions(-)
 delete mode 100644 src/Functions/FunctionsConversion.h

diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
deleted file mode 100644
index f338af28240..00000000000
--- a/src/Functions/FunctionsConversion.h
+++ /dev/null
@@ -1,4990 +0,0 @@
-#pragma once
-
-#include <cstddef>
-#include <type_traits>
-
-#include <IO/WriteBufferFromVector.h>
-#include <IO/ReadBufferFromMemory.h>
-#include <IO/Operators.h>
-#include <IO/parseDateTimeBestEffort.h>
-#include <DataTypes/DataTypeFactory.h>
-#include <DataTypes/DataTypesNumber.h>
-#include <DataTypes/DataTypesDecimal.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypeFixedString.h>
-#include <DataTypes/DataTypeDate.h>
-#include <DataTypes/DataTypeDate32.h>
-#include <DataTypes/DataTypeDateTime.h>
-#include <DataTypes/DataTypeDateTime64.h>
-#include <DataTypes/DataTypeEnum.h>
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeMap.h>
-#include <DataTypes/DataTypeNullable.h>
-#include <DataTypes/DataTypeNothing.h>
-#include <DataTypes/DataTypeUUID.h>
-#include <DataTypes/DataTypeInterval.h>
-#include <DataTypes/DataTypeAggregateFunction.h>
-#include <DataTypes/DataTypeObject.h>
-#include <DataTypes/ObjectUtils.h>
-#include <DataTypes/DataTypeNested.h>
-#include <DataTypes/DataTypeVariant.h>
-#include <DataTypes/Serializations/SerializationDecimal.h>
-#include <Formats/FormatSettings.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnFixedString.h>
-#include <Columns/ColumnConst.h>
-#include <Columns/ColumnAggregateFunction.h>
-#include <Columns/ColumnArray.h>
-#include <Columns/ColumnNullable.h>
-#include <Columns/ColumnTuple.h>
-#include <Columns/ColumnMap.h>
-#include <Columns/ColumnObject.h>
-#include <Columns/ColumnsCommon.h>
-#include <Columns/ColumnVariant.h>
-#include <Columns/ColumnStringHelpers.h>
-#include <Common/assert_cast.h>
-#include <Common/Concepts.h>
-#include <Common/quoteString.h>
-#include <Common/Exception.h>
-#include <Core/AccurateComparison.h>
-#include <Functions/IFunctionAdaptors.h>
-#include <Functions/FunctionHelpers.h>
-#include <Functions/DateTimeTransforms.h>
-#include <Functions/toFixedString.h>
-#include <Functions/TransformDateTime64.h>
-#include <Functions/FunctionsCodingIP.h>
-#include <Functions/CastOverloadResolver.h>
-#include <DataTypes/DataTypeLowCardinality.h>
-#include <Columns/ColumnLowCardinality.h>
-#include <Interpreters/Context.h>
-#include <Common/HashTable/HashMap.h>
-#include <DataTypes/DataTypeIPv4andIPv6.h>
-#include <Common/IPv6ToBinary.h>
-#include <Core/Types.h>
-
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int ATTEMPT_TO_READ_AFTER_EOF;
-    extern const int CANNOT_PARSE_NUMBER;
-    extern const int CANNOT_READ_ARRAY_FROM_TEXT;
-    extern const int CANNOT_PARSE_INPUT_ASSERTION_FAILED;
-    extern const int CANNOT_PARSE_QUOTED_STRING;
-    extern const int CANNOT_PARSE_ESCAPE_SEQUENCE;
-    extern const int CANNOT_PARSE_DATE;
-    extern const int CANNOT_PARSE_DATETIME;
-    extern const int CANNOT_PARSE_TEXT;
-    extern const int CANNOT_PARSE_UUID;
-    extern const int CANNOT_PARSE_IPV4;
-    extern const int CANNOT_PARSE_IPV6;
-    extern const int TOO_FEW_ARGUMENTS_FOR_FUNCTION;
-    extern const int LOGICAL_ERROR;
-    extern const int TYPE_MISMATCH;
-    extern const int CANNOT_CONVERT_TYPE;
-    extern const int ILLEGAL_COLUMN;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int NOT_IMPLEMENTED;
-    extern const int CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN;
-    extern const int CANNOT_PARSE_BOOL;
-    extern const int VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE;
-}
-
-/** Type conversion functions.
-  * toType - conversion in "natural way";
-  */
-
-inline UInt32 extractToDecimalScale(const ColumnWithTypeAndName & named_column)
-{
-    const auto * arg_type = named_column.type.get();
-    bool ok = checkAndGetDataType<DataTypeUInt64>(arg_type)
-        || checkAndGetDataType<DataTypeUInt32>(arg_type)
-        || checkAndGetDataType<DataTypeUInt16>(arg_type)
-        || checkAndGetDataType<DataTypeUInt8>(arg_type);
-    if (!ok)
-        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type of toDecimal() scale {}", named_column.type->getName());
-
-    Field field;
-    named_column.column->get(0, field);
-    return static_cast<UInt32>(field.get<UInt32>());
-}
-
-/// Function toUnixTimestamp has exactly the same implementation as toDateTime of String type.
-struct NameToUnixTimestamp { static constexpr auto name = "toUnixTimestamp"; };
-
-struct AccurateConvertStrategyAdditions
-{
-    UInt32 scale { 0 };
-};
-
-struct AccurateOrNullConvertStrategyAdditions
-{
-    UInt32 scale { 0 };
-};
-
-
-struct ConvertDefaultBehaviorTag {};
-struct ConvertReturnNullOnErrorTag {};
-struct ConvertReturnZeroOnErrorTag {};
-
-/** Conversion of number types to each other, enums to numbers, dates and datetimes to numbers and back: done by straight assignment.
-  *  (Date is represented internally as number of days from some day; DateTime - as unix timestamp)
-  */
-template <typename FromDataType, typename ToDataType, typename Name,
-    typename SpecialTag = ConvertDefaultBehaviorTag,
-    FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
-struct ConvertImpl
-{
-    using FromFieldType = typename FromDataType::FieldType;
-    using ToFieldType = typename ToDataType::FieldType;
-
-    template <typename Additions = void *>
-    static ColumnPtr NO_SANITIZE_UNDEFINED execute(
-        const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type [[maybe_unused]], size_t input_rows_count,
-        Additions additions [[maybe_unused]] = Additions())
-    {
-        const ColumnWithTypeAndName & named_from = arguments[0];
-
-        using ColVecFrom = typename FromDataType::ColumnType;
-        using ColVecTo = typename ToDataType::ColumnType;
-
-        if constexpr ((IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
-            && !(std::is_same_v<DataTypeDateTime64, FromDataType> || std::is_same_v<DataTypeDateTime64, ToDataType>))
-        {
-            if constexpr (!IsDataTypeDecimalOrNumber<FromDataType> || !IsDataTypeDecimalOrNumber<ToDataType>)
-            {
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    named_from.column->getName(), Name::name);
-            }
-        }
-
-        if (const ColVecFrom * col_from = checkAndGetColumn<ColVecFrom>(named_from.column.get()))
-        {
-            typename ColVecTo::MutablePtr col_to = nullptr;
-
-            if constexpr (IsDataTypeDecimal<ToDataType>)
-            {
-                UInt32 scale;
-
-                if constexpr (std::is_same_v<Additions, AccurateConvertStrategyAdditions>
-                    || std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                {
-                    scale = additions.scale;
-                }
-                else
-                {
-                    scale = additions;
-                }
-
-                col_to = ColVecTo::create(0, scale);
-            }
-            else
-                col_to = ColVecTo::create();
-
-            const auto & vec_from = col_from->getData();
-            auto & vec_to = col_to->getData();
-            vec_to.resize(input_rows_count);
-
-            ColumnUInt8::MutablePtr col_null_map_to;
-            ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
-            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-            {
-                col_null_map_to = ColumnUInt8::create(input_rows_count, false);
-                vec_null_map_to = &col_null_map_to->getData();
-            }
-
-            bool result_is_bool = isBool(result_type);
-            for (size_t i = 0; i < input_rows_count; ++i)
-            {
-                if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
-                {
-                    if (result_is_bool)
-                    {
-                        vec_to[i] = vec_from[i] != FromFieldType(0);
-                        continue;
-                    }
-                }
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> && std::is_same_v<ToDataType, DataTypeUInt128>)
-                {
-                    static_assert(
-                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                        "UInt128 and UUID types must be same");
-
-                    vec_to[i].items[1] = vec_from[i].toUnderType().items[0];
-                    vec_to[i].items[0] = vec_from[i].toUnderType().items[1];
-
-                    continue;
-                }
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
-                {
-                    static_assert(
-                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
-                        "UInt128 and IPv6 types must be same");
-
-                    vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
-                    vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
-
-                    continue;
-                }
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                    "Conversion between numeric types and UUID is not supported. "
-                                    "Probably the passed UUID is unquoted");
-                }
-                else if constexpr (
-                    (std::is_same_v<FromDataType, DataTypeIPv4> != std::is_same_v<ToDataType, DataTypeIPv4>)
-                    && !(is_any_of<FromDataType, DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeIPv6> || is_any_of<ToDataType, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256, DataTypeIPv6>)
-                )
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Conversion from {} to {} is not supported",
-                                    TypeName<typename FromDataType::FieldType>, TypeName<typename ToDataType::FieldType>);
-                }
-                else if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> != std::is_same_v<ToDataType, DataTypeIPv6> && !(std::is_same_v<ToDataType, DataTypeIPv4> || std::is_same_v<FromDataType, DataTypeIPv4>))
-                {
-                    throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                                    "Conversion between numeric types and IPv6 is not supported. "
-                                    "Probably the passed IPv6 is unquoted");
-                }
-                else
-                {
-                    if constexpr (IsDataTypeDecimal<FromDataType> || IsDataTypeDecimal<ToDataType>)
-                    {
-                        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                        {
-                            ToFieldType result;
-                            bool convert_result = false;
-
-                            if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                convert_result = tryConvertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale(), result);
-                            else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
-                                convert_result = tryConvertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), result);
-                            else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                convert_result = tryConvertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale(), result);
-
-                            if (convert_result)
-                                vec_to[i] = result;
-                            else
-                            {
-                                vec_to[i] = static_cast<ToFieldType>(0);
-                                (*vec_null_map_to)[i] = true;
-                            }
-                        }
-                        else
-                        {
-                            if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                vec_to[i] = convertDecimals<FromDataType, ToDataType>(vec_from[i], col_from->getScale(), col_to->getScale());
-                            else if constexpr (IsDataTypeDecimal<FromDataType> && IsDataTypeNumber<ToDataType>)
-                                vec_to[i] = convertFromDecimal<FromDataType, ToDataType>(vec_from[i], col_from->getScale());
-                            else if constexpr (IsDataTypeNumber<FromDataType> && IsDataTypeDecimal<ToDataType>)
-                                vec_to[i] = convertToDecimal<FromDataType, ToDataType>(vec_from[i], col_to->getScale());
-                            else
-                                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unsupported data type in conversion function");
-                        }
-                    }
-                    else
-                    {
-                        /// If From Data is Nan or Inf and we convert to integer type, throw exception
-                        if constexpr (std::is_floating_point_v<FromFieldType> && !std::is_floating_point_v<ToFieldType>)
-                        {
-                            if (!isFinite(vec_from[i]))
-                            {
-                                if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                                {
-                                    vec_to[i] = 0;
-                                    (*vec_null_map_to)[i] = true;
-                                    continue;
-                                }
-                                else
-                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Unexpected inf or nan to integer conversion");
-                            }
-                        }
-
-                        if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>
-                                || std::is_same_v<Additions, AccurateConvertStrategyAdditions>)
-                        {
-                            bool convert_result = accurate::convertNumeric(vec_from[i], vec_to[i]);
-
-                            if (!convert_result)
-                            {
-                                if (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                                {
-                                    vec_to[i] = 0;
-                                    (*vec_null_map_to)[i] = true;
-                                }
-                                else
-                                {
-                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Value in column {} cannot be safely converted into type {}",
-                                        named_from.column->getName(), result_type->getName());
-                                }
-                            }
-                        }
-                        else
-                        {
-                            if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeIPv6>)
-                            {
-                                const uint8_t ip4_cidr[] {0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x00, 0x00, 0x00};
-                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                                if (!matchIPv6Subnet(src, ip4_cidr, 96))
-                                {
-                                    char addr[IPV6_MAX_TEXT_LENGTH + 1] {};
-                                    char * paddr = addr;
-                                    formatIPv6(src, paddr);
-
-                                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "IPv6 {} in column {} is not in IPv4 mapping block", addr, named_from.column->getName());
-                                }
-
-                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                                if constexpr (std::endian::native == std::endian::little)
-                                {
-                                    dst[0] = src[15];
-                                    dst[1] = src[14];
-                                    dst[2] = src[13];
-                                    dst[3] = src[12];
-                                }
-                                else
-                                {
-                                    dst[0] = src[12];
-                                    dst[1] = src[13];
-                                    dst[2] = src[14];
-                                    dst[3] = src[15];
-                                }
-                            }
-                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv6> && std::is_same_v<FromDataType, DataTypeIPv4>)
-                            {
-                                const uint8_t * src = reinterpret_cast<const uint8_t *>(&vec_from[i].toUnderType());
-                                uint8_t * dst = reinterpret_cast<uint8_t *>(&vec_to[i].toUnderType());
-                                std::memset(dst, '\0', IPV6_BINARY_LENGTH);
-                                dst[10] = dst[11] = 0xff;
-
-                                if constexpr (std::endian::native == std::endian::little)
-                                {
-                                    dst[12] = src[3];
-                                    dst[13] = src[2];
-                                    dst[14] = src[1];
-                                    dst[15] = src[0];
-                                }
-                                else
-                                {
-                                    dst[12] = src[0];
-                                    dst[13] = src[1];
-                                    dst[14] = src[2];
-                                    dst[15] = src[3];
-                                }
-                            }
-                            else if constexpr (std::is_same_v<ToDataType, DataTypeIPv4> && std::is_same_v<FromDataType, DataTypeUInt64>)
-                                vec_to[i] = static_cast<ToFieldType>(static_cast<IPv4::UnderlyingType>(vec_from[i]));
-                            else if constexpr (std::is_same_v<Name, NameToUnixTimestamp> && (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>))
-                                vec_to[i] = static_cast<ToFieldType>(vec_from[i] * DATE_SECONDS_PER_DAY);
-                            else
-                                vec_to[i] = static_cast<ToFieldType>(vec_from[i]);
-                        }
-                    }
-                }
-            }
-
-            if constexpr (std::is_same_v<Additions, AccurateOrNullConvertStrategyAdditions>)
-                return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
-            else
-                return col_to;
-        }
-        else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                named_from.column->getName(), Name::name);
-    }
-};
-
-/** Conversion of DateTime to Date: throw off time component.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDate, ToDateImpl<date_time_overflow_behavior>, false> {};
-
-/** Conversion of DateTime to Date32: throw off time component.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDate32, ToDate32Impl, false> {};
-
-/** Conversion of Date to DateTime: adding 00:00:00 time component.
-  */
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
-struct ToDateTimeImpl
-{
-    static constexpr auto name = "toDateTime";
-
-    static UInt32 execute(UInt16 d, const DateLUTImpl & time_zone)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (d > MAX_DATETIME_DAY_NUM) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Day number {} is out of bounds of type DateTime", d);
-        }
-        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
-        {
-            if (d > MAX_DATETIME_DAY_NUM)
-                d = MAX_DATETIME_DAY_NUM;
-        }
-        return static_cast<UInt32>(time_zone.fromDayNum(DayNum(d)));
-    }
-
-    static UInt32 execute(Int32 d, const DateLUTImpl & time_zone)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
-        {
-            if (d < 0)
-                return 0;
-            else if (d > MAX_DATETIME_DAY_NUM)
-                d = MAX_DATETIME_DAY_NUM;
-        }
-        else if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (d < 0 || d > MAX_DATETIME_DAY_NUM) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", d);
-        }
-        return static_cast<UInt32>(time_zone.fromDayNum(ExtendedDayNum(d)));
-    }
-
-    static UInt32 execute(UInt32 dt, const DateLUTImpl & /*time_zone*/)
-    {
-        return dt;
-    }
-
-    static UInt32 execute(Int64 dt64, const DateLUTImpl & /*time_zone*/)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Ignore)
-            return static_cast<UInt32>(dt64);
-        else
-        {
-            if (dt64 < 0 || dt64 >= MAX_DATETIME_TIMESTAMP)
-            {
-                if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Saturate)
-                    return dt64 < 0 ? 0 : std::numeric_limits<UInt32>::max();
-                else
-                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type DateTime", dt64);
-            }
-            else
-                return static_cast<UInt32>(dt64);
-        }
-    }
-};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate, DataTypeDateTime, ToDateTimeImpl<date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate32, DataTypeDateTime, ToDateTimeImpl<date_time_overflow_behavior>, false> {};
-
-/// Implementation of toDate function.
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTransform32Or64
-{
-    static constexpr auto name = "toDate";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
-        }
-        /// if value is smaller (or equal) than maximum day value for Date, than treat it as day num,
-        /// otherwise treat it as unix timestamp. This is a bit weird, but we leave this behavior.
-        if (from <= DATE_LUT_MAX_DAY_NUM)
-            return from;
-        else
-            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
-    }
-};
-
-/** Conversion of Date32 to Date.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate32, DataTypeDate, ToDateImpl<date_time_overflow_behavior>, false> {};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTransform32Or64Signed
-{
-    static constexpr auto name = "toDate";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        // TODO: decide narrow or extended range based on FromType
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < 0 || from > MAX_DATE_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
-        }
-        else
-        {
-            if (from < 0)
-                return 0;
-        }
-        return (from <= DATE_LUT_MAX_DAY_NUM)
-            ? static_cast<ToType>(from)
-            : time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATE_TIMESTAMP)));
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTransform8Or16Signed
-{
-    static constexpr auto name = "toDate";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if (from < 0)
-        {
-            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Value {} is out of bounds of type Date", from);
-            else
-                return 0;
-        }
-        return from;
-    }
-};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-        : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false> {};
-
-/// Implementation of toDate32 function.
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDate32Transform32Or64
-{
-    static constexpr auto name = "toDate32";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        if (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
-            return static_cast<ToType>(from);
-        else
-        {
-            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-            {
-                if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                    throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
-            }
-            return time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATETIME64_TIMESTAMP)));
-        }
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDate32Transform32Or64Signed
-{
-    static constexpr auto name = "toDate32";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
-    {
-        static const Int32 daynum_min_offset = -static_cast<Int32>(time_zone.getDayNumOffsetEpoch());
-
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < daynum_min_offset || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type Date32", from);
-        }
-
-        if (from < daynum_min_offset)
-            return daynum_min_offset;
-
-        return (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
-            ? static_cast<ToType>(from)
-            : time_zone.toDayNum(std::min(time_t(Int64(from)), time_t(MAX_DATETIME64_TIMESTAMP)));
-    }
-};
-
-template <typename FromType, typename ToType>
-struct ToDate32Transform8Or16Signed
-{
-    static constexpr auto name = "toDate32";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        return from;
-    }
-};
-
-/** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
-  * Float32, Float64) to Date. If the
-  * number is less than 65536, then it is treated as DayNum, and if it's greater or equals to 65536,
-  * then treated as unix timestamp. If the number exceeds UInt32, saturate to MAX_UINT32 then as DayNum.
-  * It's a bit illogical, as we actually have two functions in one.
-  * But allows to support frequent case,
-  *  when user write toDate(UInt32), expecting conversion of unix timestamp to Date.
-  *  (otherwise such usage would be frequent mistake).
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt32, DataTypeDate, ToDateTransform32Or64<UInt32, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDate, ToDateTransform32Or64<UInt64, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDate, ToDateTransform8Or16Signed<Int8, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDate, ToDateTransform8Or16Signed<Int16, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDate, ToDateTransform32Or64Signed<Int32, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDate, ToDateTransform32Or64Signed<Int64, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDate, ToDateTransform32Or64Signed<Float32, UInt16, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDate, ToDateTransform32Or64Signed<Float64, UInt16, default_date_time_overflow_behavior>, false> {};
-
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt32, DataTypeDate32, ToDate32Transform32Or64<UInt32, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDate32, ToDate32Transform32Or64<UInt64, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDate32, ToDate32Transform8Or16Signed<Int8, Int32>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDate32, ToDate32Transform8Or16Signed<Int16, Int32>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDate32, ToDate32Transform32Or64Signed<Int32, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDate32, ToDate32Transform32Or64Signed<Int64, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDate32, ToDate32Transform32Or64Signed<Float32, Int32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDate32, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDate32, ToDate32Transform32Or64Signed<Float64, Int32, default_date_time_overflow_behavior>, false> {};
-
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTimeTransform64
-{
-    static constexpr auto name = "toDateTime";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
-        }
-        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTimeTransformSigned
-{
-    static constexpr auto name = "toDateTime";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if (from < 0)
-        {
-            if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
-            else
-                return 0;
-        }
-        return from;
-    }
-};
-
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTimeTransform64Signed
-{
-    static constexpr auto name = "toDateTime";
-
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < 0 || from > MAX_DATETIME_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime", from);
-        }
-
-        if (from < 0)
-            return 0;
-        return static_cast<ToType>(std::min(time_t(from), time_t(MAX_DATETIME_TIMESTAMP)));
-    }
-};
-
-/// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDateTime, ToDateTimeTransformSigned<Int8, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDateTime, ToDateTimeTransformSigned<Int16, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDateTime, ToDateTimeTransformSigned<Int32, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDateTime, ToDateTimeTransform64Signed<Int64, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDateTime, ToDateTimeTransform64<UInt64, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDateTime, ToDateTimeTransform64Signed<Float32, UInt32, default_date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDateTime, ToDateTimeTransform64Signed<Float64, UInt32, default_date_time_overflow_behavior>, false> {};
-
-/** Conversion of numeric to DateTime64
-  */
-
-template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTime64TransformUnsigned
-{
-    static constexpr auto name = "toDateTime64";
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    ToDateTime64TransformUnsigned(UInt32 scale = 0) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
-            else
-                return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
-        }
-        else
-            return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP), 0, scale_multiplier);
-    }
-};
-template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTime64TransformSigned
-{
-    static constexpr auto name = "toDateTime64";
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    ToDateTime64TransformSigned(UInt32 scale = 0) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
-        }
-        from = static_cast<FromType>(std::max<time_t>(from, MIN_DATETIME64_TIMESTAMP));
-        from = static_cast<FromType>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP));
-
-        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
-    }
-};
-template <typename FromDataType, typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ToDateTime64TransformFloat
-{
-    static constexpr auto name = "toDateTime64";
-
-    const UInt32 scale = 1;
-
-    ToDateTime64TransformFloat(UInt32 scale_ = 0) /// NOLINT
-        : scale(scale_)
-    {}
-
-    NO_SANITIZE_UNDEFINED DateTime64::NativeType execute(FromType from, const DateLUTImpl &) const
-    {
-        if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
-        {
-            if (from < MIN_DATETIME64_TIMESTAMP || from > MAX_DATETIME64_TIMESTAMP) [[unlikely]]
-                throw Exception(ErrorCodes::VALUE_IS_OUT_OF_RANGE_OF_DATA_TYPE, "Timestamp value {} is out of bounds of type DateTime64", from);
-        }
-
-        from = std::max(from, static_cast<FromType>(MIN_DATETIME64_TIMESTAMP));
-        from = std::min(from, static_cast<FromType>(MAX_DATETIME64_TIMESTAMP));
-        return convertToDecimal<FromDataType, DataTypeDateTime64>(from, scale);
-    }
-};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt8, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt8, DataTypeDateTime64, ToDateTime64TransformSigned<Int8, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt16, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt16, DataTypeDateTime64, ToDateTime64TransformSigned<Int16, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt32, DataTypeDateTime64, ToDateTime64TransformSigned<Int32, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeInt64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeInt64, DataTypeDateTime64, ToDateTime64TransformSigned<Int64, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeUInt64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeUInt64, DataTypeDateTime64, ToDateTime64TransformUnsigned<UInt64, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat32, DataTypeDateTime64, ToDateTime64TransformFloat<DataTypeFloat32, Float32, date_time_overflow_behavior>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeFloat64, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeFloat64, DataTypeDateTime64, ToDateTime64TransformFloat<DataTypeFloat64, Float64, date_time_overflow_behavior>, false> {};
-
-
-/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
- */
-template <typename Transform>
-struct FromDateTime64Transform
-{
-    static constexpr auto name = Transform::name;
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    FromDateTime64Transform(UInt32 scale) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    auto execute(DateTime64::NativeType dt, const DateLUTImpl & time_zone) const
-    {
-        const auto c = DecimalUtils::splitWithScaleMultiplier(DateTime64(dt), scale_multiplier);
-        return Transform::execute(static_cast<UInt32>(c.whole), time_zone);
-    }
-};
-
-/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
- */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime64, DataTypeDate, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime64, DataTypeDateTime, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime64, DataTypeDateTime, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false> {};
-
-struct ToDateTime64Transform
-{
-    static constexpr auto name = "toDateTime64";
-
-    const DateTime64::NativeType scale_multiplier = 1;
-
-    ToDateTime64Transform(UInt32 scale = 0) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    DateTime64::NativeType execute(UInt16 d, const DateLUTImpl & time_zone) const
-    {
-        const auto dt = ToDateTimeImpl<>::execute(d, time_zone);
-        return execute(dt, time_zone);
-    }
-
-    DateTime64::NativeType execute(Int32 d, const DateLUTImpl & time_zone) const
-    {
-        Int64 dt = static_cast<Int64>(time_zone.fromDayNum(ExtendedDayNum(d)));
-        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
-    }
-
-    DateTime64::NativeType execute(UInt32 dt, const DateLUTImpl & /*time_zone*/) const
-    {
-        return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(dt, 0, scale_multiplier);
-    }
-};
-
-/** Conversion of Date or DateTime to DateTime64: add zero sub-second part.
-  */
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate, DataTypeDateTime64, ToDateTime64Transform> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDate32, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDate32, DataTypeDateTime64, ToDateTime64Transform> {};
-
-template <typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct ConvertImpl<DataTypeDateTime, DataTypeDateTime64, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : DateTimeTransformImpl<DataTypeDateTime, DataTypeDateTime64, ToDateTime64Transform> {};
-
-
-/** Transformation of numbers, dates, datetimes to strings: through formatting.
-  */
-template <typename DataType>
-struct FormatImpl
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const typename DataType::FieldType x, WriteBuffer & wb, const DataType *, const DateLUTImpl *)
-    {
-        writeText(x, wb);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDate>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDate::FieldType x, WriteBuffer & wb, const DataTypeDate *, const DateLUTImpl * time_zone)
-    {
-        writeDateText(DayNum(x), wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDate32>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDate32::FieldType x, WriteBuffer & wb, const DataTypeDate32 *, const DateLUTImpl * time_zone)
-    {
-        writeDateText(ExtendedDayNum(x), wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDateTime>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDateTime::FieldType x, WriteBuffer & wb, const DataTypeDateTime *, const DateLUTImpl * time_zone)
-    {
-        writeDateTimeText(x, wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-template <>
-struct FormatImpl<DataTypeDateTime64>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const DataTypeDateTime64::FieldType x, WriteBuffer & wb, const DataTypeDateTime64 * type, const DateLUTImpl * time_zone)
-    {
-        writeDateTimeText(DateTime64(x), type->getScale(), wb, *time_zone);
-        return ReturnType(true);
-    }
-};
-
-
-template <typename FieldType>
-struct FormatImpl<DataTypeEnum<FieldType>>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeEnum<FieldType> * type, const DateLUTImpl *)
-    {
-        static constexpr bool throw_exception = std::is_same_v<ReturnType, void>;
-
-        if constexpr (throw_exception)
-        {
-            writeString(type->getNameForValue(x), wb);
-        }
-        else
-        {
-            StringRef res;
-            bool is_ok = type->getNameForValue(x, res);
-            if (is_ok)
-                writeString(res, wb);
-            return ReturnType(is_ok);
-        }
-    }
-};
-
-template <typename FieldType>
-struct FormatImpl<DataTypeDecimal<FieldType>>
-{
-    template <typename ReturnType = void>
-    static ReturnType execute(const FieldType x, WriteBuffer & wb, const DataTypeDecimal<FieldType> * type, const DateLUTImpl *)
-    {
-        writeText(x, type->getScale(), wb, false);
-        return ReturnType(true);
-    }
-};
-
-
-/// DataTypeEnum<T> to DataType<T> free conversion
-template <typename FieldType, typename Name>
-struct ConvertImpl<DataTypeEnum<FieldType>, DataTypeNumber<FieldType>, Name, ConvertDefaultBehaviorTag>
-{
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/)
-    {
-        return arguments[0].column;
-    }
-};
-
-static inline ColumnUInt8::MutablePtr copyNullMap(ColumnPtr col)
-{
-    ColumnUInt8::MutablePtr null_map = nullptr;
-    if (const auto * col_null = checkAndGetColumn<ColumnNullable>(col.get()))
-    {
-        null_map = ColumnUInt8::create();
-        null_map->insertRangeFrom(col_null->getNullMapColumn(), 0, col_null->size());
-    }
-    return null_map;
-}
-
-template <typename FromDataType, typename Name>
-requires (!std::is_same_v<FromDataType, DataTypeString>)
-struct ConvertImpl<FromDataType, DataTypeString, Name, ConvertDefaultBehaviorTag>
-{
-    using FromFieldType = typename FromDataType::FieldType;
-    using ColVecType = ColumnVectorOrDecimal<FromFieldType>;
-
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/)
-    {
-        if constexpr (IsDataTypeDateOrDateTime<FromDataType>)
-        {
-            auto datetime_arg = arguments[0];
-
-            const DateLUTImpl * time_zone = nullptr;
-            const ColumnConst * time_zone_column = nullptr;
-
-            if (arguments.size() == 1)
-            {
-                auto non_null_args = createBlockWithNestedColumns(arguments);
-                time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
-            }
-            else /// When we have a column for timezone
-            {
-                datetime_arg.column = datetime_arg.column->convertToFullColumnIfConst();
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
-                    time_zone = &DateLUT::instance();
-                /// For argument of Date or DateTime type, second argument with time zone could be specified.
-                if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> || std::is_same_v<FromDataType, DataTypeDateTime64>)
-                {
-                    if ((time_zone_column = checkAndGetColumnConst<ColumnString>(arguments[1].column.get())))
-                    {
-                        auto non_null_args = createBlockWithNestedColumns(arguments);
-                        time_zone = &extractTimeZoneFromFunctionArguments(non_null_args, 1, 0);
-                    }
-                }
-            }
-            const auto & col_with_type_and_name = columnGetNested(datetime_arg);
-
-            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
-            {
-                auto col_to = ColumnString::create();
-
-                const typename ColVecType::Container & vec_from = col_from->getData();
-                ColumnString::Chars & data_to = col_to->getChars();
-                ColumnString::Offsets & offsets_to = col_to->getOffsets();
-                size_t size = vec_from.size();
-
-                if constexpr (std::is_same_v<FromDataType, DataTypeDate>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
-                else if constexpr (std::is_same_v<FromDataType, DataTypeDate32>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD") + 1));
-                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss") + 1));
-                else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>)
-                    data_to.resize(size * (strlen("YYYY-MM-DD hh:mm:ss.") + col_from->getScale() + 1));
-                else
-                    data_to.resize(size * 3);   /// Arbitrary
-
-                offsets_to.resize(size);
-
-                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
-                const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
-
-                ColumnUInt8::MutablePtr null_map = copyNullMap(datetime_arg.column);
-
-                if (!null_map && arguments.size() > 1)
-                    null_map = copyNullMap(arguments[1].column->convertToFullColumnIfConst());
-
-                if (null_map)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!time_zone_column && arguments.size() > 1)
-                        {
-                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
-                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
-                            else
-                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
-                        }
-                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, time_zone);
-                        null_map->getData()[i] |= !is_ok;
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!time_zone_column && arguments.size() > 1)
-                        {
-                            if (!arguments[1].column.get()->getDataAt(i).toString().empty())
-                                time_zone = &DateLUT::instance(arguments[1].column.get()->getDataAt(i).toString());
-                            else
-                                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Provided time zone must be non-empty");
-                        }
-                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, time_zone);
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-
-                write_buffer.finalize();
-
-                if (null_map)
-                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
-                return col_to;
-            }
-            else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                        arguments[0].column->getName(), Name::name);
-        }
-        else
-        {
-            ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
-
-            const auto & col_with_type_and_name = columnGetNested(arguments[0]);
-            const auto & type = static_cast<const FromDataType &>(*col_with_type_and_name.type);
-
-            if (const auto col_from = checkAndGetColumn<ColVecType>(col_with_type_and_name.column.get()))
-            {
-                auto col_to = ColumnString::create();
-
-                const typename ColVecType::Container & vec_from = col_from->getData();
-                ColumnString::Chars & data_to = col_to->getChars();
-                ColumnString::Offsets & offsets_to = col_to->getOffsets();
-                size_t size = vec_from.size();
-
-                data_to.resize(size * 3);
-                offsets_to.resize(size);
-
-                WriteBufferFromVector<ColumnString::Chars> write_buffer(data_to);
-
-                if (null_map)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        bool is_ok = FormatImpl<FromDataType>::template execute<bool>(vec_from[i], write_buffer, &type, nullptr);
-                        /// We don't use timezones in this branch
-                        null_map->getData()[i] |= !is_ok;
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        FormatImpl<FromDataType>::template execute<void>(vec_from[i], write_buffer, &type, nullptr);
-                        writeChar(0, write_buffer);
-                        offsets_to[i] = write_buffer.count();
-                    }
-                }
-
-                write_buffer.finalize();
-
-                if (null_map)
-                    return ColumnNullable::create(std::move(col_to), std::move(null_map));
-                return col_to;
-            }
-            else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                        arguments[0].column->getName(), Name::name);
-        }
-    }
-};
-
-
-/// Generic conversion of any type to String or FixedString via serialization to text.
-template <typename StringColumnType>
-struct ConvertImplGenericToString
-{
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t /*input_rows_count*/)
-    {
-        static_assert(std::is_same_v<StringColumnType, ColumnString> || std::is_same_v<StringColumnType, ColumnFixedString>,
-                "Can be used only to serialize to ColumnString or ColumnFixedString");
-
-        ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
-
-        const auto & col_with_type_and_name = columnGetNested(arguments[0]);
-        const IDataType & type = *col_with_type_and_name.type;
-        const IColumn & col_from = *col_with_type_and_name.column;
-
-        size_t size = col_from.size();
-        auto col_to = removeNullable(result_type)->createColumn();
-
-        {
-            ColumnStringHelpers::WriteHelper write_helper(
-                    assert_cast<StringColumnType &>(*col_to),
-                    size);
-
-            auto & write_buffer = write_helper.getWriteBuffer();
-
-            FormatSettings format_settings;
-            auto serialization = type.getDefaultSerialization();
-            for (size_t row = 0; row < size; ++row)
-            {
-                serialization->serializeText(col_from, row, write_buffer, format_settings);
-                write_helper.rowWritten();
-            }
-
-            write_helper.finalize();
-        }
-
-        if (result_type->isNullable() && null_map)
-            return ColumnNullable::create(std::move(col_to), std::move(null_map));
-        return col_to;
-    }
-};
-
-/** Conversion of time_t to UInt16, Int32, UInt32
-  */
-template <typename DataType>
-void convertFromTime(typename DataType::FieldType & x, time_t & time)
-{
-    x = time;
-}
-
-template <>
-inline void convertFromTime<DataTypeDate>(DataTypeDate::FieldType & x, time_t & time)
-{
-    if (unlikely(time < 0))
-        x = 0;
-    else if (unlikely(time > 0xFFFF))
-        x = 0xFFFF;
-    else
-        x = time;
-}
-
-template <>
-inline void convertFromTime<DataTypeDate32>(DataTypeDate32::FieldType & x, time_t & time)
-{
-    x = static_cast<UInt32>(time);
-}
-
-template <>
-inline void convertFromTime<DataTypeDateTime>(DataTypeDateTime::FieldType & x, time_t & time)
-{
-    if (unlikely(time < 0))
-        x = 0;
-    else if (unlikely(time > MAX_DATETIME_TIMESTAMP))
-        x = MAX_DATETIME_TIMESTAMP;
-    else
-        x = static_cast<UInt32>(time);
-}
-
-/** Conversion of strings to numbers, dates, datetimes: through parsing.
-  */
-template <typename DataType>
-void parseImpl(typename DataType::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool precise_float_parsing)
-{
-    if constexpr (std::is_floating_point_v<typename DataType::FieldType>)
-    {
-        if (precise_float_parsing)
-            readFloatTextPrecise(x, rb);
-        else
-            readFloatTextFast(x, rb);
-    }
-    else
-        readText(x, rb);
-}
-
-template <>
-inline void parseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    DayNum tmp(0);
-    readDateText(tmp, rb, *time_zone);
-    x = tmp;
-}
-
-template <>
-inline void parseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    ExtendedDayNum tmp(0);
-    readDateText(tmp, rb, *time_zone);
-    x = tmp;
-}
-
-
-// NOTE: no need of extra overload of DateTime64, since readDateTimeText64 has different signature and that case is explicitly handled in the calling code.
-template <>
-inline void parseImpl<DataTypeDateTime>(DataTypeDateTime::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    time_t time = 0;
-    readDateTimeText(time, rb, *time_zone);
-    convertFromTime<DataTypeDateTime>(x, time);
-}
-
-template <>
-inline void parseImpl<DataTypeUUID>(DataTypeUUID::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    UUID tmp;
-    readUUIDText(tmp, rb);
-    x = tmp.toUnderType();
-}
-
-template <>
-inline void parseImpl<DataTypeIPv4>(DataTypeIPv4::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    IPv4 tmp;
-    readIPv4Text(tmp, rb);
-    x = tmp.toUnderType();
-}
-
-template <>
-inline void parseImpl<DataTypeIPv6>(DataTypeIPv6::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    IPv6 tmp;
-    readIPv6Text(tmp, rb);
-    x = tmp;
-}
-
-template <typename DataType>
-bool tryParseImpl(typename DataType::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool precise_float_parsing)
-{
-    if constexpr (std::is_floating_point_v<typename DataType::FieldType>)
-    {
-        if (precise_float_parsing)
-            return tryReadFloatTextPrecise(x, rb);
-        else
-            return tryReadFloatTextFast(x, rb);
-    }
-    else /*if constexpr (is_integer_v<typename DataType::FieldType>)*/
-        return tryReadIntText(x, rb);
-}
-
-template <>
-inline bool tryParseImpl<DataTypeDate>(DataTypeDate::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    DayNum tmp(0);
-    if (!tryReadDateText(tmp, rb, *time_zone))
-        return false;
-    x = tmp;
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    ExtendedDayNum tmp(0);
-    if (!tryReadDateText(tmp, rb, *time_zone))
-        return false;
-    x = tmp;
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeDateTime>(DataTypeDateTime::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
-{
-    time_t time = 0;
-    if (!tryReadDateTimeText(time, rb, *time_zone))
-        return false;
-    convertFromTime<DataTypeDateTime>(x, time);
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeUUID>(DataTypeUUID::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    UUID tmp;
-    if (!tryReadUUIDText(tmp, rb))
-        return false;
-
-    x = tmp.toUnderType();
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeIPv4>(DataTypeIPv4::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    IPv4 tmp;
-    if (!tryReadIPv4Text(tmp, rb))
-        return false;
-
-    x = tmp.toUnderType();
-    return true;
-}
-
-template <>
-inline bool tryParseImpl<DataTypeIPv6>(DataTypeIPv6::FieldType & x, ReadBuffer & rb, const DateLUTImpl *, bool)
-{
-    IPv6 tmp;
-    if (!tryReadIPv6Text(tmp, rb))
-        return false;
-
-    x = tmp;
-    return true;
-}
-
-
-/** Throw exception with verbose message when string value is not parsed completely.
-  */
-[[noreturn]] inline void throwExceptionForIncompletelyParsedValue(ReadBuffer & read_buffer, const IDataType & result_type)
-{
-    WriteBufferFromOwnString message_buf;
-    message_buf << "Cannot parse string " << quote << String(read_buffer.buffer().begin(), read_buffer.buffer().size())
-                << " as " << result_type.getName()
-                << ": syntax error";
-
-    if (read_buffer.offset())
-        message_buf << " at position " << read_buffer.offset()
-                    << " (parsed just " << quote << String(read_buffer.buffer().begin(), read_buffer.offset()) << ")";
-    else
-        message_buf << " at begin of string";
-
-    // Currently there are no functions toIPv{4,6}Or{Null,Zero}
-    if (isNativeNumber(result_type) && !(result_type.getName() == "IPv4" || result_type.getName() == "IPv6"))
-        message_buf << ". Note: there are to" << result_type.getName() << "OrZero and to" << result_type.getName() << "OrNull functions, which returns zero/NULL instead of throwing exception.";
-
-    throw Exception(PreformattedMessage{message_buf.str(), "Cannot parse string {} as {}: syntax error {}"}, ErrorCodes::CANNOT_PARSE_TEXT);
-}
-
-
-enum class ConvertFromStringExceptionMode
-{
-    Throw,  /// Throw exception if value cannot be parsed.
-    Zero,   /// Fill with zero or default if value cannot be parsed.
-    Null    /// Return ColumnNullable with NULLs when value cannot be parsed.
-};
-
-enum class ConvertFromStringParsingMode
-{
-    Normal,
-    BestEffort,  /// Only applicable for DateTime. Will use sophisticated method, that is slower.
-    BestEffortUS
-};
-
-template <typename FromDataType, typename ToDataType, typename Name,
-    ConvertFromStringExceptionMode exception_mode, ConvertFromStringParsingMode parsing_mode>
-struct ConvertThroughParsing
-{
-    static_assert(std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>,
-        "ConvertThroughParsing is only applicable for String or FixedString data types");
-
-    static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
-
-    static bool isAllRead(ReadBuffer & in)
-    {
-        /// In case of FixedString, skip zero bytes at end.
-        if constexpr (std::is_same_v<FromDataType, DataTypeFixedString>)
-            while (!in.eof() && *in.position() == 0)
-                ++in.position();
-
-        if (in.eof())
-            return true;
-
-        /// Special case, that allows to parse string with DateTime or DateTime64 as Date or Date32.
-        if constexpr (std::is_same_v<ToDataType, DataTypeDate> || std::is_same_v<ToDataType, DataTypeDate32>)
-        {
-            if (!in.eof() && (*in.position() == ' ' || *in.position() == 'T'))
-            {
-                if (in.buffer().size() == strlen("YYYY-MM-DD hh:mm:ss"))
-                    return true;
-
-                if (in.buffer().size() >= strlen("YYYY-MM-DD hh:mm:ss.x")
-                    && in.buffer().begin()[19] == '.')
-                {
-                    in.position() = in.buffer().begin() + 20;
-
-                    while (!in.eof() && isNumericASCII(*in.position()))
-                        ++in.position();
-
-                    if (in.eof())
-                        return true;
-                }
-            }
-        }
-
-        return false;
-    }
-
-    template <typename Additions = void *>
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & res_type, size_t input_rows_count,
-                        Additions additions [[maybe_unused]] = Additions())
-    {
-        using ColVecTo = typename ToDataType::ColumnType;
-
-        const DateLUTImpl * local_time_zone [[maybe_unused]] = nullptr;
-        const DateLUTImpl * utc_time_zone [[maybe_unused]] = nullptr;
-
-        /// For conversion to Date or DateTime type, second argument with time zone could be specified.
-        if constexpr (std::is_same_v<ToDataType, DataTypeDateTime> || to_datetime64)
-        {
-            const auto result_type = removeNullable(res_type);
-            // Time zone is already figured out during result type resolution, no need to do it here.
-            if (const auto dt_col = checkAndGetDataType<ToDataType>(result_type.get()))
-                local_time_zone = &dt_col->getTimeZone();
-            else
-                local_time_zone = &extractTimeZoneFromFunctionArguments(arguments, 1, 0);
-
-            if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort || parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
-                utc_time_zone = &DateLUT::instance("UTC");
-        }
-        else if constexpr (std::is_same_v<ToDataType, DataTypeDate> || std::is_same_v<ToDataType, DataTypeDate32>)
-        {
-            // Timezone is more or less dummy when parsing Date/Date32 from string.
-            local_time_zone = &DateLUT::instance();
-            utc_time_zone = &DateLUT::instance("UTC");
-        }
-
-        const IColumn * col_from = arguments[0].column.get();
-        const ColumnString * col_from_string = checkAndGetColumn<ColumnString>(col_from);
-        const ColumnFixedString * col_from_fixed_string = checkAndGetColumn<ColumnFixedString>(col_from);
-
-        if (std::is_same_v<FromDataType, DataTypeString> && !col_from_string)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                col_from->getName(), Name::name);
-
-        if (std::is_same_v<FromDataType, DataTypeFixedString> && !col_from_fixed_string)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                col_from->getName(), Name::name);
-
-        size_t size = input_rows_count;
-        typename ColVecTo::MutablePtr col_to = nullptr;
-
-        if constexpr (IsDataTypeDecimal<ToDataType>)
-        {
-            UInt32 scale = additions;
-            if constexpr (to_datetime64)
-            {
-                ToDataType check_bounds_in_ctor(scale, local_time_zone ? local_time_zone->getTimeZone() : String{});
-            }
-            else
-            {
-                ToDataType check_bounds_in_ctor(ToDataType::maxPrecision(), scale);
-            }
-            col_to = ColVecTo::create(size, scale);
-        }
-        else
-            col_to = ColVecTo::create(size);
-
-        typename ColVecTo::Container & vec_to = col_to->getData();
-
-        ColumnUInt8::MutablePtr col_null_map_to;
-        ColumnUInt8::Container * vec_null_map_to [[maybe_unused]] = nullptr;
-        if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
-        {
-            col_null_map_to = ColumnUInt8::create(size);
-            vec_null_map_to = &col_null_map_to->getData();
-        }
-
-        const ColumnString::Chars * chars = nullptr;
-        const IColumn::Offsets * offsets = nullptr;
-        size_t fixed_string_size = 0;
-
-        if constexpr (std::is_same_v<FromDataType, DataTypeString>)
-        {
-            chars = &col_from_string->getChars();
-            offsets = &col_from_string->getOffsets();
-        }
-        else
-        {
-            chars = &col_from_fixed_string->getChars();
-            fixed_string_size = col_from_fixed_string->getN();
-        }
-
-        size_t current_offset = 0;
-
-        bool precise_float_parsing = false;
-
-        if (DB::CurrentThread::isInitialized())
-        {
-            const DB::ContextPtr query_context = DB::CurrentThread::get().getQueryContext();
-
-            if (query_context)
-                precise_float_parsing = query_context->getSettingsRef().precise_float_parsing;
-        }
-
-        for (size_t i = 0; i < size; ++i)
-        {
-            size_t next_offset = std::is_same_v<FromDataType, DataTypeString> ? (*offsets)[i] : (current_offset + fixed_string_size);
-            size_t string_size = std::is_same_v<FromDataType, DataTypeString> ? next_offset - current_offset - 1 : fixed_string_size;
-
-            ReadBufferFromMemory read_buffer(&(*chars)[current_offset], string_size);
-
-            if constexpr (exception_mode == ConvertFromStringExceptionMode::Throw)
-            {
-                if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort)
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 res = 0;
-                        parseDateTime64BestEffort(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
-                        vec_to[i] = res;
-                    }
-                    else
-                    {
-                        time_t res;
-                        parseDateTimeBestEffort(res, read_buffer, *local_time_zone, *utc_time_zone);
-                        convertFromTime<ToDataType>(vec_to[i], res);
-                    }
-                }
-                else if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 res = 0;
-                        parseDateTime64BestEffortUS(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
-                        vec_to[i] = res;
-                    }
-                    else
-                    {
-                        time_t res;
-                        parseDateTimeBestEffortUS(res, read_buffer, *local_time_zone, *utc_time_zone);
-                        convertFromTime<ToDataType>(vec_to[i], res);
-                    }
-                }
-                else
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 value = 0;
-                        readDateTime64Text(value, col_to->getScale(), read_buffer, *local_time_zone);
-                        vec_to[i] = value;
-                    }
-                    else if constexpr (IsDataTypeDecimal<ToDataType>)
-                    {
-                        SerializationDecimal<typename ToDataType::FieldType>::readText(
-                            vec_to[i], read_buffer, ToDataType::maxPrecision(), col_to->getScale());
-                    }
-                    else
-                    {
-                        /// we want to utilize constexpr condition here, which is not mixable with value comparison
-                        do
-                        {
-                            if constexpr (std::is_same_v<FromDataType, DataTypeFixedString> && std::is_same_v<ToDataType, DataTypeIPv6>)
-                            {
-                                if (fixed_string_size == IPV6_BINARY_LENGTH)
-                                {
-                                    readBinary(vec_to[i], read_buffer);
-                                    break;
-                                }
-                            }
-                            parseImpl<ToDataType>(vec_to[i], read_buffer, local_time_zone, precise_float_parsing);
-                        } while (false);
-                    }
-                }
-
-                if (!isAllRead(read_buffer))
-                    throwExceptionForIncompletelyParsedValue(read_buffer, *res_type);
-            }
-            else
-            {
-                bool parsed;
-
-                if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffort)
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 res = 0;
-                        parsed = tryParseDateTime64BestEffort(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
-                        vec_to[i] = res;
-                    }
-                    else
-                    {
-                        time_t res;
-                        parsed = tryParseDateTimeBestEffort(res, read_buffer, *local_time_zone, *utc_time_zone);
-                        convertFromTime<ToDataType>(vec_to[i],res);
-                    }
-                }
-                else if constexpr (parsing_mode == ConvertFromStringParsingMode::BestEffortUS)
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 res = 0;
-                        parsed = tryParseDateTime64BestEffortUS(res, col_to->getScale(), read_buffer, *local_time_zone, *utc_time_zone);
-                        vec_to[i] = res;
-                    }
-                    else
-                    {
-                        time_t res;
-                        parsed = tryParseDateTimeBestEffortUS(res, read_buffer, *local_time_zone, *utc_time_zone);
-                        convertFromTime<ToDataType>(vec_to[i],res);
-                    }
-                }
-                else
-                {
-                    if constexpr (to_datetime64)
-                    {
-                        DateTime64 value = 0;
-                        parsed = tryReadDateTime64Text(value, col_to->getScale(), read_buffer, *local_time_zone);
-                        vec_to[i] = value;
-                    }
-                    else if constexpr (IsDataTypeDecimal<ToDataType>)
-                    {
-                        parsed = SerializationDecimal<typename ToDataType::FieldType>::tryReadText(
-                            vec_to[i], read_buffer, ToDataType::maxPrecision(), col_to->getScale());
-                    }
-                    else
-                    {
-                        /// we want to utilize constexpr condition here, which is not mixable with value comparison
-                        do
-                        {
-                            if constexpr (std::is_same_v<FromDataType, DataTypeFixedString> && std::is_same_v<ToDataType, DataTypeIPv6>)
-                            {
-                                if (fixed_string_size == IPV6_BINARY_LENGTH)
-                                {
-                                    readBinary(vec_to[i], read_buffer);
-                                    parsed = true;
-                                    break;
-                                }
-                            }
-
-                            parsed = tryParseImpl<ToDataType>(vec_to[i], read_buffer, local_time_zone, precise_float_parsing);
-                        } while (false);
-                    }
-                }
-
-                if (!isAllRead(read_buffer))
-                    parsed = false;
-
-                if (!parsed)
-                {
-                    if constexpr (std::is_same_v<ToDataType, DataTypeDate32>)
-                    {
-                        vec_to[i] = -static_cast<Int32>(DateLUT::instance().getDayNumOffsetEpoch());
-                    }
-                    else
-                    {
-                        vec_to[i] = static_cast<typename ToDataType::FieldType>(0);
-                    }
-                }
-
-                if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
-                    (*vec_null_map_to)[i] = !parsed;
-            }
-
-            current_offset = next_offset;
-        }
-
-        if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
-            return ColumnNullable::create(std::move(col_to), std::move(col_null_map_to));
-        else
-            return col_to;
-    }
-};
-
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeString>)
-struct ConvertImpl<DataTypeString, ToDataType, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeString, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal> {};
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeFixedString>)
-struct ConvertImpl<DataTypeFixedString, ToDataType, Name, ConvertDefaultBehaviorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeFixedString, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal> {};
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeString>)
-struct ConvertImpl<DataTypeString, ToDataType, Name, ConvertReturnNullOnErrorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeString, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal> {};
-
-template <typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (!std::is_same_v<ToDataType, DataTypeFixedString>)
-struct ConvertImpl<DataTypeFixedString, ToDataType, Name, ConvertReturnNullOnErrorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<DataTypeFixedString, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal> {};
-
-template <typename FromDataType, typename ToDataType, typename Name, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-requires (is_any_of<FromDataType, DataTypeString, DataTypeFixedString> && is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>)
-struct ConvertImpl<FromDataType, ToDataType, Name, ConvertReturnZeroOnErrorTag, date_time_overflow_behavior>
-    : ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::Normal> {};
-
-/// Generic conversion of any type from String. Used for complex types: Array and Tuple or types with custom serialization.
-template <typename StringColumnType>
-struct ConvertImplGenericFromString
-{
-    static ColumnPtr execute(ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * column_nullable, size_t input_rows_count)
-    {
-        static_assert(std::is_same_v<StringColumnType, ColumnString> || std::is_same_v<StringColumnType, ColumnFixedString>,
-                "Can be used only to parse from ColumnString or ColumnFixedString");
-
-        const IColumn & column_from = *arguments[0].column;
-        const IDataType & data_type_to = *result_type;
-        auto res = data_type_to.createColumn();
-        auto serialization = data_type_to.getDefaultSerialization();
-        const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
-
-        executeImpl(column_from, *res, *serialization, input_rows_count, null_map, result_type.get());
-        return res;
-    }
-
-    static void executeImpl(
-        const IColumn & column_from,
-        IColumn & column_to,
-        const ISerialization & serialization_from,
-        size_t input_rows_count,
-        const PaddedPODArray<UInt8> * null_map = nullptr,
-        const IDataType * result_type = nullptr)
-    {
-        static_assert(std::is_same_v<StringColumnType, ColumnString> || std::is_same_v<StringColumnType, ColumnFixedString>,
-                "Can be used only to parse from ColumnString or ColumnFixedString");
-
-        if (const StringColumnType * col_from_string = checkAndGetColumn<StringColumnType>(&column_from))
-        {
-            column_to.reserve(input_rows_count);
-
-            FormatSettings format_settings;
-            for (size_t i = 0; i < input_rows_count; ++i)
-            {
-                if (null_map && (*null_map)[i])
-                {
-                    column_to.insertDefault();
-                    continue;
-                }
-
-                const auto & val = col_from_string->getDataAt(i);
-                ReadBufferFromMemory read_buffer(val.data, val.size);
-                try
-                {
-                    serialization_from.deserializeWholeText(column_to, read_buffer, format_settings);
-                }
-                catch (const Exception & e)
-                {
-                    auto * nullable_column = typeid_cast<ColumnNullable *>(&column_to);
-                    if (e.code() == ErrorCodes::CANNOT_PARSE_BOOL && nullable_column)
-                    {
-                        auto & col_nullmap = nullable_column->getNullMapData();
-                        if (col_nullmap.size() != nullable_column->size())
-                            col_nullmap.resize_fill(nullable_column->size());
-                        if (nullable_column->size() == (i + 1))
-                            nullable_column->popBack(1);
-                        nullable_column->insertDefault();
-                        continue;
-                    }
-                    throw;
-                }
-
-                if (!read_buffer.eof())
-                {
-                    if (result_type)
-                        throwExceptionForIncompletelyParsedValue(read_buffer, *result_type);
-                    else
-                        throw Exception(ErrorCodes::CANNOT_PARSE_TEXT,
-                            "Cannot parse string to column {}. Expected eof", column_to.getName());
-                }
-            }
-        }
-        else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN,
-                "Illegal column {} of first argument of conversion function from string",
-                column_from.getName());
-    }
-
-};
-
-
-template <>
-struct ConvertImpl<DataTypeString, DataTypeUInt32, NameToUnixTimestamp, ConvertDefaultBehaviorTag>
-    : ConvertImpl<DataTypeString, DataTypeDateTime, NameToUnixTimestamp, ConvertDefaultBehaviorTag> {};
-
-template <>
-struct ConvertImpl<DataTypeString, DataTypeUInt32, NameToUnixTimestamp, ConvertReturnNullOnErrorTag>
-    : ConvertImpl<DataTypeString, DataTypeDateTime, NameToUnixTimestamp, ConvertReturnNullOnErrorTag> {};
-
-/** If types are identical, just take reference to column.
-  */
-template <typename T, typename Name>
-requires (!T::is_parametric)
-struct ConvertImpl<T, T, Name, ConvertDefaultBehaviorTag>
-{
-    template <typename Additions = void *>
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/,
-        Additions additions [[maybe_unused]] = Additions())
-    {
-        return arguments[0].column;
-    }
-};
-
-template <typename Name>
-struct ConvertImpl<DataTypeUInt8, DataTypeUInt8, Name, ConvertDefaultBehaviorTag>
-{
-    template <typename Additions = void *>
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/,
-                             Additions additions [[maybe_unused]] = Additions())
-    {
-
-        return arguments[0].column;
-    }
-};
-
-
-/** Conversion from FixedString to String.
-  * Cutting sequences of zero bytes from end of strings.
-  */
-template <typename Name>
-struct ConvertImpl<DataTypeFixedString, DataTypeString, Name, ConvertDefaultBehaviorTag>
-{
-    static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr & return_type, size_t /*input_rows_count*/)
-    {
-        ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
-        const auto & nested =  columnGetNested(arguments[0]);
-        if (const ColumnFixedString * col_from = checkAndGetColumn<ColumnFixedString>(nested.column.get()))
-        {
-            auto col_to = ColumnString::create();
-
-            const ColumnFixedString::Chars & data_from = col_from->getChars();
-            ColumnString::Chars & data_to = col_to->getChars();
-            ColumnString::Offsets & offsets_to = col_to->getOffsets();
-            size_t size = col_from->size();
-            size_t n = col_from->getN();
-            data_to.resize(size * (n + 1)); /// + 1 - zero terminator
-            offsets_to.resize(size);
-
-            size_t offset_from = 0;
-            size_t offset_to = 0;
-            for (size_t i = 0; i < size; ++i)
-            {
-                if (!null_map || !null_map->getData()[i])
-                {
-                    size_t bytes_to_copy = n;
-                    while (bytes_to_copy > 0 && data_from[offset_from + bytes_to_copy - 1] == 0)
-                        --bytes_to_copy;
-
-                    memcpy(&data_to[offset_to], &data_from[offset_from], bytes_to_copy);
-                    offset_to += bytes_to_copy;
-                }
-                data_to[offset_to] = 0;
-                ++offset_to;
-                offsets_to[i] = offset_to;
-                offset_from += n;
-            }
-
-            data_to.resize(offset_to);
-            if (return_type->isNullable() && null_map)
-                return ColumnNullable::create(std::move(col_to), std::move(null_map));
-            return col_to;
-        }
-        else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    arguments[0].column->getName(), Name::name);
-    }
-};
-
-
-/// Declared early because used below.
-struct NameToDate { static constexpr auto name = "toDate"; };
-struct NameToDate32 { static constexpr auto name = "toDate32"; };
-struct NameToDateTime { static constexpr auto name = "toDateTime"; };
-struct NameToDateTime32 { static constexpr auto name = "toDateTime32"; };
-struct NameToDateTime64 { static constexpr auto name = "toDateTime64"; };
-struct NameToString { static constexpr auto name = "toString"; };
-struct NameToDecimal32 { static constexpr auto name = "toDecimal32"; };
-struct NameToDecimal64 { static constexpr auto name = "toDecimal64"; };
-struct NameToDecimal128 { static constexpr auto name = "toDecimal128"; };
-struct NameToDecimal256 { static constexpr auto name = "toDecimal256"; };
-
-
-#define DEFINE_NAME_TO_INTERVAL(INTERVAL_KIND) \
-    struct NameToInterval ## INTERVAL_KIND \
-    { \
-        static constexpr auto name = "toInterval" #INTERVAL_KIND; \
-        static constexpr auto kind = IntervalKind::Kind::INTERVAL_KIND; \
-    };
-
-DEFINE_NAME_TO_INTERVAL(Nanosecond)
-DEFINE_NAME_TO_INTERVAL(Microsecond)
-DEFINE_NAME_TO_INTERVAL(Millisecond)
-DEFINE_NAME_TO_INTERVAL(Second)
-DEFINE_NAME_TO_INTERVAL(Minute)
-DEFINE_NAME_TO_INTERVAL(Hour)
-DEFINE_NAME_TO_INTERVAL(Day)
-DEFINE_NAME_TO_INTERVAL(Week)
-DEFINE_NAME_TO_INTERVAL(Month)
-DEFINE_NAME_TO_INTERVAL(Quarter)
-DEFINE_NAME_TO_INTERVAL(Year)
-
-#undef DEFINE_NAME_TO_INTERVAL
-
-struct NameParseDateTimeBestEffort;
-struct NameParseDateTimeBestEffortOrZero;
-struct NameParseDateTimeBestEffortOrNull;
-
-template<typename Name, typename ToDataType>
-static inline bool isDateTime64(const ColumnsWithTypeAndName & arguments)
-{
-    if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
-        return true;
-    else if constexpr (std::is_same_v<Name, NameToDateTime> || std::is_same_v<Name, NameParseDateTimeBestEffort>
-        || std::is_same_v<Name, NameParseDateTimeBestEffortOrZero> || std::is_same_v<Name, NameParseDateTimeBestEffortOrNull>)
-    {
-        return (arguments.size() == 2 && isUInt(arguments[1].type)) || arguments.size() == 3;
-    }
-
-    return false;
-}
-
-template <typename ToDataType, typename Name, typename MonotonicityImpl>
-class FunctionConvert : public IFunction
-{
-public:
-    using Monotonic = MonotonicityImpl;
-
-    static constexpr auto name = Name::name;
-    static constexpr bool to_decimal =
-        std::is_same_v<Name, NameToDecimal32> || std::is_same_v<Name, NameToDecimal64>
-         || std::is_same_v<Name, NameToDecimal128> || std::is_same_v<Name, NameToDecimal256>;
-
-    static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
-
-    static constexpr bool to_string_or_fixed_string = std::is_same_v<ToDataType, DataTypeFixedString> ||
-                                                      std::is_same_v<ToDataType, DataTypeString>;
-
-    static constexpr bool to_date_or_datetime = std::is_same_v<ToDataType, DataTypeDate> ||
-                                                std::is_same_v<ToDataType, DataTypeDate32> ||
-                                                std::is_same_v<ToDataType, DataTypeDateTime>;
-
-    static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionConvert>(context); }
-    static FunctionPtr create() { return std::make_shared<FunctionConvert>(); }
-
-    FunctionConvert() = default;
-    explicit FunctionConvert(ContextPtr context_) : context(context_) {}
-
-    String getName() const override
-    {
-        return name;
-    }
-
-    bool isVariadic() const override { return true; }
-    size_t getNumberOfArguments() const override { return 0; }
-    bool isInjective(const ColumnsWithTypeAndName &) const override { return std::is_same_v<Name, NameToString>; }
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & arguments) const override
-    {
-        /// TODO: We can make more optimizations here.
-        return !(to_date_or_datetime && isNumber(*arguments[0].type));
-    }
-
-    using DefaultReturnTypeGetter = std::function<DataTypePtr(const ColumnsWithTypeAndName &)>;
-    static DataTypePtr getReturnTypeDefaultImplementationForNulls(const ColumnsWithTypeAndName & arguments, const DefaultReturnTypeGetter & getter)
-    {
-        NullPresence null_presence = getNullPresense(arguments);
-
-        if (null_presence.has_null_constant)
-        {
-            return makeNullable(std::make_shared<DataTypeNothing>());
-        }
-        if (null_presence.has_nullable)
-        {
-            auto nested_columns = Block(createBlockWithNestedColumns(arguments));
-            auto return_type = getter(ColumnsWithTypeAndName(nested_columns.begin(), nested_columns.end()));
-            return makeNullable(return_type);
-        }
-
-        return getter(arguments);
-    }
-
-    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
-    {
-        auto getter = [&] (const auto & args) { return getReturnTypeImplRemovedNullable(args); };
-        auto res = getReturnTypeDefaultImplementationForNulls(arguments, getter);
-        to_nullable = res->isNullable();
-        checked_return_type = true;
-        return res;
-    }
-
-    DataTypePtr getReturnTypeImplRemovedNullable(const ColumnsWithTypeAndName & arguments) const
-    {
-        FunctionArgumentDescriptors mandatory_args = {{"Value", nullptr, nullptr, nullptr}};
-        FunctionArgumentDescriptors optional_args;
-
-        if constexpr (to_decimal)
-        {
-            mandatory_args.push_back({"scale", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isNativeInteger), &isColumnConst, "const Integer"});
-        }
-
-        if (!to_decimal && isDateTime64<Name, ToDataType>(arguments))
-        {
-            mandatory_args.push_back({"scale", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isNativeInteger), &isColumnConst, "const Integer"});
-        }
-
-        // toString(DateTime or DateTime64, [timezone: String])
-        if ((std::is_same_v<Name, NameToString> && !arguments.empty() && (isDateTime64(arguments[0].type) || isDateTime(arguments[0].type)))
-            // toUnixTimestamp(value[, timezone : String])
-            || std::is_same_v<Name, NameToUnixTimestamp>
-            // toDate(value[, timezone : String])
-            || std::is_same_v<ToDataType, DataTypeDate> // TODO: shall we allow timestamp argument for toDate? DateTime knows nothing about timezones and this argument is ignored below.
-            // toDate32(value[, timezone : String])
-            || std::is_same_v<ToDataType, DataTypeDate32>
-            // toDateTime(value[, timezone: String])
-            || std::is_same_v<ToDataType, DataTypeDateTime>
-            // toDateTime64(value, scale : Integer[, timezone: String])
-            || std::is_same_v<ToDataType, DataTypeDateTime64>)
-        {
-            optional_args.push_back({"timezone", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isString), nullptr, "String"});
-        }
-
-        validateFunctionArgumentTypes(*this, arguments, mandatory_args, optional_args);
-
-        if constexpr (std::is_same_v<ToDataType, DataTypeInterval>)
-        {
-            return std::make_shared<DataTypeInterval>(Name::kind);
-        }
-        else if constexpr (to_decimal)
-        {
-            UInt64 scale = extractToDecimalScale(arguments[1]);
-
-            if constexpr (std::is_same_v<Name, NameToDecimal32>)
-                return createDecimalMaxPrecision<Decimal32>(scale);
-            else if constexpr (std::is_same_v<Name, NameToDecimal64>)
-                return createDecimalMaxPrecision<Decimal64>(scale);
-            else if constexpr (std::is_same_v<Name, NameToDecimal128>)
-                return createDecimalMaxPrecision<Decimal128>(scale);
-            else if constexpr (std::is_same_v<Name, NameToDecimal256>)
-                return createDecimalMaxPrecision<Decimal256>(scale);
-
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected branch in code of conversion function: it is a bug.");
-        }
-        else
-        {
-            // Optional second argument with time zone for DateTime.
-            UInt8 timezone_arg_position = 1;
-            UInt32 scale [[maybe_unused]] = DataTypeDateTime64::default_scale;
-
-            // DateTime64 requires more arguments: scale and timezone. Since timezone is optional, scale should be first.
-            if (isDateTime64<Name, ToDataType>(arguments))
-            {
-                timezone_arg_position += 1;
-                scale = static_cast<UInt32>(arguments[1].column->get64(0));
-
-                if (to_datetime64 || scale != 0) /// toDateTime('xxxx-xx-xx xx:xx:xx', 0) return DateTime
-                    return std::make_shared<DataTypeDateTime64>(scale,
-                        extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
-
-                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
-            }
-
-            if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
-                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, timezone_arg_position, 0, false));
-            else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected branch in code of conversion function: it is a bug.");
-            else
-                return std::make_shared<ToDataType>();
-        }
-    }
-
-    /// Function actually uses default implementation for nulls,
-    /// but we need to know if return type is Nullable or not,
-    /// so we use checked_return_type only to intercept the first call to getReturnTypeImpl(...).
-    bool useDefaultImplementationForNulls() const override
-    {
-        bool to_nullable_string = to_nullable && std::is_same_v<ToDataType, DataTypeString>;
-        return checked_return_type && !to_nullable_string;
-    }
-
-    bool useDefaultImplementationForConstants() const override { return true; }
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override
-    {
-        if constexpr (std::is_same_v<ToDataType, DataTypeString>)
-            return {};
-        else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
-            return {2};
-        return {1};
-    }
-    bool canBeExecutedOnDefaultArguments() const override { return false; }
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
-    {
-        try
-        {
-            return executeInternal(arguments, result_type, input_rows_count);
-        }
-        catch (Exception & e)
-        {
-            /// More convenient error message.
-            if (e.code() == ErrorCodes::ATTEMPT_TO_READ_AFTER_EOF)
-            {
-                e.addMessage("Cannot parse "
-                    + result_type->getName() + " from "
-                    + arguments[0].type->getName()
-                    + ", because value is too short");
-            }
-            else if (e.code() == ErrorCodes::CANNOT_PARSE_NUMBER
-                || e.code() == ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT
-                || e.code() == ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED
-                || e.code() == ErrorCodes::CANNOT_PARSE_QUOTED_STRING
-                || e.code() == ErrorCodes::CANNOT_PARSE_ESCAPE_SEQUENCE
-                || e.code() == ErrorCodes::CANNOT_PARSE_DATE
-                || e.code() == ErrorCodes::CANNOT_PARSE_DATETIME
-                || e.code() == ErrorCodes::CANNOT_PARSE_UUID
-                || e.code() == ErrorCodes::CANNOT_PARSE_IPV4
-                || e.code() == ErrorCodes::CANNOT_PARSE_IPV6)
-            {
-                e.addMessage("Cannot parse "
-                    + result_type->getName() + " from "
-                    + arguments[0].type->getName());
-            }
-
-            throw;
-        }
-    }
-
-    bool hasInformationAboutMonotonicity() const override
-    {
-        return Monotonic::has();
-    }
-
-    Monotonicity getMonotonicityForRange(const IDataType & type, const Field & left, const Field & right) const override
-    {
-        return Monotonic::get(type, left, right);
-    }
-
-private:
-    ContextPtr context;
-    mutable bool checked_return_type = false;
-    mutable bool to_nullable = false;
-
-    ColumnPtr executeInternal(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const
-    {
-        if (arguments.empty())
-            throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} expects at least 1 argument", getName());
-
-        if (result_type->onlyNull())
-            return result_type->createColumnConstWithDefaultValue(input_rows_count);
-
-        const DataTypePtr from_type = removeNullable(arguments[0].type);
-        ColumnPtr result_column;
-
-        [[maybe_unused]] FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior;
-
-        if (context)
-            date_time_overflow_behavior = context->getSettingsRef().date_time_overflow_behavior.value;
-
-        auto call = [&](const auto & types, const auto & tag) -> bool
-        {
-            using Types = std::decay_t<decltype(types)>;
-            using LeftDataType = typename Types::LeftType;
-            using RightDataType = typename Types::RightType;
-            using SpecialTag = std::decay_t<decltype(tag)>;
-
-            if constexpr (IsDataTypeDecimal<RightDataType>)
-            {
-                if constexpr (std::is_same_v<RightDataType, DataTypeDateTime64>)
-                {
-                    /// Account for optional timezone argument.
-                    if (arguments.size() != 2 && arguments.size() != 3)
-                        throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} expects 2 or 3 arguments for DataTypeDateTime64.", getName());
-                }
-                else if (arguments.size() != 2)
-                {
-                    throw Exception(ErrorCodes::TOO_FEW_ARGUMENTS_FOR_FUNCTION, "Function {} expects 2 arguments for Decimal.", getName());
-                }
-
-                const ColumnWithTypeAndName & scale_column = arguments[1];
-                UInt32 scale = extractToDecimalScale(scale_column);
-
-                switch (date_time_overflow_behavior)
-                {
-                    case FormatSettings::DateTimeOverflowBehavior::Throw:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, scale);
-                        break;
-                    case FormatSettings::DateTimeOverflowBehavior::Ignore:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, scale);
-                        break;
-                    case FormatSettings::DateTimeOverflowBehavior::Saturate:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, scale);
-                        break;
-                }
-
-            }
-            else if constexpr (IsDataTypeDateOrDateTime<RightDataType> && std::is_same_v<LeftDataType, DataTypeDateTime64>)
-            {
-                const auto * dt64 = assert_cast<const DataTypeDateTime64 *>(arguments[0].type.get());
-                switch (date_time_overflow_behavior)
-                {
-                    case FormatSettings::DateTimeOverflowBehavior::Throw:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, dt64->getScale());
-                        break;
-                    case FormatSettings::DateTimeOverflowBehavior::Ignore:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, dt64->getScale());
-                        break;
-                    case FormatSettings::DateTimeOverflowBehavior::Saturate:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, dt64->getScale());
-                        break;
-                }
-            }
-#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE) \
-            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-                result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
-                arguments, result_type, input_rows_count); \
-                break;
-
-            else if constexpr (IsDataTypeDecimalOrNumber<LeftDataType> && IsDataTypeDecimalOrNumber<RightDataType>)
-            {
-                using LeftT = typename LeftDataType::FieldType;
-                using RightT = typename RightDataType::FieldType;
-
-                static constexpr bool bad_left =
-                    is_decimal<LeftT> || std::is_floating_point_v<LeftT> || is_big_int_v<LeftT> || is_signed_v<LeftT>;
-                static constexpr bool bad_right =
-                    is_decimal<RightT> || std::is_floating_point_v<RightT> || is_big_int_v<RightT> || is_signed_v<RightT>;
-
-                /// Disallow int vs UUID conversion (but support int vs UInt128 conversion)
-                if constexpr ((bad_left && std::is_same_v<RightDataType, DataTypeUUID>) ||
-                              (bad_right && std::is_same_v<LeftDataType, DataTypeUUID>))
-                {
-                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Wrong UUID conversion");
-                }
-                else
-                {
-                    switch (date_time_overflow_behavior)
-                    {
-                        GENERATE_OVERFLOW_MODE_CASE(Throw)
-                        GENERATE_OVERFLOW_MODE_CASE(Ignore)
-                        GENERATE_OVERFLOW_MODE_CASE(Saturate)
-                    }
-                }
-            }
-            else if constexpr ((IsDataTypeNumber<LeftDataType> || IsDataTypeDateOrDateTime<LeftDataType>)
-                               && IsDataTypeDateOrDateTime<RightDataType>)
-            {
-                switch (date_time_overflow_behavior)
-                {
-                    GENERATE_OVERFLOW_MODE_CASE(Throw)
-                    GENERATE_OVERFLOW_MODE_CASE(Ignore)
-                    GENERATE_OVERFLOW_MODE_CASE(Saturate)
-                }
-            }
-#undef GENERATE_OVERFLOW_MODE_CASE
-            else
-                  result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag>::execute(arguments, result_type, input_rows_count);
-
-            return true;
-        };
-
-        if (isDateTime64<Name, ToDataType>(arguments))
-        {
-            /// For toDateTime('xxxx-xx-xx xx:xx:xx.00', 2[, 'timezone']) we need to it convert to DateTime64
-            const ColumnWithTypeAndName & scale_column = arguments[1];
-            UInt32 scale = extractToDecimalScale(scale_column);
-
-            if (to_datetime64 || scale != 0) /// When scale = 0, the data type is DateTime otherwise the data type is DateTime64
-            {
-                if (!callOnIndexAndDataType<DataTypeDateTime64>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{}))
-                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
-                                    arguments[0].type->getName(), getName());
-
-                return result_column;
-            }
-        }
-
-        if constexpr (std::is_same_v<ToDataType, DataTypeString>)
-        {
-            if (from_type->getCustomSerialization())
-                return ConvertImplGenericToString<ColumnString>::execute(arguments, result_type, input_rows_count);
-        }
-
-        bool done = false;
-        if constexpr (to_string_or_fixed_string)
-        {
-            done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
-        }
-        else
-        {
-            bool cast_ipv4_ipv6_default_on_conversion_error = false;
-            if constexpr (is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>)
-                if (context && (cast_ipv4_ipv6_default_on_conversion_error = context->getSettingsRef().cast_ipv4_ipv6_default_on_conversion_error))
-                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertReturnZeroOnErrorTag{});
-
-            if (!cast_ipv4_ipv6_default_on_conversion_error)
-            {
-                /// We should use ConvertFromStringExceptionMode::Null mode when converting from String (or FixedString)
-                /// to Nullable type, to avoid 'value is too short' error on attempt to parse empty string from NULL values.
-                if (to_nullable && WhichDataType(from_type).isStringOrFixedString())
-                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertReturnNullOnErrorTag{});
-                else
-                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
-            }
-        }
-
-        if (!done)
-        {
-            /// Generic conversion of any type to String.
-            if (std::is_same_v<ToDataType, DataTypeString>)
-            {
-                return ConvertImplGenericToString<ColumnString>::execute(arguments, result_type, input_rows_count);
-            }
-            else
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
-                    arguments[0].type->getName(), getName());
-        }
-
-        return result_column;
-    }
-};
-
-
-/** Function toTOrZero (where T is number of date or datetime type):
-  *  try to convert from String to type T through parsing,
-  *  if cannot parse, return default value instead of throwing exception.
-  * Function toTOrNull will return Nullable type with NULL when cannot parse.
-  * NOTE Also need to implement tryToUnixTimestamp with timezone.
-  */
-template <typename ToDataType, typename Name,
-    ConvertFromStringExceptionMode exception_mode,
-    ConvertFromStringParsingMode parsing_mode = ConvertFromStringParsingMode::Normal>
-class FunctionConvertFromString : public IFunction
-{
-public:
-    static constexpr auto name = Name::name;
-    static constexpr bool to_decimal =
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal32>> ||
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal64>> ||
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal128>> ||
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal256>>;
-
-    static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
-
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionConvertFromString>(); }
-    static FunctionPtr create() { return std::make_shared<FunctionConvertFromString>(); }
-
-    String getName() const override
-    {
-        return name;
-    }
-
-    bool isVariadic() const override { return true; }
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
-    size_t getNumberOfArguments() const override { return 0; }
-
-    bool useDefaultImplementationForConstants() const override { return true; }
-    bool canBeExecutedOnDefaultArguments() const override { return false; }
-
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
-
-    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
-    {
-        DataTypePtr res;
-
-        if (isDateTime64<Name, ToDataType>(arguments))
-        {
-            validateFunctionArgumentTypes(*this, arguments,
-                FunctionArgumentDescriptors{{"string", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isStringOrFixedString), nullptr, "String or FixedString"}},
-                // optional
-                FunctionArgumentDescriptors{
-                    {"precision", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isUInt8), isColumnConst, "const UInt8"},
-                    {"timezone", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isStringOrFixedString), isColumnConst, "const String or FixedString"},
-                });
-
-            UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
-            if (arguments.size() > 1)
-                scale = extractToDecimalScale(arguments[1]);
-            const auto timezone = extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false);
-
-            res = scale == 0 ? res = std::make_shared<DataTypeDateTime>(timezone) : std::make_shared<DataTypeDateTime64>(scale, timezone);
-        }
-        else
-        {
-            if ((arguments.size() != 1 && arguments.size() != 2) || (to_decimal && arguments.size() != 2))
-                throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
-                    "Number of arguments for function {} doesn't match: passed {}, should be 1 or 2. "
-                    "Second argument only make sense for DateTime (time zone, optional) and Decimal (scale).",
-                    getName(), arguments.size());
-
-            if (!isStringOrFixedString(arguments[0].type))
-            {
-                if (this->getName().find("OrZero") != std::string::npos ||
-                    this->getName().find("OrNull") != std::string::npos)
-                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument of function {}. "
-                            "Conversion functions with postfix 'OrZero' or 'OrNull' should take String argument",
-                            arguments[0].type->getName(), getName());
-                else
-                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument of function {}",
-                            arguments[0].type->getName(), getName());
-            }
-
-            if (arguments.size() == 2)
-            {
-                if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
-                {
-                    if (!isString(arguments[1].type))
-                        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of 2nd argument of function {}",
-                            arguments[1].type->getName(), getName());
-                }
-                else if constexpr (to_decimal)
-                {
-                    if (!isInteger(arguments[1].type))
-                        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of 2nd argument of function {}",
-                            arguments[1].type->getName(), getName());
-                    if (!arguments[1].column)
-                        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Second argument for function {} must be constant", getName());
-                }
-                else
-                {
-                    throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
-                        "Number of arguments for function {} doesn't match: passed {}, should be 1. "
-                        "Second argument makes sense only for DateTime and Decimal.",
-                        getName(), arguments.size());
-                }
-            }
-
-            if constexpr (std::is_same_v<ToDataType, DataTypeDateTime>)
-                res = std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 1, 0, false));
-            else if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "MaterializedMySQL is a bug.");
-            else if constexpr (to_decimal)
-            {
-                UInt64 scale = extractToDecimalScale(arguments[1]);
-                res = createDecimalMaxPrecision<typename ToDataType::FieldType>(scale);
-                if (!res)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Something wrong with toDecimalNNOrZero() or toDecimalNNOrNull()");
-            }
-            else
-                res = std::make_shared<ToDataType>();
-        }
-
-        if constexpr (exception_mode == ConvertFromStringExceptionMode::Null)
-            res = std::make_shared<DataTypeNullable>(res);
-
-        return res;
-    }
-
-    template <typename ConvertToDataType>
-    ColumnPtr executeInternal(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count, UInt32 scale = 0) const
-    {
-        const IDataType * from_type = arguments[0].type.get();
-
-        if (checkAndGetDataType<DataTypeString>(from_type))
-        {
-            return ConvertThroughParsing<DataTypeString, ConvertToDataType, Name, exception_mode, parsing_mode>::execute(
-                arguments, result_type, input_rows_count, scale);
-        }
-        else if (checkAndGetDataType<DataTypeFixedString>(from_type))
-        {
-            return ConvertThroughParsing<DataTypeFixedString, ConvertToDataType, Name, exception_mode, parsing_mode>::execute(
-                arguments, result_type, input_rows_count, scale);
-        }
-
-        return nullptr;
-    }
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
-    {
-        ColumnPtr result_column;
-
-        if constexpr (to_decimal)
-            result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count,
-                assert_cast<const ToDataType &>(*removeNullable(result_type)).getScale());
-        else
-        {
-            if (isDateTime64<Name, ToDataType>(arguments))
-            {
-                UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
-                if (arguments.size() > 1)
-                    scale = extractToDecimalScale(arguments[1]);
-
-                if (scale == 0)
-                    result_column = executeInternal<DataTypeDateTime>(arguments, result_type, input_rows_count);
-                else
-                {
-                    result_column = executeInternal<DataTypeDateTime64>(arguments, result_type, input_rows_count, static_cast<UInt32>(scale));
-                }
-            }
-            else
-            {
-                result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count);
-            }
-        }
-
-        if (!result_column)
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
-                "Only String or FixedString argument is accepted for try-conversion function. For other arguments, "
-                "use function without 'orZero' or 'orNull'.", arguments[0].type->getName(), getName());
-
-        return result_column;
-    }
-};
-
-
-/// Monotonicity.
-
-struct PositiveMonotonicity
-{
-    static bool has() { return true; }
-    static IFunction::Monotonicity get(const IDataType &, const Field &, const Field &)
-    {
-        return { .is_monotonic = true };
-    }
-};
-
-struct UnknownMonotonicity
-{
-    static bool has() { return false; }
-    static IFunction::Monotonicity get(const IDataType &, const Field &, const Field &)
-    {
-        return { };
-    }
-};
-
-template <typename T>
-struct ToNumberMonotonicity
-{
-    static bool has() { return true; }
-
-    static UInt64 divideByRangeOfType(UInt64 x)
-    {
-        if constexpr (sizeof(T) < sizeof(UInt64))
-            return x >> (sizeof(T) * 8);
-        else
-            return 0;
-    }
-
-    static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
-    {
-        if (!type.isValueRepresentedByNumber())
-            return {};
-
-        /// If type is same, the conversion is always monotonic.
-        /// (Enum has separate case, because it is different data type)
-        if (checkAndGetDataType<DataTypeNumber<T>>(&type) ||
-            checkAndGetDataType<DataTypeEnum<T>>(&type))
-            return { .is_monotonic = true, .is_always_monotonic = true };
-
-        /// Float cases.
-
-        /// When converting to Float, the conversion is always monotonic.
-        if constexpr (std::is_floating_point_v<T>)
-            return { .is_monotonic = true, .is_always_monotonic = true };
-
-        const auto * low_cardinality = typeid_cast<const DataTypeLowCardinality *>(&type);
-        const IDataType * low_cardinality_dictionary_type = nullptr;
-        if (low_cardinality)
-            low_cardinality_dictionary_type = low_cardinality->getDictionaryType().get();
-
-        WhichDataType which_type(type);
-        WhichDataType which_inner_type = low_cardinality
-            ? WhichDataType(low_cardinality_dictionary_type)
-            : WhichDataType(type);
-
-        /// If converting from Float, for monotonicity, arguments must fit in range of result type.
-        if (which_inner_type.isFloat())
-        {
-            if (left.isNull() || right.isNull())
-                return {};
-
-            Float64 left_float = left.get<Float64>();
-            Float64 right_float = right.get<Float64>();
-
-            if (left_float >= static_cast<Float64>(std::numeric_limits<T>::min())
-                && left_float <= static_cast<Float64>(std::numeric_limits<T>::max())
-                && right_float >= static_cast<Float64>(std::numeric_limits<T>::min())
-                && right_float <= static_cast<Float64>(std::numeric_limits<T>::max()))
-                return { .is_monotonic = true };
-
-            return {};
-        }
-
-        /// Integer cases.
-
-        /// Only support types represented by native integers.
-        /// It can be extended to big integers, decimals and DateTime64 later.
-        /// By the way, NULLs are representing unbounded ranges.
-        if (!((left.isNull() || left.getType() == Field::Types::UInt64 || left.getType() == Field::Types::Int64)
-            && (right.isNull() || right.getType() == Field::Types::UInt64 || right.getType() == Field::Types::Int64)))
-            return {};
-
-        const bool from_is_unsigned = type.isValueRepresentedByUnsignedInteger();
-        const bool to_is_unsigned = is_unsigned_v<T>;
-
-        const size_t size_of_from = type.getSizeOfValueInMemory();
-        const size_t size_of_to = sizeof(T);
-
-        const bool left_in_first_half = left.isNull()
-            ? from_is_unsigned
-            : (left.get<Int64>() >= 0);
-
-        const bool right_in_first_half = right.isNull()
-            ? !from_is_unsigned
-            : (right.get<Int64>() >= 0);
-
-        /// Size of type is the same.
-        if (size_of_from == size_of_to)
-        {
-            if (from_is_unsigned == to_is_unsigned)
-                return { .is_monotonic = true, .is_always_monotonic = true };
-
-            if (left_in_first_half == right_in_first_half)
-                return { .is_monotonic = true };
-
-            return {};
-        }
-
-        /// Size of type is expanded.
-        if (size_of_from < size_of_to)
-        {
-            if (from_is_unsigned == to_is_unsigned)
-                return { .is_monotonic = true, .is_always_monotonic = true };
-
-            if (!to_is_unsigned)
-                return { .is_monotonic = true, .is_always_monotonic = true };
-
-            /// signed -> unsigned. If arguments from the same half, then function is monotonic.
-            if (left_in_first_half == right_in_first_half)
-                return { .is_monotonic = true };
-
-            return {};
-        }
-
-        /// Size of type is shrunk.
-        if (size_of_from > size_of_to)
-        {
-            /// Function cannot be monotonic on unbounded ranges.
-            if (left.isNull() || right.isNull())
-                return {};
-
-            /// Function cannot be monotonic when left and right are not on the same ranges.
-            if (divideByRangeOfType(left.get<UInt64>()) != divideByRangeOfType(right.get<UInt64>()))
-                return {};
-
-            if (to_is_unsigned)
-                return { .is_monotonic = true };
-            else
-            {
-                // If To is signed, it's possible that the signedness is different after conversion. So we check it explicitly.
-                const bool is_monotonic = (T(left.get<UInt64>()) >= 0) == (T(right.get<UInt64>()) >= 0);
-
-                return { .is_monotonic = is_monotonic };
-            }
-        }
-
-        UNREACHABLE();
-    }
-};
-
-struct ToDateMonotonicity
-{
-    static bool has() { return true; }
-
-    static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
-    {
-        auto which = WhichDataType(type);
-        if (which.isDateOrDate32() || which.isDateTime() || which.isDateTime64() || which.isInt8() || which.isInt16() || which.isUInt8()
-            || which.isUInt16())
-        {
-            return {.is_monotonic = true, .is_always_monotonic = true};
-        }
-        else if (
-            ((left.getType() == Field::Types::UInt64 || left.isNull()) && (right.getType() == Field::Types::UInt64 || right.isNull())
-             && ((left.isNull() || left.get<UInt64>() < 0xFFFF) && (right.isNull() || right.get<UInt64>() >= 0xFFFF)))
-            || ((left.getType() == Field::Types::Int64 || left.isNull()) && (right.getType() == Field::Types::Int64 || right.isNull())
-                && ((left.isNull() || left.get<Int64>() < 0xFFFF) && (right.isNull() || right.get<Int64>() >= 0xFFFF)))
-            || ((
-                (left.getType() == Field::Types::Float64 || left.isNull())
-                && (right.getType() == Field::Types::Float64 || right.isNull())
-                && ((left.isNull() || left.get<Float64>() < 0xFFFF) && (right.isNull() || right.get<Float64>() >= 0xFFFF))))
-            || !isNativeNumber(type))
-        {
-            return {};
-        }
-        else
-        {
-            return {.is_monotonic = true, .is_always_monotonic = true};
-        }
-    }
-};
-
-struct ToDateTimeMonotonicity
-{
-    static bool has() { return true; }
-
-    static IFunction::Monotonicity get(const IDataType & type, const Field &, const Field &)
-    {
-        if (type.isValueRepresentedByNumber())
-            return {.is_monotonic = true, .is_always_monotonic = true};
-        else
-            return {};
-    }
-};
-
-/** The monotonicity for the `toString` function is mainly determined for test purposes.
-  * It is doubtful that anyone is looking to optimize queries with conditions `toString(CounterID) = 34`.
-  */
-struct ToStringMonotonicity
-{
-    static bool has() { return true; }
-
-    static IFunction::Monotonicity get(const IDataType & type, const Field & left, const Field & right)
-    {
-        IFunction::Monotonicity positive{ .is_monotonic = true };
-        IFunction::Monotonicity not_monotonic;
-
-        const auto * type_ptr = &type;
-        if (const auto * low_cardinality_type = checkAndGetDataType<DataTypeLowCardinality>(type_ptr))
-            type_ptr = low_cardinality_type->getDictionaryType().get();
-
-        /// Order on enum values (which is the order on integers) is completely arbitrary in respect to the order on strings.
-        if (WhichDataType(type).isEnum())
-            return not_monotonic;
-
-        /// `toString` function is monotonous if the argument is Date or Date32 or DateTime or String, or non-negative numbers with the same number of symbols.
-        if (checkDataTypes<DataTypeDate, DataTypeDate32, DataTypeDateTime, DataTypeString>(type_ptr))
-            return positive;
-
-        if (left.isNull() || right.isNull())
-            return {};
-
-        if (left.getType() == Field::Types::UInt64
-            && right.getType() == Field::Types::UInt64)
-        {
-            return (left.get<Int64>() == 0 && right.get<Int64>() == 0)
-                || (floor(log10(left.get<UInt64>())) == floor(log10(right.get<UInt64>())))
-                ? positive : not_monotonic;
-        }
-
-        if (left.getType() == Field::Types::Int64
-            && right.getType() == Field::Types::Int64)
-        {
-            return (left.get<Int64>() == 0 && right.get<Int64>() == 0)
-                || (left.get<Int64>() > 0 && right.get<Int64>() > 0 && floor(log10(left.get<Int64>())) == floor(log10(right.get<Int64>())))
-                ? positive : not_monotonic;
-        }
-
-        return not_monotonic;
-    }
-};
-
-
-struct NameToUInt8 { static constexpr auto name = "toUInt8"; };
-struct NameToUInt16 { static constexpr auto name = "toUInt16"; };
-struct NameToUInt32 { static constexpr auto name = "toUInt32"; };
-struct NameToUInt64 { static constexpr auto name = "toUInt64"; };
-struct NameToUInt128 { static constexpr auto name = "toUInt128"; };
-struct NameToUInt256 { static constexpr auto name = "toUInt256"; };
-struct NameToInt8 { static constexpr auto name = "toInt8"; };
-struct NameToInt16 { static constexpr auto name = "toInt16"; };
-struct NameToInt32 { static constexpr auto name = "toInt32"; };
-struct NameToInt64 { static constexpr auto name = "toInt64"; };
-struct NameToInt128 { static constexpr auto name = "toInt128"; };
-struct NameToInt256 { static constexpr auto name = "toInt256"; };
-struct NameToFloat32 { static constexpr auto name = "toFloat32"; };
-struct NameToFloat64 { static constexpr auto name = "toFloat64"; };
-struct NameToUUID { static constexpr auto name = "toUUID"; };
-struct NameToIPv4 { static constexpr auto name = "toIPv4"; };
-struct NameToIPv6 { static constexpr auto name = "toIPv6"; };
-
-using FunctionToUInt8 = FunctionConvert<DataTypeUInt8, NameToUInt8, ToNumberMonotonicity<UInt8>>;
-using FunctionToUInt16 = FunctionConvert<DataTypeUInt16, NameToUInt16, ToNumberMonotonicity<UInt16>>;
-using FunctionToUInt32 = FunctionConvert<DataTypeUInt32, NameToUInt32, ToNumberMonotonicity<UInt32>>;
-using FunctionToUInt64 = FunctionConvert<DataTypeUInt64, NameToUInt64, ToNumberMonotonicity<UInt64>>;
-using FunctionToUInt128 = FunctionConvert<DataTypeUInt128, NameToUInt128, ToNumberMonotonicity<UInt128>>;
-using FunctionToUInt256 = FunctionConvert<DataTypeUInt256, NameToUInt256, ToNumberMonotonicity<UInt256>>;
-using FunctionToInt8 = FunctionConvert<DataTypeInt8, NameToInt8, ToNumberMonotonicity<Int8>>;
-using FunctionToInt16 = FunctionConvert<DataTypeInt16, NameToInt16, ToNumberMonotonicity<Int16>>;
-using FunctionToInt32 = FunctionConvert<DataTypeInt32, NameToInt32, ToNumberMonotonicity<Int32>>;
-using FunctionToInt64 = FunctionConvert<DataTypeInt64, NameToInt64, ToNumberMonotonicity<Int64>>;
-using FunctionToInt128 = FunctionConvert<DataTypeInt128, NameToInt128, ToNumberMonotonicity<Int128>>;
-using FunctionToInt256 = FunctionConvert<DataTypeInt256, NameToInt256, ToNumberMonotonicity<Int256>>;
-using FunctionToFloat32 = FunctionConvert<DataTypeFloat32, NameToFloat32, ToNumberMonotonicity<Float32>>;
-using FunctionToFloat64 = FunctionConvert<DataTypeFloat64, NameToFloat64, ToNumberMonotonicity<Float64>>;
-
-using FunctionToDate = FunctionConvert<DataTypeDate, NameToDate, ToDateMonotonicity>;
-
-using FunctionToDate32 = FunctionConvert<DataTypeDate32, NameToDate32, ToDateMonotonicity>;
-
-using FunctionToDateTime = FunctionConvert<DataTypeDateTime, NameToDateTime, ToDateTimeMonotonicity>;
-
-using FunctionToDateTime32 = FunctionConvert<DataTypeDateTime, NameToDateTime32, ToDateTimeMonotonicity>;
-
-using FunctionToDateTime64 = FunctionConvert<DataTypeDateTime64, NameToDateTime64, ToDateTimeMonotonicity>;
-
-using FunctionToUUID = FunctionConvert<DataTypeUUID, NameToUUID, ToNumberMonotonicity<UInt128>>;
-using FunctionToIPv4 = FunctionConvert<DataTypeIPv4, NameToIPv4, ToNumberMonotonicity<UInt32>>;
-using FunctionToIPv6 = FunctionConvert<DataTypeIPv6, NameToIPv6, ToNumberMonotonicity<UInt128>>;
-using FunctionToString = FunctionConvert<DataTypeString, NameToString, ToStringMonotonicity>;
-using FunctionToUnixTimestamp = FunctionConvert<DataTypeUInt32, NameToUnixTimestamp, ToNumberMonotonicity<UInt32>>;
-using FunctionToDecimal32 = FunctionConvert<DataTypeDecimal<Decimal32>, NameToDecimal32, UnknownMonotonicity>;
-using FunctionToDecimal64 = FunctionConvert<DataTypeDecimal<Decimal64>, NameToDecimal64, UnknownMonotonicity>;
-using FunctionToDecimal128 = FunctionConvert<DataTypeDecimal<Decimal128>, NameToDecimal128, UnknownMonotonicity>;
-using FunctionToDecimal256 = FunctionConvert<DataTypeDecimal<Decimal256>, NameToDecimal256, UnknownMonotonicity>;
-
-template <typename DataType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior> struct FunctionTo;
-
-template <> struct FunctionTo<DataTypeUInt8> { using Type = FunctionToUInt8; };
-template <> struct FunctionTo<DataTypeUInt16> { using Type = FunctionToUInt16; };
-template <> struct FunctionTo<DataTypeUInt32> { using Type = FunctionToUInt32; };
-template <> struct FunctionTo<DataTypeUInt64> { using Type = FunctionToUInt64; };
-template <> struct FunctionTo<DataTypeUInt128> { using Type = FunctionToUInt128; };
-template <> struct FunctionTo<DataTypeUInt256> { using Type = FunctionToUInt256; };
-template <> struct FunctionTo<DataTypeInt8> { using Type = FunctionToInt8; };
-template <> struct FunctionTo<DataTypeInt16> { using Type = FunctionToInt16; };
-template <> struct FunctionTo<DataTypeInt32> { using Type = FunctionToInt32; };
-template <> struct FunctionTo<DataTypeInt64> { using Type = FunctionToInt64; };
-template <> struct FunctionTo<DataTypeInt128> { using Type = FunctionToInt128; };
-template <> struct FunctionTo<DataTypeInt256> { using Type = FunctionToInt256; };
-template <> struct FunctionTo<DataTypeFloat32> { using Type = FunctionToFloat32; };
-template <> struct FunctionTo<DataTypeFloat64> { using Type = FunctionToFloat64; };
-
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct FunctionTo<DataTypeDate, date_time_overflow_behavior> { using Type = FunctionToDate; };
-
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct FunctionTo<DataTypeDate32, date_time_overflow_behavior> { using Type = FunctionToDate32; };
-
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct FunctionTo<DataTypeDateTime, date_time_overflow_behavior> { using Type = FunctionToDateTime; };
-
-template <FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
-struct FunctionTo<DataTypeDateTime64, date_time_overflow_behavior> { using Type = FunctionToDateTime64; };
-
-template <> struct FunctionTo<DataTypeUUID> { using Type = FunctionToUUID; };
-template <> struct FunctionTo<DataTypeIPv4> { using Type = FunctionToIPv4; };
-template <> struct FunctionTo<DataTypeIPv6> { using Type = FunctionToIPv6; };
-template <> struct FunctionTo<DataTypeString> { using Type = FunctionToString; };
-template <> struct FunctionTo<DataTypeFixedString> { using Type = FunctionToFixedString; };
-template <> struct FunctionTo<DataTypeDecimal<Decimal32>> { using Type = FunctionToDecimal32; };
-template <> struct FunctionTo<DataTypeDecimal<Decimal64>> { using Type = FunctionToDecimal64; };
-template <> struct FunctionTo<DataTypeDecimal<Decimal128>> { using Type = FunctionToDecimal128; };
-template <> struct FunctionTo<DataTypeDecimal<Decimal256>> { using Type = FunctionToDecimal256; };
-
-template <typename FieldType> struct FunctionTo<DataTypeEnum<FieldType>>
-    : FunctionTo<DataTypeNumber<FieldType>>
-{
-};
-
-struct NameToUInt8OrZero { static constexpr auto name = "toUInt8OrZero"; };
-struct NameToUInt16OrZero { static constexpr auto name = "toUInt16OrZero"; };
-struct NameToUInt32OrZero { static constexpr auto name = "toUInt32OrZero"; };
-struct NameToUInt64OrZero { static constexpr auto name = "toUInt64OrZero"; };
-struct NameToUInt128OrZero { static constexpr auto name = "toUInt128OrZero"; };
-struct NameToUInt256OrZero { static constexpr auto name = "toUInt256OrZero"; };
-struct NameToInt8OrZero { static constexpr auto name = "toInt8OrZero"; };
-struct NameToInt16OrZero { static constexpr auto name = "toInt16OrZero"; };
-struct NameToInt32OrZero { static constexpr auto name = "toInt32OrZero"; };
-struct NameToInt64OrZero { static constexpr auto name = "toInt64OrZero"; };
-struct NameToInt128OrZero { static constexpr auto name = "toInt128OrZero"; };
-struct NameToInt256OrZero { static constexpr auto name = "toInt256OrZero"; };
-struct NameToFloat32OrZero { static constexpr auto name = "toFloat32OrZero"; };
-struct NameToFloat64OrZero { static constexpr auto name = "toFloat64OrZero"; };
-struct NameToDateOrZero { static constexpr auto name = "toDateOrZero"; };
-struct NameToDate32OrZero { static constexpr auto name = "toDate32OrZero"; };
-struct NameToDateTimeOrZero { static constexpr auto name = "toDateTimeOrZero"; };
-struct NameToDateTime64OrZero { static constexpr auto name = "toDateTime64OrZero"; };
-struct NameToDecimal32OrZero { static constexpr auto name = "toDecimal32OrZero"; };
-struct NameToDecimal64OrZero { static constexpr auto name = "toDecimal64OrZero"; };
-struct NameToDecimal128OrZero { static constexpr auto name = "toDecimal128OrZero"; };
-struct NameToDecimal256OrZero { static constexpr auto name = "toDecimal256OrZero"; };
-struct NameToUUIDOrZero { static constexpr auto name = "toUUIDOrZero"; };
-struct NameToIPv4OrZero { static constexpr auto name = "toIPv4OrZero"; };
-struct NameToIPv6OrZero { static constexpr auto name = "toIPv6OrZero"; };
-
-using FunctionToUInt8OrZero = FunctionConvertFromString<DataTypeUInt8, NameToUInt8OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt16OrZero = FunctionConvertFromString<DataTypeUInt16, NameToUInt16OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt32OrZero = FunctionConvertFromString<DataTypeUInt32, NameToUInt32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt64OrZero = FunctionConvertFromString<DataTypeUInt64, NameToUInt64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt128OrZero = FunctionConvertFromString<DataTypeUInt128, NameToUInt128OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUInt256OrZero = FunctionConvertFromString<DataTypeUInt256, NameToUInt256OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt8OrZero = FunctionConvertFromString<DataTypeInt8, NameToInt8OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt16OrZero = FunctionConvertFromString<DataTypeInt16, NameToInt16OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt32OrZero = FunctionConvertFromString<DataTypeInt32, NameToInt32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt64OrZero = FunctionConvertFromString<DataTypeInt64, NameToInt64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt128OrZero = FunctionConvertFromString<DataTypeInt128, NameToInt128OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToInt256OrZero = FunctionConvertFromString<DataTypeInt256, NameToInt256OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToFloat32OrZero = FunctionConvertFromString<DataTypeFloat32, NameToFloat32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToFloat64OrZero = FunctionConvertFromString<DataTypeFloat64, NameToFloat64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDateOrZero = FunctionConvertFromString<DataTypeDate, NameToDateOrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDate32OrZero = FunctionConvertFromString<DataTypeDate32, NameToDate32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDateTimeOrZero = FunctionConvertFromString<DataTypeDateTime, NameToDateTimeOrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDateTime64OrZero = FunctionConvertFromString<DataTypeDateTime64, NameToDateTime64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDecimal32OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal32>, NameToDecimal32OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDecimal64OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal64>, NameToDecimal64OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDecimal128OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal128>, NameToDecimal128OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToDecimal256OrZero = FunctionConvertFromString<DataTypeDecimal<Decimal256>, NameToDecimal256OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToUUIDOrZero = FunctionConvertFromString<DataTypeUUID, NameToUUIDOrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToIPv4OrZero = FunctionConvertFromString<DataTypeIPv4, NameToIPv4OrZero, ConvertFromStringExceptionMode::Zero>;
-using FunctionToIPv6OrZero = FunctionConvertFromString<DataTypeIPv6, NameToIPv6OrZero, ConvertFromStringExceptionMode::Zero>;
-
-struct NameToUInt8OrNull { static constexpr auto name = "toUInt8OrNull"; };
-struct NameToUInt16OrNull { static constexpr auto name = "toUInt16OrNull"; };
-struct NameToUInt32OrNull { static constexpr auto name = "toUInt32OrNull"; };
-struct NameToUInt64OrNull { static constexpr auto name = "toUInt64OrNull"; };
-struct NameToUInt128OrNull { static constexpr auto name = "toUInt128OrNull"; };
-struct NameToUInt256OrNull { static constexpr auto name = "toUInt256OrNull"; };
-struct NameToInt8OrNull { static constexpr auto name = "toInt8OrNull"; };
-struct NameToInt16OrNull { static constexpr auto name = "toInt16OrNull"; };
-struct NameToInt32OrNull { static constexpr auto name = "toInt32OrNull"; };
-struct NameToInt64OrNull { static constexpr auto name = "toInt64OrNull"; };
-struct NameToInt128OrNull { static constexpr auto name = "toInt128OrNull"; };
-struct NameToInt256OrNull { static constexpr auto name = "toInt256OrNull"; };
-struct NameToFloat32OrNull { static constexpr auto name = "toFloat32OrNull"; };
-struct NameToFloat64OrNull { static constexpr auto name = "toFloat64OrNull"; };
-struct NameToDateOrNull { static constexpr auto name = "toDateOrNull"; };
-struct NameToDate32OrNull { static constexpr auto name = "toDate32OrNull"; };
-struct NameToDateTimeOrNull { static constexpr auto name = "toDateTimeOrNull"; };
-struct NameToDateTime64OrNull { static constexpr auto name = "toDateTime64OrNull"; };
-struct NameToDecimal32OrNull { static constexpr auto name = "toDecimal32OrNull"; };
-struct NameToDecimal64OrNull { static constexpr auto name = "toDecimal64OrNull"; };
-struct NameToDecimal128OrNull { static constexpr auto name = "toDecimal128OrNull"; };
-struct NameToDecimal256OrNull { static constexpr auto name = "toDecimal256OrNull"; };
-struct NameToUUIDOrNull { static constexpr auto name = "toUUIDOrNull"; };
-struct NameToIPv4OrNull { static constexpr auto name = "toIPv4OrNull"; };
-struct NameToIPv6OrNull { static constexpr auto name = "toIPv6OrNull"; };
-
-using FunctionToUInt8OrNull = FunctionConvertFromString<DataTypeUInt8, NameToUInt8OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt16OrNull = FunctionConvertFromString<DataTypeUInt16, NameToUInt16OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt32OrNull = FunctionConvertFromString<DataTypeUInt32, NameToUInt32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt64OrNull = FunctionConvertFromString<DataTypeUInt64, NameToUInt64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt128OrNull = FunctionConvertFromString<DataTypeUInt128, NameToUInt128OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUInt256OrNull = FunctionConvertFromString<DataTypeUInt256, NameToUInt256OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt8OrNull = FunctionConvertFromString<DataTypeInt8, NameToInt8OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt16OrNull = FunctionConvertFromString<DataTypeInt16, NameToInt16OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt32OrNull = FunctionConvertFromString<DataTypeInt32, NameToInt32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt64OrNull = FunctionConvertFromString<DataTypeInt64, NameToInt64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt128OrNull = FunctionConvertFromString<DataTypeInt128, NameToInt128OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToInt256OrNull = FunctionConvertFromString<DataTypeInt256, NameToInt256OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToFloat32OrNull = FunctionConvertFromString<DataTypeFloat32, NameToFloat32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToFloat64OrNull = FunctionConvertFromString<DataTypeFloat64, NameToFloat64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDateOrNull = FunctionConvertFromString<DataTypeDate, NameToDateOrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDate32OrNull = FunctionConvertFromString<DataTypeDate32, NameToDate32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDateTimeOrNull = FunctionConvertFromString<DataTypeDateTime, NameToDateTimeOrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDateTime64OrNull = FunctionConvertFromString<DataTypeDateTime64, NameToDateTime64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDecimal32OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal32>, NameToDecimal32OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDecimal64OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal64>, NameToDecimal64OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDecimal128OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal128>, NameToDecimal128OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToDecimal256OrNull = FunctionConvertFromString<DataTypeDecimal<Decimal256>, NameToDecimal256OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToUUIDOrNull = FunctionConvertFromString<DataTypeUUID, NameToUUIDOrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToIPv4OrNull = FunctionConvertFromString<DataTypeIPv4, NameToIPv4OrNull, ConvertFromStringExceptionMode::Null>;
-using FunctionToIPv6OrNull = FunctionConvertFromString<DataTypeIPv6, NameToIPv6OrNull, ConvertFromStringExceptionMode::Null>;
-
-struct NameParseDateTimeBestEffort { static constexpr auto name = "parseDateTimeBestEffort"; };
-struct NameParseDateTimeBestEffortOrZero { static constexpr auto name = "parseDateTimeBestEffortOrZero"; };
-struct NameParseDateTimeBestEffortOrNull { static constexpr auto name = "parseDateTimeBestEffortOrNull"; };
-struct NameParseDateTimeBestEffortUS { static constexpr auto name = "parseDateTimeBestEffortUS"; };
-struct NameParseDateTimeBestEffortUSOrZero { static constexpr auto name = "parseDateTimeBestEffortUSOrZero"; };
-struct NameParseDateTimeBestEffortUSOrNull { static constexpr auto name = "parseDateTimeBestEffortUSOrNull"; };
-struct NameParseDateTime32BestEffort { static constexpr auto name = "parseDateTime32BestEffort"; };
-struct NameParseDateTime32BestEffortOrZero { static constexpr auto name = "parseDateTime32BestEffortOrZero"; };
-struct NameParseDateTime32BestEffortOrNull { static constexpr auto name = "parseDateTime32BestEffortOrNull"; };
-struct NameParseDateTime64BestEffort { static constexpr auto name = "parseDateTime64BestEffort"; };
-struct NameParseDateTime64BestEffortOrZero { static constexpr auto name = "parseDateTime64BestEffortOrZero"; };
-struct NameParseDateTime64BestEffortOrNull { static constexpr auto name = "parseDateTime64BestEffortOrNull"; };
-struct NameParseDateTime64BestEffortUS { static constexpr auto name = "parseDateTime64BestEffortUS"; };
-struct NameParseDateTime64BestEffortUSOrZero { static constexpr auto name = "parseDateTime64BestEffortUSOrZero"; };
-struct NameParseDateTime64BestEffortUSOrNull { static constexpr auto name = "parseDateTime64BestEffortUSOrNull"; };
-
-
-using FunctionParseDateTimeBestEffort = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffort, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTimeBestEffortOrZero = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTimeBestEffortOrNull = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffort>;
-
-using FunctionParseDateTimeBestEffortUS = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortUS, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffortUS>;
-using FunctionParseDateTimeBestEffortUSOrZero = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortUSOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffortUS>;
-using FunctionParseDateTimeBestEffortUSOrNull = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTimeBestEffortUSOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffortUS>;
-
-using FunctionParseDateTime32BestEffort = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTime32BestEffort, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTime32BestEffortOrZero = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTime32BestEffortOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTime32BestEffortOrNull = FunctionConvertFromString<
-    DataTypeDateTime, NameParseDateTime32BestEffortOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffort>;
-
-using FunctionParseDateTime64BestEffort = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffort, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTime64BestEffortOrZero = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffort>;
-using FunctionParseDateTime64BestEffortOrNull = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffort>;
-
-using FunctionParseDateTime64BestEffortUS = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortUS, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::BestEffortUS>;
-using FunctionParseDateTime64BestEffortUSOrZero = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortUSOrZero, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::BestEffortUS>;
-using FunctionParseDateTime64BestEffortUSOrNull = FunctionConvertFromString<
-    DataTypeDateTime64, NameParseDateTime64BestEffortUSOrNull, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::BestEffortUS>;
-
-
-class ExecutableFunctionCast : public IExecutableFunction
-{
-public:
-    using WrapperType = std::function<ColumnPtr(ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t)>;
-
-    explicit ExecutableFunctionCast(
-            WrapperType && wrapper_function_, const char * name_, std::optional<CastDiagnostic> diagnostic_)
-            : wrapper_function(std::move(wrapper_function_)), name(name_), diagnostic(std::move(diagnostic_)) {}
-
-    String getName() const override { return name; }
-
-protected:
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
-    {
-        /// drop second argument, pass others
-        ColumnsWithTypeAndName new_arguments{arguments.front()};
-        if (arguments.size() > 2)
-            new_arguments.insert(std::end(new_arguments), std::next(std::begin(arguments), 2), std::end(arguments));
-
-        try
-        {
-            return wrapper_function(new_arguments, result_type, nullptr, input_rows_count);
-        }
-        catch (Exception & e)
-        {
-            if (diagnostic)
-                e.addMessage("while converting source column " + backQuoteIfNeed(diagnostic->column_from) +
-                             " to destination column " + backQuoteIfNeed(diagnostic->column_to));
-            throw;
-        }
-    }
-
-    bool useDefaultImplementationForNulls() const override { return false; }
-    /// CAST(Nothing, T) -> T
-    bool useDefaultImplementationForNothing() const override { return false; }
-    bool useDefaultImplementationForConstants() const override { return true; }
-    bool useDefaultImplementationForLowCardinalityColumns() const override { return false; }
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; }
-
-private:
-    WrapperType wrapper_function;
-    const char * name;
-    std::optional<CastDiagnostic> diagnostic;
-};
-
-struct CastName { static constexpr auto name = "CAST"; };
-struct CastInternalName { static constexpr auto name = "_CAST"; };
-
-class FunctionCastBase : public IFunctionBase
-{
-public:
-    using MonotonicityForRange = std::function<Monotonicity(const IDataType &, const Field &, const Field &)>;
-};
-
-template <typename FunctionName>
-class FunctionCast final : public FunctionCastBase
-{
-public:
-    using WrapperType = std::function<ColumnPtr(ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t)>;
-
-    FunctionCast(ContextPtr context_
-            , const char * cast_name_
-            , MonotonicityForRange && monotonicity_for_range_
-            , const DataTypes & argument_types_
-            , const DataTypePtr & return_type_
-            , std::optional<CastDiagnostic> diagnostic_
-            , CastType cast_type_)
-        : cast_name(cast_name_), monotonicity_for_range(std::move(monotonicity_for_range_))
-        , argument_types(argument_types_), return_type(return_type_), diagnostic(std::move(diagnostic_))
-        , cast_type(cast_type_)
-        , context(context_)
-    {
-    }
-
-    const DataTypes & getArgumentTypes() const override { return argument_types; }
-    const DataTypePtr & getResultType() const override { return return_type; }
-
-    ExecutableFunctionPtr prepare(const ColumnsWithTypeAndName & /*sample_columns*/) const override
-    {
-        try
-        {
-            return std::make_unique<ExecutableFunctionCast>(
-                    prepareUnpackDictionaries(getArgumentTypes()[0], getResultType()), cast_name, diagnostic);
-        }
-        catch (Exception & e)
-        {
-            if (diagnostic)
-                e.addMessage("while converting source column " + backQuoteIfNeed(diagnostic->column_from) +
-                             " to destination column " + backQuoteIfNeed(diagnostic->column_to));
-            throw;
-        }
-    }
-
-    String getName() const override { return cast_name; }
-
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
-
-    bool hasInformationAboutMonotonicity() const override
-    {
-        return static_cast<bool>(monotonicity_for_range);
-    }
-
-    Monotonicity getMonotonicityForRange(const IDataType & type, const Field & left, const Field & right) const override
-    {
-        return monotonicity_for_range(type, left, right);
-    }
-
-private:
-
-    const char * cast_name;
-    MonotonicityForRange monotonicity_for_range;
-
-    DataTypes argument_types;
-    DataTypePtr return_type;
-
-    std::optional<CastDiagnostic> diagnostic;
-    CastType cast_type;
-    ContextPtr context;
-
-    static WrapperType createFunctionAdaptor(FunctionPtr function, const DataTypePtr & from_type)
-    {
-        auto function_adaptor = std::make_unique<FunctionToOverloadResolverAdaptor>(function)->build({ColumnWithTypeAndName{nullptr, from_type, ""}});
-
-        return [function_adaptor]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count)
-        {
-            return function_adaptor->execute(arguments, result_type, input_rows_count);
-        };
-    }
-
-    static WrapperType createToNullableColumnWrapper()
-    {
-        return [] (ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count)
-        {
-            ColumnPtr res = result_type->createColumn();
-            ColumnUInt8::Ptr col_null_map_to = ColumnUInt8::create(input_rows_count, true);
-            return ColumnNullable::create(res->cloneResized(input_rows_count), std::move(col_null_map_to));
-        };
-    }
-
-    template <typename ToDataType>
-    WrapperType createWrapper(const DataTypePtr & from_type, const ToDataType * const to_type, bool requested_result_is_nullable) const
-    {
-        TypeIndex from_type_index = from_type->getTypeId();
-        WhichDataType which(from_type_index);
-        bool can_apply_accurate_cast = (cast_type == CastType::accurate || cast_type == CastType::accurateOrNull)
-            && (which.isInt() || which.isUInt() || which.isFloat());
-
-        FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior;
-        if (context)
-            date_time_overflow_behavior = context->getSettingsRef().date_time_overflow_behavior;
-
-        if (requested_result_is_nullable && checkAndGetDataType<DataTypeString>(from_type.get()))
-        {
-            /// In case when converting to Nullable type, we apply different parsing rule,
-            /// that will not throw an exception but return NULL in case of malformed input.
-            FunctionPtr function = FunctionConvertFromString<ToDataType, FunctionName, ConvertFromStringExceptionMode::Null>::create();
-            return createFunctionAdaptor(function, from_type);
-        }
-        else if (!can_apply_accurate_cast)
-        {
-            FunctionPtr function = FunctionTo<ToDataType>::Type::create(context);
-            return createFunctionAdaptor(function, from_type);
-        }
-
-        auto wrapper_cast_type = cast_type;
-
-        return [wrapper_cast_type, from_type_index, to_type, date_time_overflow_behavior]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *column_nullable, size_t input_rows_count)
-        {
-            ColumnPtr result_column;
-            auto res = callOnIndexAndDataType<ToDataType>(from_type_index, [&](const auto & types) -> bool {
-                using Types = std::decay_t<decltype(types)>;
-                using LeftDataType = typename Types::LeftType;
-                using RightDataType = typename Types::RightType;
-
-                if constexpr (IsDataTypeNumber<LeftDataType>)
-                {
-                    if constexpr (IsDataTypeNumber<RightDataType>)
-                    {
-#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
-            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
-                arguments, result_type, input_rows_count, ADDITIONS()); \
-                break;
-                        if (wrapper_cast_type == CastType::accurate)
-                        {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, AccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, AccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, AccurateConvertStrategyAdditions)
-                            }
-                        }
-                        else
-                        {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, AccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, AccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, AccurateOrNullConvertStrategyAdditions)
-                            }
-                        }
-#undef GENERATE_OVERFLOW_MODE_CASE
-
-                        return true;
-                    }
-
-                    if constexpr (std::is_same_v<RightDataType, DataTypeDate> || std::is_same_v<RightDataType, DataTypeDateTime>)
-                    {
-#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
-            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::template execute<ADDITIONS>( \
-arguments, result_type, input_rows_count); \
-                break;
-                        if (wrapper_cast_type == CastType::accurate)
-                        {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateConvertStrategyAdditions)
-                            }
-                        }
-                        else
-                        {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateOrNullConvertStrategyAdditions)
-                            }
-                        }
-#undef GENERATE_OVERFLOW_MODE_CASE
-                        return true;
-                    }
-                }
-
-                return false;
-            });
-
-            /// Additionally check if callOnIndexAndDataType wasn't called at all.
-            if (!res)
-            {
-                if (wrapper_cast_type == CastType::accurateOrNull)
-                {
-                    auto nullable_column_wrapper = FunctionCast<FunctionName>::createToNullableColumnWrapper();
-                    return nullable_column_wrapper(arguments, result_type, column_nullable, input_rows_count);
-                }
-                else
-                {
-                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE,
-                        "Conversion from {} to {} is not supported",
-                        from_type_index, to_type->getName());
-                }
-            }
-
-            return result_column;
-        };
-    }
-
-    template <typename ToDataType>
-    WrapperType createBoolWrapper(const DataTypePtr & from_type, const ToDataType * const to_type, bool requested_result_is_nullable) const
-    {
-        if (checkAndGetDataType<DataTypeString>(from_type.get()))
-        {
-            return &ConvertImplGenericFromString<ColumnString>::execute;
-        }
-
-        return createWrapper<ToDataType>(from_type, to_type, requested_result_is_nullable);
-    }
-
-    WrapperType createUInt8ToBoolWrapper(const DataTypePtr from_type, const DataTypePtr to_type) const
-    {
-        return [from_type, to_type] (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            /// Special case when we convert UInt8 column to Bool column.
-            /// both columns have type UInt8, but we shouldn't use identity wrapper,
-            /// because Bool column can contain only 0 and 1.
-            auto res_column = to_type->createColumn();
-            const auto & data_from = checkAndGetColumn<ColumnUInt8>(arguments[0].column.get())->getData();
-            auto & data_to = assert_cast<ColumnUInt8 *>(res_column.get())->getData();
-            data_to.resize(data_from.size());
-            for (size_t i = 0; i != data_from.size(); ++i)
-                data_to[i] = static_cast<bool>(data_from[i]);
-            return res_column;
-        };
-    }
-
-    static WrapperType createStringWrapper(const DataTypePtr & from_type)
-    {
-        FunctionPtr function = FunctionToString::create();
-        return createFunctionAdaptor(function, from_type);
-    }
-
-    WrapperType createFixedStringWrapper(const DataTypePtr & from_type, const size_t N) const
-    {
-        if (!isStringOrFixedString(from_type))
-            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "CAST AS FixedString is only implemented for types String and FixedString");
-
-        bool exception_mode_null = cast_type == CastType::accurateOrNull;
-        return [exception_mode_null, N] (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t /*input_rows_count*/)
-        {
-            if (exception_mode_null)
-                return FunctionToFixedString::executeForN<ConvertToFixedStringExceptionMode::Null>(arguments, N);
-            else
-                return FunctionToFixedString::executeForN<ConvertToFixedStringExceptionMode::Throw>(arguments, N);
-        };
-    }
-
-#define GENERATE_INTERVAL_CASE(INTERVAL_KIND) \
-            case IntervalKind::Kind::INTERVAL_KIND: \
-                return createFunctionAdaptor(FunctionConvert<DataTypeInterval, NameToInterval##INTERVAL_KIND, PositiveMonotonicity>::create(), from_type);
-
-    static WrapperType createIntervalWrapper(const DataTypePtr & from_type, IntervalKind kind)
-    {
-        switch (kind)
-        {
-            GENERATE_INTERVAL_CASE(Nanosecond)
-            GENERATE_INTERVAL_CASE(Microsecond)
-            GENERATE_INTERVAL_CASE(Millisecond)
-            GENERATE_INTERVAL_CASE(Second)
-            GENERATE_INTERVAL_CASE(Minute)
-            GENERATE_INTERVAL_CASE(Hour)
-            GENERATE_INTERVAL_CASE(Day)
-            GENERATE_INTERVAL_CASE(Week)
-            GENERATE_INTERVAL_CASE(Month)
-            GENERATE_INTERVAL_CASE(Quarter)
-            GENERATE_INTERVAL_CASE(Year)
-        }
-        throw Exception{ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion to unexpected IntervalKind: {}", kind.toString()};
-    }
-
-#undef GENERATE_INTERVAL_CASE
-
-    template <typename ToDataType>
-    requires IsDataTypeDecimal<ToDataType>
-    WrapperType createDecimalWrapper(const DataTypePtr & from_type, const ToDataType * to_type, bool requested_result_is_nullable) const
-    {
-        TypeIndex type_index = from_type->getTypeId();
-        UInt32 scale = to_type->getScale();
-
-        WhichDataType which(type_index);
-        bool ok = which.isNativeInt() || which.isNativeUInt() || which.isDecimal() || which.isFloat() || which.isDateOrDate32() || which.isDateTime() || which.isDateTime64()
-            || which.isStringOrFixedString();
-        if (!ok)
-        {
-            if (cast_type == CastType::accurateOrNull)
-                return createToNullableColumnWrapper();
-            else
-                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
-                    from_type->getName(), to_type->getName());
-        }
-
-        auto wrapper_cast_type = cast_type;
-
-        return [wrapper_cast_type, type_index, scale, to_type, requested_result_is_nullable]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *column_nullable, size_t input_rows_count)
-        {
-            ColumnPtr result_column;
-            auto res = callOnIndexAndDataType<ToDataType>(type_index, [&](const auto & types) -> bool
-            {
-                using Types = std::decay_t<decltype(types)>;
-                using LeftDataType = typename Types::LeftType;
-                using RightDataType = typename Types::RightType;
-
-                if constexpr (IsDataTypeDecimalOrNumber<LeftDataType> && IsDataTypeDecimalOrNumber<RightDataType> && !std::is_same_v<DataTypeDateTime64, RightDataType>)
-                {
-                    if (wrapper_cast_type == CastType::accurate)
-                    {
-                        AccurateConvertStrategyAdditions additions;
-                        additions.scale = scale;
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(
-                            arguments, result_type, input_rows_count, additions);
-
-                        return true;
-                    }
-                    else if (wrapper_cast_type == CastType::accurateOrNull)
-                    {
-                        AccurateOrNullConvertStrategyAdditions additions;
-                        additions.scale = scale;
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(
-                            arguments, result_type, input_rows_count, additions);
-
-                        return true;
-                    }
-                }
-                else if constexpr (std::is_same_v<LeftDataType, DataTypeString>)
-                {
-                    if (requested_result_is_nullable)
-                    {
-                        /// Consistent with CAST(Nullable(String) AS Nullable(Numbers))
-                        /// In case when converting to Nullable type, we apply different parsing rule,
-                        /// that will not throw an exception but return NULL in case of malformed input.
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName, ConvertReturnNullOnErrorTag>::execute(
-                            arguments, result_type, input_rows_count, scale);
-
-                        return true;
-                    }
-                }
-
-                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionName>::execute(arguments, result_type, input_rows_count, scale);
-
-                return true;
-            });
-
-            /// Additionally check if callOnIndexAndDataType wasn't called at all.
-            if (!res)
-            {
-                if (wrapper_cast_type == CastType::accurateOrNull)
-                {
-                    auto nullable_column_wrapper = FunctionCast<FunctionName>::createToNullableColumnWrapper();
-                    return nullable_column_wrapper(arguments, result_type, column_nullable, input_rows_count);
-                }
-                else
-                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE,
-                        "Conversion from {} to {} is not supported",
-                        type_index, to_type->getName());
-            }
-
-            return result_column;
-        };
-    }
-
-    WrapperType createAggregateFunctionWrapper(const DataTypePtr & from_type_untyped, const DataTypeAggregateFunction * to_type) const
-    {
-        /// Conversion from String through parsing.
-        if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
-        {
-            return &ConvertImplGenericFromString<ColumnString>::execute;
-        }
-        else if (const auto * agg_type = checkAndGetDataType<DataTypeAggregateFunction>(from_type_untyped.get()))
-        {
-            if (agg_type->getFunction()->haveSameStateRepresentation(*to_type->getFunction()))
-            {
-                return [function = to_type->getFunction()](
-                           ColumnsWithTypeAndName & arguments,
-                           const DataTypePtr & /* result_type */,
-                           const ColumnNullable * /* nullable_source */,
-                           size_t /*input_rows_count*/) -> ColumnPtr
-                {
-                    const auto & argument_column = arguments.front();
-                    const auto * col_agg = checkAndGetColumn<ColumnAggregateFunction>(argument_column.column.get());
-                    if (col_agg)
-                    {
-                        auto new_col_agg = ColumnAggregateFunction::create(*col_agg);
-                        new_col_agg->set(function);
-                        return new_col_agg;
-                    }
-                    else
-                    {
-                        throw Exception(
-                            ErrorCodes::LOGICAL_ERROR,
-                            "Illegal column {} for function CAST AS AggregateFunction",
-                            argument_column.column->getName());
-                    }
-                };
-            }
-        }
-
-        if (cast_type == CastType::accurateOrNull)
-            return createToNullableColumnWrapper();
-        else
-            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
-                from_type_untyped->getName(), to_type->getName());
-    }
-
-    WrapperType createArrayWrapper(const DataTypePtr & from_type_untyped, const DataTypeArray & to_type) const
-    {
-        /// Conversion from String through parsing.
-        if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
-        {
-            return &ConvertImplGenericFromString<ColumnString>::execute;
-        }
-
-        DataTypePtr from_type_holder;
-        const auto * from_type = checkAndGetDataType<DataTypeArray>(from_type_untyped.get());
-        const auto * from_type_map = checkAndGetDataType<DataTypeMap>(from_type_untyped.get());
-
-        /// Convert from Map
-        if (from_type_map)
-        {
-            /// Recreate array of unnamed tuples because otherwise it may work
-            /// unexpectedly while converting to array of named tuples.
-            from_type_holder = from_type_map->getNestedTypeWithUnnamedTuple();
-            from_type = assert_cast<const DataTypeArray *>(from_type_holder.get());
-        }
-
-        if (!from_type)
-        {
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "CAST AS Array can only be performed between same-dimensional Array, Map or String types");
-        }
-
-        DataTypePtr from_nested_type = from_type->getNestedType();
-
-        /// In query SELECT CAST([] AS Array(Array(String))) from type is Array(Nothing)
-        bool from_empty_array = isNothing(from_nested_type);
-
-        if (from_type->getNumberOfDimensions() != to_type.getNumberOfDimensions() && !from_empty_array)
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "CAST AS Array can only be performed between same-dimensional array types");
-
-        const DataTypePtr & to_nested_type = to_type.getNestedType();
-
-        /// Prepare nested type conversion
-        const auto nested_function = prepareUnpackDictionaries(from_nested_type, to_nested_type);
-
-        return [nested_function, from_nested_type, to_nested_type](
-                ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            const auto & argument_column = arguments.front();
-
-            const ColumnArray * col_array = nullptr;
-
-            if (const ColumnMap * col_map = checkAndGetColumn<ColumnMap>(argument_column.column.get()))
-                col_array = &col_map->getNestedColumn();
-            else
-                col_array = checkAndGetColumn<ColumnArray>(argument_column.column.get());
-
-            if (col_array)
-            {
-                /// create columns for converting nested column containing original and result columns
-                ColumnsWithTypeAndName nested_columns{{ col_array->getDataPtr(), from_nested_type, "" }};
-
-                /// convert nested column
-                auto result_column = nested_function(nested_columns, to_nested_type, nullable_source, nested_columns.front().column->size());
-
-                /// set converted nested column to result
-                return ColumnArray::create(result_column, col_array->getOffsetsPtr());
-            }
-            else
-            {
-                throw Exception(ErrorCodes::LOGICAL_ERROR,
-                    "Illegal column {} for function CAST AS Array",
-                    argument_column.column->getName());
-            }
-        };
-    }
-
-    using ElementWrappers = std::vector<WrapperType>;
-
-    ElementWrappers getElementWrappers(const DataTypes & from_element_types, const DataTypes & to_element_types) const
-    {
-        ElementWrappers element_wrappers;
-        element_wrappers.reserve(from_element_types.size());
-
-        /// Create conversion wrapper for each element in tuple
-        for (size_t i = 0; i < from_element_types.size(); ++i)
-        {
-            const DataTypePtr & from_element_type = from_element_types[i];
-            const DataTypePtr & to_element_type = to_element_types[i];
-            element_wrappers.push_back(prepareUnpackDictionaries(from_element_type, to_element_type));
-        }
-
-        return element_wrappers;
-    }
-
-    WrapperType createTupleWrapper(const DataTypePtr & from_type_untyped, const DataTypeTuple * to_type) const
-    {
-        /// Conversion from String through parsing.
-        if (checkAndGetDataType<DataTypeString>(from_type_untyped.get()))
-        {
-            return &ConvertImplGenericFromString<ColumnString>::execute;
-        }
-
-        const auto * from_type = checkAndGetDataType<DataTypeTuple>(from_type_untyped.get());
-        if (!from_type)
-            throw Exception(ErrorCodes::TYPE_MISMATCH, "CAST AS Tuple can only be performed between tuple types or from String.\n"
-                            "Left type: {}, right type: {}", from_type_untyped->getName(), to_type->getName());
-
-        const auto & from_element_types = from_type->getElements();
-        const auto & to_element_types = to_type->getElements();
-
-        std::vector<WrapperType> element_wrappers;
-        std::vector<std::optional<size_t>> to_reverse_index;
-
-        /// For named tuples allow conversions for tuples with
-        /// different sets of elements. If element exists in @to_type
-        /// and doesn't exist in @to_type it will be filled by default values.
-        if (from_type->haveExplicitNames() && to_type->haveExplicitNames())
-        {
-            const auto & from_names = from_type->getElementNames();
-            std::unordered_map<String, size_t> from_positions;
-            from_positions.reserve(from_names.size());
-            for (size_t i = 0; i < from_names.size(); ++i)
-                from_positions[from_names[i]] = i;
-
-            const auto & to_names = to_type->getElementNames();
-            element_wrappers.reserve(to_names.size());
-            to_reverse_index.reserve(from_names.size());
-
-            for (size_t i = 0; i < to_names.size(); ++i)
-            {
-                auto it = from_positions.find(to_names[i]);
-                if (it != from_positions.end())
-                {
-                    element_wrappers.emplace_back(prepareUnpackDictionaries(from_element_types[it->second], to_element_types[i]));
-                    to_reverse_index.emplace_back(it->second);
-                }
-                else
-                {
-                    element_wrappers.emplace_back();
-                    to_reverse_index.emplace_back();
-                }
-            }
-        }
-        else
-        {
-            if (from_element_types.size() != to_element_types.size())
-                throw Exception(ErrorCodes::TYPE_MISMATCH, "CAST AS Tuple can only be performed between tuple types "
-                                "with the same number of elements or from String.\nLeft type: {}, right type: {}",
-                                from_type->getName(), to_type->getName());
-
-            element_wrappers = getElementWrappers(from_element_types, to_element_types);
-            to_reverse_index.reserve(to_element_types.size());
-            for (size_t i = 0; i < to_element_types.size(); ++i)
-                to_reverse_index.emplace_back(i);
-        }
-
-        return [element_wrappers, from_element_types, to_element_types, to_reverse_index]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t input_rows_count) -> ColumnPtr
-        {
-            const auto * col = arguments.front().column.get();
-
-            size_t tuple_size = to_element_types.size();
-            const ColumnTuple & column_tuple = typeid_cast<const ColumnTuple &>(*col);
-
-            Columns converted_columns(tuple_size);
-
-            /// invoke conversion for each element
-            for (size_t i = 0; i < tuple_size; ++i)
-            {
-                if (to_reverse_index[i])
-                {
-                    size_t from_idx = *to_reverse_index[i];
-                    ColumnsWithTypeAndName element = {{column_tuple.getColumns()[from_idx], from_element_types[from_idx], "" }};
-                    converted_columns[i] = element_wrappers[i](element, to_element_types[i], nullable_source, input_rows_count);
-                }
-                else
-                {
-                    converted_columns[i] = to_element_types[i]->createColumn()->cloneResized(input_rows_count);
-                }
-            }
-
-            return ColumnTuple::create(converted_columns);
-        };
-    }
-
-    /// The case of: tuple([key1, key2, ..., key_n], [value1, value2, ..., value_n])
-    WrapperType createTupleToMapWrapper(const DataTypes & from_kv_types, const DataTypes & to_kv_types) const
-    {
-        return [element_wrappers = getElementWrappers(from_kv_types, to_kv_types), from_kv_types, to_kv_types]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            const auto * col = arguments.front().column.get();
-            const auto & column_tuple = assert_cast<const ColumnTuple &>(*col);
-
-            Columns offsets(2);
-            Columns converted_columns(2);
-            for (size_t i = 0; i < 2; ++i)
-            {
-                const auto & column_array = assert_cast<const ColumnArray &>(column_tuple.getColumn(i));
-                ColumnsWithTypeAndName element = {{column_array.getDataPtr(), from_kv_types[i], ""}};
-                converted_columns[i] = element_wrappers[i](element, to_kv_types[i], nullable_source, (element[0].column)->size());
-                offsets[i] = column_array.getOffsetsPtr();
-            }
-
-            const auto & keys_offsets = assert_cast<const ColumnArray::ColumnOffsets &>(*offsets[0]).getData();
-            const auto & values_offsets = assert_cast<const ColumnArray::ColumnOffsets &>(*offsets[1]).getData();
-            if (keys_offsets != values_offsets)
-                throw Exception(ErrorCodes::TYPE_MISMATCH,
-                    "CAST AS Map can only be performed from tuple of arrays with equal sizes.");
-
-            return ColumnMap::create(converted_columns[0], converted_columns[1], offsets[0]);
-        };
-    }
-
-    WrapperType createMapToMapWrapper(const DataTypes & from_kv_types, const DataTypes & to_kv_types) const
-    {
-        return [element_wrappers = getElementWrappers(from_kv_types, to_kv_types), from_kv_types, to_kv_types]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            const auto * col = arguments.front().column.get();
-            const auto & column_map = typeid_cast<const ColumnMap &>(*col);
-            const auto & nested_data = column_map.getNestedData();
-
-            Columns converted_columns(2);
-            for (size_t i = 0; i < 2; ++i)
-            {
-                ColumnsWithTypeAndName element = {{nested_data.getColumnPtr(i), from_kv_types[i], ""}};
-                converted_columns[i] = element_wrappers[i](element, to_kv_types[i], nullable_source, (element[0].column)->size());
-            }
-
-            return ColumnMap::create(converted_columns[0], converted_columns[1], column_map.getNestedColumn().getOffsetsPtr());
-        };
-    }
-
-    /// The case of: [(key1, value1), (key2, value2), ...]
-    WrapperType createArrayToMapWrapper(const DataTypes & from_kv_types, const DataTypes & to_kv_types) const
-    {
-        return [element_wrappers = getElementWrappers(from_kv_types, to_kv_types), from_kv_types, to_kv_types]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t /*input_rows_count*/) -> ColumnPtr
-        {
-            const auto * col = arguments.front().column.get();
-            const auto & column_array = typeid_cast<const ColumnArray &>(*col);
-            const auto & nested_data = typeid_cast<const ColumnTuple &>(column_array.getData());
-
-            Columns converted_columns(2);
-            for (size_t i = 0; i < 2; ++i)
-            {
-                ColumnsWithTypeAndName element = {{nested_data.getColumnPtr(i), from_kv_types[i], ""}};
-                converted_columns[i] = element_wrappers[i](element, to_kv_types[i], nullable_source, (element[0].column)->size());
-            }
-
-            return ColumnMap::create(converted_columns[0], converted_columns[1], column_array.getOffsetsPtr());
-        };
-    }
-
-
-    WrapperType createMapWrapper(const DataTypePtr & from_type_untyped, const DataTypeMap * to_type) const
-    {
-        if (const auto * from_tuple = checkAndGetDataType<DataTypeTuple>(from_type_untyped.get()))
-        {
-            if (from_tuple->getElements().size() != 2)
-                throw Exception(
-                    ErrorCodes::TYPE_MISMATCH,
-                    "CAST AS Map from tuple requires 2 elements. "
-                    "Left type: {}, right type: {}",
-                    from_tuple->getName(),
-                    to_type->getName());
-
-            DataTypes from_kv_types;
-            const auto & to_kv_types = to_type->getKeyValueTypes();
-
-            for (const auto & elem : from_tuple->getElements())
-            {
-                const auto * type_array = checkAndGetDataType<DataTypeArray>(elem.get());
-                if (!type_array)
-                    throw Exception(ErrorCodes::TYPE_MISMATCH,
-                        "CAST AS Map can only be performed from tuples of array. Got: {}", from_tuple->getName());
-
-                from_kv_types.push_back(type_array->getNestedType());
-            }
-
-            return createTupleToMapWrapper(from_kv_types, to_kv_types);
-        }
-        else if (const auto * from_array = typeid_cast<const DataTypeArray *>(from_type_untyped.get()))
-        {
-            const auto * nested_tuple = typeid_cast<const DataTypeTuple *>(from_array->getNestedType().get());
-            if (!nested_tuple || nested_tuple->getElements().size() != 2)
-                throw Exception(
-                    ErrorCodes::TYPE_MISMATCH,
-                    "CAST AS Map from array requires nested tuple of 2 elements. "
-                    "Left type: {}, right type: {}",
-                    from_array->getName(),
-                    to_type->getName());
-
-            return createArrayToMapWrapper(nested_tuple->getElements(), to_type->getKeyValueTypes());
-        }
-        else if (const auto * from_type = checkAndGetDataType<DataTypeMap>(from_type_untyped.get()))
-        {
-            return createMapToMapWrapper(from_type->getKeyValueTypes(), to_type->getKeyValueTypes());
-        }
-        else
-        {
-            throw Exception(ErrorCodes::TYPE_MISMATCH, "Unsupported types to CAST AS Map. "
-                "Left type: {}, right type: {}", from_type_untyped->getName(), to_type->getName());
-        }
-    }
-
-    WrapperType createTupleToObjectWrapper(const DataTypeTuple & from_tuple, bool has_nullable_subcolumns) const
-    {
-        if (!from_tuple.haveExplicitNames())
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-            "Cast to Object can be performed only from flatten Named Tuple. Got: {}", from_tuple.getName());
-
-        PathsInData paths;
-        DataTypes from_types;
-
-        std::tie(paths, from_types) = flattenTuple(from_tuple.getPtr());
-        auto to_types = from_types;
-
-        for (auto & type : to_types)
-        {
-            if (isTuple(type) || isNested(type))
-                throw Exception(ErrorCodes::TYPE_MISMATCH,
-                    "Cast to Object can be performed only from flatten Named Tuple. Got: {}",
-                    from_tuple.getName());
-
-            type = recursiveRemoveLowCardinality(type);
-        }
-
-        return [element_wrappers = getElementWrappers(from_types, to_types),
-            has_nullable_subcolumns, from_types, to_types, paths]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t input_rows_count)
-        {
-            size_t tuple_size = to_types.size();
-            auto flattened_column = flattenTuple(arguments.front().column);
-            const auto & column_tuple = assert_cast<const ColumnTuple &>(*flattened_column);
-
-            if (tuple_size != column_tuple.getColumns().size())
-                throw Exception(ErrorCodes::TYPE_MISMATCH,
-                    "Expected tuple with {} subcolumn, but got {} subcolumns",
-                    tuple_size, column_tuple.getColumns().size());
-
-            auto res = ColumnObject::create(has_nullable_subcolumns);
-            for (size_t i = 0; i < tuple_size; ++i)
-            {
-                ColumnsWithTypeAndName element = {{column_tuple.getColumns()[i], from_types[i], "" }};
-                auto converted_column = element_wrappers[i](element, to_types[i], nullable_source, input_rows_count);
-                res->addSubcolumn(paths[i], converted_column->assumeMutable());
-            }
-
-            return res;
-        };
-    }
-
-    WrapperType createMapToObjectWrapper(const DataTypeMap & from_map, bool has_nullable_subcolumns) const
-    {
-        auto key_value_types = from_map.getKeyValueTypes();
-
-        if (!isStringOrFixedString(key_value_types[0]))
-            throw Exception(ErrorCodes::TYPE_MISMATCH,
-                "Cast to Object from Map can be performed only from Map "
-                "with String or FixedString key. Got: {}", from_map.getName());
-
-        const auto & value_type = key_value_types[1];
-        auto to_value_type = value_type;
-
-        if (!has_nullable_subcolumns && value_type->isNullable())
-            to_value_type = removeNullable(value_type);
-
-        if (has_nullable_subcolumns && !value_type->isNullable())
-            to_value_type = makeNullable(value_type);
-
-        DataTypes to_key_value_types{std::make_shared<DataTypeString>(), std::move(to_value_type)};
-        auto element_wrappers = getElementWrappers(key_value_types, to_key_value_types);
-
-        return [has_nullable_subcolumns, element_wrappers, key_value_types, to_key_value_types]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable * nullable_source, size_t) -> ColumnPtr
-        {
-            const auto & column_map = assert_cast<const ColumnMap &>(*arguments.front().column);
-            const auto & offsets = column_map.getNestedColumn().getOffsets();
-            auto key_value_columns = column_map.getNestedData().getColumnsCopy();
-
-            for (size_t i = 0; i < 2; ++i)
-            {
-                ColumnsWithTypeAndName element{{key_value_columns[i], key_value_types[i], ""}};
-                key_value_columns[i] = element_wrappers[i](element, to_key_value_types[i], nullable_source, key_value_columns[i]->size());
-            }
-
-            const auto & key_column_str = assert_cast<const ColumnString &>(*key_value_columns[0]);
-            const auto & value_column = *key_value_columns[1];
-
-            using SubcolumnsMap = HashMap<StringRef, MutableColumnPtr, StringRefHash>;
-            SubcolumnsMap subcolumns;
-
-            for (size_t row = 0; row < offsets.size(); ++row)
-            {
-                for (size_t i = offsets[static_cast<ssize_t>(row) - 1]; i < offsets[row]; ++i)
-                {
-                    auto ref = key_column_str.getDataAt(i);
-
-                    bool inserted;
-                    SubcolumnsMap::LookupResult it;
-                    subcolumns.emplace(ref, it, inserted);
-                    auto & subcolumn = it->getMapped();
-
-                    if (inserted)
-                        subcolumn = value_column.cloneEmpty()->cloneResized(row);
-
-                    /// Map can have duplicated keys. We insert only first one.
-                    if (subcolumn->size() == row)
-                        subcolumn->insertFrom(value_column, i);
-                }
-
-                /// Insert default values for keys missed in current row.
-                for (const auto & [_, subcolumn] : subcolumns)
-                    if (subcolumn->size() == row)
-                        subcolumn->insertDefault();
-            }
-
-            auto column_object = ColumnObject::create(has_nullable_subcolumns);
-            for (auto && [key, subcolumn] : subcolumns)
-            {
-                PathInData path(key.toView());
-                column_object->addSubcolumn(path, std::move(subcolumn));
-            }
-
-            return column_object;
-        };
-    }
-
-    WrapperType createObjectWrapper(const DataTypePtr & from_type, const DataTypeObject * to_type) const
-    {
-        if (const auto * from_tuple = checkAndGetDataType<DataTypeTuple>(from_type.get()))
-        {
-            return createTupleToObjectWrapper(*from_tuple, to_type->hasNullableSubcolumns());
-        }
-        else if (const auto * from_map = checkAndGetDataType<DataTypeMap>(from_type.get()))
-        {
-            return createMapToObjectWrapper(*from_map, to_type->hasNullableSubcolumns());
-        }
-        else if (checkAndGetDataType<DataTypeString>(from_type.get()))
-        {
-            return [] (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * nullable_source, size_t input_rows_count)
-            {
-                auto res = ConvertImplGenericFromString<ColumnString>::execute(arguments, result_type, nullable_source, input_rows_count)->assumeMutable();
-                res->finalize();
-                return res;
-            };
-        }
-        else if (checkAndGetDataType<DataTypeObject>(from_type.get()))
-        {
-            return [is_nullable = to_type->hasNullableSubcolumns()] (ColumnsWithTypeAndName & arguments, const DataTypePtr & , const ColumnNullable * , size_t) -> ColumnPtr
-            {
-                auto & column_object = assert_cast<const ColumnObject &>(*arguments.front().column);
-                auto res = ColumnObject::create(is_nullable);
-                for (size_t i = 0; i < column_object.size(); i++)
-                    res->insert(column_object[i]);
-
-                res->finalize();
-                return res;
-            };
-        }
-
-        throw Exception(ErrorCodes::TYPE_MISMATCH,
-            "Cast to Object can be performed only from flatten named Tuple, Map or String. Got: {}", from_type->getName());
-    }
-
-    WrapperType createVariantToVariantWrapper(const DataTypeVariant & from_variant, const DataTypeVariant & to_variant) const
-    {
-        /// We support only extension of variant type, so, only new types can be added.
-        /// For example: Variant(T1, T2) -> Variant(T1, T2, T3) is supported, but Variant(T1, T2) -> Variant(T1, T3) is not supported.
-        /// We want to extend Variant type for free without rewriting the data, but we sort data types inside Variant during type creation
-        /// (we do it because we want Variant(T1, T2) to be the same as Variant(T2, T1)), but after extension the order of variant types
-        /// (and so their discriminators) can be different. For example: Variant(T1, T3) -> Variant(T1, T2, T3).
-        /// To avoid full rewrite of discriminators column, ColumnVariant supports it's local order of variant columns (and so local
-        /// discriminators) and stores mapping global order -> local order.
-        /// So, to extend Variant with new types for free, we should keep old local order for old variants, append new variants and change
-        /// mapping global order -> local order according to the new global order.
-
-        /// Create map (new variant type) -> (it's global discriminator in new order).
-        const auto & new_variants = to_variant.getVariants();
-        std::unordered_map<String, ColumnVariant::Discriminator> new_variant_types_to_new_global_discriminator;
-        new_variant_types_to_new_global_discriminator.reserve(new_variants.size());
-        for (size_t i = 0; i != new_variants.size(); ++i)
-            new_variant_types_to_new_global_discriminator[new_variants[i]->getName()] = i;
-
-        /// Create set of old variant types.
-        const auto & old_variants = from_variant.getVariants();
-        std::unordered_map<String, ColumnVariant::Discriminator> old_variant_types_to_old_global_discriminator;
-        old_variant_types_to_old_global_discriminator.reserve(old_variants.size());
-        for (size_t i = 0; i != old_variants.size(); ++i)
-            old_variant_types_to_old_global_discriminator[old_variants[i]->getName()] = i;
-
-        /// Check that the set of old variants types is a subset of new variant types and collect new global discriminator for each old global discriminator.
-        std::unordered_map<ColumnVariant::Discriminator, ColumnVariant::Discriminator> old_global_discriminator_to_new;
-        old_global_discriminator_to_new.reserve(old_variants.size());
-        for (const auto & [old_variant_type, old_discriminator] : old_variant_types_to_old_global_discriminator)
-        {
-            auto it = new_variant_types_to_new_global_discriminator.find(old_variant_type);
-            if (it == new_variant_types_to_new_global_discriminator.end())
-                throw Exception(
-                    ErrorCodes::CANNOT_CONVERT_TYPE,
-                    "Cannot convert type {} to {}. Conversion between Variant types is allowed only when new Variant type is an extension "
-                    "of an initial one", from_variant.getName(), to_variant.getName());
-            old_global_discriminator_to_new[old_discriminator] = it->second;
-        }
-
-        /// Collect variant types and their global discriminators that should be added to the old Variant to get the new Variant.
-        std::vector<std::pair<DataTypePtr, ColumnVariant::Discriminator>> variant_types_and_discriminators_to_add;
-        variant_types_and_discriminators_to_add.reserve(new_variants.size() - old_variants.size());
-        for (size_t i = 0; i != new_variants.size(); ++i)
-        {
-            if (!old_variant_types_to_old_global_discriminator.contains(new_variants[i]->getName()))
-                variant_types_and_discriminators_to_add.emplace_back(new_variants[i], i);
-        }
-
-        return [old_global_discriminator_to_new, variant_types_and_discriminators_to_add]
-               (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t) -> ColumnPtr
-        {
-            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
-            size_t num_old_variants = column_variant.getNumVariants();
-            Columns new_variant_columns;
-            new_variant_columns.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
-            std::vector<ColumnVariant::Discriminator> new_local_to_global_discriminators;
-            new_local_to_global_discriminators.reserve(num_old_variants + variant_types_and_discriminators_to_add.size());
-            for (size_t i = 0; i != num_old_variants; ++i)
-            {
-                new_variant_columns.push_back(column_variant.getVariantPtrByLocalDiscriminator(i));
-                new_local_to_global_discriminators.push_back(old_global_discriminator_to_new.at(column_variant.globalDiscriminatorByLocal(i)));
-            }
-
-            for (const auto & [new_variant_type, new_global_discriminator] : variant_types_and_discriminators_to_add)
-            {
-                new_variant_columns.push_back(new_variant_type->createColumn());
-                new_local_to_global_discriminators.push_back(new_global_discriminator);
-            }
-
-            return ColumnVariant::create(column_variant.getLocalDiscriminatorsPtr(), column_variant.getOffsetsPtr(), new_variant_columns, new_local_to_global_discriminators);
-        };
-    }
-
-    WrapperType createVariantToColumnWrapper(const DataTypeVariant & from_variant, const DataTypePtr & to_type) const
-    {
-        const auto & variant_types = from_variant.getVariants();
-        std::vector<WrapperType> variant_wrappers;
-        variant_wrappers.reserve(variant_types.size());
-
-        /// Create conversion wrapper for each variant.
-        for (const auto & variant_type : variant_types)
-            variant_wrappers.push_back(prepareUnpackDictionaries(variant_type, to_type));
-
-        return [variant_wrappers, variant_types, to_type]
-               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-        {
-            const auto & column_variant = assert_cast<const ColumnVariant &>(*arguments.front().column.get());
-
-            /// First, cast each variant to the result type.
-            std::vector<ColumnPtr> casted_variant_columns;
-            casted_variant_columns.reserve(variant_types.size());
-            for (size_t i = 0; i != variant_types.size(); ++i)
-            {
-                auto variant_col = column_variant.getVariantPtrByLocalDiscriminator(i);
-                ColumnsWithTypeAndName variant = {{variant_col, variant_types[i], "" }};
-                const auto & variant_wrapper = variant_wrappers[column_variant.globalDiscriminatorByLocal(i)];
-                casted_variant_columns.push_back(variant_wrapper(variant, result_type, nullptr, variant_col->size()));
-            }
-
-            /// Second, construct resulting column from casted variant columns according to discriminators.
-            const auto & local_discriminators = column_variant.getLocalDiscriminators();
-            auto res = result_type->createColumn();
-            res->reserve(input_rows_count);
-            for (size_t i = 0; i != input_rows_count; ++i)
-            {
-                auto local_discr = local_discriminators[i];
-                if (local_discr == ColumnVariant::NULL_DISCRIMINATOR)
-                    res->insertDefault();
-                else
-                    res->insertFrom(*casted_variant_columns[local_discr], column_variant.offsetAt(i));
-            }
-
-            return res;
-        };
-    }
-
-    static ColumnPtr createVariantFromDescriptorsAndOneNonEmptyVariant(const DataTypes & variant_types, const ColumnPtr & discriminators, const ColumnPtr & variant, ColumnVariant::Discriminator variant_discr)
-    {
-        Columns variants;
-        variants.reserve(variant_types.size());
-        for (size_t i = 0; i != variant_types.size(); ++i)
-        {
-            if (i == variant_discr)
-                variants.emplace_back(variant);
-            else
-                variants.push_back(variant_types[i]->createColumn());
-        }
-
-        return ColumnVariant::create(discriminators, variants);
-    }
-
-    WrapperType createColumnToVariantWrapper(const DataTypePtr & from_type, const DataTypeVariant & to_variant) const
-    {
-        /// We allow converting NULL to Variant(...) as Variant can store NULLs.
-        if (from_type->onlyNull())
-        {
-            return [](ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-            {
-                auto result_column = result_type->createColumn();
-                result_column->insertManyDefaults(input_rows_count);
-                return result_column;
-            };
-        }
-
-        auto variant_discr_opt = to_variant.tryGetVariantDiscriminator(*removeNullableOrLowCardinalityNullable(from_type));
-        if (!variant_discr_opt)
-            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert type {} to {}. Conversion to Variant allowed only for types from this Variant", from_type->getName(), to_variant.getName());
-
-        return [variant_discr = *variant_discr_opt]
-               (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t) -> ColumnPtr
-        {
-            const auto & result_variant_type = assert_cast<const DataTypeVariant &>(*result_type);
-            const auto & variant_types = result_variant_type.getVariants();
-            if (const ColumnNullable * col_nullable = typeid_cast<const ColumnNullable *>(arguments.front().column.get()))
-            {
-                const auto & column = col_nullable->getNestedColumnPtr();
-                const auto & null_map = col_nullable->getNullMapData();
-                IColumn::Filter filter;
-                filter.reserve(column->size());
-                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
-                auto & discriminators_data = discriminators->getData();
-                discriminators_data.reserve(column->size());
-                size_t variant_size_hint = 0;
-                for (size_t i = 0; i != column->size(); ++i)
-                {
-                    if (null_map[i])
-                    {
-                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
-                        filter.push_back(0);
-                    }
-                    else
-                    {
-                        discriminators_data.push_back(variant_discr);
-                        filter.push_back(1);
-                        ++variant_size_hint;
-                    }
-                }
-
-                ColumnPtr variant_column;
-                /// If there were no NULLs, just use the column.
-                if (variant_size_hint == column->size())
-                    variant_column = column;
-                /// Otherwise we should use filtered column.
-                else
-                    variant_column = column->filter(filter, variant_size_hint);
-                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), variant_column, variant_discr);
-            }
-            else if (isColumnLowCardinalityNullable(*arguments.front().column))
-            {
-                const auto & column = arguments.front().column;
-
-                /// Variant column cannot have LowCardinality(Nullable(...)) variant, as Variant column stores NULLs itself.
-                /// We should create a null-map, insert NULL_DISCRIMINATOR on NULL values and filter initial column.
-                const auto & col_lc = assert_cast<const ColumnLowCardinality &>(*column);
-                const auto & indexes = col_lc.getIndexes();
-                auto null_index = col_lc.getDictionary().getNullValueIndex();
-                IColumn::Filter filter;
-                filter.reserve(col_lc.size());
-                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
-                auto & discriminators_data = discriminators->getData();
-                discriminators_data.reserve(col_lc.size());
-                size_t variant_size_hint = 0;
-                for (size_t i = 0; i != col_lc.size(); ++i)
-                {
-                    if (indexes.getUInt(i) == null_index)
-                    {
-                        discriminators_data.push_back(ColumnVariant::NULL_DISCRIMINATOR);
-                        filter.push_back(0);
-                    }
-                    else
-                    {
-                        discriminators_data.push_back(variant_discr);
-                        filter.push_back(1);
-                        ++variant_size_hint;
-                    }
-                }
-
-                MutableColumnPtr variant_column;
-                /// If there were no NULLs, we can just clone the column.
-                if (variant_size_hint == col_lc.size())
-                    variant_column = IColumn::mutate(column);
-                /// Otherwise we should filter column.
-                else
-                    variant_column = column->filter(filter, variant_size_hint)->assumeMutable();
-
-                assert_cast<ColumnLowCardinality &>(*variant_column).nestedRemoveNullable();
-                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), std::move(variant_column), variant_discr);
-            }
-            else
-            {
-                const auto & column = arguments.front().column;
-                auto discriminators = ColumnVariant::ColumnDiscriminators::create();
-                discriminators->getData().resize_fill(column->size(), variant_discr);
-                return createVariantFromDescriptorsAndOneNonEmptyVariant(variant_types, std::move(discriminators), column, variant_discr);
-            }
-        };
-    }
-
-    /// Wrapper for conversion to/from Variant type
-    WrapperType createVariantWrapper(const DataTypePtr & from_type, const DataTypePtr & to_type) const
-    {
-        if (const auto * from_variant = checkAndGetDataType<DataTypeVariant>(from_type.get()))
-        {
-            if (const auto * to_variant = checkAndGetDataType<DataTypeVariant>(to_type.get()))
-                return createVariantToVariantWrapper(*from_variant, *to_variant);
-
-            return createVariantToColumnWrapper(*from_variant, to_type);
-        }
-
-        return createColumnToVariantWrapper(from_type, assert_cast<const DataTypeVariant &>(*to_type));
-    }
-
-    template <typename FieldType>
-    WrapperType createEnumWrapper(const DataTypePtr & from_type, const DataTypeEnum<FieldType> * to_type) const
-    {
-        using EnumType = DataTypeEnum<FieldType>;
-        using Function = typename FunctionTo<EnumType>::Type;
-
-        if (const auto * from_enum8 = checkAndGetDataType<DataTypeEnum8>(from_type.get()))
-            checkEnumToEnumConversion(from_enum8, to_type);
-        else if (const auto * from_enum16 = checkAndGetDataType<DataTypeEnum16>(from_type.get()))
-            checkEnumToEnumConversion(from_enum16, to_type);
-
-        if (checkAndGetDataType<DataTypeString>(from_type.get()))
-            return createStringToEnumWrapper<ColumnString, EnumType>();
-        else if (checkAndGetDataType<DataTypeFixedString>(from_type.get()))
-            return createStringToEnumWrapper<ColumnFixedString, EnumType>();
-        else if (isNativeNumber(from_type) || isEnum(from_type))
-        {
-            auto function = Function::create();
-            return createFunctionAdaptor(function, from_type);
-        }
-        else
-        {
-            if (cast_type == CastType::accurateOrNull)
-                return createToNullableColumnWrapper();
-            else
-                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
-                    from_type->getName(), to_type->getName());
-        }
-    }
-
-    template <typename EnumTypeFrom, typename EnumTypeTo>
-    void checkEnumToEnumConversion(const EnumTypeFrom * from_type, const EnumTypeTo * to_type) const
-    {
-        const auto & from_values = from_type->getValues();
-        const auto & to_values = to_type->getValues();
-
-        using ValueType = std::common_type_t<typename EnumTypeFrom::FieldType, typename EnumTypeTo::FieldType>;
-        using NameValuePair = std::pair<std::string, ValueType>;
-        using EnumValues = std::vector<NameValuePair>;
-
-        EnumValues name_intersection;
-        std::set_intersection(std::begin(from_values), std::end(from_values),
-            std::begin(to_values), std::end(to_values), std::back_inserter(name_intersection),
-            [] (auto && from, auto && to) { return from.first < to.first; });
-
-        for (const auto & name_value : name_intersection)
-        {
-            const auto & old_value = name_value.second;
-            const auto & new_value = to_type->getValue(name_value.first);
-            if (old_value != new_value)
-                throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Enum conversion changes value for element '{}' from {} to {}",
-                    name_value.first, toString(old_value), toString(new_value));
-        }
-    }
-
-    template <typename ColumnStringType, typename EnumType>
-    WrapperType createStringToEnumWrapper() const
-    {
-        const char * function_name = cast_name;
-        return [function_name] (
-            ColumnsWithTypeAndName & arguments, const DataTypePtr & res_type, const ColumnNullable * nullable_col, size_t /*input_rows_count*/)
-        {
-            const auto & first_col = arguments.front().column.get();
-            const auto & result_type = typeid_cast<const EnumType &>(*res_type);
-
-            const ColumnStringType * col = typeid_cast<const ColumnStringType *>(first_col);
-
-            if (col && nullable_col && nullable_col->size() != col->size())
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "ColumnNullable is not compatible with original");
-
-            if (col)
-            {
-                const auto size = col->size();
-
-                auto res = result_type.createColumn();
-                auto & out_data = static_cast<typename EnumType::ColumnType &>(*res).getData();
-                out_data.resize(size);
-
-                auto default_enum_value = result_type.getValues().front().second;
-
-                if (nullable_col)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!nullable_col->isNullAt(i))
-                            out_data[i] = result_type.getValue(col->getDataAt(i));
-                        else
-                            out_data[i] = default_enum_value;
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                        out_data[i] = result_type.getValue(col->getDataAt(i));
-                }
-
-                return res;
-            }
-            else
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected column {} as first argument of function {}",
-                    first_col->getName(), function_name);
-        };
-    }
-
-    template <typename EnumType>
-    WrapperType createEnumToStringWrapper() const
-    {
-        const char * function_name = cast_name;
-        return [function_name] (
-            ColumnsWithTypeAndName & arguments, const DataTypePtr & res_type, const ColumnNullable * nullable_col, size_t /*input_rows_count*/)
-        {
-            using ColumnEnumType = EnumType::ColumnType;
-
-            const auto & first_col = arguments.front().column.get();
-            const auto & first_type = arguments.front().type.get();
-
-            const ColumnEnumType * enum_col = typeid_cast<const ColumnEnumType *>(first_col);
-            const EnumType * enum_type = typeid_cast<const EnumType *>(first_type);
-
-            if (enum_col && nullable_col && nullable_col->size() != enum_col->size())
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "ColumnNullable is not compatible with original");
-
-            if (enum_col && enum_type)
-            {
-                const auto size = enum_col->size();
-                const auto & enum_data = enum_col->getData();
-
-                auto res = res_type->createColumn();
-
-                if (nullable_col)
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        if (!nullable_col->isNullAt(i))
-                        {
-                            const auto & value = enum_type->getNameForValue(enum_data[i]);
-                            res->insertData(value.data, value.size);
-                        }
-                        else
-                            res->insertDefault();
-                    }
-                }
-                else
-                {
-                    for (size_t i = 0; i < size; ++i)
-                    {
-                        const auto & value = enum_type->getNameForValue(enum_data[i]);
-                        res->insertData(value.data, value.size);
-                    }
-                }
-
-                return res;
-            }
-            else
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected column {} as first argument of function {}",
-                    first_col->getName(), function_name);
-        };
-    }
-
-    static WrapperType createIdentityWrapper(const DataTypePtr &)
-    {
-        return [] (ColumnsWithTypeAndName & arguments, const DataTypePtr &, const ColumnNullable *, size_t /*input_rows_count*/)
-        {
-            return arguments.front().column;
-        };
-    }
-
-    static WrapperType createNothingWrapper(const IDataType * to_type)
-    {
-        ColumnPtr res = to_type->createColumnConstWithDefaultValue(1);
-        return [res] (ColumnsWithTypeAndName &, const DataTypePtr &, const ColumnNullable *, size_t input_rows_count)
-        {
-            /// Column of Nothing type is trivially convertible to any other column
-            return res->cloneResized(input_rows_count)->convertToFullColumnIfConst();
-        };
-    }
-
-    WrapperType prepareUnpackDictionaries(const DataTypePtr & from_type, const DataTypePtr & to_type) const
-    {
-        /// Conversion from/to Variant data type is processed in a special way.
-        /// We don't need to remove LowCardinality/Nullable.
-        if (isVariant(to_type) || isVariant(from_type))
-            return createVariantWrapper(from_type, to_type);
-
-        const auto * from_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(from_type.get());
-        const auto * to_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(to_type.get());
-        const auto & from_nested = from_low_cardinality ? from_low_cardinality->getDictionaryType() : from_type;
-        const auto & to_nested = to_low_cardinality ? to_low_cardinality->getDictionaryType() : to_type;
-
-        if (from_type->onlyNull())
-        {
-            if (!to_nested->isNullable() && !isVariant(to_type))
-            {
-                if (cast_type == CastType::accurateOrNull)
-                {
-                    return createToNullableColumnWrapper();
-                }
-                else
-                {
-                    throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Cannot convert NULL to a non-nullable type");
-                }
-            }
-
-            return [](ColumnsWithTypeAndName &, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count)
-            {
-                return result_type->createColumnConstWithDefaultValue(input_rows_count)->convertToFullColumnIfConst();
-            };
-        }
-
-        bool skip_not_null_check = false;
-
-        if (from_low_cardinality && from_nested->isNullable() && !to_nested->isNullable())
-            /// Disable check for dictionary. Will check that column doesn't contain NULL in wrapper below.
-            skip_not_null_check = true;
-
-        auto wrapper = prepareRemoveNullable(from_nested, to_nested, skip_not_null_check);
-        if (!from_low_cardinality && !to_low_cardinality)
-            return wrapper;
-
-        return [wrapper, from_low_cardinality, to_low_cardinality, skip_not_null_check]
-                (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * nullable_source, size_t input_rows_count) -> ColumnPtr
-        {
-            ColumnsWithTypeAndName args = {arguments[0]};
-            auto & arg = args.front();
-            auto res_type = result_type;
-
-            ColumnPtr converted_column;
-
-            ColumnPtr res_indexes;
-            /// For some types default can't be casted (for example, String to Int). In that case convert column to full.
-            bool src_converted_to_full_column = false;
-
-            {
-                auto tmp_rows_count = input_rows_count;
-
-                if (to_low_cardinality)
-                    res_type = to_low_cardinality->getDictionaryType();
-
-                if (from_low_cardinality)
-                {
-                    const auto * col_low_cardinality = assert_cast<const ColumnLowCardinality *>(arguments[0].column.get());
-
-                    if (skip_not_null_check && col_low_cardinality->containsNull())
-                        throw Exception(ErrorCodes::CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN, "Cannot convert NULL value to non-Nullable type");
-
-                    arg.column = col_low_cardinality->getDictionary().getNestedColumn();
-                    arg.type = from_low_cardinality->getDictionaryType();
-
-                    /// TODO: Make map with defaults conversion.
-                    src_converted_to_full_column = !removeNullable(arg.type)->equals(*removeNullable(res_type));
-                    if (src_converted_to_full_column)
-                        arg.column = arg.column->index(col_low_cardinality->getIndexes(), 0);
-                    else
-                        res_indexes = col_low_cardinality->getIndexesPtr();
-
-                    tmp_rows_count = arg.column->size();
-                }
-
-                /// Perform the requested conversion.
-                converted_column = wrapper(args, res_type, nullable_source, tmp_rows_count);
-            }
-
-            if (to_low_cardinality)
-            {
-                auto res_column = to_low_cardinality->createColumn();
-                auto * col_low_cardinality = assert_cast<ColumnLowCardinality *>(res_column.get());
-
-                if (from_low_cardinality && !src_converted_to_full_column)
-                {
-                    col_low_cardinality->insertRangeFromDictionaryEncodedColumn(*converted_column, *res_indexes);
-                }
-                else
-                    col_low_cardinality->insertRangeFromFullColumn(*converted_column, 0, converted_column->size());
-
-                return res_column;
-            }
-            else if (!src_converted_to_full_column)
-                return converted_column->index(*res_indexes, 0);
-            else
-                return converted_column;
-        };
-    }
-
-    WrapperType prepareRemoveNullable(const DataTypePtr & from_type, const DataTypePtr & to_type, bool skip_not_null_check) const
-    {
-        /// Determine whether pre-processing and/or post-processing must take place during conversion.
-
-        bool source_is_nullable = from_type->isNullable();
-        bool result_is_nullable = to_type->isNullable();
-
-        auto wrapper = prepareImpl(removeNullable(from_type), removeNullable(to_type), result_is_nullable);
-
-        if (result_is_nullable)
-        {
-            return [wrapper, source_is_nullable]
-                (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-            {
-                /// Create a temporary columns on which to perform the operation.
-                const auto & nullable_type = static_cast<const DataTypeNullable &>(*result_type);
-                const auto & nested_type = nullable_type.getNestedType();
-
-                ColumnsWithTypeAndName tmp_args;
-                if (source_is_nullable)
-                    tmp_args = createBlockWithNestedColumns(arguments);
-                else
-                    tmp_args = arguments;
-
-                const ColumnNullable * nullable_source = nullptr;
-
-                /// Add original ColumnNullable for createStringToEnumWrapper()
-                if (source_is_nullable)
-                {
-                    if (arguments.size() != 1)
-                        throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid number of arguments");
-                    nullable_source = typeid_cast<const ColumnNullable *>(arguments.front().column.get());
-                }
-
-                /// Perform the requested conversion.
-                auto tmp_res = wrapper(tmp_args, nested_type, nullable_source, input_rows_count);
-
-                /// May happen in fuzzy tests. For debug purpose.
-                if (!tmp_res)
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Couldn't convert {} to {} in prepareRemoveNullable wrapper.",
-                                    arguments[0].type->getName(), nested_type->getName());
-
-                return wrapInNullable(tmp_res, arguments, nested_type, input_rows_count);
-            };
-        }
-        else if (source_is_nullable)
-        {
-            /// Conversion from Nullable to non-Nullable.
-
-            return [wrapper, skip_not_null_check]
-                (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-            {
-                auto tmp_args = createBlockWithNestedColumns(arguments);
-                auto nested_type = removeNullable(result_type);
-
-                /// Check that all values are not-NULL.
-                /// Check can be skipped in case if LowCardinality dictionary is transformed.
-                /// In that case, correctness will be checked beforehand.
-                if (!skip_not_null_check)
-                {
-                    const auto & col = arguments[0].column;
-                    const auto & nullable_col = assert_cast<const ColumnNullable &>(*col);
-                    const auto & null_map = nullable_col.getNullMapData();
-
-                    if (!memoryIsZero(null_map.data(), 0, null_map.size()))
-                        throw Exception(ErrorCodes::CANNOT_INSERT_NULL_IN_ORDINARY_COLUMN, "Cannot convert NULL value to non-Nullable type");
-                }
-                const ColumnNullable * nullable_source = typeid_cast<const ColumnNullable *>(arguments.front().column.get());
-                return wrapper(tmp_args, nested_type, nullable_source, input_rows_count);
-            };
-        }
-        else
-            return wrapper;
-    }
-
-    /// 'from_type' and 'to_type' are nested types in case of Nullable.
-    /// 'requested_result_is_nullable' is true if CAST to Nullable type is requested.
-    WrapperType prepareImpl(const DataTypePtr & from_type, const DataTypePtr & to_type, bool requested_result_is_nullable) const
-    {
-        if (isUInt8(from_type) && isBool(to_type))
-            return createUInt8ToBoolWrapper(from_type, to_type);
-
-        /// We can cast IPv6 into IPv6, IPv4 into IPv4, but we should not allow to cast FixedString(16) into IPv6 as part of identity cast
-        bool safe_convert_custom_types = true;
-
-        if (const auto * to_type_custom_name = to_type->getCustomName())
-            safe_convert_custom_types = from_type->getCustomName() && from_type->getCustomName()->getName() == to_type_custom_name->getName();
-        else if (const auto * from_type_custom_name = from_type->getCustomName())
-            safe_convert_custom_types = to_type->getCustomName() && from_type_custom_name->getName() == to_type->getCustomName()->getName();
-
-        if (from_type->equals(*to_type) && safe_convert_custom_types)
-        {
-            /// We can only use identity conversion for DataTypeAggregateFunction when they are strictly equivalent.
-            if (typeid_cast<const DataTypeAggregateFunction *>(from_type.get()))
-            {
-                if (DataTypeAggregateFunction::strictEquals(from_type, to_type))
-                    return createIdentityWrapper(from_type);
-            }
-            else
-                return createIdentityWrapper(from_type);
-        }
-        else if (WhichDataType(from_type).isNothing())
-            return createNothingWrapper(to_type.get());
-
-        WrapperType ret;
-
-        auto make_default_wrapper = [&](const auto & types) -> bool
-        {
-            using Types = std::decay_t<decltype(types)>;
-            using ToDataType = typename Types::LeftType;
-
-            if constexpr (
-                std::is_same_v<ToDataType, DataTypeUInt16> ||
-                std::is_same_v<ToDataType, DataTypeUInt32> ||
-                std::is_same_v<ToDataType, DataTypeUInt64> ||
-                std::is_same_v<ToDataType, DataTypeUInt128> ||
-                std::is_same_v<ToDataType, DataTypeUInt256> ||
-                std::is_same_v<ToDataType, DataTypeInt8> ||
-                std::is_same_v<ToDataType, DataTypeInt16> ||
-                std::is_same_v<ToDataType, DataTypeInt32> ||
-                std::is_same_v<ToDataType, DataTypeInt64> ||
-                std::is_same_v<ToDataType, DataTypeInt128> ||
-                std::is_same_v<ToDataType, DataTypeInt256> ||
-                std::is_same_v<ToDataType, DataTypeFloat32> ||
-                std::is_same_v<ToDataType, DataTypeFloat64> ||
-                std::is_same_v<ToDataType, DataTypeDate> ||
-                std::is_same_v<ToDataType, DataTypeDate32> ||
-                std::is_same_v<ToDataType, DataTypeDateTime> ||
-                std::is_same_v<ToDataType, DataTypeUUID> ||
-                std::is_same_v<ToDataType, DataTypeIPv4> ||
-                std::is_same_v<ToDataType, DataTypeIPv6>)
-            {
-                ret = createWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
-                return true;
-            }
-            if constexpr (std::is_same_v<ToDataType, DataTypeUInt8>)
-            {
-                if (isBool(to_type))
-                    ret = createBoolWrapper<ToDataType>(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
-                else
-                    ret = createWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
-                return true;
-            }
-            if constexpr (
-                std::is_same_v<ToDataType, DataTypeEnum8> ||
-                std::is_same_v<ToDataType, DataTypeEnum16>)
-            {
-                ret = createEnumWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()));
-                return true;
-            }
-            if constexpr (
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal32>> ||
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal64>> ||
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal128>> ||
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal256>> ||
-                std::is_same_v<ToDataType, DataTypeDateTime64>)
-            {
-                ret = createDecimalWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
-                return true;
-            }
-
-            return false;
-        };
-
-        bool cast_ipv4_ipv6_default_on_conversion_error_value = context && context->getSettingsRef().cast_ipv4_ipv6_default_on_conversion_error;
-        bool input_format_ipv4_default_on_conversion_error_value = context && context->getSettingsRef().input_format_ipv4_default_on_conversion_error;
-        bool input_format_ipv6_default_on_conversion_error_value = context && context->getSettingsRef().input_format_ipv6_default_on_conversion_error;
-
-        auto make_custom_serialization_wrapper = [&, cast_ipv4_ipv6_default_on_conversion_error_value, input_format_ipv4_default_on_conversion_error_value, input_format_ipv6_default_on_conversion_error_value](const auto & types) -> bool
-        {
-            using Types = std::decay_t<decltype(types)>;
-            using ToDataType = typename Types::RightType;
-            using FromDataType = typename Types::LeftType;
-
-            if constexpr (WhichDataType(FromDataType::type_id).isStringOrFixedString())
-            {
-                if constexpr (std::is_same_v<ToDataType, DataTypeIPv4>)
-                {
-                    ret = [cast_ipv4_ipv6_default_on_conversion_error_value,
-                           input_format_ipv4_default_on_conversion_error_value,
-                           requested_result_is_nullable](
-                              ColumnsWithTypeAndName & arguments,
-                              const DataTypePtr & result_type,
-                              const ColumnNullable * column_nullable,
-                              size_t) -> ColumnPtr
-                    {
-                        if (!WhichDataType(result_type).isIPv4())
-                            throw Exception(ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv4", result_type->getName());
-
-                        const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
-                        if (requested_result_is_nullable)
-                            return convertToIPv4<IPStringToNumExceptionMode::Null>(arguments[0].column, null_map);
-                        else if (cast_ipv4_ipv6_default_on_conversion_error_value || input_format_ipv4_default_on_conversion_error_value)
-                            return convertToIPv4<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
-                        else
-                            return convertToIPv4<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
-                    };
-
-                    return true;
-                }
-
-                if constexpr (std::is_same_v<ToDataType, DataTypeIPv6>)
-                {
-                    ret = [cast_ipv4_ipv6_default_on_conversion_error_value,
-                           input_format_ipv6_default_on_conversion_error_value,
-                           requested_result_is_nullable](
-                              ColumnsWithTypeAndName & arguments,
-                              const DataTypePtr & result_type,
-                              const ColumnNullable * column_nullable,
-                              size_t) -> ColumnPtr
-                    {
-                        if (!WhichDataType(result_type).isIPv6())
-                            throw Exception(
-                                ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv6", result_type->getName());
-
-                        const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
-                        if (requested_result_is_nullable)
-                            return convertToIPv6<IPStringToNumExceptionMode::Null>(arguments[0].column, null_map);
-                        else if (cast_ipv4_ipv6_default_on_conversion_error_value || input_format_ipv6_default_on_conversion_error_value)
-                            return convertToIPv6<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
-                        else
-                            return convertToIPv6<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
-                    };
-
-                    return true;
-                }
-
-                if (to_type->getCustomSerialization() && to_type->getCustomName())
-                {
-                    ret = [requested_result_is_nullable](
-                              ColumnsWithTypeAndName & arguments,
-                              const DataTypePtr & result_type,
-                              const ColumnNullable * column_nullable,
-                              size_t input_rows_count) -> ColumnPtr
-                    {
-                        auto wrapped_result_type = result_type;
-                        if (requested_result_is_nullable)
-                            wrapped_result_type = makeNullable(result_type);
-                        return ConvertImplGenericFromString<typename FromDataType::ColumnType>::execute(
-                            arguments, wrapped_result_type, column_nullable, input_rows_count);
-                    };
-                    return true;
-                }
-            }
-            else if constexpr (WhichDataType(FromDataType::type_id).isIPv6() && WhichDataType(ToDataType::type_id).isIPv4())
-            {
-                ret = [cast_ipv4_ipv6_default_on_conversion_error_value, requested_result_is_nullable](
-                                ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * column_nullable, size_t)
-                        -> ColumnPtr
-                {
-                    if (!WhichDataType(result_type).isIPv4())
-                        throw Exception(
-                            ErrorCodes::TYPE_MISMATCH, "Wrong result type {}. Expected IPv4", result_type->getName());
-
-                    const auto * null_map = column_nullable ? &column_nullable->getNullMapData() : nullptr;
-                    if (requested_result_is_nullable)
-                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Null>(arguments[0].column, null_map);
-                    else if (cast_ipv4_ipv6_default_on_conversion_error_value)
-                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Default>(arguments[0].column, null_map);
-                    else
-                        return convertIPv6ToIPv4<IPStringToNumExceptionMode::Throw>(arguments[0].column, null_map);
-                };
-
-                return true;
-            }
-
-            if constexpr (WhichDataType(ToDataType::type_id).isStringOrFixedString())
-            {
-                if constexpr (WhichDataType(FromDataType::type_id).isEnum())
-                {
-                    ret = createEnumToStringWrapper<FromDataType>();
-                    return true;
-                }
-                else if (from_type->getCustomSerialization())
-                {
-                    ret = [](ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *, size_t input_rows_count) -> ColumnPtr
-                    {
-                        return ConvertImplGenericToString<typename ToDataType::ColumnType>::execute(arguments, result_type, input_rows_count);
-                    };
-                    return true;
-                }
-            }
-
-            return false;
-        };
-
-        if (callOnTwoTypeIndexes(from_type->getTypeId(), to_type->getTypeId(), make_custom_serialization_wrapper))
-            return ret;
-
-        if (callOnIndexAndDataType<void>(to_type->getTypeId(), make_default_wrapper))
-            return ret;
-
-        switch (to_type->getTypeId())
-        {
-            case TypeIndex::String:
-                return createStringWrapper(from_type);
-            case TypeIndex::FixedString:
-                return createFixedStringWrapper(from_type, checkAndGetDataType<DataTypeFixedString>(to_type.get())->getN());
-            case TypeIndex::Array:
-                return createArrayWrapper(from_type, static_cast<const DataTypeArray &>(*to_type));
-            case TypeIndex::Tuple:
-                return createTupleWrapper(from_type, checkAndGetDataType<DataTypeTuple>(to_type.get()));
-            case TypeIndex::Map:
-                return createMapWrapper(from_type, checkAndGetDataType<DataTypeMap>(to_type.get()));
-            case TypeIndex::Object:
-                return createObjectWrapper(from_type, checkAndGetDataType<DataTypeObject>(to_type.get()));
-            case TypeIndex::AggregateFunction:
-                return createAggregateFunctionWrapper(from_type, checkAndGetDataType<DataTypeAggregateFunction>(to_type.get()));
-            case TypeIndex::Interval:
-                return createIntervalWrapper(from_type, checkAndGetDataType<DataTypeInterval>(to_type.get())->getKind());
-            default:
-                break;
-        }
-
-        if (cast_type == CastType::accurateOrNull)
-            return createToNullableColumnWrapper();
-        else
-            throw Exception(ErrorCodes::CANNOT_CONVERT_TYPE, "Conversion from {} to {} is not supported",
-                from_type->getName(), to_type->getName());
-    }
-};
-
-class MonotonicityHelper
-{
-public:
-    using MonotonicityForRange = FunctionCastBase::MonotonicityForRange;
-
-    template <typename DataType>
-    static auto monotonicityForType(const DataType * const)
-    {
-        return FunctionTo<DataType>::Type::Monotonic::get;
-    }
-
-    static MonotonicityForRange getMonotonicityInformation(const DataTypePtr & from_type, const IDataType * to_type)
-    {
-        if (const auto * type = checkAndGetDataType<DataTypeUInt8>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt16>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt64>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt128>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt256>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt8>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt16>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt64>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt128>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt256>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeFloat32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeFloat64>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeDate>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeDate32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeDateTime>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeString>(to_type))
-            return monotonicityForType(type);
-        if (isEnum(from_type))
-        {
-            if (const auto * type = checkAndGetDataType<DataTypeEnum8>(to_type))
-                return monotonicityForType(type);
-            if (const auto * type = checkAndGetDataType<DataTypeEnum16>(to_type))
-                return monotonicityForType(type);
-        }
-        /// other types like Null, FixedString, Array and Tuple have no monotonicity defined
-        return {};
-    }
-};
-
-}

From 277032e444652cfc18f62032a35af918bac39f4d Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 14 Mar 2024 14:16:33 +0100
Subject: [PATCH 507/985] Move the least updating cctools into beginning,
 update it

---
 docker/packager/binary-builder/Dockerfile | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docker/packager/binary-builder/Dockerfile b/docker/packager/binary-builder/Dockerfile
index 96c90403187..c9442accd7e 100644
--- a/docker/packager/binary-builder/Dockerfile
+++ b/docker/packager/binary-builder/Dockerfile
@@ -4,6 +4,9 @@ FROM clickhouse/fasttest:$FROM_TAG
 ENV CC=clang-${LLVM_VERSION}
 ENV CXX=clang++-${LLVM_VERSION}
 
+# If the cctools is updated, then first build it in the CI, then update here in a different commit
+COPY --from=clickhouse/cctools:d9e3596e706b /cctools /cctools
+
 # Rust toolchain and libraries
 ENV RUSTUP_HOME=/rust/rustup
 ENV CARGO_HOME=/rust/cargo
@@ -73,9 +76,6 @@ RUN curl -Lo /usr/bin/clang-tidy-cache \
         "https://raw.githubusercontent.com/matus-chochlik/ctcache/$CLANG_TIDY_SHA1/clang-tidy-cache" \
     && chmod +x /usr/bin/clang-tidy-cache
 
-# If the cctools is updated, then first build it in the CI, then update here in a different commit
-COPY --from=clickhouse/cctools:5a908f73878a /cctools /cctools
-
 RUN mkdir /workdir && chmod 777 /workdir
 WORKDIR /workdir
 

From d465835306c013b62e35c1330326505095b8b658 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 14 Mar 2024 14:08:43 +0100
Subject: [PATCH 508/985] Reorder hidden and shown checks in comment, change
 url of Mergeable check

---
 tests/ci/commit_status_helper.py | 20 +++++++++++---------
 1 file changed, 11 insertions(+), 9 deletions(-)

diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 1c2d8b2ade8..bda2db13991 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -18,8 +18,10 @@ from github.GithubObject import NotSet
 from github.IssueComment import IssueComment
 from github.Repository import Repository
 
-from ci_config import REQUIRED_CHECKS, CHECK_DESCRIPTIONS, CheckDescription
-from env_helper import GITHUB_JOB_URL, GITHUB_REPOSITORY, TEMP_PATH
+# isort: on
+
+from ci_config import CHECK_DESCRIPTIONS, REQUIRED_CHECKS, CheckDescription
+from env_helper import GITHUB_REPOSITORY, GITHUB_RUN_URL, TEMP_PATH
 from pr_info import SKIP_MERGEABLE_CHECK_LABEL, PRInfo
 from report import (
     ERROR,
@@ -259,6 +261,12 @@ def generate_status_comment(pr_info: PRInfo, statuses: CommitStatuses) -> str:
 
     result = [comment_body]
 
+    if visible_table_rows:
+        visible_table_rows.sort()
+        result.append(table_header)
+        result.extend(visible_table_rows)
+        result.append(table_footer)
+
     if hidden_table_rows:
         hidden_table_rows.sort()
         result.append(details_header)
@@ -267,12 +275,6 @@ def generate_status_comment(pr_info: PRInfo, statuses: CommitStatuses) -> str:
         result.append(table_footer)
         result.append(details_footer)
 
-    if visible_table_rows:
-        visible_table_rows.sort()
-        result.append(table_header)
-        result.extend(visible_table_rows)
-        result.append(table_footer)
-
     return "".join(result)
 
 
@@ -427,7 +429,7 @@ def set_mergeable_check(
         context=MERGEABLE_NAME,
         description=format_description(description),
         state=state,
-        target_url=GITHUB_JOB_URL(),
+        target_url=GITHUB_RUN_URL,
     )
 
 
From 03b9bca8a4dc7f27c20d8cca22cbbc234ed0468c Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 14 Mar 2024 14:31:55 +0100
Subject: [PATCH 509/985] Terminate EC2 on spot event if runner isn't running

---
 tests/ci/worker/init_runner.sh | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/tests/ci/worker/init_runner.sh b/tests/ci/worker/init_runner.sh
index b211128cf10..de1d128dc87 100644
--- a/tests/ci/worker/init_runner.sh
+++ b/tests/ci/worker/init_runner.sh
@@ -138,13 +138,15 @@ check_spot_instance_is_old() {
 check_proceed_spot_termination() {
     # The function checks and proceeds spot instance termination if exists
     # The event for spot instance termination
+    local FORCE
+    FORCE=${1:-}
     if TERMINATION_DATA=$(curl -s --fail http://169.254.169.254/latest/meta-data/spot/instance-action); then
         # https://docs.aws.amazon.com/AWSEC2/latest/UserGuide/spot-instance-termination-notices.html#instance-action-metadata
         _action=$(jq '.action' -r <<< "$TERMINATION_DATA")
         _time=$(jq '.time | fromdate' <<< "$TERMINATION_DATA")
         _until_action=$((_time - $(date +%s)))
         echo "Received the '$_action' event that will be effective in $_until_action seconds"
-        if (( _until_action <= 30 )); then
+        if (( _until_action <= 30 )) || [ "$FORCE" == "force" ]; then
             echo "The action $_action will be done in $_until_action, killing the runner and exit"
             local runner_pid
             runner_pid=$(pgrep Runner.Listener)
@@ -309,7 +311,7 @@ while true; do
         echo "Checking if the instance suppose to terminate"
         no_terminating_metadata || terminate_on_event
         check_spot_instance_is_old && terminate_and_exit
-        check_proceed_spot_termination
+        check_proceed_spot_termination force
 
         echo "Going to configure runner"
         sudo -u ubuntu ./config.sh --url $RUNNER_URL --token "$(get_runner_token)" \
@@ -319,7 +321,7 @@ while true; do
         echo "Another one check to avoid race between runner and infrastructure"
         no_terminating_metadata || terminate_on_event
         check_spot_instance_is_old && terminate_and_exit
-        check_proceed_spot_termination
+        check_proceed_spot_termination force
 
         echo "Run"
         sudo -u ubuntu \

From 02ae7e54a71881fc58956561d9c8b7b9013438ea Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 14 Mar 2024 12:28:02 +0100
Subject: [PATCH 510/985] Fix bugfix check (due to "unknown object storage
 type: azure")

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 docker/test/stateless/run.sh | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index dc181339786..2a91b235df8 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -61,6 +61,18 @@ if [[ -n "$BUGFIX_VALIDATE_CHECK" ]] && [[ "$BUGFIX_VALIDATE_CHECK" -eq 1 ]]; th
     rm /etc/clickhouse-server/users.d/s3_cache_new.xml
     rm /etc/clickhouse-server/config.d/zero_copy_destructive_operations.xml
 
+    #todo: remove these after 24.3 released.
+    sudo cat /etc/clickhouse-server/config.d/azure_storage_conf.xml \
+      | sed "s|<object_storage_type>azure|<object_storage_type>azure_blob_storage|" \
+      > /etc/clickhouse-server/config.d/azure_storage_conf.xml.tmp
+    sudo mv /etc/clickhouse-server/config.d/azure_storage_conf.xml.tmp /etc/clickhouse-server/config.d/azure_storage_conf.xml
+
+    #todo: remove these after 24.3 released.
+    sudo cat /etc/clickhouse-server/config.d/storage_conf.xml \
+      | sed "s|<object_storage_type>local|<object_storage_type>local_blob_storage|" \
+      > /etc/clickhouse-server/config.d/storage_conf.xml.tmp
+    sudo mv /etc/clickhouse-server/config.d/storage_conf.xml.tmp /etc/clickhouse-server/config.d/storage_conf.xml
+
     function remove_keeper_config()
     {
         sudo cat /etc/clickhouse-server/config.d/keeper_port.xml \

From 82b089f4e95073e7048254bf5d4dc03a515f71a2 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Thu, 14 Mar 2024 13:59:29 +0000
Subject: [PATCH 511/985] remove profile event

---
 src/Common/ProfileEvents.cpp    | 1 -
 src/Interpreters/Aggregator.cpp | 4 ----
 2 files changed, 5 deletions(-)

diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 8fd1e189977..e43e8910089 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -533,7 +533,6 @@ The server successfully detected this situation and will download merged part fr
     \
     M(AggregationPreallocatedElementsInHashTables, "How many elements were preallocated in hash tables for aggregation.") \
     M(AggregationHashTablesInitializedAsTwoLevel, "How many hash tables were inited as two-level for aggregation.") \
-    M(AggregationProcessedBlocks, "How many blocks were processed by Aggregator") \
     M(AggregationOptimizedEqualRangesOfKeys, "For how many blocks optimization of equal ranges of keys was applied") \
     \
     M(MetadataFromKeeperCacheHit, "Number of times an object storage metadata request was answered from cache without making request to Keeper") \
diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 7c9dac82eff..40b1c09a32e 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -53,7 +53,6 @@ namespace ProfileEvents
     extern const Event OverflowThrow;
     extern const Event OverflowBreak;
     extern const Event OverflowAny;
-    extern const Event AggregationProcessedBlocks;
     extern const Event AggregationOptimizedEqualRangesOfKeys;
 }
 
@@ -987,7 +986,6 @@ void Aggregator::executeOnBlockSmall(
 {
     /// `result` will destroy the states of aggregate functions in the destructor
     result.aggregator = this;
-    ProfileEvents::increment(ProfileEvents::AggregationProcessedBlocks);
 
     /// How to perform the aggregation?
     if (result.empty())
@@ -1521,7 +1519,6 @@ void NO_INLINE Aggregator::executeOnIntervalWithoutKey(
     /// `data_variants` will destroy the states of aggregate functions in the destructor
     data_variants.aggregator = this;
     data_variants.init(AggregatedDataVariants::Type::without_key);
-    ProfileEvents::increment(ProfileEvents::AggregationProcessedBlocks);
 
     AggregatedDataWithoutKey & res = data_variants.without_key;
 
@@ -1653,7 +1650,6 @@ bool Aggregator::executeOnBlock(Columns columns,
 {
     /// `result` will destroy the states of aggregate functions in the destructor
     result.aggregator = this;
-    ProfileEvents::increment(ProfileEvents::AggregationProcessedBlocks);
 
     /// How to perform the aggregation?
     if (result.empty())

From 200823c31108015b16ead859a346a59f83cc6e74 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 14 Mar 2024 15:04:19 +0100
Subject: [PATCH 512/985] Try fix docs check

---
 .../sql-reference/aggregate-functions/reference/varpop.md   | 4 ++--
 .../sql-reference/aggregate-functions/reference/varsamp.md  | 6 +++---
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/docs/en/sql-reference/aggregate-functions/reference/varpop.md b/docs/en/sql-reference/aggregate-functions/reference/varpop.md
index 76472f62789..2044b7e690b 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/varpop.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/varpop.md
@@ -63,8 +63,8 @@ covarPopStable(x, y)
 
 **Parameters**
 
-- `x`: The first data column. [String literal](../syntax#syntax-string-literal)
-- `y`: The second data column. [Expression](../syntax#syntax-expressions)
+- `x`: The first data column. [String literal](../../syntax#syntax-string-literal)
+- `y`: The second data column. [Expression](../../syntax#syntax-expressions)
 
 **Returned value**
 
diff --git a/docs/en/sql-reference/aggregate-functions/reference/varsamp.md b/docs/en/sql-reference/aggregate-functions/reference/varsamp.md
index e75cb075ff8..be669a16ae8 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/varsamp.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/varsamp.md
@@ -8,7 +8,7 @@ This page contains information on the `varSamp` and `varSampStable` ClickHouse f
 
 ## varSamp
 
-Calculate the sample variance of a data set. 
+Calculate the sample variance of a data set.
 
 **Syntax**
 
@@ -18,7 +18,7 @@ varSamp(expr)
 
 **Parameters**
 
-- `expr`: An expression representing the data set for which you want to calculate the sample variance. [Expression](../syntax#syntax-expressions)
+- `expr`: An expression representing the data set for which you want to calculate the sample variance. [Expression](../../syntax#syntax-expressions)
 
 **Returned value**
 
@@ -78,7 +78,7 @@ varSampStable(expr)
 
 **Parameters**
 
-- `expr`: An expression representing the data set for which you want to calculate the sample variance. [Expression](../syntax#syntax-expressions)
+- `expr`: An expression representing the data set for which you want to calculate the sample variance. [Expression](../../syntax#syntax-expressions)
 
 **Returned value**
 

From 02e81329794ed326853f1e039bca49e960ed469d Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Thu, 14 Mar 2024 14:05:19 +0000
Subject: [PATCH 513/985] fix test

---
 .../03008_optimize_equal_ranges.reference            | 12 ++++++++++--
 .../0_stateless/03008_optimize_equal_ranges.sql      |  9 ++++++---
 2 files changed, 16 insertions(+), 5 deletions(-)

diff --git a/tests/queries/0_stateless/03008_optimize_equal_ranges.reference b/tests/queries/0_stateless/03008_optimize_equal_ranges.reference
index 08f8008fca6..fc7a4f3c118 100644
--- a/tests/queries/0_stateless/03008_optimize_equal_ranges.reference
+++ b/tests/queries/0_stateless/03008_optimize_equal_ranges.reference
@@ -1,8 +1,16 @@
 0	30000
 1	30000
 2	30000
+0	30000
+1	30000
+2	30000
 0	449985000
 1	449985000
 2	449985000
-sum	1
-uniqExact	0
+0	449985000
+1	449985000
+2	449985000
+sum	1	1
+sum	16	1
+uniqExact	1	1
+uniqExact	16	0
diff --git a/tests/queries/0_stateless/03008_optimize_equal_ranges.sql b/tests/queries/0_stateless/03008_optimize_equal_ranges.sql
index c6143fb7f51..4d521420741 100644
--- a/tests/queries/0_stateless/03008_optimize_equal_ranges.sql
+++ b/tests/queries/0_stateless/03008_optimize_equal_ranges.sql
@@ -10,16 +10,19 @@ INSERT INTO t_optimize_equal_ranges SELECT 0, toString(number), number FROM numb
 INSERT INTO t_optimize_equal_ranges SELECT 1, toString(number), number FROM numbers(30000);
 INSERT INTO t_optimize_equal_ranges SELECT 2, toString(number), number FROM numbers(30000);
 
-SELECT a, uniqExact(b) FROM t_optimize_equal_ranges GROUP BY a ORDER BY a;
-SELECT a, sum(c) FROM t_optimize_equal_ranges GROUP BY a ORDER BY a;
+SELECT a, uniqExact(b) FROM t_optimize_equal_ranges GROUP BY a ORDER BY a SETTINGS max_threads = 16;
+SELECT a, uniqExact(b) FROM t_optimize_equal_ranges GROUP BY a ORDER BY a SETTINGS max_threads = 1;
+SELECT a, sum(c) FROM t_optimize_equal_ranges GROUP BY a ORDER BY a SETTINGS max_threads = 16;
+SELECT a, sum(c) FROM t_optimize_equal_ranges GROUP BY a ORDER BY a SETTINGS max_threads = 1;
 
 SYSTEM FLUSH LOGS;
 
 SELECT
     used_aggregate_functions[1] AS func,
+    Settings['max_threads'] AS threads,
     ProfileEvents['AggregationOptimizedEqualRangesOfKeys'] > 0
 FROM system.query_log
 WHERE type = 'QueryFinish' AND current_database = currentDatabase() AND query LIKE '%SELECT%FROM%t_optimize_equal_ranges%'
-ORDER BY func;
+ORDER BY func, threads;
 
 DROP TABLE t_optimize_equal_ranges;

From b21a5fec7b99bf223482491759f72357ec447480 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 14 Mar 2024 15:06:08 +0100
Subject: [PATCH 514/985] Fix broken list and thank clang tidy

---
 src/Client/QueryFuzzer.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index 38e78157096..0a7cb1b36db 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -974,7 +974,7 @@ ASTPtr QueryFuzzer::reverseLiteralFuzzing(ASTPtr child)
             "toFixedString", /// Same as toDecimal
             "toInt128",
             "toInt256",
-            "toLowCardinality"
+            "toLowCardinality",
             "toNullable",
             "toUInt128",
             "toUInt256"};

From 026ac4deb14963077722ba527cabf76abd2ff0c0 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Thu, 14 Mar 2024 14:20:22 +0000
Subject: [PATCH 515/985] Fix heap-use-after-free for Merge table with alias

---
 src/Storages/StorageMerge.cpp                 |  3 +-
 ...t_storage_merge_aliases_analyzer.reference | 10 ++++
 ...25_test_storage_merge_aliases_analyzer.sql | 60 +++++++++++++++++++
 3 files changed, 72 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/01925_test_storage_merge_aliases_analyzer.reference
 create mode 100644 tests/queries/0_stateless/01925_test_storage_merge_aliases_analyzer.sql

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 8410f0a8df8..e07bcf339c3 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -681,8 +681,9 @@ public:
         {
             if (column->hasExpression())
             {
+                auto column_name = column->getColumnName();
                 node = column->getExpressionOrThrow();
-                node->setAlias(column->getColumnName());
+                node->setAlias(column_name);
             }
             else
                 column->setColumnSource(replacement_table_expression);
diff --git a/tests/queries/0_stateless/01925_test_storage_merge_aliases_analyzer.reference b/tests/queries/0_stateless/01925_test_storage_merge_aliases_analyzer.reference
new file mode 100644
index 00000000000..b0fea25ed4b
--- /dev/null
+++ b/tests/queries/0_stateless/01925_test_storage_merge_aliases_analyzer.reference
@@ -0,0 +1,10 @@
+alias1
+1	4	16	23
+23	16	4	1
+2020-02-02	1	4	2	16	3	23
+alias2
+1	3	4	4
+4	4	3	1
+23	16	4	1
+2020-02-01	1	3	2	4	3	4
+2020-02-02	1	4	2	16	3	23
diff --git a/tests/queries/0_stateless/01925_test_storage_merge_aliases_analyzer.sql b/tests/queries/0_stateless/01925_test_storage_merge_aliases_analyzer.sql
new file mode 100644
index 00000000000..31035aa80cd
--- /dev/null
+++ b/tests/queries/0_stateless/01925_test_storage_merge_aliases_analyzer.sql
@@ -0,0 +1,60 @@
+-- Tags: no-parallel
+
+drop table if exists merge;
+set allow_experimental_analyzer = 1;
+create table merge
+(
+    dt Date,
+    colAlias0 Int32,
+    colAlias1 Int32,
+    col2 Int32,
+    colAlias2 UInt32,
+    col3 Int32,
+    colAlias3 UInt32
+)
+engine = Merge(currentDatabase(), '^alias_');
+
+drop table if exists alias_1;
+drop table if exists alias_2;
+
+create table alias_1
+(
+    dt Date,
+    col Int32,
+    colAlias0 UInt32 alias col,
+    colAlias1 UInt32 alias col3 + colAlias0,
+    col2 Int32,
+    colAlias2 Int32 alias colAlias1 + col2 + 10,
+    col3 Int32,
+    colAlias3 Int32 alias colAlias2 + colAlias1 + col3
+)
+engine = MergeTree()
+order by (dt);
+
+insert into alias_1 (dt, col, col2, col3) values ('2020-02-02', 1, 2, 3);
+
+select 'alias1';
+select colAlias0, colAlias1, colAlias2, colAlias3 from alias_1;
+select colAlias3, colAlias2, colAlias1, colAlias0 from merge;
+select * from merge;
+
+create table alias_2
+(
+    dt Date,
+    col Int32,
+    col2 Int32,
+    colAlias0 UInt32 alias col,
+    colAlias3 Int32 alias col3 + colAlias0,
+    colAlias1 UInt32 alias colAlias0 + col2,
+    colAlias2 Int32 alias colAlias0 + colAlias1,
+    col3 Int32
+)
+engine = MergeTree()
+order by (dt);
+
+insert into alias_2 (dt, col, col2, col3) values ('2020-02-01', 1, 2, 3);
+
+select 'alias2';
+select colAlias0, colAlias1, colAlias2, colAlias3 from alias_2;
+select colAlias3, colAlias2, colAlias1, colAlias0 from merge order by dt;
+select * from merge order by dt;

From bb5e8f52a3fad759007ea6b7684f770f9646c103 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Thu, 14 Mar 2024 14:27:41 +0000
Subject: [PATCH 516/985] Kek

---
 CMakeLists.txt | 22 +++++++++++-----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 7a07cf2b436..4799e055698 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -54,19 +54,19 @@ endif ()
 # ccache ignore it.
 option(ENABLE_CHECK_HEAVY_BUILDS "Don't allow C++ translation units to compile too long or to take too much memory while compiling." OFF)
 if (ENABLE_CHECK_HEAVY_BUILDS)
-    # set DATA (since RSS does not work since 2.6.x+) to 5G
-    set (RLIMIT_DATA 5000000000)
-    # set VIRT (RLIMIT_AS) to 10G (DATA*10)
-    set (RLIMIT_AS 10000000000)
-    # set CPU time limit to 1000 seconds
-    set (RLIMIT_CPU 1000)
+    # # set DATA (since RSS does not work since 2.6.x+) to 5G
+    # set (RLIMIT_DATA 5000000000)
+    # # set VIRT (RLIMIT_AS) to 10G (DATA*10)
+    # set (RLIMIT_AS 10000000000)
+    # # set CPU time limit to 1000 seconds
+    # set (RLIMIT_CPU 1000)
 
-    # -fsanitize=memory and address are too heavy
-    if (SANITIZE)
-       set (RLIMIT_DATA 15000000000) # 10G
-    endif()
+    # # -fsanitize=memory and address are too heavy
+    # if (SANITIZE)
+    #    set (RLIMIT_DATA 15000000000) # 10G
+    # endif()
 
-    set (CMAKE_CXX_COMPILER_LAUNCHER prlimit --as=${RLIMIT_AS} --data=${RLIMIT_DATA} --cpu=${RLIMIT_CPU} ${CMAKE_CXX_COMPILER_LAUNCHER})
+    # set (CMAKE_CXX_COMPILER_LAUNCHER prlimit --as=${RLIMIT_AS} --data=${RLIMIT_DATA} --cpu=${RLIMIT_CPU} ${CMAKE_CXX_COMPILER_LAUNCHER})
 endif ()
 
 if (NOT CMAKE_BUILD_TYPE OR CMAKE_BUILD_TYPE STREQUAL "None")

From e145115ef1a1cdb8f480cbbd51a7eab3f86a43d3 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 14 Mar 2024 16:15:06 +0100
Subject: [PATCH 517/985] Fixup

---
 src/Storages/StorageMerge.cpp | 25 +++++--------------------
 1 file changed, 5 insertions(+), 20 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index f0b9d58f3dd..7124cd7393e 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -56,17 +56,12 @@
 #include <Storages/checkAndGetLiteralArgument.h>
 #include <base/defines.h>
 #include <base/range.h>
-#include "Common/logger_useful.h"
 #include <Common/Exception.h>
 #include <Common/assert_cast.h>
 #include <Common/checkStackSize.h>
 #include <Common/typeid_cast.h>
-#include "Analyzer/QueryNode.h"
-#include "Core/QueryProcessingStage.h"
-#include "IO/WriteHelpers.h"
 #include <Core/NamesAndTypes.h>
 #include <Functions/FunctionFactory.h>
-#include <Poco/Logger.h>
 
 namespace DB
 {
@@ -803,13 +798,10 @@ QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
     const ContextPtr & context,
     const Names & required_column_names)
 {
-    LOG_DEBUG(&Poco::Logger::get("replaceTableExpressionAndRemoveJoin"), "BEFORE:\n{}", query->dumpTree());
     auto * query_node = query->as<QueryNode>();
     auto join_tree_type = query_node->getJoinTree()->getNodeType();
     auto modified_query = query_node->cloneAndReplace(original_table_expression, replacement_table_expression);
 
-    LOG_DEBUG(&Poco::Logger::get("replaceTableExpressionAndRemoveJoin"), "AFTER:\n{}", modified_query->dumpTree());
-
     // For the case when join tree is just a table or a table function we don't need to do anything more.
     if (join_tree_type == QueryTreeNodeType::TABLE || join_tree_type == QueryTreeNodeType::TABLE_FUNCTION)
         return modified_query;
@@ -969,8 +961,6 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
                 column_name_to_node);
         }
 
-        LOG_DEBUG(&Poco::Logger::get("getModifiedQueryInfo"), "{}", modified_query_info.query_tree->dumpTree());
-
         modified_query_info.query = queryNodeToSelectQuery(modified_query_info.query_tree);
     }
     else
@@ -1058,8 +1048,6 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
 
         Block pipe_header = builder->getHeader();
 
-        LOG_DEBUG(&Poco::Logger::get("createSources"), "Processed:{}\nStorage:{}", toString(processed_stage), toString(storage_stage));
-
         if (allow_experimental_analyzer)
         {
             String table_alias = modified_query_info.query_tree->as<QueryNode>()->getJoinTree()->as<TableNode>()->getAlias();
@@ -1067,7 +1055,8 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
             String database_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_database" : table_alias + "._database";
             String table_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_table" : table_alias + "._table";
 
-            if (has_database_virtual_column && common_header.has(database_column) && (storage_stage == QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr))
+            if (has_database_virtual_column && common_header.has(database_column)
+                && (storage_stage == QueryProcessingStage::FetchColumns || (dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr && !pipe_header.has("'" + database_name + "'_String"))))
             {
                 ColumnWithTypeAndName column;
                 column.name = database_column;
@@ -1082,7 +1071,8 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
                                             { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
             }
 
-            if (has_table_virtual_column && common_header.has(table_column) && (storage_stage == QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr))
+            if (has_table_virtual_column && common_header.has(table_column)
+                && (storage_stage == QueryProcessingStage::FetchColumns || (dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr && !pipe_header.has("'" + table_name + "'_String"))))
             {
                 ColumnWithTypeAndName column;
                 column.name = table_column;
@@ -1166,8 +1156,6 @@ QueryPlan ReadFromMerge::createPlanForTable(
         storage_snapshot_,
         modified_query_info);
 
-    LOG_DEBUG(&Poco::Logger::get("createPlanForTable"), "Storage: {}", toString(storage_stage));
-
     QueryPlan plan;
 
     if (processed_stage <= storage_stage)
@@ -1545,8 +1533,7 @@ void ReadFromMerge::convertAndFilterSourceStream(
 
     ActionsDAG::MatchColumnsMode convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Name;
 
-    if (local_context->getSettingsRef().allow_experimental_analyzer
-        && (processed_stage == QueryProcessingStage::FetchColumns && dynamic_cast<const StorageDistributed *>(&snapshot->storage) != nullptr))
+    if (local_context->getSettingsRef().allow_experimental_analyzer && dynamic_cast<const StorageDistributed *>(&snapshot->storage) != nullptr)
         convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Position;
 
     if (row_policy_data_opt)
@@ -1554,8 +1541,6 @@ void ReadFromMerge::convertAndFilterSourceStream(
         row_policy_data_opt->addFilterTransform(builder);
     }
 
-    LOG_DEBUG(&Poco::Logger::get("convertAndFilterSourceStream"), "SOURCE:\n{}\nRESULT:\n{}", builder.getHeader().dumpStructure(), header.dumpStructure());
-
     auto convert_actions_dag = ActionsDAG::makeConvertingActions(builder.getHeader().getColumnsWithTypeAndName(),
                                                                 header.getColumnsWithTypeAndName(),
                                                                 convert_actions_match_columns_mode);

From d558c4dcb7ed2d80ca63d1bf2f9e09d580c843c0 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 14 Mar 2024 16:17:58 +0100
Subject: [PATCH 518/985] Cleanup

---
 src/Storages/StorageMerge.cpp | 5 ++---
 src/Storages/StorageMerge.h   | 3 +--
 2 files changed, 3 insertions(+), 5 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 7124cd7393e..f95464f4bff 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -1121,7 +1121,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
         /// Subordinary tables could have different but convertible types, like numeric types of different width.
         /// We must return streams with structure equals to structure of Merge table.
         convertAndFilterSourceStream(
-            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, storage_stage);
+            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder);
     }
 
     return builder;
@@ -1473,8 +1473,7 @@ void ReadFromMerge::convertAndFilterSourceStream(
     const Aliases & aliases,
     const RowPolicyDataOpt & row_policy_data_opt,
     ContextPtr local_context,
-    QueryPipelineBuilder & builder,
-    QueryProcessingStage::Enum processed_stage [[maybe_unused]])
+    QueryPipelineBuilder & builder)
 {
     Block before_block_header = builder.getHeader();
 
diff --git a/src/Storages/StorageMerge.h b/src/Storages/StorageMerge.h
index 556649f622d..3aabd7e26e3 100644
--- a/src/Storages/StorageMerge.h
+++ b/src/Storages/StorageMerge.h
@@ -277,8 +277,7 @@ private:
         const Aliases & aliases,
         const RowPolicyDataOpt & row_policy_data_opt,
         ContextPtr context,
-        QueryPipelineBuilder & builder,
-        QueryProcessingStage::Enum processed_stage);
+        QueryPipelineBuilder & builder);
 
     StorageMerge::StorageListWithLocks getSelectedTables(
         ContextPtr query_context,

From c89010f80336384252e230158c85ae4f7ae1dae1 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Thu, 14 Mar 2024 15:22:01 +0000
Subject: [PATCH 519/985] Remove unused function template

---
 src/Dictionaries/RangeHashedDictionary_2.cpp | 114 -------------------
 1 file changed, 114 deletions(-)

diff --git a/src/Dictionaries/RangeHashedDictionary_2.cpp b/src/Dictionaries/RangeHashedDictionary_2.cpp
index 2329d621da4..d400fd1d830 100644
--- a/src/Dictionaries/RangeHashedDictionary_2.cpp
+++ b/src/Dictionaries/RangeHashedDictionary_2.cpp
@@ -118,120 +118,6 @@ size_t RangeHashedDictionary<dictionary_key_type>::getItemsShortCircuitImpl(
     return keys_found;
 }
 
-template <DictionaryKeyType dictionary_key_type>
-template <typename ValueType, bool is_nullable, typename DefaultValueExtractor>
-void RangeHashedDictionary<dictionary_key_type>::getItemsImpl(
-    const Attribute & attribute,
-    const Columns & key_columns,
-    typename RangeHashedDictionary<dictionary_key_type>::ValueSetterFunc<ValueType> && set_value,
-    DefaultValueExtractor & default_value_extractor) const
-{
-    const auto & attribute_container = std::get<AttributeContainerType<ValueType>>(attribute.container);
-
-    size_t keys_found = 0;
-
-    const ColumnPtr & range_column = key_columns.back();
-    auto key_columns_copy = key_columns;
-    key_columns_copy.pop_back();
-
-    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
-    DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
-    const size_t keys_size = keys_extractor.getKeysSize();
-
-    callOnRangeType(
-        dict_struct.range_min->type,
-        [&](const auto & types)
-        {
-            using Types = std::decay_t<decltype(types)>;
-            using RangeColumnType = typename Types::LeftType;
-            using RangeStorageType = typename RangeColumnType::ValueType;
-            using RangeInterval = Interval<RangeStorageType>;
-
-            const auto * range_column_typed = typeid_cast<const RangeColumnType *>(range_column.get());
-            if (!range_column_typed)
-                throw Exception(
-                    ErrorCodes::TYPE_MISMATCH,
-                    "Dictionary {} range column type should be equal to {}",
-                    getFullName(),
-                    dict_struct.range_min->type->getName());
-
-            const auto & range_column_data = range_column_typed->getData();
-
-            const auto & key_attribute_container = std::get<KeyAttributeContainerType<RangeStorageType>>(key_attribute.container);
-
-            for (size_t key_index = 0; key_index < keys_size; ++key_index)
-            {
-                auto key = keys_extractor.extractCurrentKey();
-                const auto it = key_attribute_container.find(key);
-
-                if (it)
-                {
-                    const auto date = range_column_data[key_index];
-                    const auto & interval_tree = it->getMapped();
-
-                    size_t value_index = 0;
-                    std::optional<RangeInterval> range;
-
-                    interval_tree.find(
-                        date,
-                        [&](auto & interval, auto & interval_value_index)
-                        {
-                            if (range)
-                            {
-                                if (likely(configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::min) && interval < *range)
-                                {
-                                    range = interval;
-                                    value_index = interval_value_index;
-                                }
-                                else if (configuration.lookup_strategy == RangeHashedDictionaryLookupStrategy::max && interval > *range)
-                                {
-                                    range = interval;
-                                    value_index = interval_value_index;
-                                }
-                            }
-                            else
-                            {
-                                range = interval;
-                                value_index = interval_value_index;
-                            }
-
-                            return true;
-                        });
-
-                    if (range.has_value())
-                    {
-                        ++keys_found;
-
-                        ValueType value = attribute_container[value_index];
-
-                        if constexpr (is_nullable)
-                        {
-                            bool is_null = (*attribute.is_value_nullable)[value_index];
-                            set_value(key_index, value, is_null);
-                        }
-                        else
-                        {
-                            set_value(key_index, value, false);
-                        }
-
-                        keys_extractor.rollbackCurrentKey();
-                        continue;
-                    }
-                }
-
-                if constexpr (is_nullable)
-                    set_value(key_index, default_value_extractor[key_index], default_value_extractor.isNullAt(key_index));
-                else
-                    set_value(key_index, default_value_extractor[key_index], false);
-
-                keys_extractor.rollbackCurrentKey();
-            }
-        });
-
-    query_count.fetch_add(keys_size, std::memory_order_relaxed);
-    found_count.fetch_add(keys_found, std::memory_order_relaxed);
-}
-
 #define INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType, IsNullable, ValueType) \
     template size_t RangeHashedDictionary<DictionaryKeyType>::getItemsShortCircuitImpl<ValueType, IsNullable>( \
         const Attribute & attribute, \

From b778b01408bf4057e030bd94e1d911c8f5efaca2 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 14 Mar 2024 16:39:32 +0100
Subject: [PATCH 520/985] Add settings

---
 src/Core/Settings.h                         | 3 +++
 src/Storages/StorageReplicatedMergeTree.cpp | 3 ++-
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d70a6cf51c5..2755fa53866 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -838,6 +838,9 @@ class IColumn;
     M(Bool, compatibility_ignore_auto_increment_in_create_table, false, "Ignore AUTO_INCREMENT keyword in column declaration if true, otherwise return error. It simplifies migration from MySQL", 0) \
     M(Bool, multiple_joins_try_to_keep_original_names, false, "Do not add aliases to top level expression list on multiple joins rewrite", 0) \
     M(Bool, optimize_sorting_by_input_stream_properties, true, "Optimize sorting by sorting properties of input stream", 0) \
+    M(UInt64, keeper_max_retries, 10, "Max retries for general keeper operations", 0) \
+    M(UInt64, keeper_retry_initial_backoff_ms, 100, "Initial backoff timeout for general keeper operations", 0) \
+    M(UInt64, keeper_retry_max_backoff_ms, 5000, "Max backoff timeout for general keeper operations", 0) \
     M(UInt64, insert_keeper_max_retries, 20, "Max retries for keeper operations during insert", 0) \
     M(UInt64, insert_keeper_retry_initial_backoff_ms, 100, "Initial backoff timeout for keeper operations during insert", 0) \
     M(UInt64, insert_keeper_retry_max_backoff_ms, 10000, "Max backoff timeout for keeper operations during insert", 0) \
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 71ac1fc4965..c41403e312b 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -7682,7 +7682,8 @@ void StorageReplicatedMergeTree::forcefullyRemoveBrokenOutdatedPartFromZooKeeper
 
     bool exists = false;
     String part_path = replica_path + "/parts/" + part_name;
-    ZooKeeperRetriesInfo retries_info{/* max_retries */5, /* initial_backoff_ms */100, /* max_backoff_ms */100};
+    const auto & settings = getContext()->getSettingsRef();
+    ZooKeeperRetriesInfo retries_info{settings.keeper_max_retries, settings.keeper_retry_initial_backoff_ms, settings.keeper_retry_max_backoff_ms};
     ZooKeeperRetriesControl retries_ctl("outdatedPartExists", log.load(), retries_info, nullptr);
 
     retries_ctl.retryLoop([&]() { exists = getZooKeeper()->exists(part_path); });

From 22ca96cf8d44aa907c0c3c463e4b0a5628312aa0 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Thu, 14 Mar 2024 16:05:01 +0000
Subject: [PATCH 521/985] Disable optimize_rewrite_sum_if_to_count_if if return
 is nullable

---
 src/Analyzer/Passes/SumIfToCountIfPass.cpp                     | 2 +-
 .../0_stateless/03010_sum_to_to_count_if_nullable.reference    | 0
 .../queries/0_stateless/03010_sum_to_to_count_if_nullable.sql  | 3 +++
 3 files changed, 4 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
 create mode 100644 tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql

diff --git a/src/Analyzer/Passes/SumIfToCountIfPass.cpp b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
index 1a6ee9215a9..d374d92c1fb 100644
--- a/src/Analyzer/Passes/SumIfToCountIfPass.cpp
+++ b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
@@ -32,7 +32,7 @@ public:
             return;
 
         auto * function_node = node->as<FunctionNode>();
-        if (!function_node || !function_node->isAggregateFunction())
+        if (!function_node || !function_node->isAggregateFunction() || function_node->getResultType()->isNullable())
             return;
 
         auto function_name = function_node->getFunctionName();
diff --git a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql
new file mode 100644
index 00000000000..394cd4f1ea5
--- /dev/null
+++ b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql
@@ -0,0 +1,3 @@
+SET optimize_rewrite_sum_if_to_count_if = 1;
+SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10) SETTINGS allow_experimental_analyzer=0;
+SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10) SETTINGS allow_experimental_analyzer=1;
\ No newline at end of file

From 7c5ef07c7b9f20db16811eb60dbe27a36b821575 Mon Sep 17 00:00:00 2001
From: Peter <peter279k@gmail.com>
Date: Fri, 15 Mar 2024 00:18:37 +0800
Subject: [PATCH 522/985] Add checksum validating before extracting archive

---
 docs/en/getting-started/example-datasets/nyc-taxi.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/docs/en/getting-started/example-datasets/nyc-taxi.md b/docs/en/getting-started/example-datasets/nyc-taxi.md
index cac75fdc45a..516a6d54248 100644
--- a/docs/en/getting-started/example-datasets/nyc-taxi.md
+++ b/docs/en/getting-started/example-datasets/nyc-taxi.md
@@ -248,6 +248,9 @@ Some of the files might not download fully. Check the file sizes and re-download
 
 ``` bash
 $ curl -O https://datasets.clickhouse.com/trips_mergetree/partitions/trips_mergetree.tar
+# Validate the checksum
+$ md5sum trips_mergetree.tar
+# Checksum should be equal to: f3b8d469b41d9a82da064ded7245d12c
 $ tar xvf trips_mergetree.tar -C /var/lib/clickhouse # path to ClickHouse data directory
 $ # check permissions of unpacked data, fix if required
 $ sudo service clickhouse-server restart

From 75aed5ce8651fa1aff93bb726418de3df413ead6 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Thu, 14 Mar 2024 16:26:38 +0000
Subject: [PATCH 523/985] fix consecutive keys optimization for nullable keys

---
 src/Common/ColumnsHashingImpl.h | 88 +++++++++++++++++++++++----------
 1 file changed, 62 insertions(+), 26 deletions(-)

diff --git a/src/Common/ColumnsHashingImpl.h b/src/Common/ColumnsHashingImpl.h
index 7116160e94c..c8d62fa7e6b 100644
--- a/src/Common/ColumnsHashingImpl.h
+++ b/src/Common/ColumnsHashingImpl.h
@@ -46,29 +46,45 @@ struct LastElementCacheStats
 namespace columns_hashing_impl
 {
 
-template <typename Value, bool consecutive_keys_optimization_>
-struct LastElementCache
+struct LastElementCacheBase
 {
-    static constexpr bool consecutive_keys_optimization = consecutive_keys_optimization_;
-
-    Value value;
     bool empty = true;
     bool found = false;
     UInt64 misses = 0;
 
-    bool check(const Value & value_) const { return value == value_; }
+    void onNewValue(bool is_found)
+    {
+        empty = false;
+        found = is_found;
+        ++misses;
+    }
+
+    bool hasOnlyOneValue() const { return found && misses == 1; }
+};
+
+template <typename Value, bool nullable> struct LastElementCache;
+
+template <typename Value>
+struct LastElementCache<Value, true> : public LastElementCacheBase
+{
+    Value value;
+    bool is_null = false;
+
+    template <typename Key>
+    bool check(const Key & key) const { return !is_null && value.first == key; }
+
+    bool check(const Value & rhs) const { return !is_null && value == rhs; }
+};
+
+template <typename Value>
+struct LastElementCache<Value, false> : public LastElementCacheBase
+{
+    Value value;
 
     template <typename Key>
     bool check(const Key & key) const { return value.first == key; }
 
-    bool hasOnlyOneValue() const { return found && misses == 1; }
-    UInt64 getMisses() const { return misses; }
-};
-
-template <typename Data>
-struct LastElementCache<Data, false>
-{
-    static constexpr bool consecutive_keys_optimization = false;
+    bool check(const Value & rhs) const { return value == rhs; }
 };
 
 template <typename Mapped>
@@ -162,7 +178,7 @@ public:
     using EmplaceResult = EmplaceResultImpl<Mapped>;
     using FindResult = FindResultImpl<Mapped, need_offset>;
     static constexpr bool has_mapped = !std::is_same_v<Mapped, void>;
-    using Cache = LastElementCache<Value, consecutive_keys_optimization>;
+    using Cache = LastElementCache<Value, nullable>;
 
     static HashMethodContextPtr createContext(const HashMethodContext::Settings &) { return nullptr; }
 
@@ -173,6 +189,15 @@ public:
         {
             if (isNullAt(row))
             {
+                if constexpr (consecutive_keys_optimization)
+                {
+                    if (!cache.is_null)
+                    {
+                        cache.onNewValue(true);
+                        cache.is_null = true;
+                    }
+                }
+
                 bool has_null_key = data.hasNullKeyData();
                 data.hasNullKeyData() = true;
 
@@ -194,10 +219,21 @@ public:
         {
             if (isNullAt(row))
             {
+                bool has_null_key = data.hasNullKeyData();
+
+                if constexpr (consecutive_keys_optimization)
+                {
+                    if (!cache.is_null)
+                    {
+                        cache.onNewValue(has_null_key);
+                        cache.is_null = true;
+                    }
+                }
+
                 if constexpr (has_mapped)
-                    return FindResult(&data.getNullKeyData(), data.hasNullKeyData(), 0);
+                    return FindResult(&data.getNullKeyData(), has_null_key, 0);
                 else
-                    return FindResult(data.hasNullKeyData(), 0);
+                    return FindResult(has_null_key, 0);
             }
         }
 
@@ -232,7 +268,7 @@ public:
     ALWAYS_INLINE UInt64 getCacheMissesSinceLastReset() const
     {
         if constexpr (consecutive_keys_optimization)
-            return cache.getMisses();
+            return cache.misses;
         return 0;
     }
 
@@ -304,9 +340,10 @@ protected:
 
         if constexpr (consecutive_keys_optimization)
         {
-            cache.found = true;
-            cache.empty = false;
-            ++cache.misses;
+            cache.onNewValue(true);
+
+            if constexpr (nullable)
+                cache.is_null = false;
 
             if constexpr (has_mapped)
             {
@@ -347,17 +384,16 @@ protected:
 
         if constexpr (consecutive_keys_optimization)
         {
-            cache.found = it != nullptr;
-            cache.empty = false;
-            ++cache.misses;
+            cache.onNewValue(it != nullptr);
+
+            if constexpr (nullable)
+                cache.is_null = false;
 
             if constexpr (has_mapped)
             {
                 cache.value.first = key;
                 if (it)
-                {
                     cache.value.second = it->getMapped();
-                }
             }
             else
             {

From 8c22f8ec3c7b7b40d687e5eb137ba98bfe76c67b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 14 Mar 2024 17:26:52 +0100
Subject: [PATCH 524/985] Update settings changes history

---
 src/Core/SettingsChangesHistory.h | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index e680c02671a..3b0af6ded27 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -93,6 +93,9 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"input_format_json_use_string_type_for_ambiguous_paths_in_named_tuples_inference_from_objects", false, false, "Allow to use String type for ambiguous paths during named tuple inference from JSON objects"},
               {"throw_if_deduplication_in_dependent_materialized_views_enabled_with_async_insert", false, true, "Deduplication is dependent materialized view cannot work together with async inserts."},
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
+              {"keeper_max_retries", 10, 10, "Max retries for general keeper operations"},
+              {"keeper_retry_initial_backoff_ms", 100, 100, "Initial backoff timeout for general keeper operations"},
+              {"keeper_retry_max_backoff_ms", 5000, 5000, "Max backoff timeout for general keeper operations"},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},

From 0b3b734c9b268e65c758e1f2092d176dfc1d9489 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 14 Mar 2024 17:37:49 +0100
Subject: [PATCH 525/985] Analyzer: Fix planner context for subquery in
 StorageMerge

---
 src/Planner/PlannerContext.cpp              |  6 ++++++
 src/Planner/PlannerContext.h                |  8 ++++++--
 src/Storages/StorageMerge.cpp               | 22 ++++++++++++---------
 src/Storages/StorageMerge.h                 |  2 +-
 tests/analyzer_integration_broken_tests.txt |  1 -
 5 files changed, 26 insertions(+), 13 deletions(-)

diff --git a/src/Planner/PlannerContext.cpp b/src/Planner/PlannerContext.cpp
index f33255f0a44..f939b959ce7 100644
--- a/src/Planner/PlannerContext.cpp
+++ b/src/Planner/PlannerContext.cpp
@@ -48,6 +48,12 @@ PlannerContext::PlannerContext(ContextMutablePtr query_context_, GlobalPlannerCo
     , is_ast_level_optimization_allowed(!(query_context->getClientInfo().query_kind == ClientInfo::QueryKind::SECONDARY_QUERY || select_query_options_.ignore_ast_optimizations))
 {}
 
+PlannerContext::PlannerContext(ContextMutablePtr query_context_, PlannerContextPtr planner_context_)
+    : query_context(std::move(query_context_))
+    , global_planner_context(planner_context_->global_planner_context)
+    , is_ast_level_optimization_allowed(planner_context_->is_ast_level_optimization_allowed)
+{}
+
 TableExpressionData & PlannerContext::getOrCreateTableExpressionData(const QueryTreeNodePtr & table_expression_node)
 {
     auto [it, _] = table_expression_node_to_data.emplace(table_expression_node, TableExpressionData());
diff --git a/src/Planner/PlannerContext.h b/src/Planner/PlannerContext.h
index 4d9ba037cac..418240fa34e 100644
--- a/src/Planner/PlannerContext.h
+++ b/src/Planner/PlannerContext.h
@@ -75,12 +75,18 @@ private:
 
 using GlobalPlannerContextPtr = std::shared_ptr<GlobalPlannerContext>;
 
+class PlannerContext;
+using PlannerContextPtr = std::shared_ptr<PlannerContext>;
+
 class PlannerContext
 {
 public:
     /// Create planner context with query context and global planner context
     PlannerContext(ContextMutablePtr query_context_, GlobalPlannerContextPtr global_planner_context_, const SelectQueryOptions & select_query_options_);
 
+    /// Create planner with modified query_context
+    PlannerContext(ContextMutablePtr query_context_, PlannerContextPtr planner_context_);
+
     /// Get planner context query context
     ContextPtr getQueryContext() const
     {
@@ -191,6 +197,4 @@ private:
     PreparedSets prepared_sets;
 };
 
-using PlannerContextPtr = std::shared_ptr<PlannerContext>;
-
 }
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 8410f0a8df8..4c53f67c76b 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -422,6 +422,7 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
     std::vector<std::unique_ptr<QueryPipelineBuilder>> pipelines;
 
     auto table_it = selected_tables.begin();
+    auto modified_context = Context::createCopy(context);
     for (size_t i = 0; i < selected_tables.size(); ++i, ++table_it)
     {
         auto & child_plan = child_plans->at(i);
@@ -438,7 +439,7 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
         if (child_plan.row_policy_data_opt)
             child_plan.row_policy_data_opt->extendNames(real_column_names);
 
-        auto modified_query_info = getModifiedQueryInfo(context, table, nested_storage_snaphsot, real_column_names, column_names_as_aliases, aliases);
+        auto modified_query_info = getModifiedQueryInfo(modified_context, table, nested_storage_snaphsot, real_column_names, column_names_as_aliases, aliases);
 
         auto source_pipeline = createSources(
             child_plan.plan,
@@ -547,9 +548,10 @@ std::vector<ReadFromMerge::ChildPlan> ReadFromMerge::createChildrenPlans(SelectQ
     }
 
     /// Settings will be modified when planning children tables.
-    auto modified_context = Context::createCopy(context);
     for (const auto & table : selected_tables)
     {
+        auto modified_context = Context::createCopy(context);
+
         size_t current_need_streams = tables_count >= num_streams ? 1 : (num_streams / tables_count);
         size_t current_streams = std::min(current_need_streams, remaining_streams);
         remaining_streams -= current_streams;
@@ -570,25 +572,25 @@ std::vector<ReadFromMerge::ChildPlan> ReadFromMerge::createChildrenPlans(SelectQ
         auto & aliases = res.back().table_aliases;
         auto & row_policy_data_opt = res.back().row_policy_data_opt;
         auto storage_metadata_snapshot = storage->getInMemoryMetadataPtr();
-        auto nested_storage_snaphsot = storage->getStorageSnapshot(storage_metadata_snapshot, context);
+        auto nested_storage_snaphsot = storage->getStorageSnapshot(storage_metadata_snapshot, modified_context);
 
         Names column_names_as_aliases;
         Names real_column_names = column_names;
 
         const auto & database_name = std::get<0>(table);
         const auto & table_name = std::get<3>(table);
-        auto row_policy_filter_ptr = context->getRowPolicyFilter(
+        auto row_policy_filter_ptr = modified_context->getRowPolicyFilter(
             database_name,
             table_name,
             RowPolicyFilterType::SELECT_FILTER);
         if (row_policy_filter_ptr)
         {
-            row_policy_data_opt = RowPolicyData(row_policy_filter_ptr, storage, context);
+            row_policy_data_opt = RowPolicyData(row_policy_filter_ptr, storage, modified_context);
             row_policy_data_opt->extendNames(real_column_names);
         }
 
         auto modified_query_info
-            = getModifiedQueryInfo(context, table, nested_storage_snaphsot, real_column_names, column_names_as_aliases, aliases);
+            = getModifiedQueryInfo(modified_context, table, nested_storage_snaphsot, real_column_names, column_names_as_aliases, aliases);
 
         if (!context->getSettingsRef().allow_experimental_analyzer)
         {
@@ -657,10 +659,9 @@ std::vector<ReadFromMerge::ChildPlan> ReadFromMerge::createChildrenPlans(SelectQ
             row_policy_data_opt,
             modified_context,
             current_streams);
+        res.back().plan.addInterpreterContext(modified_context);
     }
 
-    if (!res.empty())
-        res[0].plan.addInterpreterContext(modified_context);
 
     return res;
 }
@@ -863,7 +864,7 @@ QueryTreeNodePtr replaceTableExpressionAndRemoveJoin(
 
 }
 
-SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_context,
+SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextMutablePtr & modified_context,
     const StorageWithLockAndName & storage_with_lock_and_name,
     const StorageSnapshotPtr & storage_snapshot_,
     Names required_column_names,
@@ -877,6 +878,9 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextPtr & modified_
     if (modified_query_info.optimized_prewhere_info && !modified_query_info.prewhere_info)
         modified_query_info.prewhere_info = modified_query_info.optimized_prewhere_info;
 
+    if (modified_query_info.planner_context)
+        modified_query_info.planner_context = std::make_shared<PlannerContext>(modified_context, modified_query_info.planner_context);
+
     if (modified_query_info.table_expression)
     {
         auto replacement_table_expression = std::make_shared<TableNode>(storage, storage_lock, storage_snapshot_);
diff --git a/src/Storages/StorageMerge.h b/src/Storages/StorageMerge.h
index 556649f622d..c049d50f3b4 100644
--- a/src/Storages/StorageMerge.h
+++ b/src/Storages/StorageMerge.h
@@ -192,7 +192,7 @@ private:
 
     using Aliases = std::vector<AliasData>;
 
-    SelectQueryInfo getModifiedQueryInfo(const ContextPtr & modified_context,
+    SelectQueryInfo getModifiedQueryInfo(const ContextMutablePtr & modified_context,
         const StorageWithLockAndName & storage_with_lock_and_name,
         const StorageSnapshotPtr & storage_snapshot,
         Names required_column_names,
diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index 31527dc3476..d2ef983f26d 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -1,4 +1,3 @@
 test_build_sets_from_multiple_threads/test.py::test_set
 test_concurrent_backups_s3/test.py::test_concurrent_backups
 test_distributed_type_object/test.py::test_distributed_type_object
-test_merge_table_over_distributed/test.py::test_global_in

From e3666e42a9864623f0f509c90a81bba6581c350e Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Thu, 14 Mar 2024 16:47:37 +0000
Subject: [PATCH 526/985] add a test

---
 .../03009_consecutive_keys_nullable.reference | 16 ++++++
 .../03009_consecutive_keys_nullable.sql       | 56 +++++++++++++++++++
 2 files changed, 72 insertions(+)
 create mode 100644 tests/queries/0_stateless/03009_consecutive_keys_nullable.reference
 create mode 100644 tests/queries/0_stateless/03009_consecutive_keys_nullable.sql

diff --git a/tests/queries/0_stateless/03009_consecutive_keys_nullable.reference b/tests/queries/0_stateless/03009_consecutive_keys_nullable.reference
new file mode 100644
index 00000000000..1c8064290c6
--- /dev/null
+++ b/tests/queries/0_stateless/03009_consecutive_keys_nullable.reference
@@ -0,0 +1,16 @@
+\N	1	1
+1	2	0
+\N	1	1
+1	2	0
+\N	3	3
+1	3	0
+\N	1	1
+1	2	0
+\N	2	2
+1	1	0
+t_nullable_keys_1	0
+t_nullable_keys_2	0
+t_nullable_keys_3	1
+t_nullable_keys_4	1
+t_nullable_keys_5	0
+t_nullable_keys_6	0
diff --git a/tests/queries/0_stateless/03009_consecutive_keys_nullable.sql b/tests/queries/0_stateless/03009_consecutive_keys_nullable.sql
new file mode 100644
index 00000000000..ee2cb5a171f
--- /dev/null
+++ b/tests/queries/0_stateless/03009_consecutive_keys_nullable.sql
@@ -0,0 +1,56 @@
+DROP TABLE IF EXISTS t_nullable_keys_1;
+
+CREATE TABLE t_nullable_keys_1 (x Nullable(Int64)) ENGINE = Memory;
+INSERT INTO t_nullable_keys_1 VALUES (1), (1), (NULL);
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_1 GROUP BY x;
+
+DROP TABLE t_nullable_keys_1;
+
+DROP TABLE IF EXISTS t_nullable_keys_2;
+
+CREATE TABLE t_nullable_keys_2 (x Nullable(Int64)) ENGINE = Memory;
+INSERT INTO t_nullable_keys_2 VALUES (NULL), (1), (1);
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_2 GROUP BY x;
+
+DROP TABLE t_nullable_keys_2;
+
+DROP TABLE IF EXISTS t_nullable_keys_3;
+
+CREATE TABLE t_nullable_keys_3 (x Nullable(Int64)) ENGINE = Memory;
+INSERT INTO t_nullable_keys_3 VALUES (NULL), (NULL), (NULL);
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_3 GROUP BY x;
+
+DROP TABLE t_nullable_keys_3;
+
+DROP TABLE IF EXISTS t_nullable_keys_4;
+
+CREATE TABLE t_nullable_keys_4 (x Nullable(Int64)) ENGINE = Memory;
+INSERT INTO t_nullable_keys_4 VALUES (1), (1), (1);
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_4 GROUP BY x;
+
+DROP TABLE t_nullable_keys_4;
+
+DROP TABLE IF EXISTS t_nullable_keys_5;
+
+CREATE TABLE t_nullable_keys_5 (x Nullable(Int64)) ENGINE = Memory;
+INSERT INTO t_nullable_keys_5 VALUES (1), (NULL), (1);
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_5 GROUP BY x;
+
+DROP TABLE t_nullable_keys_5;
+
+DROP TABLE IF EXISTS t_nullable_keys_6;
+
+CREATE TABLE t_nullable_keys_6 (x Nullable(Int64)) ENGINE = Memory;
+INSERT INTO t_nullable_keys_6 VALUES (NULL), (1), (NULL);
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_6 GROUP BY x;
+
+DROP TABLE t_nullable_keys_6;
+
+SYSTEM FLUSH LOGS;
+
+SELECT
+    splitByChar('.', tables[1])[2] AS table,
+    ProfileEvents['AggregationOptimizedEqualRangesOfKeys'] > 0
+FROM system.query_log
+WHERE type = 'QueryFinish' AND current_database = currentDatabase() AND query LIKE '%SELECT%FROM%t_nullable_keys_%'
+ORDER BY table;

From b064cff245464f972033efb535d3b69273770833 Mon Sep 17 00:00:00 2001
From: Nikolay Degterinsky <evillique@gmail.com>
Date: Thu, 14 Mar 2024 16:57:17 +0000
Subject: [PATCH 527/985] Fix test_failed_async_inserts

---
 tests/integration/test_failed_async_inserts/configs/config.xml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/integration/test_failed_async_inserts/configs/config.xml b/tests/integration/test_failed_async_inserts/configs/config.xml
index 038c0792b44..7daf4bd31a1 100644
--- a/tests/integration/test_failed_async_inserts/configs/config.xml
+++ b/tests/integration/test_failed_async_inserts/configs/config.xml
@@ -1,3 +1,4 @@
 <clickhouse>
     <max_server_memory_usage>1000</max_server_memory_usage>
+    <page_cache_size>0</page_cache_size>
 </clickhouse>

From cd912074a5a94dc80daf4104942e0a9d3ed26e45 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 14 Mar 2024 18:29:07 +0100
Subject: [PATCH 528/985] Fixup

---
 src/DataTypes/ObjectUtils.cpp                 | 14 ++++++--------
 src/DataTypes/ObjectUtils.h                   |  4 +---
 .../ClusterProxy/SelectStreamFactory.cpp      | 19 ++++++++++++-------
 .../ClusterProxy/SelectStreamFactory.h        |  7 +++++--
 src/Processors/QueryPlan/ReadFromRemote.cpp   |  6 +++---
 .../01455_opentelemetry_distributed.reference |  4 ++--
 6 files changed, 29 insertions(+), 25 deletions(-)

diff --git a/src/DataTypes/ObjectUtils.cpp b/src/DataTypes/ObjectUtils.cpp
index ccfa0a28f13..cdd95da6c00 100644
--- a/src/DataTypes/ObjectUtils.cpp
+++ b/src/DataTypes/ObjectUtils.cpp
@@ -959,24 +959,22 @@ void replaceMissedSubcolumnsByConstants(
 
 /// @expected_columns and @available_columns contain descriptions
 /// of extended Object columns.
-MissingObjectList replaceMissedSubcolumnsByConstants(
+bool replaceMissedSubcolumnsByConstants(
     const ColumnsDescription & expected_columns,
     const ColumnsDescription & available_columns,
     QueryTreeNodePtr & query,
     const ContextPtr & context [[maybe_unused]])
 {
-    MissingObjectList missed_list;
+    bool has_missing_objects = false;
 
     NamesAndTypes missed_names_types = calculateMissedSubcolumns(expected_columns, available_columns);
 
     if (missed_names_types.empty())
-        return missed_list;
+        return has_missing_objects;
 
     auto * query_node = query->as<QueryNode>();
     if (!query_node)
-        return missed_list;
-
-    missed_list.reserve(missed_names_types.size());
+        return has_missing_objects;
 
     auto table_expression = extractLeftTableExpression(query_node->getJoinTree());
 
@@ -987,12 +985,12 @@ MissingObjectList replaceMissedSubcolumnsByConstants(
         constant->setAlias(table_expression->getAlias() + "." + name);
 
         column_name_to_node[name] = buildCastFunction(constant, type, context);
-        missed_list.push_back({ constant->getValueStringRepresentation() + "_" + constant->getResultType()->getName(), table_expression->getAlias() + "." + name });
+        has_missing_objects = true;
     }
 
     replaceColumns(query, table_expression, column_name_to_node);
 
-    return missed_list;
+    return has_missing_objects;
 }
 
 Field FieldVisitorReplaceScalars::operator()(const Array & x) const
diff --git a/src/DataTypes/ObjectUtils.h b/src/DataTypes/ObjectUtils.h
index 6ef19baf5ae..7b171056f06 100644
--- a/src/DataTypes/ObjectUtils.h
+++ b/src/DataTypes/ObjectUtils.h
@@ -100,9 +100,7 @@ void replaceMissedSubcolumnsByConstants(
     const ColumnsDescription & available_columns,
     ASTPtr query);
 
-using MissingObjectList = std::vector<std::pair<String, String>>;
-
-MissingObjectList replaceMissedSubcolumnsByConstants(
+bool replaceMissedSubcolumnsByConstants(
     const ColumnsDescription & expected_columns,
     const ColumnsDescription & available_columns,
     QueryTreeNodePtr & query,
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
index 4fccd83c8c0..ab301e01d0a 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
@@ -130,6 +130,7 @@ void SelectStreamFactory::createForShard(
     createForShardImpl(
         shard_info,
         query_ast,
+        {},
         main_table,
         table_func_ptr,
         std::move(context),
@@ -143,6 +144,7 @@ void SelectStreamFactory::createForShard(
 void SelectStreamFactory::createForShardImpl(
     const Cluster::ShardInfo & shard_info,
     const ASTPtr & query_ast,
+    const QueryTreeNodePtr & query_tree,
     const StorageID & main_table,
     const ASTPtr & table_func_ptr,
     ContextPtr context,
@@ -151,13 +153,13 @@ void SelectStreamFactory::createForShardImpl(
     UInt32 shard_count,
     bool parallel_replicas_enabled,
     AdditionalShardFilterGenerator shard_filter_generator,
-    MissingObjectList missed_list)
+    bool has_missing_objects)
 {
     auto emplace_local_stream = [&]()
     {
         Block shard_header;
         if (context->getSettingsRef().allow_experimental_analyzer)
-            shard_header = InterpreterSelectQueryAnalyzer::getSampleBlock(query_ast, context, SelectQueryOptions(processed_stage).analyze());
+            shard_header = InterpreterSelectQueryAnalyzer::getSampleBlock(query_tree, context, SelectQueryOptions(processed_stage).analyze());
         else
             shard_header = header;
 
@@ -169,15 +171,16 @@ void SelectStreamFactory::createForShardImpl(
     {
         Block shard_header;
         if (context->getSettingsRef().allow_experimental_analyzer)
-            shard_header = InterpreterSelectQueryAnalyzer::getSampleBlock(query_ast, context, SelectQueryOptions(processed_stage).analyze());
+            shard_header = InterpreterSelectQueryAnalyzer::getSampleBlock(query_tree, context, SelectQueryOptions(processed_stage).analyze());
         else
             shard_header = header;
 
         remote_shards.emplace_back(Shard{
             .query = query_ast,
+            .query_tree = query_tree,
             .main_table = main_table,
             .header = shard_header,
-            .missing_object_list = std::move(missed_list),
+            .has_missing_objects = has_missing_objects,
             .shard_info = shard_info,
             .lazy = lazy,
             .local_delay = local_delay,
@@ -300,15 +303,17 @@ void SelectStreamFactory::createForShard(
 
     auto it = objects_by_shard.find(shard_info.shard_num);
     QueryTreeNodePtr modified_query = query_tree;
-    MissingObjectList missed_list;
+
+    bool has_missing_objects = false;
     if (it != objects_by_shard.end())
-        missed_list = replaceMissedSubcolumnsByConstants(storage_snapshot->object_columns, it->second, modified_query, context);
+        has_missing_objects = replaceMissedSubcolumnsByConstants(storage_snapshot->object_columns, it->second, modified_query, context);
 
     auto query_ast = queryNodeToDistributedSelectQuery(modified_query);
 
     createForShardImpl(
         shard_info,
         query_ast,
+        modified_query,
         main_table,
         table_func_ptr,
         std::move(context),
@@ -317,7 +322,7 @@ void SelectStreamFactory::createForShard(
         shard_count,
         parallel_replicas_enabled,
         std::move(shard_filter_generator),
-        std::move(missed_list));
+        has_missing_objects);
 
 }
 
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.h b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
index 61694830b3d..760281284fd 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.h
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
@@ -54,11 +54,13 @@ public:
     {
         /// Query and header may be changed depending on shard.
         ASTPtr query;
+        QueryTreeNodePtr query_tree;
+
         /// Used to check the table existence on remote node
         StorageID main_table;
         Block header;
 
-        MissingObjectList missing_object_list;
+        bool has_missing_objects = false;
 
         Cluster::ShardInfo shard_info;
 
@@ -110,6 +112,7 @@ private:
     void createForShardImpl(
         const Cluster::ShardInfo & shard_info,
         const ASTPtr & query_ast,
+        const QueryTreeNodePtr & query_tree,
         const StorageID & main_table,
         const ASTPtr & table_func_ptr,
         ContextPtr context,
@@ -118,7 +121,7 @@ private:
         UInt32 shard_count,
         bool parallel_replicas_enabled,
         AdditionalShardFilterGenerator shard_filter_generator,
-        MissingObjectList missed_list = {});
+        bool has_missing_objects = false);
 };
 
 }
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 72848a37f6e..8c455883ab2 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -218,7 +218,7 @@ void ReadFromRemote::addLazyPipe(Pipes & pipes, const ClusterProxy::SelectStream
     };
 
     pipes.emplace_back(createDelayedPipe(shard.header, lazily_create_stream, add_totals, add_extremes));
-    addConvertingActions(pipes.back(), output_stream->header, !shard.missing_object_list.empty());
+    addConvertingActions(pipes.back(), output_stream->header, shard.has_missing_objects);
 }
 
 void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFactory::Shard & shard)
@@ -299,7 +299,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
             pipes.emplace_back(
                 createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
-            addConvertingActions(pipes.back(), output_stream->header, !shard.missing_object_list.empty());
+            addConvertingActions(pipes.back(), output_stream->header, shard.has_missing_objects);
         }
     }
     else
@@ -328,7 +328,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
 
         pipes.emplace_back(
             createRemoteSourcePipe(remote_query_executor, add_agg_info, add_totals, add_extremes, async_read, async_query_sending));
-        addConvertingActions(pipes.back(), output_stream->header, !shard.missing_object_list.empty());
+        addConvertingActions(pipes.back(), output_stream->header, shard.has_missing_objects);
     }
 }
 
diff --git a/tests/queries/0_stateless/01455_opentelemetry_distributed.reference b/tests/queries/0_stateless/01455_opentelemetry_distributed.reference
index 2920b387aa2..b04a3a5ea82 100644
--- a/tests/queries/0_stateless/01455_opentelemetry_distributed.reference
+++ b/tests/queries/0_stateless/01455_opentelemetry_distributed.reference
@@ -1,9 +1,9 @@
 ===http===
 {"query":"select 1 from remote('127.0.0.2', system, one) settings allow_experimental_analyzer = 1 format Null\n","status":"QueryFinish","tracestate":"some custom state","sorted_by_start_time":1}
 {"query":"DESC TABLE system.one","status":"QueryFinish","tracestate":"some custom state","sorted_by_start_time":1}
-{"query":"SELECT 1 AS `1` FROM `system`.`one` AS `__table1`","status":"QueryFinish","tracestate":"some custom state","sorted_by_start_time":1}
+{"query":"SELECT 1 AS `1` FROM `system`.`one` AS `__table1` SETTINGS allow_experimental_analyzer = 1","status":"QueryFinish","tracestate":"some custom state","sorted_by_start_time":1}
 {"query":"DESC TABLE system.one","query_status":"QueryFinish","tracestate":"some custom state","sorted_by_finish_time":1}
-{"query":"SELECT 1 AS `1` FROM `system`.`one` AS `__table1`","query_status":"QueryFinish","tracestate":"some custom state","sorted_by_finish_time":1}
+{"query":"SELECT 1 AS `1` FROM `system`.`one` AS `__table1` SETTINGS allow_experimental_analyzer = 1","query_status":"QueryFinish","tracestate":"some custom state","sorted_by_finish_time":1}
 {"query":"select 1 from remote('127.0.0.2', system, one) settings allow_experimental_analyzer = 1 format Null\n","query_status":"QueryFinish","tracestate":"some custom state","sorted_by_finish_time":1}
 {"total spans":"3","unique spans":"3","unique non-zero parent spans":"3"}
 {"initial query spans with proper parent":"2"}

From a6f1e09e69a583ab2f235f918e4bc0d92949d478 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 14 Mar 2024 17:35:10 +0000
Subject: [PATCH 529/985] Test test test_system_clusters_actual_information
 flakiness

---
 .../test_system_clusters_actual_information/test.py | 13 -------------
 1 file changed, 13 deletions(-)

diff --git a/tests/integration/test_system_clusters_actual_information/test.py b/tests/integration/test_system_clusters_actual_information/test.py
index e90a6cdeb3f..c6e3262fd62 100644
--- a/tests/integration/test_system_clusters_actual_information/test.py
+++ b/tests/integration/test_system_clusters_actual_information/test.py
@@ -12,20 +12,11 @@ cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance(
     "node", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
 )
-node_1 = cluster.add_instance("node_1", with_zookeeper=True)
-
 
 @pytest.fixture(scope="module")
 def started_cluster():
     try:
         cluster.start()
-        node_1.query_with_retry("DROP TABLE IF EXISTS replicated")
-
-        node_1.query_with_retry(
-            """CREATE TABLE replicated (id UInt32, date Date) ENGINE =
-            ReplicatedMergeTree('/clickhouse/tables/replicated', 'node_1')  ORDER BY id PARTITION BY toYYYYMM(date)"""
-        )
-
         node.query_with_retry(
             "CREATE TABLE distributed (id UInt32, date Date) ENGINE = Distributed('test_cluster', 'default', 'replicated')"
         )
@@ -37,8 +28,6 @@ def started_cluster():
 
 
 def test(started_cluster):
-    cluster.pause_container("node_1")
-
     node.query("SYSTEM RELOAD CONFIG")
     error = node.query_and_get_error(
         "SELECT count() FROM distributed SETTINGS receive_timeout=1, handshake_timeout_ms=1"
@@ -67,5 +56,3 @@ def test(started_cluster):
 
     assert recovery_time == 0
     assert errors_count == 0
-
-    cluster.unpause_container("node_1")

From 5c8f2bbda0124704fffc414e329b37d8245c42e4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Thu, 14 Mar 2024 17:45:42 +0000
Subject: [PATCH 530/985] Split template instantiations into separate files

---
 src/Dictionaries/RangeHashedDictionary.h      |  1 +
 ... => RangeHashedDictionaryGetItemsImpl.txx} | 30 +++++++++----------
 ...ngeHashedDictionaryGetItemsImplDecimal.cpp | 10 +++++++
 ...RangeHashedDictionaryGetItemsImplFloat.cpp |  7 +++++
 .../RangeHashedDictionaryGetItemsImplInt.cpp  | 11 +++++++
 ...angeHashedDictionaryGetItemsImplOthers.cpp | 10 +++++++
 .../RangeHashedDictionaryGetItemsImplUInt.cpp | 11 +++++++
 ...hedDictionaryGetItemsShortCircuitImpl.txx} | 30 ++++++++-----------
 ...tionaryGetItemsShortCircuitImplDecimal.cpp | 10 +++++++
 ...ictionaryGetItemsShortCircuitImplFloat.cpp |  7 +++++
 ...dDictionaryGetItemsShortCircuitImplInt.cpp | 11 +++++++
 ...ctionaryGetItemsShortCircuitImplOthers.cpp | 10 +++++++
 ...DictionaryGetItemsShortCircuitImplUInt.cpp | 11 +++++++
 13 files changed, 126 insertions(+), 33 deletions(-)
 rename src/Dictionaries/{RangeHashedDictionary_3.cpp => RangeHashedDictionaryGetItemsImpl.txx} (98%)
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsImplDecimal.cpp
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsImplFloat.cpp
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsImplInt.cpp
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsImplOthers.cpp
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsImplUInt.cpp
 rename src/Dictionaries/{RangeHashedDictionary_2.cpp => RangeHashedDictionaryGetItemsShortCircuitImpl.txx} (98%)
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplDecimal.cpp
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplFloat.cpp
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplInt.cpp
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplOthers.cpp
 create mode 100644 src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplUInt.cpp

diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index a5dedae97c4..23f7df8133e 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -292,6 +292,7 @@ private:
 extern template class RangeHashedDictionary<DictionaryKeyType::Simple>;
 extern template class RangeHashedDictionary<DictionaryKeyType::Complex>;
 
+
 namespace
 {
     template <typename F>
diff --git a/src/Dictionaries/RangeHashedDictionary_3.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsImpl.txx
similarity index 98%
rename from src/Dictionaries/RangeHashedDictionary_3.cpp
rename to src/Dictionaries/RangeHashedDictionaryGetItemsImpl.txx
index a3136d6f63d..9da2b0faf4a 100644
--- a/src/Dictionaries/RangeHashedDictionary_3.cpp
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsImpl.txx
@@ -1,5 +1,18 @@
 #include <Dictionaries/RangeHashedDictionary.h>
 
+#define INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType, IsNullable, AttributeType, ValueType) \
+template void RangeHashedDictionary<DictionaryKeyType>::getItemsImpl<ValueType, IsNullable, DictionaryDefaultValueExtractor<AttributeType>>( \
+    const Attribute & attribute,\
+    const Columns & key_columns,\
+    typename RangeHashedDictionary<DictionaryKeyType>::ValueSetterFunc<ValueType> && set_value,\
+    DictionaryDefaultValueExtractor<AttributeType> & default_value_extractor) const;
+
+#define INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(AttributeType) \
+    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Simple, true, AttributeType, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Simple, false, AttributeType, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Complex, true, AttributeType, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Complex, false, AttributeType, DictionaryValueType<AttributeType>)
+
 namespace DB
 {
 
@@ -13,6 +26,7 @@ void RangeHashedDictionary<dictionary_key_type>::getItemsImpl(
 {
     const auto & attribute_container = std::get<AttributeContainerType<ValueType>>(attribute.container);
 
+
     size_t keys_found = 0;
 
     const ColumnPtr & range_column = key_columns.back();
@@ -116,20 +130,4 @@ void RangeHashedDictionary<dictionary_key_type>::getItemsImpl(
     query_count.fetch_add(keys_size, std::memory_order_relaxed);
     found_count.fetch_add(keys_found, std::memory_order_relaxed);
 }
-
-#define INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType, IsNullable, AttributeType, ValueType) \
-template void RangeHashedDictionary<DictionaryKeyType>::getItemsImpl<ValueType, IsNullable, DictionaryDefaultValueExtractor<AttributeType>>( \
-    const Attribute & attribute,\
-    const Columns & key_columns,\
-    typename RangeHashedDictionary<DictionaryKeyType>::ValueSetterFunc<ValueType> && set_value,\
-    DictionaryDefaultValueExtractor<AttributeType> & default_value_extractor) const;
-
-#define INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(AttributeType) \
-    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Simple, true, AttributeType, DictionaryValueType<AttributeType>) \
-    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Simple, false, AttributeType, DictionaryValueType<AttributeType>) \
-    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Complex, true, AttributeType, DictionaryValueType<AttributeType>) \
-    INSTANTIATE_GET_ITEMS_IMPL(DictionaryKeyType::Complex, false, AttributeType, DictionaryValueType<AttributeType>)
-
-CALL_FOR_ALL_DICTIONARY_ATTRIBUTE_TYPES(INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE)
-
 }
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsImplDecimal.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsImplDecimal.cpp
new file mode 100644
index 00000000000..f1ee4dd58e1
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsImplDecimal.cpp
@@ -0,0 +1,10 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Decimal32);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Decimal64);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Decimal128);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Decimal256);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(DateTime64);
+}
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsImplFloat.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsImplFloat.cpp
new file mode 100644
index 00000000000..291a55a76db
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsImplFloat.cpp
@@ -0,0 +1,7 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Float32);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Float64);
+}
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsImplInt.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsImplInt.cpp
new file mode 100644
index 00000000000..a0748a9f486
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsImplInt.cpp
@@ -0,0 +1,11 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Int8);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Int16);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Int32);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Int64);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Int128);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Int256);
+}
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsImplOthers.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsImplOthers.cpp
new file mode 100644
index 00000000000..96e5bb54d0b
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsImplOthers.cpp
@@ -0,0 +1,10 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(UUID);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(IPv4);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(IPv6);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(String);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(Array);
+}
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsImplUInt.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsImplUInt.cpp
new file mode 100644
index 00000000000..e60a7189a2d
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsImplUInt.cpp
@@ -0,0 +1,11 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(UInt8);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(UInt16);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(UInt32);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(UInt64);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(UInt128);
+INSTANTIATE_GET_ITEMS_IMPL_FOR_ATTRIBUTE_TYPE(UInt256);
+}
diff --git a/src/Dictionaries/RangeHashedDictionary_2.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx
similarity index 98%
rename from src/Dictionaries/RangeHashedDictionary_2.cpp
rename to src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx
index d400fd1d830..5807af519f9 100644
--- a/src/Dictionaries/RangeHashedDictionary_2.cpp
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx
@@ -1,9 +1,21 @@
 #include <Dictionaries/RangeHashedDictionary.h>
 
+#define INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType, IsNullable, ValueType) \
+    template size_t RangeHashedDictionary<DictionaryKeyType>::getItemsShortCircuitImpl<ValueType, IsNullable>( \
+        const Attribute & attribute, \
+        const Columns & key_columns, \
+        typename RangeHashedDictionary<DictionaryKeyType>::ValueSetterFunc<ValueType> && set_value, \
+        IColumn::Filter & default_mask) const;
+
+#define INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(AttributeType) \
+    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Simple, true, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Simple, false, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Complex, true, DictionaryValueType<AttributeType>) \
+    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Complex, false, DictionaryValueType<AttributeType>)
+
 namespace DB
 {
 
-
 template <DictionaryKeyType dictionary_key_type>
 template <typename ValueType, bool is_nullable>
 size_t RangeHashedDictionary<dictionary_key_type>::getItemsShortCircuitImpl(
@@ -117,20 +129,4 @@ size_t RangeHashedDictionary<dictionary_key_type>::getItemsShortCircuitImpl(
     found_count.fetch_add(keys_found, std::memory_order_relaxed);
     return keys_found;
 }
-
-#define INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType, IsNullable, ValueType) \
-    template size_t RangeHashedDictionary<DictionaryKeyType>::getItemsShortCircuitImpl<ValueType, IsNullable>( \
-        const Attribute & attribute, \
-        const Columns & key_columns, \
-        typename RangeHashedDictionary<DictionaryKeyType>::ValueSetterFunc<ValueType> && set_value, \
-        IColumn::Filter & default_mask) const;
-
-#define INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(AttributeType) \
-    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Simple, true, DictionaryValueType<AttributeType>) \
-    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Simple, false, DictionaryValueType<AttributeType>) \
-    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Complex, true, DictionaryValueType<AttributeType>) \
-    INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL(DictionaryKeyType::Complex, false, DictionaryValueType<AttributeType>)
-
-CALL_FOR_ALL_DICTIONARY_ATTRIBUTE_TYPES(INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE)
-
 }
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplDecimal.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplDecimal.cpp
new file mode 100644
index 00000000000..298369e4735
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplDecimal.cpp
@@ -0,0 +1,10 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Decimal32);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Decimal64);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Decimal128);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Decimal256);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(DateTime64);
+}
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplFloat.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplFloat.cpp
new file mode 100644
index 00000000000..e8e8da6c75e
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplFloat.cpp
@@ -0,0 +1,7 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Float32);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Float64);
+}
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplInt.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplInt.cpp
new file mode 100644
index 00000000000..c685b9b5331
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplInt.cpp
@@ -0,0 +1,11 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Int8);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Int16);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Int32);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Int64);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Int128);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Int256);
+}
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplOthers.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplOthers.cpp
new file mode 100644
index 00000000000..46ea141b59b
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplOthers.cpp
@@ -0,0 +1,10 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(UUID);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(IPv4);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(IPv6);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(String);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(Array);
+}
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplUInt.cpp b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplUInt.cpp
new file mode 100644
index 00000000000..18421fd7e2d
--- /dev/null
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImplUInt.cpp
@@ -0,0 +1,11 @@
+#include <Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx>
+
+namespace DB
+{
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(UInt8);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(UInt16);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(UInt32);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(UInt64);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(UInt128);
+INSTANTIATE_GET_ITEMS_SHORT_CIRCUIT_IMPL_FOR_ATTRIBUTE_TYPE(UInt256);
+}

From 7b79d92bbe4c4070135da9747be02edb8499c6a4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Thu, 14 Mar 2024 17:49:23 +0000
Subject: [PATCH 531/985] Adjust large object check

---
 src/Dictionaries/RangeHashedDictionary.h | 1 -
 utils/check-style/check-large-objects.sh | 1 -
 2 files changed, 2 deletions(-)

diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index 23f7df8133e..a5dedae97c4 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -292,7 +292,6 @@ private:
 extern template class RangeHashedDictionary<DictionaryKeyType::Simple>;
 extern template class RangeHashedDictionary<DictionaryKeyType::Complex>;
 
-
 namespace
 {
     template <typename F>
diff --git a/utils/check-style/check-large-objects.sh b/utils/check-style/check-large-objects.sh
index 5ef57ea4f6c..5b0e8e88df5 100755
--- a/utils/check-style/check-large-objects.sh
+++ b/utils/check-style/check-large-objects.sh
@@ -6,7 +6,6 @@ TU_EXCLUDES=(
     CastOverloadResolver
     AggregateFunctionUniq
     FunctionsConversion
-    RangeHashedDictionary_
 
     Aggregator
 )

From c6826145dbc6d21c90b3346a26c6c1c53323d138 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Thu, 14 Mar 2024 17:59:58 +0000
Subject: [PATCH 532/985] Remove unnecessary empty lines

---
 src/Dictionaries/RangeHashedDictionary.h | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index a5dedae97c4..0469e82d7be 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -31,7 +31,6 @@
 #include <Functions/FunctionHelpers.h>
 #include <Interpreters/castColumn.h>
 
-
 namespace DB
 {
 
@@ -44,7 +43,6 @@ namespace ErrorCodes
     extern const int TYPE_MISMATCH;
 }
 
-
 enum class RangeHashedDictionaryLookupStrategy : uint8_t
 {
     min,
@@ -236,8 +234,6 @@ private:
 
     static Attribute createAttribute(const DictionaryAttribute & dictionary_attribute);
 
-
-
     template <typename ValueType>
     using ValueSetterFunc = std::function<void(size_t, const ValueType &, bool)>;
 

From e8da3bb2eb4ba0c54e948c1756c2d30e548d4432 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Thu, 14 Mar 2024 19:06:02 +0100
Subject: [PATCH 533/985] Fix style

---
 .../integration/test_system_clusters_actual_information/test.py  | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/integration/test_system_clusters_actual_information/test.py b/tests/integration/test_system_clusters_actual_information/test.py
index c6e3262fd62..8b6436aeb5c 100644
--- a/tests/integration/test_system_clusters_actual_information/test.py
+++ b/tests/integration/test_system_clusters_actual_information/test.py
@@ -13,6 +13,7 @@ node = cluster.add_instance(
     "node", with_zookeeper=True, main_configs=["configs/remote_servers.xml"]
 )
 
+
 @pytest.fixture(scope="module")
 def started_cluster():
     try:

From 7e9d863c22e65ce34539670519de096a9f2261e6 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Thu, 14 Mar 2024 18:08:55 +0000
Subject: [PATCH 534/985] Update reference of the test

---
 .../0_stateless/03010_sum_to_to_count_if_nullable.reference     | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
index e69de29bb2d..8627f639a03 100644
--- a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
+++ b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
@@ -0,0 +1,2 @@
+(5,NULL)
+(5,NULL)

From b65beba1fd439a1e98b028b85548873e8339335c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Thu, 14 Mar 2024 18:13:06 +0000
Subject: [PATCH 535/985] Remove not used error code declaration

---
 src/Dictionaries/RangeHashedDictionary.cpp | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/src/Dictionaries/RangeHashedDictionary.cpp b/src/Dictionaries/RangeHashedDictionary.cpp
index 8299c3ad93a..30a0123ade6 100644
--- a/src/Dictionaries/RangeHashedDictionary.cpp
+++ b/src/Dictionaries/RangeHashedDictionary.cpp
@@ -3,11 +3,6 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int TYPE_MISMATCH;
-}
-
 template <DictionaryKeyType dictionary_key_type>
 ColumnPtr RangeHashedDictionary<dictionary_key_type>::getColumn(
     const std::string & attribute_name,

From b0008495294761e3394de0060dda61ee66808476 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Thu, 14 Mar 2024 18:15:12 +0000
Subject: [PATCH 536/985] Better

---
 src/Analyzer/Passes/SumIfToCountIfPass.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Analyzer/Passes/SumIfToCountIfPass.cpp b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
index d374d92c1fb..2c41b6dc467 100644
--- a/src/Analyzer/Passes/SumIfToCountIfPass.cpp
+++ b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
@@ -32,7 +32,7 @@ public:
             return;
 
         auto * function_node = node->as<FunctionNode>();
-        if (!function_node || !function_node->isAggregateFunction() || function_node->getResultType()->isNullable())
+        if (!function_node || !function_node->isAggregateFunction())
             return;
 
         auto function_name = function_node->getFunctionName();
@@ -54,10 +54,10 @@ public:
             if (!constant_node)
                 return;
 
-            const auto & constant_value_literal = constant_node->getValue();
-            if (!isInt64OrUInt64FieldType(constant_value_literal.getType()))
+            if (auto constant_type = constant_node->getResultType(); !isUInt64(constant_type) && !isInt64(constant_type))
                 return;
 
+            const auto & constant_value_literal = constant_node->getValue();
             if (getSettings().aggregate_functions_null_for_empty)
                 return;
 

From e9f81170873bd06bf8c9875fa90654ec6fb0abc8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 14 Mar 2024 20:16:25 +0100
Subject: [PATCH 537/985] Increase memory limit for coverage builds

---
 CMakeLists.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 9ffb4789dc9..eff6dd3ff6a 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -56,13 +56,13 @@ option(ENABLE_CHECK_HEAVY_BUILDS "Don't allow C++ translation units to compile t
 if (ENABLE_CHECK_HEAVY_BUILDS)
     # set DATA (since RSS does not work since 2.6.x+) to 5G
     set (RLIMIT_DATA 5000000000)
-    # set VIRT (RLIMIT_AS) to 10G (DATA*10)
+    # set VIRT (RLIMIT_AS) to 10G (DATA*2)
     set (RLIMIT_AS 10000000000)
     # set CPU time limit to 1000 seconds
     set (RLIMIT_CPU 1000)
 
     # -fsanitize=memory and address are too heavy
-    if (SANITIZE)
+    if (SANITIZE OR SANITIZE_COVERAGE OR WITH_COVERAGE)
        set (RLIMIT_DATA 10000000000) # 10G
     endif()
 

From 6f1b835a4e77df36e322ca16ee01b2c52f60edbf Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 14 Mar 2024 20:46:54 +0100
Subject: [PATCH 538/985] Fix comment

---
 base/base/itoa.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/base/base/itoa.cpp b/base/base/itoa.cpp
index 9bd2fcd1837..fd8fd8de025 100644
--- a/base/base/itoa.cpp
+++ b/base/base/itoa.cpp
@@ -1,6 +1,6 @@
 // Based on https://github.com/amdn/itoa and combined with our optimizations
 //
-//=== itoa.h - Fast integer to ascii conversion                   --*- C++ -*-//
+//=== itoa.cpp - Fast integer to ascii conversion                 --*- C++ -*-//
 //
 // The MIT License (MIT)
 // Copyright (c) 2016 Arturo Martin-de-Nicolas

From e8b3cc28518a409fbefe5206f676c2623d881484 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Thu, 14 Mar 2024 20:01:12 +0000
Subject: [PATCH 539/985] CI: skip hdfs tests for arm  #do_not_test  #batch_0 
 #no_merge_commit

 #ci_set_arm
---
 .../integration/test_allowed_url_from_config/test.py | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/tests/integration/test_allowed_url_from_config/test.py b/tests/integration/test_allowed_url_from_config/test.py
index 3106cf12702..fb7564ae9d3 100644
--- a/tests/integration/test_allowed_url_from_config/test.py
+++ b/tests/integration/test_allowed_url_from_config/test.py
@@ -1,3 +1,4 @@
+import platform
 import pytest
 from helpers.cluster import ClickHouseCluster
 
@@ -16,9 +17,11 @@ node5 = cluster.add_instance(
     "node5", main_configs=["configs/config_without_allowed_hosts.xml"]
 )
 node6 = cluster.add_instance("node6", main_configs=["configs/config_for_remote.xml"])
-node7 = cluster.add_instance(
-    "node7", main_configs=["configs/config_for_redirect.xml"], with_hdfs=True
-)
+
+if platform.processor() != "arm":
+    node7 = cluster.add_instance(
+        "node7", main_configs=["configs/config_for_redirect.xml"], with_hdfs=True
+    )
 
 
 @pytest.fixture(scope="module")
@@ -270,6 +273,7 @@ def test_table_function_remote(start_cluster):
     )
 
 
+@pytest.mark.skipif(platform.processor() == "arm", reason="skip for ARM")
 def test_redirect(start_cluster):
     hdfs_api = start_cluster.hdfs_api
 
@@ -284,6 +288,7 @@ def test_redirect(start_cluster):
     node7.query("DROP TABLE table_test_7_1")
 
 
+@pytest.mark.skipif(platform.processor() == "arm", reason="skip for ARM")
 def test_HDFS(start_cluster):
     assert "not allowed" in node7.query_and_get_error(
         "CREATE TABLE table_test_7_2 (word String) ENGINE=HDFS('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'CSV')"
@@ -293,6 +298,7 @@ def test_HDFS(start_cluster):
     )
 
 
+@pytest.mark.skipif(platform.processor() == "arm", reason="skip for ARM")
 def test_schema_inference(start_cluster):
     error = node7.query_and_get_error("desc url('http://test.com`, 'TSVRaw'')")
     assert error.find("ReadWriteBufferFromHTTPBase") == -1

From e08eaebc9946d39d19b4e995cfdc962719c55c44 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Thu, 14 Mar 2024 20:36:18 +0000
Subject: [PATCH 540/985] Add sanity check for poll_max_batch_size FileLog
 setting to avoid big untracked allocations

---
 src/Storages/FileLog/FileLogSettings.cpp                    | 6 ++++++
 .../03010_file_log_large_poll_batch_size.reference          | 0
 .../0_stateless/03010_file_log_large_poll_batch_size.sql    | 2 ++
 3 files changed, 8 insertions(+)
 create mode 100644 tests/queries/0_stateless/03010_file_log_large_poll_batch_size.reference
 create mode 100644 tests/queries/0_stateless/03010_file_log_large_poll_batch_size.sql

diff --git a/src/Storages/FileLog/FileLogSettings.cpp b/src/Storages/FileLog/FileLogSettings.cpp
index 2cd42c35870..8e245285b9a 100644
--- a/src/Storages/FileLog/FileLogSettings.cpp
+++ b/src/Storages/FileLog/FileLogSettings.cpp
@@ -11,6 +11,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int UNKNOWN_SETTING;
+    extern const int INVALID_SETTING_VALUE;
 }
 
 IMPLEMENT_SETTINGS_TRAITS(FileLogSettingsTraits, LIST_OF_FILELOG_SETTINGS)
@@ -36,6 +37,11 @@ void FileLogSettings::loadFromQuery(ASTStorage & storage_def)
         settings_ast->is_standalone = false;
         storage_def.set(storage_def.settings, settings_ast);
     }
+
+    /// Check that batch size is not too high (the same as we check setting max_block_size).
+    constexpr UInt64 max_sane_block_rows_size = 4294967296; // 2^32
+    if (poll_max_batch_size > max_sane_block_rows_size)
+        throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Sanity check: 'poll_max_batch_size' value is too high ({})", poll_max_batch_size);
 }
 
 }
diff --git a/tests/queries/0_stateless/03010_file_log_large_poll_batch_size.reference b/tests/queries/0_stateless/03010_file_log_large_poll_batch_size.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03010_file_log_large_poll_batch_size.sql b/tests/queries/0_stateless/03010_file_log_large_poll_batch_size.sql
new file mode 100644
index 00000000000..2663011f2ec
--- /dev/null
+++ b/tests/queries/0_stateless/03010_file_log_large_poll_batch_size.sql
@@ -0,0 +1,2 @@
+create table test (number UInt64) engine=FileLog('./user_files/data.jsonl', 'JSONEachRow') settings poll_max_batch_size=18446744073709; -- {serverError INVALID_SETTING_VALUE}
+

From 1cae77997a648414d2e16e806c322fae2f2da301 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Thu, 14 Mar 2024 21:34:25 +0000
Subject: [PATCH 541/985] Try revert stage back

---
 src/Storages/StorageMerge.cpp | 8 +++++---
 src/Storages/StorageMerge.h   | 3 ++-
 2 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index f95464f4bff..52362eb5cb8 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -1121,7 +1121,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
         /// Subordinary tables could have different but convertible types, like numeric types of different width.
         /// We must return streams with structure equals to structure of Merge table.
         convertAndFilterSourceStream(
-            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder);
+            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, processed_stage);
     }
 
     return builder;
@@ -1473,7 +1473,8 @@ void ReadFromMerge::convertAndFilterSourceStream(
     const Aliases & aliases,
     const RowPolicyDataOpt & row_policy_data_opt,
     ContextPtr local_context,
-    QueryPipelineBuilder & builder)
+    QueryPipelineBuilder & builder,
+    QueryProcessingStage::Enum processed_stage)
 {
     Block before_block_header = builder.getHeader();
 
@@ -1532,7 +1533,8 @@ void ReadFromMerge::convertAndFilterSourceStream(
 
     ActionsDAG::MatchColumnsMode convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Name;
 
-    if (local_context->getSettingsRef().allow_experimental_analyzer && dynamic_cast<const StorageDistributed *>(&snapshot->storage) != nullptr)
+    if (local_context->getSettingsRef().allow_experimental_analyzer
+        && (processed_stage != QueryProcessingStage::FetchColumns || dynamic_cast<const StorageDistributed *>(&snapshot->storage) != nullptr))
         convert_actions_match_columns_mode = ActionsDAG::MatchColumnsMode::Position;
 
     if (row_policy_data_opt)
diff --git a/src/Storages/StorageMerge.h b/src/Storages/StorageMerge.h
index 3aabd7e26e3..556649f622d 100644
--- a/src/Storages/StorageMerge.h
+++ b/src/Storages/StorageMerge.h
@@ -277,7 +277,8 @@ private:
         const Aliases & aliases,
         const RowPolicyDataOpt & row_policy_data_opt,
         ContextPtr context,
-        QueryPipelineBuilder & builder);
+        QueryPipelineBuilder & builder,
+        QueryProcessingStage::Enum processed_stage);
 
     StorageMerge::StorageListWithLocks getSelectedTables(
         ContextPtr query_context,

From 23169117aefc65c54e29b38629948ee4157aaf9c Mon Sep 17 00:00:00 2001
From: tomershafir <tomer.shafir8@gmail.com>
Date: Fri, 15 Mar 2024 00:02:09 +0200
Subject: [PATCH 542/985] thread-fuzzer: randomize sleep time

---
 docker/test/stateless/run.sh             | 10 +++----
 docker/test/stress/run.sh                | 10 +++----
 src/Common/ThreadFuzzer.cpp              | 35 ++++++++++++------------
 src/Common/ThreadFuzzer.h                | 10 +++----
 src/Common/examples/chaos_sanitizer.cpp  |  2 +-
 utils/keeper-overload/keeper-overload.py | 10 +++----
 6 files changed, 38 insertions(+), 39 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index dc181339786..cfa3c806212 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -77,7 +77,7 @@ fi
 if [ "$NUM_TRIES" -gt "1" ]; then
     export THREAD_FUZZER_CPU_TIME_PERIOD_US=1000
     export THREAD_FUZZER_SLEEP_PROBABILITY=0.1
-    export THREAD_FUZZER_SLEEP_TIME_US=100000
+    export THREAD_FUZZER_SLEEP_TIME_US_MAX=100000
 
     export THREAD_FUZZER_pthread_mutex_lock_BEFORE_MIGRATE_PROBABILITY=1
     export THREAD_FUZZER_pthread_mutex_lock_AFTER_MIGRATE_PROBABILITY=1
@@ -88,10 +88,10 @@ if [ "$NUM_TRIES" -gt "1" ]; then
     export THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_PROBABILITY=0.001
     export THREAD_FUZZER_pthread_mutex_unlock_BEFORE_SLEEP_PROBABILITY=0.001
     export THREAD_FUZZER_pthread_mutex_unlock_AFTER_SLEEP_PROBABILITY=0.001
-    export THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_TIME_US=10000
-    export THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_TIME_US=10000
-    export THREAD_FUZZER_pthread_mutex_unlock_BEFORE_SLEEP_TIME_US=10000
-    export THREAD_FUZZER_pthread_mutex_unlock_AFTER_SLEEP_TIME_US=10000
+    export THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_TIME_US_MAX=10000
+    export THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_TIME_US_MAX=10000
+    export THREAD_FUZZER_pthread_mutex_unlock_BEFORE_SLEEP_TIME_US_MAX=10000
+    export THREAD_FUZZER_pthread_mutex_unlock_AFTER_SLEEP_TIME_US_MAX=10000
 
     mkdir -p /var/run/clickhouse-server
     # simplest way to forward env variables to server
diff --git a/docker/test/stress/run.sh b/docker/test/stress/run.sh
index 621a6ced7f6..ea7e3aece1d 100644
--- a/docker/test/stress/run.sh
+++ b/docker/test/stress/run.sh
@@ -27,7 +27,7 @@ install_packages package_folder
 # and find more potential issues.
 export THREAD_FUZZER_CPU_TIME_PERIOD_US=1000
 export THREAD_FUZZER_SLEEP_PROBABILITY=0.1
-export THREAD_FUZZER_SLEEP_TIME_US=100000
+export THREAD_FUZZER_SLEEP_TIME_US_MAX=100000
 
 export THREAD_FUZZER_pthread_mutex_lock_BEFORE_MIGRATE_PROBABILITY=1
 export THREAD_FUZZER_pthread_mutex_lock_AFTER_MIGRATE_PROBABILITY=1
@@ -38,11 +38,11 @@ export THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_PROBABILITY=0.001
 export THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_PROBABILITY=0.001
 export THREAD_FUZZER_pthread_mutex_unlock_BEFORE_SLEEP_PROBABILITY=0.001
 export THREAD_FUZZER_pthread_mutex_unlock_AFTER_SLEEP_PROBABILITY=0.001
-export THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_TIME_US=10000
+export THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_TIME_US_MAX=10000
 
-export THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_TIME_US=10000
-export THREAD_FUZZER_pthread_mutex_unlock_BEFORE_SLEEP_TIME_US=10000
-export THREAD_FUZZER_pthread_mutex_unlock_AFTER_SLEEP_TIME_US=10000
+export THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_TIME_US_MAX=10000
+export THREAD_FUZZER_pthread_mutex_unlock_BEFORE_SLEEP_TIME_US_MAX=10000
+export THREAD_FUZZER_pthread_mutex_unlock_AFTER_SLEEP_TIME_US_MAX=10000
 
 export THREAD_FUZZER_EXPLICIT_SLEEP_PROBABILITY=0.01
 export THREAD_FUZZER_EXPLICIT_MEMORY_EXCEPTION_PROBABILITY=0.01
diff --git a/src/Common/ThreadFuzzer.cpp b/src/Common/ThreadFuzzer.cpp
index 1d944f4a458..9f9ec4fa356 100644
--- a/src/Common/ThreadFuzzer.cpp
+++ b/src/Common/ThreadFuzzer.cpp
@@ -86,12 +86,12 @@ static std::atomic<int> num_cpus = 0;
         static std::atomic<double> NAME##_before_yield_probability = 0; \
         static std::atomic<double> NAME##_before_migrate_probability = 0; \
         static std::atomic<double> NAME##_before_sleep_probability = 0; \
-        static std::atomic<double> NAME##_before_sleep_time_us = 0; \
+        static std::atomic<double> NAME##_before_sleep_time_us_max = 0; \
 \
         static std::atomic<double> NAME##_after_yield_probability = 0; \
         static std::atomic<double> NAME##_after_migrate_probability = 0; \
         static std::atomic<double> NAME##_after_sleep_probability = 0; \
-        static std::atomic<double> NAME##_after_sleep_time_us = 0;
+        static std::atomic<double> NAME##_after_sleep_time_us_max = 0;
 
 FOR_EACH_WRAPPED_FUNCTION(DEFINE_WRAPPER_PARAMS)
 
@@ -110,7 +110,7 @@ void ThreadFuzzer::initConfiguration()
     initFromEnv(yield_probability, "THREAD_FUZZER_YIELD_PROBABILITY");
     initFromEnv(migrate_probability, "THREAD_FUZZER_MIGRATE_PROBABILITY");
     initFromEnv(sleep_probability, "THREAD_FUZZER_SLEEP_PROBABILITY");
-    initFromEnv(sleep_time_us, "THREAD_FUZZER_SLEEP_TIME_US");
+    initFromEnv(sleep_time_us_max, "THREAD_FUZZER_SLEEP_TIME_US_MAX");
     initFromEnv(explicit_sleep_probability, "THREAD_FUZZER_EXPLICIT_SLEEP_PROBABILITY");
     initFromEnv(explicit_memory_exception_probability, "THREAD_FUZZER_EXPLICIT_MEMORY_EXCEPTION_PROBABILITY");
 
@@ -119,13 +119,12 @@ void ThreadFuzzer::initConfiguration()
         initFromEnv(NAME##_before_yield_probability, "THREAD_FUZZER_" #NAME "_BEFORE_YIELD_PROBABILITY"); \
         initFromEnv(NAME##_before_migrate_probability, "THREAD_FUZZER_" #NAME "_BEFORE_MIGRATE_PROBABILITY"); \
         initFromEnv(NAME##_before_sleep_probability, "THREAD_FUZZER_" #NAME "_BEFORE_SLEEP_PROBABILITY"); \
-        initFromEnv(NAME##_before_sleep_time_us, "THREAD_FUZZER_" #NAME "_BEFORE_SLEEP_TIME_US"); \
+        initFromEnv(NAME##_before_sleep_time_us_max, "THREAD_FUZZER_" #NAME "_BEFORE_SLEEP_TIME_US_MAX"); \
 \
         initFromEnv(NAME##_after_yield_probability, "THREAD_FUZZER_" #NAME "_AFTER_YIELD_PROBABILITY"); \
         initFromEnv(NAME##_after_migrate_probability, "THREAD_FUZZER_" #NAME "_AFTER_MIGRATE_PROBABILITY"); \
         initFromEnv(NAME##_after_sleep_probability, "THREAD_FUZZER_" #NAME "_AFTER_SLEEP_PROBABILITY"); \
-        initFromEnv(NAME##_after_sleep_time_us, "THREAD_FUZZER_" #NAME "_AFTER_SLEEP_TIME_US");
-
+        initFromEnv(NAME##_after_sleep_time_us_max, "THREAD_FUZZER_" #NAME "_AFTER_SLEEP_TIME_US_MAX");
     FOR_EACH_WRAPPED_FUNCTION(INIT_WRAPPER_PARAMS)
 
 #    undef INIT_WRAPPER_PARAMS
@@ -146,7 +145,7 @@ bool ThreadFuzzer::isEffective() const
             return true; \
         if (NAME##_before_sleep_probability.load(std::memory_order_relaxed) > 0.0) \
             return true; \
-        if (NAME##_before_sleep_time_us.load(std::memory_order_relaxed) > 0.0) \
+        if (NAME##_before_sleep_time_us_max.load(std::memory_order_relaxed) > 0.0) \
             return true; \
 \
         if (NAME##_after_yield_probability.load(std::memory_order_relaxed) > 0.0) \
@@ -155,7 +154,7 @@ bool ThreadFuzzer::isEffective() const
             return true; \
         if (NAME##_after_sleep_probability.load(std::memory_order_relaxed) > 0.0) \
             return true; \
-        if (NAME##_after_sleep_time_us.load(std::memory_order_relaxed) > 0.0) \
+        if (NAME##_after_sleep_time_us_max.load(std::memory_order_relaxed) > 0.0) \
             return true;
 
     FOR_EACH_WRAPPED_FUNCTION(CHECK_WRAPPER_PARAMS)
@@ -166,7 +165,7 @@ bool ThreadFuzzer::isEffective() const
     return cpu_time_period_us != 0
         && (yield_probability > 0
             || migrate_probability > 0
-            || (sleep_probability > 0 && sleep_time_us > 0));
+            || (sleep_probability > 0 && sleep_time_us_max > 0));
 }
 
 void ThreadFuzzer::stop()
@@ -190,7 +189,7 @@ static void injectionImpl(
     double yield_probability,
     double migrate_probability,
     double sleep_probability,
-    double sleep_time_us)
+    double sleep_time_us_max)
 {
     DENY_ALLOCATIONS_IN_SCOPE;
     if (!ThreadFuzzer::isStarted())
@@ -221,10 +220,10 @@ static void injectionImpl(
 #endif
 
     if (sleep_probability > 0
-        && sleep_time_us > 0
+        && sleep_time_us_max > 0
         && std::bernoulli_distribution(sleep_probability)(thread_local_rng))
     {
-        sleepForNanoseconds(static_cast<uint64_t>(sleep_time_us * 1000));
+        sleepForNanoseconds((thread_local_rng() % static_cast<uint64_t>(sleep_time_us_max)) * 1000); /*may sleep(0)*/
     }
 }
 
@@ -232,19 +231,19 @@ static ALWAYS_INLINE void injection(
     double yield_probability,
     double migrate_probability,
     double sleep_probability,
-    double sleep_time_us)
+    double sleep_time_us_max)
 {
     DENY_ALLOCATIONS_IN_SCOPE;
     if (!ThreadFuzzer::isStarted())
         return;
 
-    injectionImpl(yield_probability, migrate_probability, sleep_probability, sleep_time_us);
+    injectionImpl(yield_probability, migrate_probability, sleep_probability, sleep_time_us_max);
 }
 
 void ThreadFuzzer::maybeInjectSleep()
 {
     auto & fuzzer = ThreadFuzzer::instance();
-    injection(fuzzer.yield_probability, fuzzer.migrate_probability, fuzzer.explicit_sleep_probability, fuzzer.sleep_time_us);
+    injection(fuzzer.yield_probability, fuzzer.migrate_probability, fuzzer.explicit_sleep_probability, fuzzer.sleep_time_us_max);
 }
 
 /// Sometimes maybeInjectSleep() is not enough and we need to inject an exception.
@@ -265,7 +264,7 @@ void ThreadFuzzer::signalHandler(int)
     DENY_ALLOCATIONS_IN_SCOPE;
     auto saved_errno = errno;
     auto & fuzzer = ThreadFuzzer::instance();
-    injection(fuzzer.yield_probability, fuzzer.migrate_probability, fuzzer.sleep_probability, fuzzer.sleep_time_us);
+    injection(fuzzer.yield_probability, fuzzer.migrate_probability, fuzzer.sleep_probability, fuzzer.sleep_time_us_max);
     errno = saved_errno;
 }
 
@@ -309,13 +308,13 @@ void ThreadFuzzer::setup() const
         NAME##_before_yield_probability.load(std::memory_order_relaxed),   \
         NAME##_before_migrate_probability.load(std::memory_order_relaxed), \
         NAME##_before_sleep_probability.load(std::memory_order_relaxed),   \
-        NAME##_before_sleep_time_us.load(std::memory_order_relaxed));
+        NAME##_before_sleep_time_us_max.load(std::memory_order_relaxed));
 #define INJECTION_AFTER(NAME) \
     injectionImpl(                                                         \
         NAME##_after_yield_probability.load(std::memory_order_relaxed),    \
         NAME##_after_migrate_probability.load(std::memory_order_relaxed),  \
         NAME##_after_sleep_probability.load(std::memory_order_relaxed),    \
-        NAME##_after_sleep_time_us.load(std::memory_order_relaxed));
+        NAME##_after_sleep_time_us_max.load(std::memory_order_relaxed));
 
 /// ThreadFuzzer intercepts pthread_mutex_lock()/pthread_mutex_unlock().
 ///
diff --git a/src/Common/ThreadFuzzer.h b/src/Common/ThreadFuzzer.h
index 1cff27a7588..8956538e7d1 100644
--- a/src/Common/ThreadFuzzer.h
+++ b/src/Common/ThreadFuzzer.h
@@ -16,7 +16,7 @@ namespace DB
   * THREAD_FUZZER_YIELD_PROBABILITY   - probability to do 'sched_yield'.
   * THREAD_FUZZER_MIGRATE_PROBABILITY - probability to set CPU affinity to random CPU core.
   * THREAD_FUZZER_SLEEP_PROBABILITY   - probability to sleep.
-  * THREAD_FUZZER_SLEEP_TIME_US       - amount of time to sleep in microseconds.
+  * THREAD_FUZZER_SLEEP_TIME_US_MAX   - max amount of time to sleep in microseconds, actual sleep time is randomized.
   *
   * ThreadFuzzer will do nothing if environment variables are not set accordingly.
   *
@@ -33,16 +33,15 @@ namespace DB
   *
   * Notes:
   * - it can be also implemented with instrumentation (example: LLVM Xray) instead of signals.
-  * - we should also make the sleep time random.
   * - sleep and migration obviously helps, but the effect of yield is unclear.
   *
   * In addition, we allow to inject glitches around thread synchronization functions.
   * Example:
   *
   * THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_PROBABILITY=0.001
-  * THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_TIME_US=10000
+  * THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_TIME_US_MAX=10000
   * THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_PROBABILITY=0.001
-  * THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_TIME_US=10000
+  * THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_TIME_US_MAX=10000
   */
 class ThreadFuzzer
 {
@@ -67,7 +66,8 @@ private:
     double yield_probability = 0;
     double migrate_probability = 0;
     double sleep_probability = 0;
-    double sleep_time_us = 0;
+    double sleep_time_us_max = 0;
+    
     double explicit_sleep_probability = 0;
     double explicit_memory_exception_probability = 0;
 
diff --git a/src/Common/examples/chaos_sanitizer.cpp b/src/Common/examples/chaos_sanitizer.cpp
index 76e22411a2e..175c3e8d767 100644
--- a/src/Common/examples/chaos_sanitizer.cpp
+++ b/src/Common/examples/chaos_sanitizer.cpp
@@ -12,7 +12,7 @@
 /** Proves that ThreadFuzzer helps to find concurrency bugs.
   *
   * for i in {1..10}; do ./chaos_sanitizer 1000000; done
-  * for i in {1..10}; do THREAD_FUZZER_CPU_TIME_PERIOD_US=1000 THREAD_FUZZER_SLEEP_PROBABILITY=0.1 THREAD_FUZZER_SLEEP_TIME_US=100000 ./chaos_sanitizer 1000000; done
+  * for i in {1..10}; do THREAD_FUZZER_CPU_TIME_PERIOD_US=1000 THREAD_FUZZER_SLEEP_PROBABILITY=0.1 THREAD_FUZZER_SLEEP_TIME_US_MAX=100000 ./chaos_sanitizer 1000000; done
   */
 int main(int argc, char ** argv)
 {
diff --git a/utils/keeper-overload/keeper-overload.py b/utils/keeper-overload/keeper-overload.py
index 0a059b10588..1032ea656bc 100755
--- a/utils/keeper-overload/keeper-overload.py
+++ b/utils/keeper-overload/keeper-overload.py
@@ -102,7 +102,7 @@ class Keeper:
         if self.with_thread_fuzzer:
             env["THREAD_FUZZER_CPU_TIME_PERIOD_US"] = "1000"
             env["THREAD_FUZZER_SLEEP_PROBABILITY"] = "0.1"
-            env["THREAD_FUZZER_SLEEP_TIME_US"] = "100000"
+            env["THREAD_FUZZER_SLEEP_TIME_US_MAX"] = "100000"
             env["THREAD_FUZZER_pthread_mutex_lock_BEFORE_MIGRATE_PROBABILITY"] = "1"
             env["THREAD_FUZZER_pthread_mutex_lock_AFTER_MIGRATE_PROBABILITY"] = "1"
             env["THREAD_FUZZER_pthread_mutex_unlock_BEFORE_MIGRATE_PROBABILITY"] = "1"
@@ -112,10 +112,10 @@ class Keeper:
             env["THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_PROBABILITY"] = "0.001"
             env["THREAD_FUZZER_pthread_mutex_unlock_BEFORE_SLEEP_PROBABILITY"] = "0.001"
             env["THREAD_FUZZER_pthread_mutex_unlock_AFTER_SLEEP_PROBABILITY"] = "0.001"
-            env["THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_TIME_US"] = "10000"
-            env["THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_TIME_US"] = "10000"
-            env["THREAD_FUZZER_pthread_mutex_unlock_BEFORE_SLEEP_TIME_US"] = "10000"
-            env["THREAD_FUZZER_pthread_mutex_unlock_AFTER_SLEEP_TIME_US"] = "10000"
+            env["THREAD_FUZZER_pthread_mutex_lock_BEFORE_SLEEP_TIME_US_MAX"] = "10000"
+            env["THREAD_FUZZER_pthread_mutex_lock_AFTER_SLEEP_TIME_US_MAX"] = "10000"
+            env["THREAD_FUZZER_pthread_mutex_unlock_BEFORE_SLEEP_TIME_US_MAX"] = "10000"
+            env["THREAD_FUZZER_pthread_mutex_unlock_AFTER_SLEEP_TIME_US_MAX"] = "10000"
 
         self.process = subprocess.Popen(
             [

From e6c04599c1ef15718165efee4cd044ea22cefb7c Mon Sep 17 00:00:00 2001
From: tomershafir <tomer.shafir8@gmail.com>
Date: Fri, 15 Mar 2024 00:03:51 +0200
Subject: [PATCH 543/985] sched_yield matters

---
 src/Common/ThreadFuzzer.h | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Common/ThreadFuzzer.h b/src/Common/ThreadFuzzer.h
index 8956538e7d1..b5501ecf4e1 100644
--- a/src/Common/ThreadFuzzer.h
+++ b/src/Common/ThreadFuzzer.h
@@ -33,7 +33,6 @@ namespace DB
   *
   * Notes:
   * - it can be also implemented with instrumentation (example: LLVM Xray) instead of signals.
-  * - sleep and migration obviously helps, but the effect of yield is unclear.
   *
   * In addition, we allow to inject glitches around thread synchronization functions.
   * Example:

From e418f249b8a08484b10bbd5a60de5718686de2f3 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Fri, 15 Mar 2024 00:40:28 +0000
Subject: [PATCH 544/985] fix test

---
 tests/queries/0_stateless/03008_optimize_equal_ranges.sql | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/03008_optimize_equal_ranges.sql b/tests/queries/0_stateless/03008_optimize_equal_ranges.sql
index 4d521420741..6d769c7382a 100644
--- a/tests/queries/0_stateless/03008_optimize_equal_ranges.sql
+++ b/tests/queries/0_stateless/03008_optimize_equal_ranges.sql
@@ -5,6 +5,7 @@ CREATE TABLE t_optimize_equal_ranges (a UInt64, b String, c UInt64) ENGINE = Mer
 SET max_block_size = 1024;
 SET max_bytes_before_external_group_by = 0;
 SET optimize_aggregation_in_order = 0;
+SET optimize_use_projections = 0;
 
 INSERT INTO t_optimize_equal_ranges SELECT 0, toString(number), number FROM numbers(30000);
 INSERT INTO t_optimize_equal_ranges SELECT 1, toString(number), number FROM numbers(30000);

From 25c56ac0a6c291b109bde878b1c3a85c2b1d91ca Mon Sep 17 00:00:00 2001
From: justindeguzman <justin@justindeguzman.net>
Date: Thu, 14 Mar 2024 18:30:18 -0700
Subject: [PATCH 545/985] [Docs] Specify that MySQL table engine is not
 supported in Cloud

---
 docs/en/engines/table-engines/integrations/mysql.md | 4 ++++
 utils/check-style/aspell-ignore/en/aspell-dict.txt  | 1 +
 2 files changed, 5 insertions(+)

diff --git a/docs/en/engines/table-engines/integrations/mysql.md b/docs/en/engines/table-engines/integrations/mysql.md
index 87d59a9394b..978f1589e11 100644
--- a/docs/en/engines/table-engines/integrations/mysql.md
+++ b/docs/en/engines/table-engines/integrations/mysql.md
@@ -4,8 +4,12 @@ sidebar_position: 138
 sidebar_label: MySQL
 ---
 
+import CloudNotSupportedBadge from '@theme/badges/CloudNotSupportedBadge';
+
 # MySQL
 
+<CloudNotSupportedBadge />
+
 The MySQL engine allows you to perform `SELECT` and `INSERT` queries on data that is stored on a remote MySQL server.
 
 ## Creating a Table {#creating-a-table}
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index cbd53e5dfce..e81ef772489 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -161,6 +161,7 @@ ClickHouseVapor
 ClickVisual
 ClickableSquare
 CloudDetails
+CloudNotSupportedBadge
 CodeBlock
 CodeLLDB
 Codecs

From 22e911dbe42219eb0cfb4fd403c4c520db1cd112 Mon Sep 17 00:00:00 2001
From: justindeguzman <justin@justindeguzman.net>
Date: Thu, 14 Mar 2024 18:56:28 -0700
Subject: [PATCH 546/985] [Docs] Specify that MySQL database engine is not
 supported in Cloud

---
 docs/en/engines/database-engines/mysql.md           | 6 +++++-
 docs/en/engines/table-engines/integrations/mysql.md | 6 +++---
 utils/check-style/aspell-ignore/en/aspell-dict.txt  | 1 +
 3 files changed, 9 insertions(+), 4 deletions(-)

diff --git a/docs/en/engines/database-engines/mysql.md b/docs/en/engines/database-engines/mysql.md
index 20434ad124e..ac0ea5e5af1 100644
--- a/docs/en/engines/database-engines/mysql.md
+++ b/docs/en/engines/database-engines/mysql.md
@@ -4,7 +4,11 @@ sidebar_position: 50
 sidebar_label: MySQL
 ---
 
-# MySQL
+import CloudNotSupportedBadge from '@theme/badges/CloudNotSupportedBadge';
+
+# MySQL Database Engine
+
+<CloudNotSupportedBadge />
 
 Allows to connect to databases on a remote MySQL server and perform `INSERT` and `SELECT` queries to exchange data between ClickHouse and MySQL.
 
diff --git a/docs/en/engines/table-engines/integrations/mysql.md b/docs/en/engines/table-engines/integrations/mysql.md
index 978f1589e11..e9d0a43242b 100644
--- a/docs/en/engines/table-engines/integrations/mysql.md
+++ b/docs/en/engines/table-engines/integrations/mysql.md
@@ -4,11 +4,11 @@ sidebar_position: 138
 sidebar_label: MySQL
 ---
 
-import CloudNotSupportedBadge from '@theme/badges/CloudNotSupportedBadge';
+import CloudAvailableBadge from '@theme/badges/CloudAvailableBadge';
 
-# MySQL
+# MySQL Table Engine
 
-<CloudNotSupportedBadge />
+<CloudAvailableBadge />
 
 The MySQL engine allows you to perform `SELECT` and `INSERT` queries on data that is stored on a remote MySQL server.
 
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index e81ef772489..f709d9b3546 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -160,6 +160,7 @@ ClickHouseNIO
 ClickHouseVapor
 ClickVisual
 ClickableSquare
+CloudAvailableBadge
 CloudDetails
 CloudNotSupportedBadge
 CodeBlock

From e5f0079fc66b06317fce92d0736c32a575f8aade Mon Sep 17 00:00:00 2001
From: peter279k <peter279k@gmail.com>
Date: Fri, 15 Mar 2024 10:27:10 +0800
Subject: [PATCH 547/985] Correct the GEO datasets information

---
 docs/en/getting-started/example-datasets/cell-towers.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/getting-started/example-datasets/cell-towers.md b/docs/en/getting-started/example-datasets/cell-towers.md
index 090de1b32fd..94fa6998f5d 100644
--- a/docs/en/getting-started/example-datasets/cell-towers.md
+++ b/docs/en/getting-started/example-datasets/cell-towers.md
@@ -75,14 +75,14 @@ This is the output of `DESCRIBE`.  Down further in this guide the field type cho
 </TabItem>
 <TabItem value="selfmanaged" label="Self-managed">
 
-1. Download the snapshot of the dataset from February 2021: [cell_towers.csv.xz](https://datasets.clickhouse.com/cell_towers.csv.xz) (729 MB).
+1. Download the snapshot of the dataset from February 2021: [cell_towers.csv.xz](https://datasets.clickhouse.com/cell_towers.csv.xz) (686 MB).
 
 2. Validate the integrity (optional step):
 ```bash
 md5sum cell_towers.csv.xz
 ```
 ```response
-8cf986f4a0d9f12c6f384a0e9192c908  cell_towers.csv.xz
+8a797f7bdb55faba93f6cbc37d47b037  cell_towers.csv.xz
 ```
 
 3. Decompress it with the following command:
@@ -132,7 +132,7 @@ SELECT radio, count() AS c FROM cell_towers GROUP BY radio ORDER BY c DESC
 ┌─radio─┬────────c─┐
 │ UMTS  │ 20686487 │
 │ LTE   │ 12101148 │
-│ GSM   │  9931312 │
+│ GSM   │  9931304 │
 │ CDMA  │   556344 │
 │ NR    │      867 │
 └───────┴──────────┘

From 978fb783517639f495fbfbc67fe721cb8c8b2f5d Mon Sep 17 00:00:00 2001
From: peter279k <peter279k@gmail.com>
Date: Fri, 15 Mar 2024 11:18:21 +0800
Subject: [PATCH 548/985] Correct Criteo example dataset instruction section

---
 docs/en/getting-started/example-datasets/criteo.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/getting-started/example-datasets/criteo.md b/docs/en/getting-started/example-datasets/criteo.md
index a2e0fda0cb0..4becdb50731 100644
--- a/docs/en/getting-started/example-datasets/criteo.md
+++ b/docs/en/getting-started/example-datasets/criteo.md
@@ -55,7 +55,7 @@ CREATE TABLE criteo_log (
 ) ENGINE = Log;
 ```
 
-Download the data:
+Insert the data:
 
 ``` bash
 $ for i in {00..23}; do echo $i; zcat datasets/criteo/day_${i#0}.gz | sed -r 's/^/2000-01-'${i/00/24}'\t/' | clickhouse-client --host=example-perftest01j --query="INSERT INTO criteo_log FORMAT TabSeparated"; done

From a3da67ba9ae17440d4809e76ad19d2e308469e44 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 15 Mar 2024 06:47:10 +0000
Subject: [PATCH 549/985] Update version_date.tsv and changelogs after
 v23.8.11.28-lts

---
 docs/changelogs/v23.8.11.28-lts.md   | 30 ++++++++++++++++++++++++++++
 utils/list-versions/version_date.tsv |  4 ++++
 2 files changed, 34 insertions(+)
 create mode 100644 docs/changelogs/v23.8.11.28-lts.md

diff --git a/docs/changelogs/v23.8.11.28-lts.md b/docs/changelogs/v23.8.11.28-lts.md
new file mode 100644
index 00000000000..acc284caa72
--- /dev/null
+++ b/docs/changelogs/v23.8.11.28-lts.md
@@ -0,0 +1,30 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v23.8.11.28-lts (31879d2ab4c) FIXME as compared to v23.8.10.43-lts (a278225bba9)
+
+#### Improvement
+* Backported in [#60828](https://github.com/ClickHouse/ClickHouse/issues/60828): Update tzdata to 2024a. [#60768](https://github.com/ClickHouse/ClickHouse/pull/60768) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix buffer overflow in CompressionCodecMultiple [#60731](https://github.com/ClickHouse/ClickHouse/pull/60731) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove nonsense from SQL/JSON [#60738](https://github.com/ClickHouse/ClickHouse/pull/60738) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix crash in arrayEnumerateRanked [#60764](https://github.com/ClickHouse/ClickHouse/pull/60764) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix crash when using input() in INSERT SELECT JOIN [#60765](https://github.com/ClickHouse/ClickHouse/pull/60765) ([Kruglov Pavel](https://github.com/Avogar)).
+* Remove recursion when reading from S3 [#60849](https://github.com/ClickHouse/ClickHouse/pull/60849) ([Antonio Andelic](https://github.com/antonio2368)).
+
+#### NO CL ENTRY
+
+* NO CL ENTRY:  'Use the current branch test-utils to build cctools'. [#61276](https://github.com/ClickHouse/ClickHouse/pull/61276) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Cancel PipelineExecutor properly in case of exception in spawnThreads [#57104](https://github.com/ClickHouse/ClickHouse/pull/57104) ([Kruglov Pavel](https://github.com/Avogar)).
+* Detect io_uring in tests [#60373](https://github.com/ClickHouse/ClickHouse/pull/60373) ([Azat Khuzhin](https://github.com/azat)).
+* Cancel PipelineExecutor properly in case of exception in spawnThreads [#60499](https://github.com/ClickHouse/ClickHouse/pull/60499) ([Kruglov Pavel](https://github.com/Avogar)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index e372e407ce1..ad7c92d85d5 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,9 +1,11 @@
 v24.2.1.2248-stable	2024-02-29
+v24.1.6.52-stable	2024-03-07
 v24.1.5.6-stable	2024-02-14
 v24.1.4.20-stable	2024-02-14
 v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30
+v23.12.5.81-stable	2024-03-15
 v23.12.4.15-stable	2024-02-09
 v23.12.3.40-stable	2024-02-02
 v23.12.2.59-stable	2024-01-05
@@ -25,6 +27,7 @@ v23.9.4.11-stable	2023-11-08
 v23.9.3.12-stable	2023-10-31
 v23.9.2.56-stable	2023-10-19
 v23.9.1.1854-stable	2023-09-29
+v23.8.11.28-lts	2024-03-15
 v23.8.10.43-lts	2024-03-05
 v23.8.9.54-lts	2024-01-05
 v23.8.8.20-lts	2023-11-25
@@ -55,6 +58,7 @@ v23.4.4.16-stable	2023-06-17
 v23.4.3.48-stable	2023-06-12
 v23.4.2.11-stable	2023-05-02
 v23.4.1.1943-stable	2023-04-27
+v23.3.21.26-lts	2024-03-15
 v23.3.20.27-lts	2024-03-05
 v23.3.19.32-lts	2024-01-05
 v23.3.18.15-lts	2023-11-25

From e6f2cd080e2bc8b0fb47287c6749fe6bc45a14e7 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 15 Mar 2024 06:47:48 +0000
Subject: [PATCH 550/985] Update version_date.tsv and changelogs after
 v23.3.21.26-lts

---
 docs/changelogs/v23.3.21.26-lts.md   | 24 ++++++++++++++++++++++++
 utils/list-versions/version_date.tsv |  2 ++
 2 files changed, 26 insertions(+)
 create mode 100644 docs/changelogs/v23.3.21.26-lts.md

diff --git a/docs/changelogs/v23.3.21.26-lts.md b/docs/changelogs/v23.3.21.26-lts.md
new file mode 100644
index 00000000000..b0f059c4907
--- /dev/null
+++ b/docs/changelogs/v23.3.21.26-lts.md
@@ -0,0 +1,24 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v23.3.21.26-lts (d9672a3731f) FIXME as compared to v23.3.20.27-lts (cc974ba4f81)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix reading from sparse columns after restart [#49660](https://github.com/ClickHouse/ClickHouse/pull/49660) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix buffer overflow in CompressionCodecMultiple [#60731](https://github.com/ClickHouse/ClickHouse/pull/60731) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove nonsense from SQL/JSON [#60738](https://github.com/ClickHouse/ClickHouse/pull/60738) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix crash in arrayEnumerateRanked [#60764](https://github.com/ClickHouse/ClickHouse/pull/60764) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix crash when using input() in INSERT SELECT JOIN [#60765](https://github.com/ClickHouse/ClickHouse/pull/60765) ([Kruglov Pavel](https://github.com/Avogar)).
+* Remove recursion when reading from S3 [#60849](https://github.com/ClickHouse/ClickHouse/pull/60849) ([Antonio Andelic](https://github.com/antonio2368)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Cancel PipelineExecutor properly in case of exception in spawnThreads [#57104](https://github.com/ClickHouse/ClickHouse/pull/57104) ([Kruglov Pavel](https://github.com/Avogar)).
+* Detect io_uring in tests [#60373](https://github.com/ClickHouse/ClickHouse/pull/60373) ([Azat Khuzhin](https://github.com/azat)).
+* Cancel PipelineExecutor properly in case of exception in spawnThreads [#60499](https://github.com/ClickHouse/ClickHouse/pull/60499) ([Kruglov Pavel](https://github.com/Avogar)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index e372e407ce1..4ed577e0b61 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,4 +1,5 @@
 v24.2.1.2248-stable	2024-02-29
+v24.1.6.52-stable	2024-03-07
 v24.1.5.6-stable	2024-02-14
 v24.1.4.20-stable	2024-02-14
 v24.1.3.31-stable	2024-02-09
@@ -55,6 +56,7 @@ v23.4.4.16-stable	2023-06-17
 v23.4.3.48-stable	2023-06-12
 v23.4.2.11-stable	2023-05-02
 v23.4.1.1943-stable	2023-04-27
+v23.3.21.26-lts	2024-03-15
 v23.3.20.27-lts	2024-03-05
 v23.3.19.32-lts	2024-01-05
 v23.3.18.15-lts	2023-11-25

From 4e34887ab4d1bfe2355327da452d66d376dc6dae Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 15 Mar 2024 06:48:11 +0000
Subject: [PATCH 551/985] Update version_date.tsv and changelogs after
 v24.1.7.18-stable

---
 docker/keeper/Dockerfile             |  2 +-
 docker/server/Dockerfile.alpine      |  2 +-
 docker/server/Dockerfile.ubuntu      |  2 +-
 docs/changelogs/v24.1.7.18-stable.md | 26 ++++++++++++++++++++++++++
 utils/list-versions/version_date.tsv |  6 ++++++
 5 files changed, 35 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelogs/v24.1.7.18-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index 2f42854a972..17eee6d4287 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.2.1.2248"
+ARG VERSION="24.2.2.71"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 7bd777de5b9..bd5fa313adc 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.2.1.2248"
+ARG VERSION="24.2.2.71"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 03d01cfd5d7..256dcdc029f 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -27,7 +27,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.2.1.2248"
+ARG VERSION="24.2.2.71"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.1.7.18-stable.md b/docs/changelogs/v24.1.7.18-stable.md
new file mode 100644
index 00000000000..603a83a67be
--- /dev/null
+++ b/docs/changelogs/v24.1.7.18-stable.md
@@ -0,0 +1,26 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v24.1.7.18-stable (90925babd78) FIXME as compared to v24.1.6.52-stable (fa09f677bc9)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix deadlock in parallel parsing when lots of rows are skipped due to errors [#60516](https://github.com/ClickHouse/ClickHouse/pull/60516) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix_max_query_size_for_kql_compound_operator: [#60534](https://github.com/ClickHouse/ClickHouse/pull/60534) ([Yong Wang](https://github.com/kashwy)).
+* Fix crash with different allow_experimental_analyzer value in subqueries [#60770](https://github.com/ClickHouse/ClickHouse/pull/60770) ([Dmitry Novik](https://github.com/novikd)).
+* Fix Keeper reconfig for standalone binary [#61233](https://github.com/ClickHouse/ClickHouse/pull/61233) ([Antonio Andelic](https://github.com/antonio2368)).
+
+#### CI Fix or Improvement (changelog entry is not required)
+
+* Backported in [#61043](https://github.com/ClickHouse/ClickHouse/issues/61043): Debug and fix markreleaseready. [#60611](https://github.com/ClickHouse/ClickHouse/pull/60611) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Backported in [#61168](https://github.com/ClickHouse/ClickHouse/issues/61168): Just a preparation for the merge queue support. [#61099](https://github.com/ClickHouse/ClickHouse/pull/61099) ([Max K.](https://github.com/maxknv)).
+* Backported in [#61192](https://github.com/ClickHouse/ClickHouse/issues/61192): ... [#61185](https://github.com/ClickHouse/ClickHouse/pull/61185) ([Max K.](https://github.com/maxknv)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Cancel PipelineExecutor properly in case of exception in spawnThreads [#60499](https://github.com/ClickHouse/ClickHouse/pull/60499) ([Kruglov Pavel](https://github.com/Avogar)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index e372e407ce1..32fbfee8274 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,9 +1,13 @@
+v24.2.2.71-stable	2024-03-15
 v24.2.1.2248-stable	2024-02-29
+v24.1.7.18-stable	2024-03-15
+v24.1.6.52-stable	2024-03-07
 v24.1.5.6-stable	2024-02-14
 v24.1.4.20-stable	2024-02-14
 v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30
+v23.12.5.81-stable	2024-03-15
 v23.12.4.15-stable	2024-02-09
 v23.12.3.40-stable	2024-02-02
 v23.12.2.59-stable	2024-01-05
@@ -25,6 +29,7 @@ v23.9.4.11-stable	2023-11-08
 v23.9.3.12-stable	2023-10-31
 v23.9.2.56-stable	2023-10-19
 v23.9.1.1854-stable	2023-09-29
+v23.8.11.28-lts	2024-03-15
 v23.8.10.43-lts	2024-03-05
 v23.8.9.54-lts	2024-01-05
 v23.8.8.20-lts	2023-11-25
@@ -55,6 +60,7 @@ v23.4.4.16-stable	2023-06-17
 v23.4.3.48-stable	2023-06-12
 v23.4.2.11-stable	2023-05-02
 v23.4.1.1943-stable	2023-04-27
+v23.3.21.26-lts	2024-03-15
 v23.3.20.27-lts	2024-03-05
 v23.3.19.32-lts	2024-01-05
 v23.3.18.15-lts	2023-11-25

From 5a56c439395c3864d0f95d7b3b8ef63ed069fab6 Mon Sep 17 00:00:00 2001
From: Pham Anh Tuan <tuanpa.vn.1991@gmail.com>
Date: Wed, 13 Mar 2024 15:06:11 +0000
Subject: [PATCH 552/985] add async metrics for virtual memory mappings

---
 src/Common/AsynchronousMetrics.cpp            | 53 +++++++++++++++++++
 src/Common/AsynchronousMetrics.h              |  3 ++
 ...ry_mappings_asynchronous_metrics.reference |  2 +
 ...l_memory_mappings_asynchronous_metrics.sql |  4 ++
 4 files changed, 62 insertions(+)
 create mode 100644 tests/queries/0_stateless/03010_virtual_memory_mappings_asynchronous_metrics.reference
 create mode 100644 tests/queries/0_stateless/03010_virtual_memory_mappings_asynchronous_metrics.sql

diff --git a/src/Common/AsynchronousMetrics.cpp b/src/Common/AsynchronousMetrics.cpp
index b24d9bcc301..0b9be18c84e 100644
--- a/src/Common/AsynchronousMetrics.cpp
+++ b/src/Common/AsynchronousMetrics.cpp
@@ -9,6 +9,7 @@
 #include <IO/MMappedFileCache.h>
 #include <IO/ReadHelpers.h>
 #include <base/errnoToString.h>
+#include <base/find_symbols.h>
 #include <base/getPageSize.h>
 #include <sys/resource.h>
 #include <chrono>
@@ -90,6 +91,9 @@ AsynchronousMetrics::AsynchronousMetrics(
         openFileIfExists("/sys/fs/cgroup/cpu/cpu.cfs_quota_us", cgroupcpu_cfs_quota);
     }
 
+    openFileIfExists("/proc/sys/vm/max_map_count", vm_max_map_count);
+    openFileIfExists("/proc/self/maps", vm_maps);
+
     openSensors();
     openBlockDevices();
     openEDAC();
@@ -1423,6 +1427,55 @@ void AsynchronousMetrics::update(TimePoint update_time, bool force_update)
         }
     }
 
+    if (vm_max_map_count)
+    {
+        try
+        {
+            vm_max_map_count->rewind();
+
+            uint64_t max_map_count = 0;
+            readText(max_map_count, *vm_max_map_count);
+            new_values["VMMaxMapCount"] = { max_map_count, "The maximum number of memory mappings a process may have (/proc/sys/vm/max_map_count)."};
+        }
+        catch (...)
+        {
+            tryLogCurrentException(__PRETTY_FUNCTION__);
+            openFileIfExists("/proc/sys/vm/max_map_count", vm_max_map_count);
+        }
+    }
+
+    if (vm_maps)
+    {
+        try
+        {
+            vm_maps->rewind();
+
+            uint64_t num_maps = 0;
+            while (!vm_maps->eof())
+            {
+                char * next_pos = find_first_symbols<'\n'>(vm_maps->position(), vm_maps->buffer().end());
+                vm_maps->position() = next_pos;
+
+                if (!vm_maps->hasPendingData())
+                    continue;
+
+                if (*vm_maps->position() == '\n')
+                {
+                    ++num_maps;
+                    ++vm_maps->position();
+                }
+            }
+            new_values["VMNumMaps"] = { num_maps,
+                "The current number of memory mappings of the process (/proc/self/maps)."
+                " If it is close to the maximum (VMMaxMapCount), you should increase the limit for vm.max_map_count in /etc/sysctl.conf"};
+        }
+        catch (...)
+        {
+            tryLogCurrentException(__PRETTY_FUNCTION__);
+            openFileIfExists("/proc/self/maps", vm_maps);
+        }
+    }
+
     try
     {
         for (size_t i = 0, size = thermal.size(); i < size; ++i)
diff --git a/src/Common/AsynchronousMetrics.h b/src/Common/AsynchronousMetrics.h
index 305e8136b8a..4b3d28e80c5 100644
--- a/src/Common/AsynchronousMetrics.h
+++ b/src/Common/AsynchronousMetrics.h
@@ -123,6 +123,9 @@ private:
     std::optional<ReadBufferFromFilePRead> cgroupcpu_cfs_quota TSA_GUARDED_BY(data_mutex);
     std::optional<ReadBufferFromFilePRead> cgroupcpu_max TSA_GUARDED_BY(data_mutex);
 
+    std::optional<ReadBufferFromFilePRead> vm_max_map_count TSA_GUARDED_BY(data_mutex);
+    std::optional<ReadBufferFromFilePRead> vm_maps TSA_GUARDED_BY(data_mutex);
+
     std::vector<std::unique_ptr<ReadBufferFromFilePRead>> thermal TSA_GUARDED_BY(data_mutex);
 
     std::unordered_map<String /* device name */,
diff --git a/tests/queries/0_stateless/03010_virtual_memory_mappings_asynchronous_metrics.reference b/tests/queries/0_stateless/03010_virtual_memory_mappings_asynchronous_metrics.reference
new file mode 100644
index 00000000000..aa47d0d46d4
--- /dev/null
+++ b/tests/queries/0_stateless/03010_virtual_memory_mappings_asynchronous_metrics.reference
@@ -0,0 +1,2 @@
+0
+0
diff --git a/tests/queries/0_stateless/03010_virtual_memory_mappings_asynchronous_metrics.sql b/tests/queries/0_stateless/03010_virtual_memory_mappings_asynchronous_metrics.sql
new file mode 100644
index 00000000000..e9aced83ded
--- /dev/null
+++ b/tests/queries/0_stateless/03010_virtual_memory_mappings_asynchronous_metrics.sql
@@ -0,0 +1,4 @@
+-- Tags: no-replicated-database
+
+SELECT least(value, 0) FROM system.asynchronous_metrics WHERE metric = 'VMMaxMapCount';
+SELECT least(value, 0) FROM system.asynchronous_metrics WHERE metric = 'VMNumMaps';

From e5a1c0e251e9da5b4e5f1d1b1646766a7c75ecdf Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 15 Mar 2024 06:50:44 +0000
Subject: [PATCH 553/985] Update version_date.tsv and changelogs after
 v24.2.2.71-stable

---
 docker/keeper/Dockerfile             |  2 +-
 docker/server/Dockerfile.alpine      |  2 +-
 docker/server/Dockerfile.ubuntu      |  2 +-
 docs/changelogs/v24.2.2.71-stable.md | 55 ++++++++++++++++++++++++++++
 utils/list-versions/version_date.tsv |  6 +++
 5 files changed, 64 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelogs/v24.2.2.71-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index 2f42854a972..17eee6d4287 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.2.1.2248"
+ARG VERSION="24.2.2.71"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 7bd777de5b9..bd5fa313adc 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.2.1.2248"
+ARG VERSION="24.2.2.71"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 03d01cfd5d7..256dcdc029f 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -27,7 +27,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.2.1.2248"
+ARG VERSION="24.2.2.71"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v24.2.2.71-stable.md b/docs/changelogs/v24.2.2.71-stable.md
new file mode 100644
index 00000000000..b9aa5be626b
--- /dev/null
+++ b/docs/changelogs/v24.2.2.71-stable.md
@@ -0,0 +1,55 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v24.2.2.71-stable (9293d361e72) FIXME as compared to v24.2.1.2248-stable (891689a4150)
+
+#### Improvement
+* Backported in [#60834](https://github.com/ClickHouse/ClickHouse/issues/60834): Update tzdata to 2024a. [#60768](https://github.com/ClickHouse/ClickHouse/pull/60768) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* PartsSplitter invalid ranges for the same part [#60041](https://github.com/ClickHouse/ClickHouse/pull/60041) ([Maksim Kita](https://github.com/kitaisreal)).
+* Try to avoid calculation of scalar subqueries for CREATE TABLE. [#60464](https://github.com/ClickHouse/ClickHouse/pull/60464) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix deadlock in parallel parsing when lots of rows are skipped due to errors [#60516](https://github.com/ClickHouse/ClickHouse/pull/60516) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix_max_query_size_for_kql_compound_operator: [#60534](https://github.com/ClickHouse/ClickHouse/pull/60534) ([Yong Wang](https://github.com/kashwy)).
+* Reduce the number of read rows from `system.numbers` [#60546](https://github.com/ClickHouse/ClickHouse/pull/60546) ([JackyWoo](https://github.com/JackyWoo)).
+* Don't output number tips for date types [#60577](https://github.com/ClickHouse/ClickHouse/pull/60577) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix buffer overflow in CompressionCodecMultiple [#60731](https://github.com/ClickHouse/ClickHouse/pull/60731) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove nonsense from SQL/JSON [#60738](https://github.com/ClickHouse/ClickHouse/pull/60738) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Prevent setting custom metadata headers on unsupported multipart upload operations [#60748](https://github.com/ClickHouse/ClickHouse/pull/60748) ([Francisco J. Jurado Moreno](https://github.com/Beetelbrox)).
+* Fix crash in arrayEnumerateRanked [#60764](https://github.com/ClickHouse/ClickHouse/pull/60764) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix crash when using input() in INSERT SELECT JOIN [#60765](https://github.com/ClickHouse/ClickHouse/pull/60765) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix crash with different allow_experimental_analyzer value in subqueries [#60770](https://github.com/ClickHouse/ClickHouse/pull/60770) ([Dmitry Novik](https://github.com/novikd)).
+* Remove recursion when reading from S3 [#60849](https://github.com/ClickHouse/ClickHouse/pull/60849) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix multiple bugs in groupArraySorted [#61203](https://github.com/ClickHouse/ClickHouse/pull/61203) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix Keeper reconfig for standalone binary [#61233](https://github.com/ClickHouse/ClickHouse/pull/61233) ([Antonio Andelic](https://github.com/antonio2368)).
+
+#### CI Fix or Improvement (changelog entry is not required)
+
+* Backported in [#60758](https://github.com/ClickHouse/ClickHouse/issues/60758): Decoupled changes from [#60408](https://github.com/ClickHouse/ClickHouse/issues/60408). [#60553](https://github.com/ClickHouse/ClickHouse/pull/60553) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Backported in [#60706](https://github.com/ClickHouse/ClickHouse/issues/60706): Eliminates the need to provide input args to docker server jobs to clean yml files. [#60602](https://github.com/ClickHouse/ClickHouse/pull/60602) ([Max K.](https://github.com/maxknv)).
+* Backported in [#61045](https://github.com/ClickHouse/ClickHouse/issues/61045): Debug and fix markreleaseready. [#60611](https://github.com/ClickHouse/ClickHouse/pull/60611) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Backported in [#60721](https://github.com/ClickHouse/ClickHouse/issues/60721): Fix build_report job so that it's defined by ci_config only (not yml file). [#60613](https://github.com/ClickHouse/ClickHouse/pull/60613) ([Max K.](https://github.com/maxknv)).
+* Backported in [#60668](https://github.com/ClickHouse/ClickHouse/issues/60668): Do not await ci pending jobs on release branches decrease wait timeout to fit into gh job timeout. [#60652](https://github.com/ClickHouse/ClickHouse/pull/60652) ([Max K.](https://github.com/maxknv)).
+* Backported in [#60863](https://github.com/ClickHouse/ClickHouse/issues/60863): Set limited number of builds for "special build check" report in backports. [#60850](https://github.com/ClickHouse/ClickHouse/pull/60850) ([Max K.](https://github.com/maxknv)).
+* Backported in [#60946](https://github.com/ClickHouse/ClickHouse/issues/60946): ... [#60935](https://github.com/ClickHouse/ClickHouse/pull/60935) ([Max K.](https://github.com/maxknv)).
+* Backported in [#60972](https://github.com/ClickHouse/ClickHouse/issues/60972): ... [#60952](https://github.com/ClickHouse/ClickHouse/pull/60952) ([Max K.](https://github.com/maxknv)).
+* Backported in [#60980](https://github.com/ClickHouse/ClickHouse/issues/60980): ... [#60958](https://github.com/ClickHouse/ClickHouse/pull/60958) ([Max K.](https://github.com/maxknv)).
+* Backported in [#61170](https://github.com/ClickHouse/ClickHouse/issues/61170): Just a preparation for the merge queue support. [#61099](https://github.com/ClickHouse/ClickHouse/pull/61099) ([Max K.](https://github.com/maxknv)).
+* Backported in [#61181](https://github.com/ClickHouse/ClickHouse/issues/61181): ... [#61172](https://github.com/ClickHouse/ClickHouse/pull/61172) ([Max K.](https://github.com/maxknv)).
+* Backported in [#61228](https://github.com/ClickHouse/ClickHouse/issues/61228): ... [#61183](https://github.com/ClickHouse/ClickHouse/pull/61183) ([Han Fei](https://github.com/hanfei1991)).
+* Backported in [#61194](https://github.com/ClickHouse/ClickHouse/issues/61194): ... [#61185](https://github.com/ClickHouse/ClickHouse/pull/61185) ([Max K.](https://github.com/maxknv)).
+* Backported in [#61244](https://github.com/ClickHouse/ClickHouse/issues/61244): ... [#61214](https://github.com/ClickHouse/ClickHouse/pull/61214) ([Max K.](https://github.com/maxknv)).
+* Backported in [#61388](https://github.com/ClickHouse/ClickHouse/issues/61388):. [#61373](https://github.com/ClickHouse/ClickHouse/pull/61373) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* CI: make workflow yml abstract [#60421](https://github.com/ClickHouse/ClickHouse/pull/60421) ([Max K.](https://github.com/maxknv)).
+* Cancel PipelineExecutor properly in case of exception in spawnThreads [#60499](https://github.com/ClickHouse/ClickHouse/pull/60499) ([Kruglov Pavel](https://github.com/Avogar)).
+* General sanity in function `seriesOutliersDetectTukey` [#60535](https://github.com/ClickHouse/ClickHouse/pull/60535) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Speed up cctools building [#61011](https://github.com/ClickHouse/ClickHouse/pull/61011) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index e372e407ce1..32fbfee8274 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,9 +1,13 @@
+v24.2.2.71-stable	2024-03-15
 v24.2.1.2248-stable	2024-02-29
+v24.1.7.18-stable	2024-03-15
+v24.1.6.52-stable	2024-03-07
 v24.1.5.6-stable	2024-02-14
 v24.1.4.20-stable	2024-02-14
 v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30
+v23.12.5.81-stable	2024-03-15
 v23.12.4.15-stable	2024-02-09
 v23.12.3.40-stable	2024-02-02
 v23.12.2.59-stable	2024-01-05
@@ -25,6 +29,7 @@ v23.9.4.11-stable	2023-11-08
 v23.9.3.12-stable	2023-10-31
 v23.9.2.56-stable	2023-10-19
 v23.9.1.1854-stable	2023-09-29
+v23.8.11.28-lts	2024-03-15
 v23.8.10.43-lts	2024-03-05
 v23.8.9.54-lts	2024-01-05
 v23.8.8.20-lts	2023-11-25
@@ -55,6 +60,7 @@ v23.4.4.16-stable	2023-06-17
 v23.4.3.48-stable	2023-06-12
 v23.4.2.11-stable	2023-05-02
 v23.4.1.1943-stable	2023-04-27
+v23.3.21.26-lts	2024-03-15
 v23.3.20.27-lts	2024-03-05
 v23.3.19.32-lts	2024-01-05
 v23.3.18.15-lts	2023-11-25

From 51f0930fe276da5d32a7a4df302f337ebfead00e Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Fri, 15 Mar 2024 06:53:49 +0000
Subject: [PATCH 554/985] Update version_date.tsv and changelogs after
 v23.12.5.81-stable

---
 docker/keeper/Dockerfile              |  2 +-
 docker/server/Dockerfile.alpine       |  2 +-
 docker/server/Dockerfile.ubuntu       |  2 +-
 docs/changelogs/v23.12.5.81-stable.md | 64 +++++++++++++++++++++++++++
 utils/list-versions/version_date.tsv  |  6 +++
 5 files changed, 73 insertions(+), 3 deletions(-)
 create mode 100644 docs/changelogs/v23.12.5.81-stable.md

diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index 2f42854a972..17eee6d4287 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,7 +34,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.2.1.2248"
+ARG VERSION="24.2.2.71"
 ARG PACKAGES="clickhouse-keeper"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index 7bd777de5b9..bd5fa313adc 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,7 +32,7 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="24.2.1.2248"
+ARG VERSION="24.2.2.71"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 ARG DIRECT_DOWNLOAD_URLS=""
 
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 03d01cfd5d7..256dcdc029f 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -27,7 +27,7 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="24.2.1.2248"
+ARG VERSION="24.2.2.71"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
diff --git a/docs/changelogs/v23.12.5.81-stable.md b/docs/changelogs/v23.12.5.81-stable.md
new file mode 100644
index 00000000000..0a0acd97d58
--- /dev/null
+++ b/docs/changelogs/v23.12.5.81-stable.md
@@ -0,0 +1,64 @@
+---
+sidebar_position: 1
+sidebar_label: 2024
+---
+
+# 2024 Changelog
+
+### ClickHouse release v23.12.5.81-stable (a0fbe3ae813) FIXME as compared to v23.12.4.15-stable (4233d111d20)
+
+#### Improvement
+* Backported in [#60290](https://github.com/ClickHouse/ClickHouse/issues/60290): Copy S3 file GCP fallback to buffer copy in case GCP returned `Internal Error` with `GATEWAY_TIMEOUT` HTTP error code. [#60164](https://github.com/ClickHouse/ClickHouse/pull/60164) ([Maksim Kita](https://github.com/kitaisreal)).
+* Backported in [#60830](https://github.com/ClickHouse/ClickHouse/issues/60830): Update tzdata to 2024a. [#60768](https://github.com/ClickHouse/ClickHouse/pull/60768) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### Build/Testing/Packaging Improvement
+* Backported in [#59883](https://github.com/ClickHouse/ClickHouse/issues/59883): If you want to run initdb scripts every time when ClickHouse container is starting you shoud initialize environment varible CLICKHOUSE_ALWAYS_RUN_INITDB_SCRIPTS. [#59808](https://github.com/ClickHouse/ClickHouse/pull/59808) ([Alexander Nikolaev](https://github.com/AlexNik)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix_kql_issue_found_by_wingfuzz [#59626](https://github.com/ClickHouse/ClickHouse/pull/59626) ([Yong Wang](https://github.com/kashwy)).
+* Fix error "Read beyond last offset" for AsynchronousBoundedReadBuffer [#59630](https://github.com/ClickHouse/ClickHouse/pull/59630) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix query start time on non initial queries [#59662](https://github.com/ClickHouse/ClickHouse/pull/59662) ([Raúl Marín](https://github.com/Algunenano)).
+* rabbitmq: fix having neither acked nor nacked messages [#59775](https://github.com/ClickHouse/ClickHouse/pull/59775) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix parsing of partition expressions surrounded by parens [#59901](https://github.com/ClickHouse/ClickHouse/pull/59901) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Fix optimize_uniq_to_count removing the column alias [#60026](https://github.com/ClickHouse/ClickHouse/pull/60026) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix cosineDistance crash with Nullable [#60150](https://github.com/ClickHouse/ClickHouse/pull/60150) ([Raúl Marín](https://github.com/Algunenano)).
+* Hide sensitive info for s3queue [#60233](https://github.com/ClickHouse/ClickHouse/pull/60233) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix deadlock in parallel parsing when lots of rows are skipped due to errors [#60516](https://github.com/ClickHouse/ClickHouse/pull/60516) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix_max_query_size_for_kql_compound_operator: [#60534](https://github.com/ClickHouse/ClickHouse/pull/60534) ([Yong Wang](https://github.com/kashwy)).
+* Reduce the number of read rows from `system.numbers` [#60546](https://github.com/ClickHouse/ClickHouse/pull/60546) ([JackyWoo](https://github.com/JackyWoo)).
+* Fix buffer overflow in CompressionCodecMultiple [#60731](https://github.com/ClickHouse/ClickHouse/pull/60731) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove nonsense from SQL/JSON [#60738](https://github.com/ClickHouse/ClickHouse/pull/60738) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Prevent setting custom metadata headers on unsupported multipart upload operations [#60748](https://github.com/ClickHouse/ClickHouse/pull/60748) ([Francisco J. Jurado Moreno](https://github.com/Beetelbrox)).
+* Fix crash in arrayEnumerateRanked [#60764](https://github.com/ClickHouse/ClickHouse/pull/60764) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix crash when using input() in INSERT SELECT JOIN [#60765](https://github.com/ClickHouse/ClickHouse/pull/60765) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix crash with different allow_experimental_analyzer value in subqueries [#60770](https://github.com/ClickHouse/ClickHouse/pull/60770) ([Dmitry Novik](https://github.com/novikd)).
+* Remove recursion when reading from S3 [#60849](https://github.com/ClickHouse/ClickHouse/pull/60849) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix Keeper reconfig for standalone binary [#61233](https://github.com/ClickHouse/ClickHouse/pull/61233) ([Antonio Andelic](https://github.com/antonio2368)).
+
+#### CI Fix or Improvement (changelog entry is not required)
+
+* Backported in [#60767](https://github.com/ClickHouse/ClickHouse/issues/60767): Decoupled changes from [#60408](https://github.com/ClickHouse/ClickHouse/issues/60408). [#60553](https://github.com/ClickHouse/ClickHouse/pull/60553) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Backported in [#60582](https://github.com/ClickHouse/ClickHouse/issues/60582): Arm and amd docker build jobs use similar job names and thus overwrite job reports - aarch64 and amd64 suffixes added to fix this. [#60554](https://github.com/ClickHouse/ClickHouse/pull/60554) ([Max K.](https://github.com/maxknv)).
+* Backported in [#61041](https://github.com/ClickHouse/ClickHouse/issues/61041): Debug and fix markreleaseready. [#60611](https://github.com/ClickHouse/ClickHouse/pull/60611) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Backported in [#61030](https://github.com/ClickHouse/ClickHouse/issues/61030): ... [#61022](https://github.com/ClickHouse/ClickHouse/pull/61022) ([Max K.](https://github.com/maxknv)).
+* Backported in [#61224](https://github.com/ClickHouse/ClickHouse/issues/61224): ... [#61183](https://github.com/ClickHouse/ClickHouse/pull/61183) ([Han Fei](https://github.com/hanfei1991)).
+* Backported in [#61190](https://github.com/ClickHouse/ClickHouse/issues/61190): ... [#61185](https://github.com/ClickHouse/ClickHouse/pull/61185) ([Max K.](https://github.com/maxknv)).
+
+#### NO CL ENTRY
+
+* NO CL ENTRY:  'Revert "Backport [#59798](https://github.com/ClickHouse/ClickHouse/issues/59798) to 23.12: CI: do not reuse builds on release branches"'. [#59979](https://github.com/ClickHouse/ClickHouse/pull/59979) ([Max K.](https://github.com/maxknv)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* CI: move ci-specifics from job scripts to ci.py [#58516](https://github.com/ClickHouse/ClickHouse/pull/58516) ([Max K.](https://github.com/maxknv)).
+* Make ZooKeeper actually sequentialy consistent [#59735](https://github.com/ClickHouse/ClickHouse/pull/59735) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix special build reports in release branches [#59797](https://github.com/ClickHouse/ClickHouse/pull/59797) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* CI: do not reuse builds on release branches [#59798](https://github.com/ClickHouse/ClickHouse/pull/59798) ([Max K.](https://github.com/maxknv)).
+* Fix mark release ready [#59994](https://github.com/ClickHouse/ClickHouse/pull/59994) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Ability to detect undead ZooKeeper sessions [#60044](https://github.com/ClickHouse/ClickHouse/pull/60044) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Detect io_uring in tests [#60373](https://github.com/ClickHouse/ClickHouse/pull/60373) ([Azat Khuzhin](https://github.com/azat)).
+* Cancel PipelineExecutor properly in case of exception in spawnThreads [#60499](https://github.com/ClickHouse/ClickHouse/pull/60499) ([Kruglov Pavel](https://github.com/Avogar)).
+* Remove broken test while we fix it [#60547](https://github.com/ClickHouse/ClickHouse/pull/60547) ([Raúl Marín](https://github.com/Algunenano)).
+* Speed up cctools building [#61011](https://github.com/ClickHouse/ClickHouse/pull/61011) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index e372e407ce1..32fbfee8274 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,9 +1,13 @@
+v24.2.2.71-stable	2024-03-15
 v24.2.1.2248-stable	2024-02-29
+v24.1.7.18-stable	2024-03-15
+v24.1.6.52-stable	2024-03-07
 v24.1.5.6-stable	2024-02-14
 v24.1.4.20-stable	2024-02-14
 v24.1.3.31-stable	2024-02-09
 v24.1.2.5-stable	2024-02-02
 v24.1.1.2048-stable	2024-01-30
+v23.12.5.81-stable	2024-03-15
 v23.12.4.15-stable	2024-02-09
 v23.12.3.40-stable	2024-02-02
 v23.12.2.59-stable	2024-01-05
@@ -25,6 +29,7 @@ v23.9.4.11-stable	2023-11-08
 v23.9.3.12-stable	2023-10-31
 v23.9.2.56-stable	2023-10-19
 v23.9.1.1854-stable	2023-09-29
+v23.8.11.28-lts	2024-03-15
 v23.8.10.43-lts	2024-03-05
 v23.8.9.54-lts	2024-01-05
 v23.8.8.20-lts	2023-11-25
@@ -55,6 +60,7 @@ v23.4.4.16-stable	2023-06-17
 v23.4.3.48-stable	2023-06-12
 v23.4.2.11-stable	2023-05-02
 v23.4.1.1943-stable	2023-04-27
+v23.3.21.26-lts	2024-03-15
 v23.3.20.27-lts	2024-03-05
 v23.3.19.32-lts	2024-01-05
 v23.3.18.15-lts	2023-11-25

From ac0ed1deee9afa394d0b6ef15fcd3cfb38e4f9c4 Mon Sep 17 00:00:00 2001
From: tomershafir <tomer.shafir8@gmail.com>
Date: Fri, 15 Mar 2024 09:03:43 +0200
Subject: [PATCH 555/985] rm whitespace

---
 src/Common/ThreadFuzzer.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/ThreadFuzzer.h b/src/Common/ThreadFuzzer.h
index b5501ecf4e1..e8f1fe606f0 100644
--- a/src/Common/ThreadFuzzer.h
+++ b/src/Common/ThreadFuzzer.h
@@ -66,7 +66,7 @@ private:
     double migrate_probability = 0;
     double sleep_probability = 0;
     double sleep_time_us_max = 0;
-    
+
     double explicit_sleep_probability = 0;
     double explicit_memory_exception_probability = 0;
 

From 7f97b11ce6095ae77d0baf1cb3f9517714c6bdc5 Mon Sep 17 00:00:00 2001
From: Zhuo Qiu <jewelz.q.915@gmail.com>
Date: Fri, 15 Mar 2024 15:46:09 +0800
Subject: [PATCH 556/985] only read _row_exists column when necessary

---
 src/Storages/MergeTree/MutateTask.cpp | 21 +++++++++++----------
 1 file changed, 11 insertions(+), 10 deletions(-)

diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 4d1e60f450e..bfdc109a89d 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -1018,8 +1018,8 @@ struct MutationContext
 
     scope_guard temporary_directory_lock;
 
-    /// Whether this mutation contains lightweight delete
-    bool has_lightweight_delete;
+    /// Whether we need to count lightweight delete rows in this mutation
+    bool count_lightweight_deleted_rows;
 };
 
 using MutationContextPtr = std::shared_ptr<MutationContext>;
@@ -1282,7 +1282,8 @@ bool PartMergerWriter::mutateOriginalPartAndPrepareProjections()
 
         ctx->out->write(cur_block);
 
-        if (ctx->has_lightweight_delete)
+        /// TODO: move this calculation to DELETE FROM mutation
+        if (ctx->count_lightweight_deleted_rows)
             existing_rows_count += MutationHelpers::getExistingRowsCount(cur_block);
 
         for (size_t i = 0, size = ctx->projections_to_build.size(); i < size; ++i)
@@ -1376,7 +1377,7 @@ bool PartMergerWriter::iterateThroughAllProjections()
 
 void PartMergerWriter::finalize()
 {
-    if (ctx->has_lightweight_delete)
+    if (ctx->count_lightweight_deleted_rows)
         ctx->new_data_part->existing_rows_count = existing_rows_count;
 }
 
@@ -2225,17 +2226,17 @@ bool MutateTask::prepare()
     if (ctx->mutating_pipeline_builder.initialized())
         ctx->execute_ttl_type = MutationHelpers::shouldExecuteTTL(ctx->metadata_snapshot, ctx->interpreter->getColumnDependencies());
 
-    if (ctx->updated_header.has(RowExistsColumn::name))
+    if (ctx->data->getSettings()->exclude_deleted_rows_for_part_size_in_merge && ctx->updated_header.has(RowExistsColumn::name))
     {
-        /// This mutation contains lightweight delete, reset existing_rows_count of new data part to 0
-        /// It will be updated while writing _row_exists column
-        ctx->has_lightweight_delete = true;
+        /// This mutation contains lightweight delete and we need to count the deleted rows,
+        /// Reset existing_rows_count of new data part to 0 and it will be updated while writing _row_exists column
+        ctx->count_lightweight_deleted_rows = true;
     }
     else
     {
-        ctx->has_lightweight_delete = false;
+        ctx->count_lightweight_deleted_rows = false;
 
-        /// This mutation does not contains lightweight delete, copy existing_rows_count from source part
+        /// No need to count deleted rows, copy existing_rows_count from source part
         ctx->new_data_part->existing_rows_count = ctx->source_part->existing_rows_count.value_or(ctx->source_part->rows_count);
     }
 

From be4554ba431c2c496c139e6b4869a68ca3ba58dc Mon Sep 17 00:00:00 2001
From: Zhuo Qiu <jewelz.q.915@gmail.com>
Date: Fri, 15 Mar 2024 16:31:50 +0800
Subject: [PATCH 557/985] fix test

---
 tests/queries/0_stateless/03001_consider_lwd_when_merge.sql | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tests/queries/0_stateless/03001_consider_lwd_when_merge.sql b/tests/queries/0_stateless/03001_consider_lwd_when_merge.sql
index a65e8877020..988d7058f21 100644
--- a/tests/queries/0_stateless/03001_consider_lwd_when_merge.sql
+++ b/tests/queries/0_stateless/03001_consider_lwd_when_merge.sql
@@ -17,6 +17,9 @@ SELECT count() FROM system.parts WHERE database = currentDatabase() AND table =
 
 ALTER TABLE lwd_merge MODIFY SETTING exclude_deleted_rows_for_part_size_in_merge = 1;
 
+-- delete again because deleted rows will be counted in mutation
+DELETE FROM lwd_merge WHERE id % 100 == 0;
+
 OPTIMIZE TABLE lwd_merge;
 SELECT count() FROM system.parts WHERE database = currentDatabase() AND table = 'lwd_merge' AND active = 1;
 

From 4eda78440d696db68d654a5883cc20fb1b145365 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 15 Mar 2024 10:34:32 +0100
Subject: [PATCH 558/985] Remove C++ templates

---
 src/DataTypes/IDataType.h       |   2 +
 src/Functions/castOrDefault.cpp | 181 ++++++++++++++------------------
 2 files changed, 79 insertions(+), 104 deletions(-)

diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index 55f584ef1e0..4403e3d9bd4 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -533,6 +533,8 @@ class DataTypeDateTime;
 class DataTypeDateTime64;
 
 template <is_decimal T> constexpr bool IsDataTypeDecimal<DataTypeDecimal<T>> = true;
+
+/// TODO: this is garbage, remove it.
 template <> inline constexpr bool IsDataTypeDecimal<DataTypeDateTime64> = true;
 
 template <typename T> constexpr bool IsDataTypeNumber<DataTypeNumber<T>> = true;
diff --git a/src/Functions/castOrDefault.cpp b/src/Functions/castOrDefault.cpp
index 970e6fd6f75..18bdea28029 100644
--- a/src/Functions/castOrDefault.cpp
+++ b/src/Functions/castOrDefault.cpp
@@ -173,25 +173,22 @@ private:
     bool keep_nullable;
 };
 
-template <typename Type, typename Name>
 class FunctionCastOrDefaultTyped final : public IFunction
 {
 public:
-    static constexpr auto name = Name::name;
-
-    static FunctionPtr create(ContextPtr context)
-    {
-        return std::make_shared<FunctionCastOrDefaultTyped>(context);
-    }
-
-    explicit FunctionCastOrDefaultTyped(ContextPtr context_)
-        : impl(context_)
+    explicit FunctionCastOrDefaultTyped(ContextPtr context_, String name_, DataTypePtr type_)
+        : impl(context_), name(std::move(name_)), type(std::move(type_)), which(type)
     {
     }
 
     String getName() const override { return name; }
 
 private:
+    FunctionCastOrDefault impl;
+    String name;
+    DataTypePtr type;
+    WhichDataType which;
+
     size_t getNumberOfArguments() const override { return 0; }
     bool isVariadic() const override { return true; }
 
@@ -209,10 +206,10 @@ private:
         FunctionArgumentDescriptors mandatory_args = {{"Value", nullptr, nullptr, nullptr}};
         FunctionArgumentDescriptors optional_args;
 
-        if constexpr (IsDataTypeDecimal<Type>)
+        if (isDecimal(type) || isDateTime64(type))
             mandatory_args.push_back({"scale", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isNativeInteger), &isColumnConst, "const Integer"});
 
-        if (std::is_same_v<Type, DataTypeDateTime> || std::is_same_v<Type, DataTypeDateTime64>)
+        if (isDateTimeOrDateTime64(type))
             optional_args.push_back({"timezone", static_cast<FunctionArgumentDescriptor::TypeValidator>(&isString), isColumnConst, "const String"});
 
         optional_args.push_back({"default_value", nullptr, nullptr, nullptr});
@@ -224,7 +221,7 @@ private:
         size_t scale = 0;
         std::string time_zone;
 
-        if constexpr (IsDataTypeDecimal<Type>)
+        if (isDecimal(type))
         {
             const auto & scale_argument = arguments[additional_argument_index];
 
@@ -241,7 +238,7 @@ private:
             ++additional_argument_index;
         }
 
-        if constexpr (std::is_same_v<Type, DataTypeDateTime> || std::is_same_v<Type, DataTypeDateTime64>)
+        if (isDateTimeOrDateTime64(type))
         {
             if (additional_argument_index < arguments.size())
             {
@@ -251,16 +248,22 @@ private:
             }
         }
 
-        std::shared_ptr<Type> cast_type;
+        DataTypePtr cast_type;
 
-        if constexpr (std::is_same_v<Type, DataTypeDateTime64>)
-            cast_type = std::make_shared<Type>(scale, time_zone);
-        else if constexpr (IsDataTypeDecimal<Type>)
-            cast_type = std::make_shared<Type>(Type::maxPrecision(), scale);
-        else if constexpr (std::is_same_v<Type, DataTypeDateTime> || std::is_same_v<Type, DataTypeDateTime64>)
-            cast_type = std::make_shared<Type>(time_zone);
+        if (which.isDateTime64())
+            cast_type = std::make_shared<DataTypeDateTime64>(scale, time_zone);
+        else if (which.isDateTime())
+            cast_type = std::make_shared<DataTypeDateTime>(time_zone);
+        else if (which.isDecimal32())
+            cast_type = createDecimalMaxPrecision<Decimal32>(scale);
+        else if (which.isDecimal64())
+            cast_type = createDecimalMaxPrecision<Decimal64>(scale);
+        else if (which.isDecimal128())
+            cast_type = createDecimalMaxPrecision<Decimal128>(scale);
+        else if (which.isDecimal256())
+            cast_type = createDecimalMaxPrecision<Decimal256>(scale);
         else
-            cast_type = std::make_shared<Type>();
+            cast_type = type;
 
         ColumnWithTypeAndName type_argument =
         {
@@ -289,7 +292,8 @@ private:
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_size) const override
     {
-        size_t additional_arguments_size = IsDataTypeDecimal<Type> + (std::is_same_v<Type, DataTypeDateTime> || std::is_same_v<Type, DataTypeDateTime64>);
+        /// Scale and time zone
+        size_t additional_arguments_size = (which.isDecimal() || which.isDateTime64()) + which.isDateTimeOrDateTime64();
 
         ColumnWithTypeAndName second_argument =
         {
@@ -310,98 +314,67 @@ private:
 
         return impl.executeImpl(arguments_with_cast_type, result_type, input_rows_size);
     }
-
-    FunctionCastOrDefault impl;
 };
 
-struct NameToUInt8OrDefault { static constexpr auto name = "toUInt8OrDefault"; };
-struct NameToUInt16OrDefault { static constexpr auto name = "toUInt16OrDefault"; };
-struct NameToUInt32OrDefault { static constexpr auto name = "toUInt32OrDefault"; };
-struct NameToUInt64OrDefault { static constexpr auto name = "toUInt64OrDefault"; };
-struct NameToUInt256OrDefault { static constexpr auto name = "toUInt256OrDefault"; };
-struct NameToInt8OrDefault { static constexpr auto name = "toInt8OrDefault"; };
-struct NameToInt16OrDefault { static constexpr auto name = "toInt16OrDefault"; };
-struct NameToInt32OrDefault { static constexpr auto name = "toInt32OrDefault"; };
-struct NameToInt64OrDefault { static constexpr auto name = "toInt64OrDefault"; };
-struct NameToInt128OrDefault { static constexpr auto name = "toInt128OrDefault"; };
-struct NameToInt256OrDefault { static constexpr auto name = "toInt256OrDefault"; };
-struct NameToFloat32OrDefault { static constexpr auto name = "toFloat32OrDefault"; };
-struct NameToFloat64OrDefault { static constexpr auto name = "toFloat64OrDefault"; };
-struct NameToDateOrDefault { static constexpr auto name = "toDateOrDefault"; };
-struct NameToDate32OrDefault { static constexpr auto name = "toDate32OrDefault"; };
-struct NameToDateTimeOrDefault { static constexpr auto name = "toDateTimeOrDefault"; };
-struct NameToDateTime64OrDefault { static constexpr auto name = "toDateTime64OrDefault"; };
-struct NameToDecimal32OrDefault { static constexpr auto name = "toDecimal32OrDefault"; };
-struct NameToDecimal64OrDefault { static constexpr auto name = "toDecimal64OrDefault"; };
-struct NameToDecimal128OrDefault { static constexpr auto name = "toDecimal128OrDefault"; };
-struct NameToDecimal256OrDefault { static constexpr auto name = "toDecimal256OrDefault"; };
-struct NameToUUIDOrDefault { static constexpr auto name = "toUUIDOrDefault"; };
-struct NameToIPv4OrDefault { static constexpr auto name = "toIPv4OrDefault"; };
-struct NameToIPv6OrDefault { static constexpr auto name = "toIPv6OrDefault"; };
-
-using FunctionToUInt8OrDefault = FunctionCastOrDefaultTyped<DataTypeUInt8, NameToUInt8OrDefault>;
-using FunctionToUInt16OrDefault = FunctionCastOrDefaultTyped<DataTypeUInt16, NameToUInt16OrDefault>;
-using FunctionToUInt32OrDefault = FunctionCastOrDefaultTyped<DataTypeUInt32, NameToUInt32OrDefault>;
-using FunctionToUInt64OrDefault = FunctionCastOrDefaultTyped<DataTypeUInt64, NameToUInt64OrDefault>;
-using FunctionToUInt256OrDefault = FunctionCastOrDefaultTyped<DataTypeUInt256, NameToUInt256OrDefault>;
-
-using FunctionToInt8OrDefault = FunctionCastOrDefaultTyped<DataTypeInt8, NameToInt8OrDefault>;
-using FunctionToInt16OrDefault = FunctionCastOrDefaultTyped<DataTypeInt16, NameToInt16OrDefault>;
-using FunctionToInt32OrDefault = FunctionCastOrDefaultTyped<DataTypeInt32, NameToInt32OrDefault>;
-using FunctionToInt64OrDefault = FunctionCastOrDefaultTyped<DataTypeInt64, NameToInt64OrDefault>;
-using FunctionToInt128OrDefault = FunctionCastOrDefaultTyped<DataTypeInt128, NameToInt128OrDefault>;
-using FunctionToInt256OrDefault = FunctionCastOrDefaultTyped<DataTypeInt256, NameToInt256OrDefault>;
-
-using FunctionToFloat32OrDefault = FunctionCastOrDefaultTyped<DataTypeFloat32, NameToFloat32OrDefault>;
-using FunctionToFloat64OrDefault = FunctionCastOrDefaultTyped<DataTypeFloat64, NameToFloat64OrDefault>;
-
-using FunctionToDateOrDefault = FunctionCastOrDefaultTyped<DataTypeDate, NameToDateOrDefault>;
-using FunctionToDate32OrDefault = FunctionCastOrDefaultTyped<DataTypeDate32, NameToDate32OrDefault>;
-using FunctionToDateTimeOrDefault = FunctionCastOrDefaultTyped<DataTypeDateTime, NameToDateTimeOrDefault>;
-using FunctionToDateTime64OrDefault = FunctionCastOrDefaultTyped<DataTypeDateTime64, NameToDateTime64OrDefault>;
-
-using FunctionToDecimal32OrDefault = FunctionCastOrDefaultTyped<DataTypeDecimal<Decimal32>, NameToDecimal32OrDefault>;
-using FunctionToDecimal64OrDefault = FunctionCastOrDefaultTyped<DataTypeDecimal<Decimal64>, NameToDecimal64OrDefault>;
-using FunctionToDecimal128OrDefault = FunctionCastOrDefaultTyped<DataTypeDecimal<Decimal128>, NameToDecimal128OrDefault>;
-using FunctionToDecimal256OrDefault = FunctionCastOrDefaultTyped<DataTypeDecimal<Decimal256>, NameToDecimal256OrDefault>;
-
-using FunctionToUUIDOrDefault = FunctionCastOrDefaultTyped<DataTypeUUID, NameToUUIDOrDefault>;
-using FunctionToIPv4OrDefault = FunctionCastOrDefaultTyped<DataTypeIPv4, NameToIPv4OrDefault>;
-using FunctionToIPv6OrDefault = FunctionCastOrDefaultTyped<DataTypeIPv6, NameToIPv6OrDefault>;
-
 REGISTER_FUNCTION(CastOrDefault)
 {
     factory.registerFunction<FunctionCastOrDefault>();
 
-    factory.registerFunction<FunctionToUInt8OrDefault>();
-    factory.registerFunction<FunctionToUInt16OrDefault>();
-    factory.registerFunction<FunctionToUInt32OrDefault>();
-    factory.registerFunction<FunctionToUInt64OrDefault>();
-    factory.registerFunction<FunctionToUInt256OrDefault>();
+    factory.registerFunction("toUInt8OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt8OrDefault", std::make_shared<DataTypeUInt8>())); });
+    factory.registerFunction("toUInt16OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt16OrDefault", std::make_shared<DataTypeUInt16>())); });
+    factory.registerFunction("toUInt32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt32OrDefault", std::make_shared<DataTypeUInt32>())); });
+    factory.registerFunction("toUInt64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt64OrDefault", std::make_shared<DataTypeUInt64>())); });
+    factory.registerFunction("toUInt128OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt128OrDefault", std::make_shared<DataTypeUInt128>())); });
+    factory.registerFunction("toUInt256OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt256OrDefault", std::make_shared<DataTypeUInt256>())); });
 
-    factory.registerFunction<FunctionToInt8OrDefault>();
-    factory.registerFunction<FunctionToInt16OrDefault>();
-    factory.registerFunction<FunctionToInt32OrDefault>();
-    factory.registerFunction<FunctionToInt64OrDefault>();
-    factory.registerFunction<FunctionToInt128OrDefault>();
-    factory.registerFunction<FunctionToInt256OrDefault>();
+    factory.registerFunction("toInt8OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt8OrDefault", std::make_shared<DataTypeInt8>())); });
+    factory.registerFunction("toInt16OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt16OrDefault", std::make_shared<DataTypeInt16>())); });
+    factory.registerFunction("toInt32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt32OrDefault", std::make_shared<DataTypeInt32>())); });
+    factory.registerFunction("toInt64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt64OrDefault", std::make_shared<DataTypeInt64>())); });
+    factory.registerFunction("toInt128OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt128OrDefault", std::make_shared<DataTypeInt128>())); });
+    factory.registerFunction("toInt256OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt256OrDefault", std::make_shared<DataTypeInt256>())); });
 
-    factory.registerFunction<FunctionToFloat32OrDefault>();
-    factory.registerFunction<FunctionToFloat64OrDefault>();
+    factory.registerFunction("toFloat32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat32OrDefault", std::make_shared<DataTypeFloat32>())); });
+    factory.registerFunction("toFloat64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat64OrDefault", std::make_shared<DataTypeFloat64>())); });
 
-    factory.registerFunction<FunctionToDateOrDefault>();
-    factory.registerFunction<FunctionToDate32OrDefault>();
-    factory.registerFunction<FunctionToDateTimeOrDefault>();
-    factory.registerFunction<FunctionToDateTime64OrDefault>();
+    factory.registerFunction("toDateOrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateOrDefault", std::make_shared<DataTypeDate>())); });
+    factory.registerFunction("toDate32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDate32OrDefault", std::make_shared<DataTypeDate32>())); });
+    factory.registerFunction("toDateTimeOrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTimeOrDefault", std::make_shared<DataTypeDateTime>())); });
+    factory.registerFunction("toDateTime64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTime64OrDefault", std::make_shared<DataTypeDateTime64>(3 /* default scale */))); });
 
-    factory.registerFunction<FunctionToDecimal32OrDefault>();
-    factory.registerFunction<FunctionToDecimal64OrDefault>();
-    factory.registerFunction<FunctionToDecimal128OrDefault>();
-    factory.registerFunction<FunctionToDecimal256OrDefault>();
+    factory.registerFunction("toDecimal32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal32OrDefault", createDecimalMaxPrecision<Decimal32>(0))); });
+    factory.registerFunction("toDecimal64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal64OrDefault", createDecimalMaxPrecision<Decimal64>(0))); });
+    factory.registerFunction("toDecimal128OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal128OrDefault", createDecimalMaxPrecision<Decimal128>(0))); });
+    factory.registerFunction("toDecimal256OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal256OrDefault", createDecimalMaxPrecision<Decimal256>(0))); });
 
-    factory.registerFunction<FunctionToUUIDOrDefault>();
-    factory.registerFunction<FunctionToIPv4OrDefault>();
-    factory.registerFunction<FunctionToIPv6OrDefault>();
+    factory.registerFunction("toUUIDOrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUUIDOrDefault", std::make_shared<DataTypeUUID>())); });
+    factory.registerFunction("toIPv4OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv4OrDefault", std::make_shared<DataTypeIPv4>())); });
+    factory.registerFunction("toIPv6OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv6OrDefault", std::make_shared<DataTypeIPv6>())); });
 }
 
 }

From 4290b1fe2cfe6eace74c08601db884f0c1738bf8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 15 Mar 2024 11:32:21 +0100
Subject: [PATCH 559/985] Garbage

---
 src/Functions/FunctionsConversion.cpp | 49 +++++++--------------------
 src/Functions/castOrDefault.cpp       |  2 +-
 2 files changed, 13 insertions(+), 38 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 42056067f00..f69d3e9146b 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1980,13 +1980,6 @@ public:
 
     static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
 
-    static constexpr bool to_string_or_fixed_string = std::is_same_v<ToDataType, DataTypeFixedString> ||
-                                                      std::is_same_v<ToDataType, DataTypeString>;
-
-    static constexpr bool to_date_or_datetime = std::is_same_v<ToDataType, DataTypeDate> ||
-                                                std::is_same_v<ToDataType, DataTypeDate32> ||
-                                                std::is_same_v<ToDataType, DataTypeDateTime>;
-
     static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionConvert>(context); }
     static FunctionPtr create() { return std::make_shared<FunctionConvert>(); }
 
@@ -2003,8 +1996,7 @@ public:
     bool isInjective(const ColumnsWithTypeAndName &) const override { return std::is_same_v<Name, NameToString>; }
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & arguments) const override
     {
-        /// TODO: We can make more optimizations here.
-        return !(to_date_or_datetime && isNumber(*arguments[0].type));
+        return !(IsDataTypeDateOrDateTime<ToDataType> && isNumber(*arguments[0].type));
     }
 
     using DefaultReturnTypeGetter = std::function<DataTypePtr(const ColumnsWithTypeAndName &)>;
@@ -2327,7 +2319,7 @@ private:
         }
 
         bool done = false;
-        if constexpr (to_string_or_fixed_string)
+        if constexpr (std::is_same_v<ToDataType, DataTypeFixedString> || std::is_same_v<ToDataType, DataTypeString>)
         {
             done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
         }
@@ -3155,7 +3147,6 @@ public:
     }
 
 private:
-
     const char * cast_name;
     MonotonicityForRange monotonicity_for_range;
 
@@ -4623,26 +4614,12 @@ arguments, result_type, input_rows_count); \
             using Types = std::decay_t<decltype(types)>;
             using ToDataType = typename Types::LeftType;
 
-            if constexpr (
-                std::is_same_v<ToDataType, DataTypeUInt16> ||
-                std::is_same_v<ToDataType, DataTypeUInt32> ||
-                std::is_same_v<ToDataType, DataTypeUInt64> ||
-                std::is_same_v<ToDataType, DataTypeUInt128> ||
-                std::is_same_v<ToDataType, DataTypeUInt256> ||
-                std::is_same_v<ToDataType, DataTypeInt8> ||
-                std::is_same_v<ToDataType, DataTypeInt16> ||
-                std::is_same_v<ToDataType, DataTypeInt32> ||
-                std::is_same_v<ToDataType, DataTypeInt64> ||
-                std::is_same_v<ToDataType, DataTypeInt128> ||
-                std::is_same_v<ToDataType, DataTypeInt256> ||
-                std::is_same_v<ToDataType, DataTypeFloat32> ||
-                std::is_same_v<ToDataType, DataTypeFloat64> ||
-                std::is_same_v<ToDataType, DataTypeDate> ||
-                std::is_same_v<ToDataType, DataTypeDate32> ||
-                std::is_same_v<ToDataType, DataTypeDateTime> ||
-                std::is_same_v<ToDataType, DataTypeUUID> ||
-                std::is_same_v<ToDataType, DataTypeIPv4> ||
-                std::is_same_v<ToDataType, DataTypeIPv6>)
+            if constexpr (is_any_of<ToDataType,
+                DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256,
+                DataTypeInt8, DataTypeInt16, DataTypeInt32, DataTypeInt64, DataTypeInt128, DataTypeInt256,
+                DataTypeFloat32, DataTypeFloat64,
+                DataTypeDate, DataTypeDate32, DataTypeDateTime,
+                DataTypeUUID, DataTypeIPv4, DataTypeIPv6>)
             {
                 ret = createWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
                 return true;
@@ -4662,12 +4639,10 @@ arguments, result_type, input_rows_count); \
                 ret = createEnumWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()));
                 return true;
             }
-            if constexpr (
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal32>> ||
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal64>> ||
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal128>> ||
-                std::is_same_v<ToDataType, DataTypeDecimal<Decimal256>> ||
-                std::is_same_v<ToDataType, DataTypeDateTime64>)
+            if constexpr (is_any_of<ToDataType,
+                DataTypeDecimal<Decimal32>, DataTypeDecimal<Decimal64>,
+                DataTypeDecimal<Decimal128>, DataTypeDecimal<Decimal256>,
+                DataTypeDateTime64>)
             {
                 ret = createDecimalWrapper(from_type, checkAndGetDataType<ToDataType>(to_type.get()), requested_result_is_nullable);
                 return true;
diff --git a/src/Functions/castOrDefault.cpp b/src/Functions/castOrDefault.cpp
index 18bdea28029..57cb03e0349 100644
--- a/src/Functions/castOrDefault.cpp
+++ b/src/Functions/castOrDefault.cpp
@@ -303,7 +303,7 @@ private:
         };
 
         ColumnsWithTypeAndName arguments_with_cast_type;
-        arguments_with_cast_type.reserve(arguments.size());
+        arguments_with_cast_type.reserve(arguments.size() + 1);
 
         arguments_with_cast_type.emplace_back(arguments[0]);
         arguments_with_cast_type.emplace_back(second_argument);

From 060f79862d1c13f9fb723b592e384db009a45823 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 15 Mar 2024 10:49:36 +0000
Subject: [PATCH 560/985] Fix

---
 src/Analyzer/Passes/SumIfToCountIfPass.cpp    |  2 +-
 ...3010_sum_to_to_count_if_nullable.reference | 66 +++++++++++++++++++
 .../03010_sum_to_to_count_if_nullable.sql     | 12 +++-
 3 files changed, 77 insertions(+), 3 deletions(-)

diff --git a/src/Analyzer/Passes/SumIfToCountIfPass.cpp b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
index 2c41b6dc467..1c2097e7be9 100644
--- a/src/Analyzer/Passes/SumIfToCountIfPass.cpp
+++ b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
@@ -54,7 +54,7 @@ public:
             if (!constant_node)
                 return;
 
-            if (auto constant_type = constant_node->getResultType(); !isUInt64(constant_type) && !isInt64(constant_type))
+            if (auto constant_type = constant_node->getResultType(); !isNativeInteger(constant_type))
                 return;
 
             const auto & constant_value_literal = constant_node->getValue();
diff --git a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
index 8627f639a03..89e5f639c66 100644
--- a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
+++ b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
@@ -1,2 +1,68 @@
 (5,NULL)
 (5,NULL)
+(5,NULL)
+QUERY id: 0
+  PROJECTION COLUMNS
+    (sumIf(toNullable(1), equals(modulo(number, 2), 0)), NULL) Tuple(Nullable(UInt64), Nullable(Nothing))
+  PROJECTION
+    LIST id: 1, nodes: 1
+      FUNCTION id: 2, function_name: tuple, function_type: ordinary, result_type: Tuple(Nullable(UInt64), Nullable(Nothing))
+        ARGUMENTS
+          LIST id: 3, nodes: 2
+            FUNCTION id: 4, function_name: sumIf, function_type: aggregate, result_type: Nullable(UInt64)
+              ARGUMENTS
+                LIST id: 5, nodes: 2
+                  CONSTANT id: 6, constant_value: UInt64_1, constant_value_type: Nullable(UInt8)
+                    EXPRESSION
+                      FUNCTION id: 7, function_name: toNullable, function_type: ordinary, result_type: Nullable(UInt8)
+                        ARGUMENTS
+                          LIST id: 8, nodes: 1
+                            CONSTANT id: 9, constant_value: UInt64_1, constant_value_type: UInt8
+                  FUNCTION id: 10, function_name: equals, function_type: ordinary, result_type: UInt8
+                    ARGUMENTS
+                      LIST id: 11, nodes: 2
+                        FUNCTION id: 12, function_name: modulo, function_type: ordinary, result_type: UInt8
+                          ARGUMENTS
+                            LIST id: 13, nodes: 2
+                              COLUMN id: 14, column_name: number, result_type: UInt64, source_id: 15
+                              CONSTANT id: 16, constant_value: UInt64_2, constant_value_type: UInt8
+                        CONSTANT id: 17, constant_value: UInt64_0, constant_value_type: UInt8
+            CONSTANT id: 18, constant_value: NULL, constant_value_type: Nullable(Nothing)
+  JOIN TREE
+    TABLE_FUNCTION id: 15, alias: __table1, table_function_name: numbers
+      ARGUMENTS
+        LIST id: 19, nodes: 1
+          CONSTANT id: 20, constant_value: UInt64_10, constant_value_type: UInt8
+(5,NULL)
+QUERY id: 0
+  PROJECTION COLUMNS
+    (sum(if(equals(modulo(number, 2), 0), toNullable(1), 0)), NULL) Tuple(Nullable(UInt64), Nullable(Nothing))
+  PROJECTION
+    LIST id: 1, nodes: 1
+      FUNCTION id: 2, function_name: tuple, function_type: ordinary, result_type: Tuple(Nullable(UInt64), Nullable(Nothing))
+        ARGUMENTS
+          LIST id: 3, nodes: 2
+            FUNCTION id: 4, function_name: sumOrNullIf, function_type: aggregate, result_type: Nullable(UInt64)
+              ARGUMENTS
+                LIST id: 5, nodes: 2
+                  CONSTANT id: 6, constant_value: UInt64_1, constant_value_type: Nullable(UInt8)
+                    EXPRESSION
+                      FUNCTION id: 7, function_name: toNullable, function_type: ordinary, result_type: Nullable(UInt8)
+                        ARGUMENTS
+                          LIST id: 8, nodes: 1
+                            CONSTANT id: 9, constant_value: UInt64_1, constant_value_type: UInt8
+                  FUNCTION id: 10, function_name: equals, function_type: ordinary, result_type: UInt8
+                    ARGUMENTS
+                      LIST id: 11, nodes: 2
+                        FUNCTION id: 12, function_name: modulo, function_type: ordinary, result_type: UInt8
+                          ARGUMENTS
+                            LIST id: 13, nodes: 2
+                              COLUMN id: 14, column_name: number, result_type: UInt64, source_id: 15
+                              CONSTANT id: 16, constant_value: UInt64_2, constant_value_type: UInt8
+                        CONSTANT id: 17, constant_value: UInt64_0, constant_value_type: UInt8
+            CONSTANT id: 18, constant_value: NULL, constant_value_type: Nullable(Nothing)
+  JOIN TREE
+    TABLE_FUNCTION id: 15, alias: __table1, table_function_name: numbers
+      ARGUMENTS
+        LIST id: 19, nodes: 1
+          CONSTANT id: 20, constant_value: UInt64_10, constant_value_type: UInt8
diff --git a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql
index 394cd4f1ea5..b283a69a020 100644
--- a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql
+++ b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql
@@ -1,3 +1,11 @@
 SET optimize_rewrite_sum_if_to_count_if = 1;
-SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10) SETTINGS allow_experimental_analyzer=0;
-SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10) SETTINGS allow_experimental_analyzer=1;
\ No newline at end of file
+
+SET allow_experimental_analyzer = 0;
+SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10);
+SELECT (sum(if((number % 2) = 0, toNullable(1), 0)), NULL) FROM numbers(10);
+
+SET allow_experimental_analyzer = 1;
+SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10);
+EXPLAIN QUERY TREE SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10);
+SELECT (sum(if((number % 2) = 0, toNullable(1), 0)), NULL) FROM numbers(10);
+EXPLAIN QUERY TREE SELECT (sum(if((number % 2) = 0, toNullable(1), 0)), NULL) FROM numbers(10);
\ No newline at end of file

From f55e4f8f289e135ab65ca75fe6bb354b8cf00988 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Thu, 14 Mar 2024 09:51:02 +0100
Subject: [PATCH 561/985] Add test.

---
 .../test_dictionaries_replace/__init__.py     |   0
 .../configs/allow_database_types.xml          |   7 +
 .../configs/no_lazy_load.xml                  |   3 +
 .../configs/remote_servers.xml                |  16 +++
 .../test_dictionaries_replace/test.py         | 136 ++++++++++++++++++
 5 files changed, 162 insertions(+)
 create mode 100644 tests/integration/test_dictionaries_replace/__init__.py
 create mode 100644 tests/integration/test_dictionaries_replace/configs/allow_database_types.xml
 create mode 100644 tests/integration/test_dictionaries_replace/configs/no_lazy_load.xml
 create mode 100644 tests/integration/test_dictionaries_replace/configs/remote_servers.xml
 create mode 100644 tests/integration/test_dictionaries_replace/test.py

diff --git a/tests/integration/test_dictionaries_replace/__init__.py b/tests/integration/test_dictionaries_replace/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_dictionaries_replace/configs/allow_database_types.xml b/tests/integration/test_dictionaries_replace/configs/allow_database_types.xml
new file mode 100644
index 00000000000..0434df06457
--- /dev/null
+++ b/tests/integration/test_dictionaries_replace/configs/allow_database_types.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <profiles>
+        <default>
+            <allow_experimental_database_replicated>1</allow_experimental_database_replicated>
+        </default>
+    </profiles>
+</clickhouse>
diff --git a/tests/integration/test_dictionaries_replace/configs/no_lazy_load.xml b/tests/integration/test_dictionaries_replace/configs/no_lazy_load.xml
new file mode 100644
index 00000000000..aaae3e0c4c1
--- /dev/null
+++ b/tests/integration/test_dictionaries_replace/configs/no_lazy_load.xml
@@ -0,0 +1,3 @@
+<clickhouse>
+    <dictionaries_lazy_load>0</dictionaries_lazy_load>
+</clickhouse>
diff --git a/tests/integration/test_dictionaries_replace/configs/remote_servers.xml b/tests/integration/test_dictionaries_replace/configs/remote_servers.xml
new file mode 100644
index 00000000000..6362032973f
--- /dev/null
+++ b/tests/integration/test_dictionaries_replace/configs/remote_servers.xml
@@ -0,0 +1,16 @@
+<clickhouse>
+    <remote_servers>
+        <cluster>
+            <shard>
+                <replica>
+                    <host>node_ll</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>node_no_ll</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </cluster>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_dictionaries_replace/test.py b/tests/integration/test_dictionaries_replace/test.py
new file mode 100644
index 00000000000..bf406f46cb1
--- /dev/null
+++ b/tests/integration/test_dictionaries_replace/test.py
@@ -0,0 +1,136 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers.test_tools import TSV
+
+
+cluster = ClickHouseCluster(__file__)
+
+node_ll = cluster.add_instance(
+    "node_ll",
+    main_configs=[
+        "configs/remote_servers.xml",
+    ],
+    user_configs=[
+        "configs/allow_database_types.xml",
+    ],
+    macros={"replica": "node_ll", "shard": "shard"},
+    with_zookeeper=True,
+)
+
+node_no_ll = cluster.add_instance(
+    "node_no_ll",
+    main_configs=[
+        "configs/no_lazy_load.xml",
+        "configs/remote_servers.xml",
+    ],
+    user_configs=[
+        "configs/allow_database_types.xml",
+    ],
+    macros={"replica": "node_no_ll", "shard": "shard"},
+    with_zookeeper=True,
+)
+
+instances = [node_ll, node_no_ll]
+
+
+@pytest.fixture(scope="module", autouse=True)
+def started_cluster():
+    try:
+        cluster.start()
+
+        # "sleep(1)" is here to make loading of dictionaries a bit slower for this test.
+        instances[0].query(
+            "CREATE VIEW src ON CLUSTER 'cluster' AS SELECT number AS key, number * number + 1 + sleep(1) AS value FROM numbers(10)"
+        )
+
+        # "dict_get_user" can only call dictGet(), nothing more.
+        instances[0].query("CREATE USER dictget_user ON CLUSTER 'cluster'")
+        instances[0].query(
+            "GRANT dictGet ON atomicdb.dict TO dictget_user ON CLUSTER 'cluster'"
+        )
+        instances[0].query(
+            "GRANT dictGet ON repldb.dict TO dictget_user ON CLUSTER 'cluster'"
+        )
+
+        instances[0].query("CREATE DATABASE atomicdb ON CLUSTER 'cluster'")
+        instances[0].query(
+            "CREATE DATABASE repldb ON CLUSTER 'cluster' ENGINE=Replicated('/clickhouse/path/','{shard}','{replica}')"
+        )
+
+        yield cluster
+
+    finally:
+        instances[0].query("DROP TABLE IF EXISTS src ON CLUSTER 'cluster'")
+        instances[0].query("DROP USER IF EXISTS dictget_user ON CLUSTER 'cluster'")
+        instances[0].query("DROP DATABASE IF EXISTS atomicdb ON CLUSTER 'cluster'")
+        instances[0].query("DROP DATABASE IF EXISTS repldb ON CLUSTER 'cluster'")
+
+        cluster.shutdown()
+
+
+@pytest.fixture(autouse=True)
+def cleanup_after_test():
+    try:
+        yield
+    finally:
+        instances[0].query("DROP DICTIONARY IF EXISTS dict ON CLUSTER 'cluster'")
+
+
+def get_status(instance, dictionary_name):
+    return instance.query(
+        "SELECT status FROM system.dictionaries WHERE name='" + dictionary_name + "'"
+    ).rstrip("\n")
+
+
+@pytest.mark.parametrize(
+    "database, instance_to_create_dictionary, instances_to_check",
+    [
+        ("atomicdb", node_ll, [node_ll]),
+        ("atomicdb", node_no_ll, [node_no_ll]),
+        ("repldb", node_ll, [node_ll, node_no_ll]),
+        ("repldb", node_no_ll, [node_ll, node_no_ll]),
+    ],
+)
+def test_create_or_replace(database, instance_to_create_dictionary, instances_to_check):
+    num_steps = 2
+    dict_uuids = {}
+    for step in range(0, num_steps):
+        create_dictionary_query = f"CREATE OR REPLACE DICTIONARY {database}.dict (key Int64, value Int64) PRIMARY KEY key SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() USER 'default' TABLE 'src' PASSWORD '' DB 'default')) LIFETIME(0) LAYOUT(FLAT())"
+        instance_to_create_dictionary.query(create_dictionary_query)
+
+        for instance in instances_to_check:
+            if instance != instance_to_create_dictionary:
+                instance.query(f"SYSTEM SYNC DATABASE REPLICA {database}")
+
+            dict_uuid = instance.query(
+                f"SELECT uuid FROM system.tables WHERE database='{database}' AND table='dict'"
+            ).strip("\n")
+
+            dict_db, dict_name, dict_status = (
+                instance.query(
+                    f"SELECT database, name, status FROM system.dictionaries WHERE uuid='{dict_uuid}'"
+                )
+                .strip("\n")
+                .split("\t")
+            )
+            assert dict_db == database
+            assert dict_name == "dict"
+
+            # "uuid" must be the same for all the dictionaries created at the same "step" and different for the dictionaries created at different steps.
+            if step in dict_uuids:
+                assert dict_uuids[step] == dict_uuid
+            dict_uuids[step] = dict_uuid
+            assert dict_uuid not in [
+                dict_uuids[prev_step] for prev_step in range(0, step)
+            ]
+
+            expected_dict_status = (
+                ["NOT_LOADED"] if instance == node_ll else ["LOADING", "LOADED"]
+            )
+            assert dict_status in expected_dict_status
+
+    for instance in instances_to_check:
+        select_query = f"SELECT arrayJoin([0, 5, 7, 11]) as key, dictGet({database}.dict, 'value', key)"
+        expected_result = TSV([[0, 1], [5, 26], [7, 50], [11, 0]])
+        assert instance.query(select_query) == expected_result
+        assert instance.query(select_query, user="dictget_user") == expected_result

From ad4a25906842e89c526d2651954d1ac3e64fbfb7 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Fri, 15 Mar 2024 12:13:35 +0100
Subject: [PATCH 562/985] Restore automerge for approved PRs

---
 .github/workflows/pull_request.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index c065219f980..2dddde9aa14 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -172,6 +172,7 @@ jobs:
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
           python3 finish_check.py
+          python3 merge_pr.py --check-approved
 
 
 #############################################################################################

From a5bd24205947aea5a93490bb698fa99856e00d89 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 15 Mar 2024 12:36:33 +0100
Subject: [PATCH 563/985] Even more garbage

---
 src/Functions/FunctionsConversion.cpp | 73 ++++++++++++---------------
 1 file changed, 32 insertions(+), 41 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index f69d3e9146b..7f130b0cc86 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1183,26 +1183,26 @@ struct ConvertImpl
         {
             /// Conversion of DateTime to Date: throw off time component.
             /// Conversion of Date32 to Date.
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateImpl<date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateImpl<date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime> && std::is_same_v<ToDataType, DataTypeDate32>)
         {
             /// Conversion of DateTime to Date: throw off time component.
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Impl, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Impl, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((std::is_same_v<FromDataType, DataTypeDate> || std::is_same_v<FromDataType, DataTypeDate32>)
             && std::is_same_v<ToDataType, DataTypeDateTime>)
         {
             /// Conversion from Date/Date32 to DateTime.
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeImpl<date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeImpl<date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64> && std::is_same_v<ToDataType, DataTypeDate32>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false>::execute(
+            return DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
         }
         /** Special case of converting Int8, Int16, (U)Int32 or (U)Int64 (and also, for convenience,
@@ -1220,7 +1220,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1229,7 +1229,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform8Or16Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform8Or16Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1240,7 +1240,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1249,7 +1249,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate32>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1258,7 +1258,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate32>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform8Or16Signed<typename FromDataType::FieldType, UInt16>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform8Or16Signed<typename FromDataType::FieldType, UInt16>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1269,7 +1269,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate32>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         /// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.
@@ -1280,14 +1280,14 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDateTime>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransformSigned<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransformSigned<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
             && std::is_same_v<ToDataType, DataTypeDateTime>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1297,7 +1297,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDateTime>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64Signed<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64Signed<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1308,15 +1308,15 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDateTime64>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformSigned<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count, additions);
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformSigned<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+                arguments, result_type, input_rows_count);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
             && std::is_same_v<ToDataType, DataTypeDateTime64>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformUnsigned<UInt64, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count, additions);
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformUnsigned<UInt64, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+                arguments, result_type, input_rows_count);
         }
         else if constexpr ((
                 std::is_same_v<FromDataType, DataTypeFloat32>
@@ -1324,22 +1324,22 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDateTime64>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformFloat<FromDataType, typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::execute(
-                arguments, result_type, input_rows_count, additions);
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformFloat<FromDataType, typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+                arguments, result_type, input_rows_count);
         }
         /// Conversion of DateTime64 to Date or DateTime: discards fractional part.
         else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
             && std::is_same_v<ToDataType, DataTypeDate>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
             && std::is_same_v<ToDataType, DataTypeDateTime>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false>::execute(
+            return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
         }
         /// Conversion of Date or DateTime to DateTime64: add zero sub-second part.
@@ -1350,8 +1350,8 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDateTime64>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64Transform, false>::execute(
-                arguments, result_type, input_rows_count, additions);
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64Transform, false>::template execute<Additions>(
+                arguments, result_type, input_rows_count);
         }
         else if constexpr (IsDataTypeDateOrDateTime<FromDataType>
             && std::is_same_v<ToDataType, DataTypeString>)
@@ -1573,8 +1573,8 @@ struct ConvertImpl
             && std::is_same_v<FromDataType, DataTypeString>
             && std::is_same_v<ToDataType, DataTypeUInt32>)
         {
-            return ConvertImpl<FromDataType, DataTypeDateTime, Name, SpecialTag, date_time_overflow_behavior>::execute(
-                arguments, result_type, input_rows_count, additions);
+            return ConvertImpl<FromDataType, DataTypeDateTime, Name, SpecialTag, date_time_overflow_behavior>::template execute<Additions>(
+                arguments, result_type, input_rows_count);
         }
         else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>)
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
@@ -1974,11 +1974,8 @@ public:
     using Monotonic = MonotonicityImpl;
 
     static constexpr auto name = Name::name;
-    static constexpr bool to_decimal =
-        std::is_same_v<Name, NameToDecimal32> || std::is_same_v<Name, NameToDecimal64>
-         || std::is_same_v<Name, NameToDecimal128> || std::is_same_v<Name, NameToDecimal256>;
-
     static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
+    static constexpr bool to_decimal = IsDataTypeDecimal<ToDataType> && !to_datetime64;
 
     static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionConvert>(context); }
     static FunctionPtr create() { return std::make_shared<FunctionConvert>(); }
@@ -2319,7 +2316,7 @@ private:
         }
 
         bool done = false;
-        if constexpr (std::is_same_v<ToDataType, DataTypeFixedString> || std::is_same_v<ToDataType, DataTypeString>)
+        if constexpr (is_any_of<ToDataType, DataTypeString, DataTypeFixedString>)
         {
             done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
         }
@@ -2371,13 +2368,8 @@ class FunctionConvertFromString : public IFunction
 {
 public:
     static constexpr auto name = Name::name;
-    static constexpr bool to_decimal =
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal32>> ||
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal64>> ||
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal128>> ||
-        std::is_same_v<ToDataType, DataTypeDecimal<Decimal256>>;
-
     static constexpr bool to_datetime64 = std::is_same_v<ToDataType, DataTypeDateTime64>;
+    static constexpr bool to_decimal = IsDataTypeDecimal<ToDataType> && !to_datetime64;
 
     static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionConvertFromString>(); }
 
@@ -3203,13 +3195,12 @@ private:
             return createFunctionAdaptor(function, from_type);
         }
 
-        auto wrapper_cast_type = cast_type;
-
-        return [wrapper_cast_type, from_type_index, to_type, date_time_overflow_behavior]
-            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable *column_nullable, size_t input_rows_count)
+        return [wrapper_cast_type = cast_type, from_type_index, to_type, date_time_overflow_behavior]
+            (ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, const ColumnNullable * column_nullable, size_t input_rows_count)
         {
             ColumnPtr result_column;
-            auto res = callOnIndexAndDataType<ToDataType>(from_type_index, [&](const auto & types) -> bool {
+            auto res = callOnIndexAndDataType<ToDataType>(from_type_index, [&](const auto & types) -> bool
+            {
                 using Types = std::decay_t<decltype(types)>;
                 using LeftDataType = typename Types::LeftType;
                 using RightDataType = typename Types::RightType;

From 61870fa4b5621d2c9d55a397ee463e285675eee2 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Fri, 15 Mar 2024 12:43:11 +0100
Subject: [PATCH 564/985] Disable broken SonarCloud

---
 .github/workflows/nightly.yml | 103 +++++++++++++++++-----------------
 1 file changed, 53 insertions(+), 50 deletions(-)

diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml
index 93ac2be19b4..0ab02db8d7a 100644
--- a/.github/workflows/nightly.yml
+++ b/.github/workflows/nightly.yml
@@ -45,6 +45,7 @@ jobs:
     with:
       data: "${{ needs.RunConfig.outputs.data }}"
       set_latest: true
+
   SonarCloud:
     runs-on: [self-hosted, builder]
     env:
@@ -54,53 +55,55 @@ jobs:
       CC: clang-17
       CXX: clang++-17
     steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # Shallow clones should be disabled for a better relevancy of analysis
-          filter: tree:0
-          submodules: true
-      - name: Set up JDK 11
-        uses: actions/setup-java@v1
-        with:
-          java-version: 11
-      - name: Download and set up sonar-scanner
-        env:
-          SONAR_SCANNER_DOWNLOAD_URL: https://binaries.sonarsource.com/Distribution/sonar-scanner-cli/sonar-scanner-cli-${{ env.SONAR_SCANNER_VERSION }}-linux.zip
-        run: |
-          mkdir -p "$HOME/.sonar"
-          curl -sSLo "$HOME/.sonar/sonar-scanner.zip" "${{ env.SONAR_SCANNER_DOWNLOAD_URL }}"
-          unzip -o "$HOME/.sonar/sonar-scanner.zip" -d "$HOME/.sonar/"
-          echo "$HOME/.sonar/sonar-scanner-${{ env.SONAR_SCANNER_VERSION }}-linux/bin" >> "$GITHUB_PATH"
-      - name: Download and set up build-wrapper
-        env:
-          BUILD_WRAPPER_DOWNLOAD_URL: ${{ env.SONAR_SERVER_URL }}/static/cpp/build-wrapper-linux-x86.zip
-        run: |
-          curl -sSLo "$HOME/.sonar/build-wrapper-linux-x86.zip" "${{ env.BUILD_WRAPPER_DOWNLOAD_URL }}"
-          unzip -o "$HOME/.sonar/build-wrapper-linux-x86.zip" -d "$HOME/.sonar/"
-          echo "$HOME/.sonar/build-wrapper-linux-x86" >> "$GITHUB_PATH"
-      - name: Set Up Build Tools
-        run: |
-          sudo apt-get update
-          sudo apt-get install -yq git cmake ccache ninja-build python3 yasm nasm
-          sudo bash -c "$(wget -O - https://apt.llvm.org/llvm.sh)"
-      - name: Run build-wrapper
-        run: |
-          mkdir build
-          cd build
-          cmake ..
-          cd ..
-          build-wrapper-linux-x86-64 --out-dir ${{ env.BUILD_WRAPPER_OUT_DIR }} cmake --build build/
-      - name: Run sonar-scanner
-        env:
-          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-          SONAR_TOKEN: ${{ secrets.SONAR_TOKEN }}
-        run: |
-          sonar-scanner \
-            --define sonar.host.url="${{ env.SONAR_SERVER_URL }}" \
-            --define sonar.cfamily.build-wrapper-output="${{ env.BUILD_WRAPPER_OUT_DIR }}" \
-            --define sonar.projectKey="ClickHouse_ClickHouse" \
-            --define sonar.organization="clickhouse-java" \
-            --define sonar.cfamily.cpp23.enabled=true \
-            --define sonar.exclusions="**/*.java,**/*.ts,**/*.js,**/*.css,**/*.sql"
+      - name: Disabled
+        run: echo "The job is disabled since permanently broken"
+        # - name: Check out repository code
+        #   uses: ClickHouse/checkout@v1
+        #   with:
+        #     clear-repository: true
+        #     fetch-depth: 0  # Shallow clones should be disabled for a better relevancy of analysis
+        #     filter: tree:0
+        #     submodules: true
+        # - name: Set up JDK 11
+        #   uses: actions/setup-java@v1
+        #   with:
+        #     java-version: 11
+        # - name: Download and set up sonar-scanner
+        #   env:
+        #     SONAR_SCANNER_DOWNLOAD_URL: https://binaries.sonarsource.com/Distribution/sonar-scanner-cli/sonar-scanner-cli-${{ env.SONAR_SCANNER_VERSION }}-linux.zip
+        #   run: |
+        #     mkdir -p "$HOME/.sonar"
+        #     curl -sSLo "$HOME/.sonar/sonar-scanner.zip" "${{ env.SONAR_SCANNER_DOWNLOAD_URL }}"
+        #     unzip -o "$HOME/.sonar/sonar-scanner.zip" -d "$HOME/.sonar/"
+        #     echo "$HOME/.sonar/sonar-scanner-${{ env.SONAR_SCANNER_VERSION }}-linux/bin" >> "$GITHUB_PATH"
+        # - name: Download and set up build-wrapper
+        #   env:
+        #     BUILD_WRAPPER_DOWNLOAD_URL: ${{ env.SONAR_SERVER_URL }}/static/cpp/build-wrapper-linux-x86.zip
+        #   run: |
+        #     curl -sSLo "$HOME/.sonar/build-wrapper-linux-x86.zip" "${{ env.BUILD_WRAPPER_DOWNLOAD_URL }}"
+        #     unzip -o "$HOME/.sonar/build-wrapper-linux-x86.zip" -d "$HOME/.sonar/"
+        #     echo "$HOME/.sonar/build-wrapper-linux-x86" >> "$GITHUB_PATH"
+        # - name: Set Up Build Tools
+        #   run: |
+        #     sudo apt-get update
+        #     sudo apt-get install -yq git cmake ccache ninja-build python3 yasm nasm
+        #     sudo bash -c "$(wget -O - https://apt.llvm.org/llvm.sh)"
+        # - name: Run build-wrapper
+        #   run: |
+        #     mkdir build
+        #     cd build
+        #     cmake ..
+        #     cd ..
+        #     build-wrapper-linux-x86-64 --out-dir ${{ env.BUILD_WRAPPER_OUT_DIR }} cmake --build build/
+        # - name: Run sonar-scanner
+        #   env:
+        #     GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+        #     SONAR_TOKEN: ${{ secrets.SONAR_TOKEN }}
+        #   run: |
+        #     sonar-scanner \
+        #       --define sonar.host.url="${{ env.SONAR_SERVER_URL }}" \
+        #       --define sonar.cfamily.build-wrapper-output="${{ env.BUILD_WRAPPER_OUT_DIR }}" \
+        #       --define sonar.projectKey="ClickHouse_ClickHouse" \
+        #       --define sonar.organization="clickhouse-java" \
+        #       --define sonar.cfamily.cpp23.enabled=true \
+        #       --define sonar.exclusions="**/*.java,**/*.ts,**/*.js,**/*.css,**/*.sql"

From 00533f3df634c3a96e78fa0732c9375f257ffb5b Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Fri, 15 Mar 2024 19:43:44 +0800
Subject: [PATCH 565/985] revert opts in column array

---
 src/Columns/ColumnArray.cpp | 232 +++---------------------------------
 src/Columns/ColumnArray.h   |  14 +--
 2 files changed, 19 insertions(+), 227 deletions(-)

diff --git a/src/Columns/ColumnArray.cpp b/src/Columns/ColumnArray.cpp
index 0214375122f..7b268b80116 100644
--- a/src/Columns/ColumnArray.cpp
+++ b/src/Columns/ColumnArray.cpp
@@ -31,7 +31,6 @@ namespace ErrorCodes
     extern const int SIZES_OF_COLUMNS_DOESNT_MATCH;
     extern const int LOGICAL_ERROR;
     extern const int TOO_LARGE_ARRAY_SIZE;
-    extern const int ILLEGAL_COLUMN;
 }
 
 /** Obtaining array as Field can be slow for large arrays and consume vast amount of memory.
@@ -43,34 +42,29 @@ namespace ErrorCodes
 static constexpr size_t max_array_size_as_field = 1000000;
 
 
-ColumnArray::ColumnArray(MutableColumnPtr && nested_column, MutableColumnPtr && offsets_column, bool check_offsets)
+ColumnArray::ColumnArray(MutableColumnPtr && nested_column, MutableColumnPtr && offsets_column)
     : data(std::move(nested_column)), offsets(std::move(offsets_column))
 {
-    if (check_offsets)
+    const ColumnOffsets * offsets_concrete = typeid_cast<const ColumnOffsets *>(offsets.get());
+
+    if (!offsets_concrete)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "offsets_column must be a ColumnUInt64");
+
+    if (!offsets_concrete->empty() && data && !data->empty())
     {
-        const ColumnOffsets * offsets_concrete = typeid_cast<const ColumnOffsets *>(offsets.get());
+        Offset last_offset = offsets_concrete->getData().back();
 
-        if (!offsets_concrete)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "offsets_column must be a ColumnUInt64");
-
-        if (!offsets_concrete->empty() && data && !data->empty())
-        {
-            Offset last_offset = offsets_concrete->getData().back();
-
-            /// This will also prevent possible overflow in offset.
-            if (data->size() != last_offset)
-                throw Exception(
-                    ErrorCodes::LOGICAL_ERROR,
-                    "offsets_column has data inconsistent with nested_column. Data size: {}, last offset: {}",
-                    data->size(),
-                    last_offset);
-        }
-
-        /** NOTE
-         * Arrays with constant value are possible and used in implementation of higher order functions (see FunctionReplicate).
-         * But in most cases, arrays with constant value are unexpected and code will work wrong. Use with caution.
-         */
+        /// This will also prevent possible overflow in offset.
+        if (data->size() != last_offset)
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                "offsets_column has data inconsistent with nested_column. Data size: {}, last offset: {}",
+                data->size(), last_offset);
     }
+
+    /** NOTE
+      * Arrays with constant value are possible and used in implementation of higher order functions (see FunctionReplicate).
+      * But in most cases, arrays with constant value are unexpected and code will work wrong. Use with caution.
+      */
 }
 
 ColumnArray::ColumnArray(MutableColumnPtr && nested_column)
@@ -353,196 +347,6 @@ void ColumnArray::insertFrom(const IColumn & src_, size_t n)
     getOffsets().push_back(getOffsets().back() + size);
 }
 
-template <typename T>
-void ColumnArray::insertManyFromNumber(const ColumnArray & src, size_t position, size_t length)
-{
-    using ColVecType = ColumnVectorOrDecimal<T>;
-    size_t src_size = src.sizeAt(position);
-    size_t src_offset = src.offsetAt(position);
-
-    const typename ColVecType::Container & src_data = typeid_cast<const ColVecType &>(src.getData()).getData();
-    typename ColVecType::Container & data_ref = typeid_cast<ColVecType &>(getData()).getData();
-    size_t old_size = data_ref.size();
-    size_t new_size = old_size + src_size * length;
-    data_ref.resize(new_size);
-    for (size_t i = 0, offset = old_size; i < length; ++i, offset += src_size)
-        memcpy(&data_ref[offset], &src_data[src_offset], src_size * sizeof(T));
-}
-
-void ColumnArray::insertManyFromConst(const ColumnConst & src, size_t  /*position*/, size_t length)
-{
-    const ColumnArray * src_array = typeid_cast<const ColumnArray *>(&src.getDataColumn());
-    if (!src_array)
-        throw Exception(
-            ErrorCodes::ILLEGAL_COLUMN,
-            "Cannot insert from const column of type {} to column of type {}",
-            src.getDataColumn().getName(),
-            getName());
-
-    insertManyFromImpl(*src_array, 0, length, true);
-}
-
-void ColumnArray::insertManyFromString(const ColumnArray & src, size_t position, size_t length)
-{
-    size_t src_size = src.sizeAt(position);
-    size_t src_offset = src.offsetAt(position);
-
-    const auto & src_string = typeid_cast<const ColumnString &>(src.getData());
-    const auto & src_chars = src_string.getChars();
-    const auto & src_string_offsets = src_string.getOffsets();
-    auto & dst_string = typeid_cast<ColumnString &>(getData());
-    auto & dst_chars = dst_string.getChars();
-    auto & dst_string_offsets = dst_string.getOffsets();
-
-    /// Each row may have multiple strings, copy them to dst_chars and update dst_offsets
-    size_t old_size = dst_string_offsets.size();
-    size_t new_size = old_size + src_size * length;
-    dst_string_offsets.resize(new_size);
-    size_t dst_string_offset = dst_chars.size();
-    for (size_t i = 0; i < length; ++i)
-    {
-        for (size_t j = 0; j < src_size; ++j)
-        {
-            size_t nested_offset = src_string_offsets[src_offset + j - 1];
-            size_t nested_length = src_string_offsets[src_offset + j] - nested_offset;
-
-            dst_string_offset += nested_length;
-            dst_string_offsets[old_size + i * src_size + j] = dst_string_offset;
-        }
-    }
-
-    size_t chars_to_copy = src_string_offsets[src_offset + src_size - 1] - src_string_offsets[src_offset - 1];
-    dst_chars.resize(dst_chars.size() + chars_to_copy * length);
-    for (size_t dst_offset = old_size; dst_offset < new_size; dst_offset += src_size)
-        memcpy(&dst_chars[dst_string_offsets[dst_offset - 1]], &src_chars[src_string_offsets[src_offset - 1]], chars_to_copy);
-}
-
-void ColumnArray::insertManyFromTuple(const ColumnArray & src, size_t position, size_t length)
-{
-    ColumnTuple & tuple = assert_cast<ColumnTuple &>(getData());
-    const ColumnTuple & src_tuple = assert_cast<const ColumnTuple &>(src.getData());
-
-    /// Make temporary arrays for each components of Tuple. In the same way as for Nullable.
-    size_t tuple_size = tuple.tupleSize();
-    size_t src_tuple_size = src_tuple.tupleSize();
-    if (tuple_size == 0)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Empty tuple");
-    if (tuple_size != src_tuple_size)
-        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Nested tuple size mismatch: {} vs {}", tuple_size, src_tuple_size);
-
-    Columns tuple_columns(tuple_size);
-    for (size_t i = 0; i < tuple_size; ++i)
-    {
-        auto array_of_element = ColumnArray(tuple.getColumn(i).assumeMutable(), getOffsetsPtr()->assumeMutable(), false);
-        auto src_array_of_element = ColumnArray(src_tuple.getColumn(i).assumeMutable(), src.getOffsetsPtr()->assumeMutable());
-        array_of_element.insertManyFromImpl(src_array_of_element, position, length, false);
-        tuple_columns[i] = array_of_element.getDataPtr();
-    }
-    getDataPtr() = ColumnTuple::create(std::move(tuple_columns));
-}
-
-void ColumnArray::insertManyFromNullable(const ColumnArray & src, size_t position, size_t length)
-{
-    ColumnNullable & nullable = assert_cast<ColumnNullable &>(getData());
-    const ColumnNullable & src_nullable = assert_cast<const ColumnNullable &>(src.getData());
-
-    /// Process nested column without updating array offsets
-    auto array_of_nested = ColumnArray(nullable.getNestedColumnPtr()->assumeMutable(), getOffsetsPtr()->assumeMutable(), false);
-    auto src_array_of_nested = ColumnArray(src_nullable.getNestedColumnPtr()->assumeMutable(), src.getOffsetsPtr()->assumeMutable());
-    array_of_nested.insertManyFromImpl(src_array_of_nested, position, length, false);
-
-    /// Process null map column without updating array offsets
-    auto array_of_null_map = ColumnArray(nullable.getNullMapColumnPtr()->assumeMutable(), getOffsetsPtr()->assumeMutable(), false);
-    auto src_array_of_null_map = ColumnArray(src_nullable.getNullMapColumnPtr()->assumeMutable(), src.getOffsetsPtr()->assumeMutable());
-    array_of_null_map.insertManyFromImpl(src_array_of_null_map, position, length, false);
-
-    /// Update array data
-    getDataPtr() = ColumnNullable::create(array_of_nested.getDataPtr(), array_of_null_map.getDataPtr());
-}
-
-void ColumnArray::insertManyFromGeneric(const ColumnArray & src, size_t position, size_t length)
-{
-    size_t src_size = src.sizeAt(position);
-    size_t src_offset = src.offsetAt(position);
-    const auto & src_data = src.getData();
-    size_t new_size = data->size() + src_size * length;
-    data->reserve(new_size);
-    for (size_t i = 0; i < length; ++i)
-        data->insertRangeFrom(src_data, src_offset, src_size);
-}
-
-void ColumnArray::insertManyFrom(const IColumn & src_, size_t position, size_t length)
-{
-    const ColumnConst * src_const = typeid_cast<const ColumnConst *>(&src_);
-    if (src_const)
-        return insertManyFromConst(*src_const, position, length);
-
-    const ColumnArray * src_array = typeid_cast<const ColumnArray *>(&src_);
-    if (!src_array)
-        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Cannot insert from column of type {} to column of type {}", src_.getName(), getName());
-
-    return insertManyFromImpl(*src_array, position, length, true);
-}
-
-void ColumnArray::insertManyFromImpl(const ColumnArray & src, size_t position, size_t length, bool update_offsets)
-{
-    /// First fill offsets if needed
-    if (update_offsets)
-    {
-        size_t src_size = src.sizeAt(position);
-        auto & offsets_ref = getOffsets();
-        size_t old_rows = offsets_ref.size();
-        size_t new_rows = old_rows + length;
-        size_t old_size = offsets_ref.back();
-        offsets_ref.resize(new_rows);
-        for (size_t i = 0, offset = old_size + src_size; i < length; ++i, offset += src_size)
-            offsets_ref[old_rows + i] = offset;
-    }
-
-    if (typeid_cast<const ColumnUInt8 *>(data.get()))
-        return insertManyFromNumber<UInt8>(src, position, length);
-    if (typeid_cast<const ColumnUInt16 *>(data.get()))
-        return insertManyFromNumber<UInt16>(src, position, length);
-    if (typeid_cast<const ColumnUInt32 *>(data.get()))
-        return insertManyFromNumber<UInt32>(src, position, length);
-    if (typeid_cast<const ColumnUInt64 *>(data.get()))
-        return insertManyFromNumber<UInt64>(src, position, length);
-    if (typeid_cast<const ColumnUInt128 *>(data.get()))
-        return insertManyFromNumber<UInt128>(src, position, length);
-    if (typeid_cast<const ColumnUInt256 *>(data.get()))
-        return insertManyFromNumber<UInt256>(src, position, length);
-    if (typeid_cast<const ColumnInt16 *>(data.get()))
-        return insertManyFromNumber<Int16>(src, position, length);
-    if (typeid_cast<const ColumnInt32 *>(data.get()))
-        return insertManyFromNumber<Int32>(src, position, length);
-    if (typeid_cast<const ColumnInt64 *>(data.get()))
-        return insertManyFromNumber<Int64>(src, position, length);
-    if (typeid_cast<const ColumnInt128 *>(data.get()))
-        return insertManyFromNumber<Int128>(src, position, length);
-    if (typeid_cast<const ColumnInt256 *>(data.get()))
-        return insertManyFromNumber<Int256>(src, position, length);
-    if (typeid_cast<const ColumnFloat32 *>(data.get()))
-        return insertManyFromNumber<Float32>(src, position, length);
-    if (typeid_cast<const ColumnFloat64 *>(data.get()))
-        return insertManyFromNumber<Float64>(src, position, length);
-    if (typeid_cast<const ColumnDecimal<Decimal32> *>(data.get()))
-        return insertManyFromNumber<Decimal32>(src, position, length);
-    if (typeid_cast<const ColumnDecimal<Decimal64> *>(data.get()))
-        return insertManyFromNumber<Decimal64>(src, position, length);
-    if (typeid_cast<const ColumnDecimal<Decimal128> *>(data.get()))
-        return insertManyFromNumber<Decimal128>(src, position, length);
-    if (typeid_cast<const ColumnDecimal<Decimal256> *>(data.get()))
-        return insertManyFromNumber<Decimal256>(src, position, length);
-    if (typeid_cast<const ColumnDecimal<DateTime64> *>(data.get()))
-        return insertManyFromNumber<DateTime64>(src, position, length);
-    if (typeid_cast<const ColumnString *>(data.get()))
-        return insertManyFromString(src, position, length);
-    if (typeid_cast<const ColumnNullable *>(data.get()))
-        return insertManyFromNullable(src, position, length);
-    if (typeid_cast<const ColumnTuple *>(data.get()))
-        return insertManyFromTuple(src, position, length);
-    return insertManyFromGeneric(src, position, length);
-}
 
 void ColumnArray::insertDefault()
 {
diff --git a/src/Columns/ColumnArray.h b/src/Columns/ColumnArray.h
index 8c4d103e7d0..230d8830265 100644
--- a/src/Columns/ColumnArray.h
+++ b/src/Columns/ColumnArray.h
@@ -21,7 +21,7 @@ private:
     friend class COWHelper<IColumnHelper<ColumnArray>, ColumnArray>;
 
     /** Create an array column with specified values and offsets. */
-    ColumnArray(MutableColumnPtr && nested_column, MutableColumnPtr && offsets_column, bool check_offsets = true);
+    ColumnArray(MutableColumnPtr && nested_column, MutableColumnPtr && offsets_column);
 
     /** Create an empty column of arrays with the type of values as in the column `nested_column` */
     explicit ColumnArray(MutableColumnPtr && nested_column);
@@ -88,7 +88,6 @@ public:
     void insert(const Field & x) override;
     bool tryInsert(const Field & x) override;
     void insertFrom(const IColumn & src_, size_t n) override;
-    void insertManyFrom(const IColumn & src, size_t position, size_t length) override;
     void insertDefault() override;
     void popBack(size_t n) override;
     ColumnPtr filter(const Filter & filt, ssize_t result_size_hint) const override;
@@ -214,17 +213,6 @@ private:
     ColumnPtr filterNullable(const Filter & filt, ssize_t result_size_hint) const;
     ColumnPtr filterGeneric(const Filter & filt, ssize_t result_size_hint) const;
 
-    /// Specializations for insertManyFrom
-    void insertManyFromConst(const ColumnConst & src, size_t position, size_t length);
-    void insertManyFromImpl(const ColumnArray & src, size_t position, size_t length, bool update_offsets = true);
-
-    template <typename T>
-    void insertManyFromNumber(const ColumnArray & src, size_t position, size_t length);
-    void insertManyFromString(const ColumnArray & src, size_t position, size_t length);
-    void insertManyFromTuple(const ColumnArray & src, size_t position, size_t length);
-    void insertManyFromNullable(const ColumnArray & src, size_t position, size_t length);
-    void insertManyFromGeneric(const ColumnArray & src, size_t position, size_t length);
-
     int compareAtImpl(size_t n, size_t m, const IColumn & rhs_, int nan_direction_hint, const Collator * collator=nullptr) const;
 };
 

From 5787b7f7c8a38fd407d8c532b99f143685e55a78 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 15 Mar 2024 14:46:26 +0300
Subject: [PATCH 566/985] Update nightly.yml

---
 .github/workflows/nightly.yml | 62 -----------------------------------
 1 file changed, 62 deletions(-)

diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml
index 0ab02db8d7a..515236bb826 100644
--- a/.github/workflows/nightly.yml
+++ b/.github/workflows/nightly.yml
@@ -45,65 +45,3 @@ jobs:
     with:
       data: "${{ needs.RunConfig.outputs.data }}"
       set_latest: true
-
-  SonarCloud:
-    runs-on: [self-hosted, builder]
-    env:
-      SONAR_SCANNER_VERSION: 4.8.0.2856
-      SONAR_SERVER_URL: "https://sonarcloud.io"
-      BUILD_WRAPPER_OUT_DIR: build_wrapper_output_directory # Directory where build-wrapper output will be placed
-      CC: clang-17
-      CXX: clang++-17
-    steps:
-      - name: Disabled
-        run: echo "The job is disabled since permanently broken"
-        # - name: Check out repository code
-        #   uses: ClickHouse/checkout@v1
-        #   with:
-        #     clear-repository: true
-        #     fetch-depth: 0  # Shallow clones should be disabled for a better relevancy of analysis
-        #     filter: tree:0
-        #     submodules: true
-        # - name: Set up JDK 11
-        #   uses: actions/setup-java@v1
-        #   with:
-        #     java-version: 11
-        # - name: Download and set up sonar-scanner
-        #   env:
-        #     SONAR_SCANNER_DOWNLOAD_URL: https://binaries.sonarsource.com/Distribution/sonar-scanner-cli/sonar-scanner-cli-${{ env.SONAR_SCANNER_VERSION }}-linux.zip
-        #   run: |
-        #     mkdir -p "$HOME/.sonar"
-        #     curl -sSLo "$HOME/.sonar/sonar-scanner.zip" "${{ env.SONAR_SCANNER_DOWNLOAD_URL }}"
-        #     unzip -o "$HOME/.sonar/sonar-scanner.zip" -d "$HOME/.sonar/"
-        #     echo "$HOME/.sonar/sonar-scanner-${{ env.SONAR_SCANNER_VERSION }}-linux/bin" >> "$GITHUB_PATH"
-        # - name: Download and set up build-wrapper
-        #   env:
-        #     BUILD_WRAPPER_DOWNLOAD_URL: ${{ env.SONAR_SERVER_URL }}/static/cpp/build-wrapper-linux-x86.zip
-        #   run: |
-        #     curl -sSLo "$HOME/.sonar/build-wrapper-linux-x86.zip" "${{ env.BUILD_WRAPPER_DOWNLOAD_URL }}"
-        #     unzip -o "$HOME/.sonar/build-wrapper-linux-x86.zip" -d "$HOME/.sonar/"
-        #     echo "$HOME/.sonar/build-wrapper-linux-x86" >> "$GITHUB_PATH"
-        # - name: Set Up Build Tools
-        #   run: |
-        #     sudo apt-get update
-        #     sudo apt-get install -yq git cmake ccache ninja-build python3 yasm nasm
-        #     sudo bash -c "$(wget -O - https://apt.llvm.org/llvm.sh)"
-        # - name: Run build-wrapper
-        #   run: |
-        #     mkdir build
-        #     cd build
-        #     cmake ..
-        #     cd ..
-        #     build-wrapper-linux-x86-64 --out-dir ${{ env.BUILD_WRAPPER_OUT_DIR }} cmake --build build/
-        # - name: Run sonar-scanner
-        #   env:
-        #     GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-        #     SONAR_TOKEN: ${{ secrets.SONAR_TOKEN }}
-        #   run: |
-        #     sonar-scanner \
-        #       --define sonar.host.url="${{ env.SONAR_SERVER_URL }}" \
-        #       --define sonar.cfamily.build-wrapper-output="${{ env.BUILD_WRAPPER_OUT_DIR }}" \
-        #       --define sonar.projectKey="ClickHouse_ClickHouse" \
-        #       --define sonar.organization="clickhouse-java" \
-        #       --define sonar.cfamily.cpp23.enabled=true \
-        #       --define sonar.exclusions="**/*.java,**/*.ts,**/*.js,**/*.css,**/*.sql"

From 16abbcd095c4034a49921288ff0d79835addbf16 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Fri, 15 Mar 2024 12:54:13 +0100
Subject: [PATCH 567/985] Revert "Updated format settings references in the
 docs (datetime.md)"

---
 docs/en/sql-reference/data-types/datetime.md | 8 ++++----
 docs/ru/sql-reference/data-types/datetime.md | 8 ++++----
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/docs/en/sql-reference/data-types/datetime.md b/docs/en/sql-reference/data-types/datetime.md
index a465106c2ff..1adff18f598 100644
--- a/docs/en/sql-reference/data-types/datetime.md
+++ b/docs/en/sql-reference/data-types/datetime.md
@@ -36,9 +36,9 @@ You can explicitly set a time zone for `DateTime`-type columns when creating a t
 
 The [clickhouse-client](../../interfaces/cli.md) applies the server time zone by default if a time zone isn’t explicitly set when initializing the data type. To use the client time zone, run `clickhouse-client` with the `--use_client_time_zone` parameter.
 
-ClickHouse outputs values depending on the value of the [date_time_output_format](../../operations/settings/settings-formats.md#date_time_output_format) setting. `YYYY-MM-DD hh:mm:ss` text format by default. Additionally, you can change the output with the [formatDateTime](../../sql-reference/functions/date-time-functions.md#formatdatetime) function.
+ClickHouse outputs values depending on the value of the [date_time_output_format](../../operations/settings/settings.md#settings-date_time_output_format) setting. `YYYY-MM-DD hh:mm:ss` text format by default. Additionally, you can change the output with the [formatDateTime](../../sql-reference/functions/date-time-functions.md#formatdatetime) function.
 
-When inserting data into ClickHouse, you can use different formats of date and time strings, depending on the value of the [date_time_input_format](../../operations/settings/settings-formats.md#date_time_input_format) setting.
+When inserting data into ClickHouse, you can use different formats of date and time strings, depending on the value of the [date_time_input_format](../../operations/settings/settings.md#settings-date_time_input_format) setting.
 
 ## Examples
 
@@ -147,8 +147,8 @@ Time shifts for multiple days. Some pacific islands changed their timezone offse
 - [Type conversion functions](../../sql-reference/functions/type-conversion-functions.md)
 - [Functions for working with dates and times](../../sql-reference/functions/date-time-functions.md)
 - [Functions for working with arrays](../../sql-reference/functions/array-functions.md)
-- [The `date_time_input_format` setting](../../operations/settings/settings-formats.md#date_time_input_format)
-- [The `date_time_output_format` setting](../../operations/settings/settings-formats.md#date_time_output_format)
+- [The `date_time_input_format` setting](../../operations/settings/settings-formats.md#settings-date_time_input_format)
+- [The `date_time_output_format` setting](../../operations/settings/settings-formats.md#settings-date_time_output_format)
 - [The `timezone` server configuration parameter](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-timezone)
 - [The `session_timezone` setting](../../operations/settings/settings.md#session_timezone)
 - [Operators for working with dates and times](../../sql-reference/operators/index.md#operators-datetime)
diff --git a/docs/ru/sql-reference/data-types/datetime.md b/docs/ru/sql-reference/data-types/datetime.md
index 25e87794147..57f24786bb7 100644
--- a/docs/ru/sql-reference/data-types/datetime.md
+++ b/docs/ru/sql-reference/data-types/datetime.md
@@ -27,9 +27,9 @@ DateTime([timezone])
 
 Консольный клиент ClickHouse по умолчанию использует часовой пояс сервера, если для значения `DateTime` часовой пояс не был задан в явном виде при инициализации типа данных. Чтобы использовать часовой пояс клиента, запустите [clickhouse-client](../../interfaces/cli.md) с параметром `--use_client_time_zone`.
 
-ClickHouse отображает значения в зависимости от значения параметра [date\_time\_output\_format](../../operations/settings/settings-formats.md#date_time_output_format). Текстовый формат по умолчанию `YYYY-MM-DD hh:mm:ss`. Кроме того, вы можете поменять отображение с помощью функции [formatDateTime](../../sql-reference/functions/date-time-functions.md#formatdatetime).
+ClickHouse отображает значения в зависимости от значения параметра [date\_time\_output\_format](../../operations/settings/index.md#settings-date_time_output_format). Текстовый формат по умолчанию `YYYY-MM-DD hh:mm:ss`. Кроме того, вы можете поменять отображение с помощью функции [formatDateTime](../../sql-reference/functions/date-time-functions.md#formatdatetime).
 
-При вставке данных в ClickHouse, можно использовать различные форматы даты и времени в зависимости от значения настройки [date_time_input_format](../../operations/settings/settings-formats.md#date_time_input_format).
+При вставке данных в ClickHouse, можно использовать различные форматы даты и времени в зависимости от значения настройки [date_time_input_format](../../operations/settings/index.md#settings-date_time_input_format).
 
 ## Примеры {#primery}
 
@@ -119,8 +119,8 @@ FROM dt
 -   [Функции преобразования типов](../../sql-reference/functions/type-conversion-functions.md)
 -   [Функции для работы с датой и временем](../../sql-reference/functions/date-time-functions.md)
 -   [Функции для работы с массивами](../../sql-reference/functions/array-functions.md)
--   [Настройка `date_time_input_format`](../../operations/settings/settings-formats.md#date_time_input_format)
--   [Настройка `date_time_output_format`](../../operations/settings/settings-formats.md#date_time_output_format)
+-   [Настройка `date_time_input_format`](../../operations/settings/index.md#settings-date_time_input_format)
+-   [Настройка `date_time_output_format`](../../operations/settings/index.md)
 -   [Конфигурационный параметр сервера `timezone`](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-timezone)
 -   [Параметр `session_timezone`](../../operations/settings/settings.md#session_timezone)
 -   [Операторы для работы с датой и временем](../../sql-reference/operators/index.md#operators-datetime)

From f91c45f562c0cdef32c9403e90eb1e52e818064c Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Fri, 15 Mar 2024 12:03:49 +0000
Subject: [PATCH 568/985] fix `01599_multiline_input_and_singleline_comments`
 properly

---
 ...multiline_input_and_singleline_comments.sh | 23 ++++++++++++-------
 1 file changed, 15 insertions(+), 8 deletions(-)

diff --git a/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh b/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh
index f1acd39136f..07c2e345009 100755
--- a/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh
+++ b/tests/queries/0_stateless/01599_multiline_input_and_singleline_comments.sh
@@ -2,7 +2,6 @@
 
 log_user 0
 
-# In some places `-timeout 1` is used to avoid expect to always wait for the whole timeout
 set timeout 60
 
 match_max 100000
@@ -14,15 +13,23 @@ expect ":) "
 
 # Make a query
 send -- "SELECT 1\r"
-expect -timeout 1 ":-] "
 send -- "-- xxx\r"
-expect -timeout 1 ":-] "
 send -- ", 2\r"
-expect -timeout 1 ":-] "
-send -- ";\r"
+send -- ";"
+
+# For some reason this sleep is required for this test to work properly
+sleep 1
+send -- "\r"
+
+expect {
+    "│ 1 │ 2 │" { }
+    timeout { exit 1 }
+}
 
-expect "│ 1 │ 2 │"
 expect ":) "
 
-send -- "\4"
-expect eof
+send -- ""
+expect {
+    eof { exit 0 }
+    timeout { exit 1 }
+}

From 5dad208b56d22a8f02fcfb72fcd822d87a8ca941 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 15 Mar 2024 13:40:18 +0100
Subject: [PATCH 569/985] fix tests

---
 .../03009_storage_memory_circ_buffer_usage.reference   |  4 ++++
 .../03009_storage_memory_circ_buffer_usage.sql         | 10 ++++++----
 2 files changed, 10 insertions(+), 4 deletions(-)

diff --git a/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.reference b/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.reference
index 0bcc6fe4434..20dda4fa15a 100644
--- a/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.reference
+++ b/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.reference
@@ -1,12 +1,16 @@
+TESTING BYTES
 8192
 9216
 9216
 65536
+TESTING ROWS
 50
 1000
 1020
 1100
+TESTING NO CIRCULAR-BUFFER
 8192
 9216
 17408
 82944
+TESTING INVALID SETTINGS
diff --git a/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.sql b/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.sql
index 77aa1d0befc..fa4ba96277d 100644
--- a/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.sql
+++ b/tests/queries/0_stateless/03009_storage_memory_circ_buffer_usage.sql
@@ -1,7 +1,9 @@
+SET max_block_size = 65409; -- Default value
+
 DROP TABLE IF EXISTS memory;
 CREATE TABLE memory (i UInt32) ENGINE = Memory SETTINGS min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
 
-/* TESTING BYTES */
+SELECT 'TESTING BYTES';
 /* 1. testing oldest block doesn't get deleted because of min-threshold */
 INSERT INTO memory SELECT * FROM numbers(0, 1600);
 SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
@@ -21,7 +23,7 @@ SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = curre
 DROP TABLE IF EXISTS memory;
 CREATE TABLE memory (i UInt32) ENGINE = Memory SETTINGS min_rows_to_keep = 100, max_rows_to_keep = 1000;
 
-/* TESTING ROWS */
+SELECT 'TESTING ROWS';
 /* 1. add normal number of rows */
 INSERT INTO memory SELECT * FROM numbers(0, 50);
 SELECT total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
@@ -38,7 +40,7 @@ SELECT total_rows FROM system.tables WHERE name = 'memory' and database = curren
 INSERT INTO memory SELECT * FROM numbers(3000, 1100);
 SELECT total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
 
-/* TESTING NO CIRCULAR-BUFFER */
+SELECT 'TESTING NO CIRCULAR-BUFFER';
 DROP TABLE IF EXISTS memory;
 CREATE TABLE memory (i UInt32) ENGINE = Memory;
 
@@ -54,7 +56,7 @@ SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = curre
 INSERT INTO memory SELECT * FROM numbers(9000, 10000);
 SELECT total_bytes FROM system.tables WHERE name = 'memory' and database = currentDatabase();
 
-/* TESTING INVALID SETTINGS */
+SELECT 'TESTING INVALID SETTINGS';
 CREATE TABLE faulty_memory (i UInt32) ENGINE = Memory SETTINGS min_rows_to_keep = 100;  -- { serverError 452 }
 CREATE TABLE faulty_memory (i UInt32) ENGINE = Memory SETTINGS min_bytes_to_keep = 100; -- { serverError 452 }
 

From 20bad992a41a37b65a477dcd40bb1c70b5c4344c Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Fri, 15 Mar 2024 12:46:15 +0000
Subject: [PATCH 570/985] CI: fix checkout action version

 #do_not_test
---
 .github/workflows/reusable_build.yml | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/.github/workflows/reusable_build.yml b/.github/workflows/reusable_build.yml
index d2fe6f5dbe7..80d78d93e1b 100644
--- a/.github/workflows/reusable_build.yml
+++ b/.github/workflows/reusable_build.yml
@@ -43,8 +43,7 @@ jobs:
     runs-on: [self-hosted, '${{inputs.runner_type}}']
     steps:
       - name: Check out repository code
-        # WIP: temporary try commit with limited perallelization of checkout
-        uses: ClickHouse/checkout@0be3f7b3098bae494d3ef5d29d2e0676fb606232
+        uses: ClickHouse/checkout@v1
         with:
           clear-repository: true
           ref: ${{ fromJson(inputs.data).git_ref }}

From bf8ae84cb6dba368966cb220b4ca5b3c6deef106 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Fri, 15 Mar 2024 13:43:03 +0000
Subject: [PATCH 571/985] fixup! CI: skip hdfs tests for arm  #do_not_test 
 #batch_0  #no_merge_commit

---
 tests/integration/helpers/cluster.py                  |  7 +++++++
 .../integration/test_allowed_url_from_config/test.py  | 11 +++++------
 2 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 52c0d8a8ee5..194c66fa5c3 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -1,8 +1,10 @@
 import base64
 import errno
+from functools import cached_property
 import http.client
 import logging
 import os
+import platform
 import stat
 import os.path as p
 import pprint
@@ -4746,3 +4748,8 @@ class ClickHouseKiller(object):
 
     def __exit__(self, exc_type, exc_val, exc_tb):
         self.clickhouse_node.start_clickhouse()
+
+
+@cached_property
+def is_arm():
+    return any(arch in platform.processor().lower() for arch in ("arm, aarch"))
diff --git a/tests/integration/test_allowed_url_from_config/test.py b/tests/integration/test_allowed_url_from_config/test.py
index fb7564ae9d3..df8934aa69b 100644
--- a/tests/integration/test_allowed_url_from_config/test.py
+++ b/tests/integration/test_allowed_url_from_config/test.py
@@ -1,6 +1,5 @@
-import platform
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance("node1", main_configs=["configs/config_with_hosts.xml"])
@@ -18,7 +17,7 @@ node5 = cluster.add_instance(
 )
 node6 = cluster.add_instance("node6", main_configs=["configs/config_for_remote.xml"])
 
-if platform.processor() != "arm":
+if not is_arm():
     node7 = cluster.add_instance(
         "node7", main_configs=["configs/config_for_redirect.xml"], with_hdfs=True
     )
@@ -273,7 +272,7 @@ def test_table_function_remote(start_cluster):
     )
 
 
-@pytest.mark.skipif(platform.processor() == "arm", reason="skip for ARM")
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_redirect(start_cluster):
     hdfs_api = start_cluster.hdfs_api
 
@@ -288,7 +287,7 @@ def test_redirect(start_cluster):
     node7.query("DROP TABLE table_test_7_1")
 
 
-@pytest.mark.skipif(platform.processor() == "arm", reason="skip for ARM")
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_HDFS(start_cluster):
     assert "not allowed" in node7.query_and_get_error(
         "CREATE TABLE table_test_7_2 (word String) ENGINE=HDFS('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'CSV')"
@@ -298,7 +297,7 @@ def test_HDFS(start_cluster):
     )
 
 
-@pytest.mark.skipif(platform.processor() == "arm", reason="skip for ARM")
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_schema_inference(start_cluster):
     error = node7.query_and_get_error("desc url('http://test.com`, 'TSVRaw'')")
     assert error.find("ReadWriteBufferFromHTTPBase") == -1

From ff456ffb3399a024657930623b377f91def8ad61 Mon Sep 17 00:00:00 2001
From: Max K <max.kainov@clickhouse.com>
Date: Fri, 15 Mar 2024 15:08:03 +0100
Subject: [PATCH 572/985] Revert "CI: ARM integration tests: disable tests with
 HDFS "

---
 tests/integration/helpers/cluster.py                |  7 -------
 .../test_allowed_url_from_config/test.py            | 13 ++++---------
 2 files changed, 4 insertions(+), 16 deletions(-)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 194c66fa5c3..52c0d8a8ee5 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -1,10 +1,8 @@
 import base64
 import errno
-from functools import cached_property
 import http.client
 import logging
 import os
-import platform
 import stat
 import os.path as p
 import pprint
@@ -4748,8 +4746,3 @@ class ClickHouseKiller(object):
 
     def __exit__(self, exc_type, exc_val, exc_tb):
         self.clickhouse_node.start_clickhouse()
-
-
-@cached_property
-def is_arm():
-    return any(arch in platform.processor().lower() for arch in ("arm, aarch"))
diff --git a/tests/integration/test_allowed_url_from_config/test.py b/tests/integration/test_allowed_url_from_config/test.py
index df8934aa69b..3106cf12702 100644
--- a/tests/integration/test_allowed_url_from_config/test.py
+++ b/tests/integration/test_allowed_url_from_config/test.py
@@ -1,5 +1,5 @@
 import pytest
-from helpers.cluster import ClickHouseCluster, is_arm
+from helpers.cluster import ClickHouseCluster
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance("node1", main_configs=["configs/config_with_hosts.xml"])
@@ -16,11 +16,9 @@ node5 = cluster.add_instance(
     "node5", main_configs=["configs/config_without_allowed_hosts.xml"]
 )
 node6 = cluster.add_instance("node6", main_configs=["configs/config_for_remote.xml"])
-
-if not is_arm():
-    node7 = cluster.add_instance(
-        "node7", main_configs=["configs/config_for_redirect.xml"], with_hdfs=True
-    )
+node7 = cluster.add_instance(
+    "node7", main_configs=["configs/config_for_redirect.xml"], with_hdfs=True
+)
 
 
 @pytest.fixture(scope="module")
@@ -272,7 +270,6 @@ def test_table_function_remote(start_cluster):
     )
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_redirect(start_cluster):
     hdfs_api = start_cluster.hdfs_api
 
@@ -287,7 +284,6 @@ def test_redirect(start_cluster):
     node7.query("DROP TABLE table_test_7_1")
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_HDFS(start_cluster):
     assert "not allowed" in node7.query_and_get_error(
         "CREATE TABLE table_test_7_2 (word String) ENGINE=HDFS('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'CSV')"
@@ -297,7 +293,6 @@ def test_HDFS(start_cluster):
     )
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_schema_inference(start_cluster):
     error = node7.query_and_get_error("desc url('http://test.com`, 'TSVRaw'')")
     assert error.find("ReadWriteBufferFromHTTPBase") == -1

From 061cd5a53d141136adac7606a68042ce8355afe7 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 15 Mar 2024 14:22:46 +0000
Subject: [PATCH 573/985] Fixup #ci_set_analyzer

---
 src/Storages/StorageMerge.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 52362eb5cb8..4a3035dffce 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -1056,7 +1056,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
             String table_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_table" : table_alias + "._table";
 
             if (has_database_virtual_column && common_header.has(database_column)
-                && (storage_stage == QueryProcessingStage::FetchColumns || (dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr && !pipe_header.has("'" + database_name + "'_String"))))
+                && (storage_stage == QueryProcessingStage::FetchColumns || !pipe_header.has("'" + database_name + "'_String")))
             {
                 ColumnWithTypeAndName column;
                 column.name = database_column;
@@ -1072,7 +1072,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
             }
 
             if (has_table_virtual_column && common_header.has(table_column)
-                && (storage_stage == QueryProcessingStage::FetchColumns || (dynamic_cast<const StorageDistributed *>(&storage_snapshot_->storage) != nullptr && !pipe_header.has("'" + table_name + "'_String"))))
+                && (storage_stage == QueryProcessingStage::FetchColumns || !pipe_header.has("'" + table_name + "'_String")))
             {
                 ColumnWithTypeAndName column;
                 column.name = table_column;
@@ -1121,7 +1121,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
         /// Subordinary tables could have different but convertible types, like numeric types of different width.
         /// We must return streams with structure equals to structure of Merge table.
         convertAndFilterSourceStream(
-            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, processed_stage);
+            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, storage_stage);
     }
 
     return builder;

From 4d6aeaa151a7789fdcc8c1d250d1ed780fbd89c4 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 15 Mar 2024 15:31:58 +0100
Subject: [PATCH 574/985] Reload CI


From 7d38789e3053b6912300e9fd48456cd3b3426690 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Fri, 15 Mar 2024 14:43:01 +0000
Subject: [PATCH 575/985] Make generate_series test smaller

---
 tests/queries/0_stateless/02970_generate_series.reference | 5 +++--
 tests/queries/0_stateless/02970_generate_series.sql       | 5 +++--
 2 files changed, 6 insertions(+), 4 deletions(-)

diff --git a/tests/queries/0_stateless/02970_generate_series.reference b/tests/queries/0_stateless/02970_generate_series.reference
index 4e4f556a39b..6e6f3c81587 100644
--- a/tests/queries/0_stateless/02970_generate_series.reference
+++ b/tests/queries/0_stateless/02970_generate_series.reference
@@ -2,8 +2,9 @@
 1
 4
 8
-500000001
-50000000
+501
+50
+17928
 0
 10
 13
diff --git a/tests/queries/0_stateless/02970_generate_series.sql b/tests/queries/0_stateless/02970_generate_series.sql
index a7f89e1bd3f..0844714b3a6 100644
--- a/tests/queries/0_stateless/02970_generate_series.sql
+++ b/tests/queries/0_stateless/02970_generate_series.sql
@@ -2,8 +2,9 @@ SELECT count() FROM generate_series(5, 4);
 SELECT count() FROM generate_series(0, 0);
 SELECT count() FROM generate_series(10, 20, 3);
 SELECT count() FROM generate_series(7, 77, 10);
-SELECT count() FROM generate_series(0, 1000000000, 2);
-SELECT count() FROM generate_series(0, 999999999, 20);
+SELECT count() FROM generate_series(0, 1000, 2);
+SELECT count() FROM generate_series(0, 999, 20);
+SELECT sum(generate_series) FROM generate_series(4, 1008, 4) WHERE generate_series % 7 = 1;
 
 SELECT * FROM generate_series(5, 4);
 SELECT * FROM generate_series(0, 0);

From f67eae6d7b8f3ecbe2becb7aa43a8d83431142f8 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 15 Mar 2024 15:50:17 +0100
Subject: [PATCH 576/985] Update memory.md

---
 .../engines/table-engines/special/memory.md   | 40 ++++++++++++++-----
 1 file changed, 31 insertions(+), 9 deletions(-)

diff --git a/docs/en/engines/table-engines/special/memory.md b/docs/en/engines/table-engines/special/memory.md
index 8ebdd57ae67..19b5c798a76 100644
--- a/docs/en/engines/table-engines/special/memory.md
+++ b/docs/en/engines/table-engines/special/memory.md
@@ -22,8 +22,7 @@ Normally, using this table engine is not justified. However, it can be used for
 
 The Memory engine is used by the system for temporary tables with external query data (see the section “External data for processing a query”), and for implementing `GLOBAL IN` (see the section “IN operators”).
 
-Upper and lower bounds can be specified to limit Memory engine table size, effectively allowing it to act as a circular
-buffer (see [Engine Parameters](#engine-parameters)).
+Upper and lower bounds can be specified to limit Memory engine table size, effectively allowing it to act as a circular buffer (see [Engine Parameters](#engine-parameters)).
 
 ## Engine Parameters {#engine-parameters}
 
@@ -40,9 +39,6 @@ buffer (see [Engine Parameters](#engine-parameters)).
 
 ## Usage {#usage}
 
-``` sql
-CREATE TABLE memory (i UInt32) ENGINE = Memory;
-```
 
 **Initialize settings**
 ``` sql
@@ -56,16 +52,42 @@ CREATE TABLE memory (i UInt32) ENGINE = Memory SETTINGS min_rows_to_keep = 100,
 CREATE TABLE memory (i UInt32) ENGINE = Memory SETTINGS min_bytes_to_keep = 4096, max_bytes_to_keep = 16384;
 
 /* 1. testing oldest block doesn't get deleted due to min-threshold - 3000 rows */
-INSERT INTO memory SELECT * FROM numbers(0, 1600);
+INSERT INTO memory SELECT * FROM numbers(0, 1600); -- 8'192 bytes
 
 /* 2. adding block that doesn't get deleted */
-INSERT INTO memory SELECT * FROM numbers(1000, 100);
+INSERT INTO memory SELECT * FROM numbers(1000, 100); -- 1'024 bytes
 
 /* 3. testing oldest block gets deleted - 9216 bytes - 1100 */
-INSERT INTO memory SELECT * FROM numbers(9000, 1000);
+INSERT INTO memory SELECT * FROM numbers(9000, 1000); -- 8'192 bytes
 
 /* 4. checking a very large block overrides all */
-INSERT INTO memory SELECT * FROM numbers(9000, 10000);
+INSERT INTO memory SELECT * FROM numbers(9000, 10000); -- 65'536 bytes
+
+SELECT total_bytes, total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
+```
+
+``` text
+┌─total_bytes─┬─total_rows─┐
+│       65536 │      10000 │
+└─────────────┴────────────┘
+```
+
+also, for rows:
+
+``` sql
+CREATE TABLE memory (i UInt32) ENGINE = Memory SETTINGS min_rows_to_keep = 4000, max_rows_to_keep = 10000;
+
+/* 1. testing oldest block doesn't get deleted due to min-threshold - 3000 rows */
+INSERT INTO memory SELECT * FROM numbers(0, 1600); -- 1'600 rows
+
+/* 2. adding block that doesn't get deleted */
+INSERT INTO memory SELECT * FROM numbers(1000, 100); -- 100 rows
+
+/* 3. testing oldest block gets deleted - 9216 bytes - 1100 */
+INSERT INTO memory SELECT * FROM numbers(9000, 1000); -- 1'000 rows
+
+/* 4. checking a very large block overrides all */
+INSERT INTO memory SELECT * FROM numbers(9000, 10000); -- 10'000 rows
 
 SELECT total_bytes, total_rows FROM system.tables WHERE name = 'memory' and database = currentDatabase();
 ```

From 32ed2353f511d9e87e48cf20d807a6fcdf6d9334 Mon Sep 17 00:00:00 2001
From: taiyang-li <654010905@qq.com>
Date: Tue, 20 Feb 2024 18:36:07 +0800
Subject: [PATCH 577/985] fix issue of actions dag split

---
 src/Interpreters/ActionsDAG.cpp | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index 37ef217cb6d..86a5b91ad63 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -1757,6 +1757,10 @@ ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split
         }
     }
 
+    /// All input nodes are needed by split to make sure first DAG and initial DAG have equal inputs,
+    for (const auto * input: inputs)
+        data[input].needed_by_split_node = true;
+
     /// DFS. Move nodes to one of the DAGs.
     for (const auto & node : nodes)
     {

From 91d18649f4d98b2ebb1c4463f4511ecc30e56255 Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Fri, 15 Mar 2024 16:23:51 +0100
Subject: [PATCH 578/985] update comments

---
 programs/keeper/Keeper.cpp              | 3 +++
 src/Common/CgroupsMemoryUsageObserver.h | 3 ++-
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index 671dd50215b..9263719da2a 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -631,6 +631,9 @@ try
         if (wait_time != 0)
         {
             observer.emplace(std::chrono::seconds(wait_time));
+            /// Keeper use setting max_memory_usage_soft_limit to control memory limit. When memory usage
+            /// hits the limit, Keeper will refuse all the request util memory usage is lower.
+            /// We don't call setLimits() here because of this.
             observer->setOnMemoryAmountAvailableChanged([&]()
             {
                 main_config_reloader->reload();
diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index 7ad0f882edd..1da49f8f777 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -17,7 +17,8 @@ namespace DB
 /// 2. Periodically reads the the maximum memory available to the process (which can change due to cgroups settings).
 ///    You can specify a callback to react on changes. The callback typically performs circular logic: It reloads the
 ///    configuration (e.g. server configuration file), which will check the memory amount again and re-calculate
-///    soft/hard limits (see 1.).
+///    soft/hard limits (see 1.) and update the value of setting `max_server_memory_usage` for clickhouse-server or
+///    `max_memory_usage_soft_limit` for clickhouse-keeper.
 #if defined(OS_LINUX)
 class CgroupsMemoryUsageObserver
 {

From 694f5416b9238a2d79b2aa7cc590ee743ca18e9d Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Fri, 15 Mar 2024 16:32:57 +0100
Subject: [PATCH 579/985] refine tests

---
 tests/integration/test_manipulate_statistic/test.py  | 2 +-
 tests/integration/test_memory_limit_observer/test.py | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_manipulate_statistic/test.py b/tests/integration/test_manipulate_statistic/test.py
index f1c00a61b07..7b96b392da8 100644
--- a/tests/integration/test_manipulate_statistic/test.py
+++ b/tests/integration/test_manipulate_statistic/test.py
@@ -6,7 +6,7 @@ from helpers.cluster import ClickHouseCluster
 cluster = ClickHouseCluster(__file__)
 
 node1 = cluster.add_instance(
-    "node1", user_configs=["config/config.xml"], with_zookeeper=True
+    "node1", user_configs=["config/config.xml"], with_zookeeper=False
 )
 
 
diff --git a/tests/integration/test_memory_limit_observer/test.py b/tests/integration/test_memory_limit_observer/test.py
index 408aa5e4018..6badb26c538 100644
--- a/tests/integration/test_memory_limit_observer/test.py
+++ b/tests/integration/test_memory_limit_observer/test.py
@@ -50,3 +50,4 @@ def test_observe_memory_limit(started_cluster):
         logging.debug(f"get new memory limit {new_max_mem}")
         if new_max_mem > original_max_mem:
             return
+    raise Exception('the memory limit does not increase as expected')

From 7c49d5bbf673b5ca855bae79609c6a2ea5bc2079 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Fri, 15 Mar 2024 15:35:31 +0000
Subject: [PATCH 580/985] Fix some tests #ci_set_analyzer

---
 .../ClusterProxy/SelectStreamFactory.cpp            |  8 +-------
 .../OptimizeShardingKeyRewriteInVisitor.cpp         |  8 +++++++-
 .../QueryPlan/DistributedCreateLocalPlan.cpp        | 13 ++++++++-----
 .../QueryPlan/DistributedCreateLocalPlan.h          |  3 ++-
 src/Processors/QueryPlan/ReadFromRemote.cpp         |  6 +++++-
 5 files changed, 23 insertions(+), 15 deletions(-)

diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
index ab301e01d0a..94a02eacdaa 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.cpp
@@ -157,14 +157,8 @@ void SelectStreamFactory::createForShardImpl(
 {
     auto emplace_local_stream = [&]()
     {
-        Block shard_header;
-        if (context->getSettingsRef().allow_experimental_analyzer)
-            shard_header = InterpreterSelectQueryAnalyzer::getSampleBlock(query_tree, context, SelectQueryOptions(processed_stage).analyze());
-        else
-            shard_header = header;
-
         local_plans.emplace_back(createLocalPlan(
-            query_ast, shard_header, context, processed_stage, shard_info.shard_num, shard_count));
+            query_ast, header, context, processed_stage, shard_info.shard_num, shard_count, has_missing_objects));
     };
 
     auto emplace_remote_stream = [&](bool lazy = false, time_t local_delay = 0)
diff --git a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
index e0d0fda81cb..0df6fcee229 100644
--- a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
+++ b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
@@ -11,6 +11,7 @@
 #include "Analyzer/FunctionNode.h"
 #include "Analyzer/IQueryTreeNode.h"
 #include "Analyzer/InDepthQueryTreeVisitor.h"
+#include "Analyzer/Utils.h"
 #include "DataTypes/IDataType.h"
 #include "Interpreters/Context_fwd.h"
 
@@ -170,7 +171,12 @@ public:
 
                 if (new_tuple.empty())
                     new_tuple.push_back(tuple.back());
-                node = std::make_shared<ConstantNode>(new_tuple);
+
+                if (new_tuple.size() == tuple.size())
+                    return;
+
+                arguments[1] = std::make_shared<ConstantNode>(new_tuple);
+                rerunFunctionResolve(function_node, getContext());
             }
         }
     }
diff --git a/src/Processors/QueryPlan/DistributedCreateLocalPlan.cpp b/src/Processors/QueryPlan/DistributedCreateLocalPlan.cpp
index 4d4bc6220e9..c8d230c87d9 100644
--- a/src/Processors/QueryPlan/DistributedCreateLocalPlan.cpp
+++ b/src/Processors/QueryPlan/DistributedCreateLocalPlan.cpp
@@ -14,12 +14,14 @@ namespace DB
 namespace
 {
 
-void addConvertingActions(QueryPlan & plan, const Block & header)
+void addConvertingActions(QueryPlan & plan, const Block & header, bool has_missing_objects)
 {
     if (blocksHaveEqualStructure(plan.getCurrentDataStream().header, header))
         return;
 
-    auto get_converting_dag = [](const Block & block_, const Block & header_)
+    auto mode = has_missing_objects ? ActionsDAG::MatchColumnsMode::Position : ActionsDAG::MatchColumnsMode::Name;
+
+    auto get_converting_dag = [mode](const Block & block_, const Block & header_)
     {
         /// Convert header structure to expected.
         /// Also we ignore constants from result and replace it with constants from header.
@@ -27,7 +29,7 @@ void addConvertingActions(QueryPlan & plan, const Block & header)
         return ActionsDAG::makeConvertingActions(
             block_.getColumnsWithTypeAndName(),
             header_.getColumnsWithTypeAndName(),
-            ActionsDAG::MatchColumnsMode::Name,
+            mode,
             true);
     };
 
@@ -44,7 +46,8 @@ std::unique_ptr<QueryPlan> createLocalPlan(
     ContextPtr context,
     QueryProcessingStage::Enum processed_stage,
     size_t shard_num,
-    size_t shard_count)
+    size_t shard_count,
+    bool has_missing_objects)
 {
     checkStackSize();
 
@@ -74,7 +77,7 @@ std::unique_ptr<QueryPlan> createLocalPlan(
         interpreter.buildQueryPlan(*query_plan);
     }
 
-    addConvertingActions(*query_plan, header);
+    addConvertingActions(*query_plan, header, has_missing_objects);
     return query_plan;
 }
 
diff --git a/src/Processors/QueryPlan/DistributedCreateLocalPlan.h b/src/Processors/QueryPlan/DistributedCreateLocalPlan.h
index 489d2607849..50545d9ae81 100644
--- a/src/Processors/QueryPlan/DistributedCreateLocalPlan.h
+++ b/src/Processors/QueryPlan/DistributedCreateLocalPlan.h
@@ -18,5 +18,6 @@ std::unique_ptr<QueryPlan> createLocalPlan(
     ContextPtr context,
     QueryProcessingStage::Enum processed_stage,
     size_t shard_num,
-    size_t shard_count);
+    size_t shard_count,
+    bool has_missing_objects);
 }
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index 8c455883ab2..119710d06d8 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -11,6 +11,7 @@
 #include <Processors/Sources/RemoteSource.h>
 #include <Processors/Sources/DelayedSource.h>
 #include <Processors/Transforms/ExpressionTransform.h>
+#include <Processors/Transforms/MaterializingTransform.h>
 #include <Interpreters/ActionsDAG.h>
 #include <Common/logger_useful.h>
 #include <Common/checkStackSize.h>
@@ -50,6 +51,9 @@ static void addConvertingActions(Pipe & pipe, const Block & header, bool use_pos
             true);
     };
 
+    if (use_positions_to_match)
+        pipe.addSimpleTransform([](const Block & stream_header) { return std::make_shared<MaterializingTransform>(stream_header); });
+
     auto convert_actions = std::make_shared<ExpressionActions>(get_converting_dag(pipe.getHeader(), header));
     pipe.addSimpleTransform([&](const Block & cur_header, Pipe::StreamType) -> ProcessorPtr
     {
@@ -190,7 +194,7 @@ void ReadFromRemote::addLazyPipe(Pipes & pipes, const ClusterProxy::SelectStream
         if (try_results.empty() || local_delay < max_remote_delay)
         {
             auto plan = createLocalPlan(
-                query, header, my_context, my_stage, my_shard.shard_info.shard_num, my_shard_count);
+                query, header, my_context, my_stage, my_shard.shard_info.shard_num, my_shard_count, my_shard.has_missing_objects);
 
             return std::move(*plan->buildQueryPipeline(
                 QueryPlanOptimizationSettings::fromContext(my_context),

From aaab9e4ed4977046fd7d9f04a17d2c8455dc9a3d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 15 Mar 2024 16:49:54 +0100
Subject: [PATCH 581/985] Add test

---
 .../03010_view_prewhere_in.reference            |  3 +++
 .../0_stateless/03010_view_prewhere_in.sql      | 17 +++++++++++++++++
 2 files changed, 20 insertions(+)
 create mode 100644 tests/queries/0_stateless/03010_view_prewhere_in.reference
 create mode 100644 tests/queries/0_stateless/03010_view_prewhere_in.sql

diff --git a/tests/queries/0_stateless/03010_view_prewhere_in.reference b/tests/queries/0_stateless/03010_view_prewhere_in.reference
new file mode 100644
index 00000000000..01e79c32a8c
--- /dev/null
+++ b/tests/queries/0_stateless/03010_view_prewhere_in.reference
@@ -0,0 +1,3 @@
+1
+2
+3
diff --git a/tests/queries/0_stateless/03010_view_prewhere_in.sql b/tests/queries/0_stateless/03010_view_prewhere_in.sql
new file mode 100644
index 00000000000..799c07f31ce
--- /dev/null
+++ b/tests/queries/0_stateless/03010_view_prewhere_in.sql
@@ -0,0 +1,17 @@
+DROP TABLE IF EXISTS v;
+CREATE VIEW v (`date` UInt32,`value` UInt8) AS
+WITH
+    data AS (SELECT '' id LIMIT 0),
+    r AS (SELECT'' as id, 1::UInt8 as value)
+SELECT
+    now() as date,
+    value AND (data.id IN (SELECT '' as d from system.one)) AS value
+FROM data
+         LEFT JOIN r ON data.id = r.id;
+
+SELECT 1;
+SELECT date, value FROM v;
+SELECT 2;
+SELECT date, value FROM v ORDER BY date;
+SELECT 3;
+DROP TABLE v;

From f02858a917639d08d1dff705e477523d7d4a1225 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Fri, 15 Mar 2024 15:59:19 +0000
Subject: [PATCH 582/985] Use SHARD_LOAD_QUEUE_BACKLOG for dictionaries in
 tests

---
 .../02098_hashed_array_dictionary_simple_key.sql.j2   | 10 ++++++----
 .../02099_hashed_array_dictionary_complex_key.sql.j2  | 11 +++++++----
 2 files changed, 13 insertions(+), 8 deletions(-)

diff --git a/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql.j2 b/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql.j2
index e5d8ad36c6d..c023f3ba6ad 100644
--- a/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql.j2
+++ b/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql.j2
@@ -10,8 +10,9 @@ ENGINE = TinyLog;
 INSERT INTO simple_key_simple_attributes_source_table VALUES(0, 'value_0', 'value_second_0');
 INSERT INTO simple_key_simple_attributes_source_table VALUES(1, 'value_1', 'value_second_1');
 INSERT INTO simple_key_simple_attributes_source_table VALUES(2, 'value_2', 'value_second_2');
+INSERT INTO simple_key_simple_attributes_source_table SELECT number + 10 as id, concat('value_', toString(id)), concat('value_second_', toString(id)) FROM numbers_mt(1_000_000);
 
-{% for dictionary_config in ['', 'SHARDS 16'] -%}
+{% for dictionary_config in ['', 'SHARDS 16 SHARD_LOAD_QUEUE_BACKLOG 2'] -%}
 
 DROP DICTIONARY IF EXISTS hashed_array_dictionary_simple_key_simple_attributes;
 CREATE DICTIONARY hashed_array_dictionary_simple_key_simple_attributes
@@ -42,7 +43,7 @@ SELECT dictGetOrDefault('hashed_array_dictionary_simple_key_simple_attributes',
 SELECT 'dictHas';
 SELECT dictHas('hashed_array_dictionary_simple_key_simple_attributes', number) FROM system.numbers LIMIT 4;
 SELECT 'select all values as input stream';
-SELECT * FROM hashed_array_dictionary_simple_key_simple_attributes ORDER BY id;
+SELECT * FROM hashed_array_dictionary_simple_key_simple_attributes ORDER BY id LIMIT 3;
 
 DROP DICTIONARY hashed_array_dictionary_simple_key_simple_attributes;
 {% endfor %}
@@ -61,8 +62,9 @@ ENGINE = TinyLog;
 INSERT INTO simple_key_complex_attributes_source_table VALUES(0, 'value_0', 'value_second_0');
 INSERT INTO simple_key_complex_attributes_source_table VALUES(1, 'value_1', NULL);
 INSERT INTO simple_key_complex_attributes_source_table VALUES(2, 'value_2', 'value_second_2');
+INSERT INTO simple_key_complex_attributes_source_table SELECT number + 10 as id, concat('value_', toString(id)), concat('value_second_', toString(id)) FROM numbers_mt(1_000_000);
 
-{% for dictionary_config in ['', 'SHARDS 16'] -%}
+{% for dictionary_config in ['', 'SHARDS 16 SHARD_LOAD_QUEUE_BACKLOG 2'] -%}
 
 DROP DICTIONARY IF EXISTS hashed_array_dictionary_simple_key_complex_attributes;
 CREATE DICTIONARY hashed_array_dictionary_simple_key_complex_attributes
@@ -92,7 +94,7 @@ SELECT dictGetOrDefault('hashed_array_dictionary_simple_key_complex_attributes',
 SELECT 'dictHas';
 SELECT dictHas('hashed_array_dictionary_simple_key_complex_attributes', number) FROM system.numbers LIMIT 4;
 SELECT 'select all values as input stream';
-SELECT * FROM hashed_array_dictionary_simple_key_complex_attributes ORDER BY id;
+SELECT * FROM hashed_array_dictionary_simple_key_complex_attributes ORDER BY id LIMIT 3;
 
 DROP DICTIONARY hashed_array_dictionary_simple_key_complex_attributes;
 
diff --git a/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql.j2 b/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql.j2
index 56f9b264a62..3a92b035666 100644
--- a/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql.j2
+++ b/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql.j2
@@ -12,7 +12,9 @@ INSERT INTO complex_key_simple_attributes_source_table VALUES(0, 'id_key_0', 'va
 INSERT INTO complex_key_simple_attributes_source_table VALUES(1, 'id_key_1', 'value_1', 'value_second_1');
 INSERT INTO complex_key_simple_attributes_source_table VALUES(2, 'id_key_2', 'value_2', 'value_second_2');
 
-{% for dictionary_config in ['', 'SHARDS 16'] -%}
+INSERT INTO complex_key_simple_attributes_source_table SELECT number + 10 as id, concat('id_key_', toString(id)), toString(id), toString(id) FROM numbers_mt(1_000_000);
+
+{% for dictionary_config in ['', 'SHARDS 16 SHARD_LOAD_QUEUE_BACKLOG 2'] -%}
 
 DROP DICTIONARY IF EXISTS hashed_array_dictionary_complex_key_simple_attributes;
 CREATE DICTIONARY hashed_array_dictionary_complex_key_simple_attributes
@@ -43,7 +45,7 @@ SELECT dictGetOrDefault('hashed_array_dictionary_complex_key_simple_attributes',
 SELECT 'dictHas';
 SELECT dictHas('hashed_array_dictionary_complex_key_simple_attributes', (number, concat('id_key_', toString(number)))) FROM system.numbers LIMIT 4;
 SELECT 'select all values as input stream';
-SELECT * FROM hashed_array_dictionary_complex_key_simple_attributes ORDER BY (id, id_key);
+SELECT * FROM hashed_array_dictionary_complex_key_simple_attributes ORDER BY (id, id_key) LIMIT 3;
 
 DROP DICTIONARY hashed_array_dictionary_complex_key_simple_attributes;
 
@@ -64,8 +66,9 @@ ENGINE = TinyLog;
 INSERT INTO complex_key_complex_attributes_source_table VALUES(0, 'id_key_0', 'value_0', 'value_second_0');
 INSERT INTO complex_key_complex_attributes_source_table VALUES(1, 'id_key_1', 'value_1', NULL);
 INSERT INTO complex_key_complex_attributes_source_table VALUES(2, 'id_key_2', 'value_2', 'value_second_2');
+INSERT INTO complex_key_complex_attributes_source_table SELECT number + 10 as id, concat('id_key_', toString(id)), toString(id), toString(id) FROM numbers_mt(1_000_000);
 
-{% for dictionary_config in ['', 'SHARDS 16'] -%}
+{% for dictionary_config in ['', 'SHARDS 16 SHARD_LOAD_QUEUE_BACKLOG 2'] -%}
 
 DROP DICTIONARY IF EXISTS hashed_array_dictionary_complex_key_complex_attributes;
 CREATE DICTIONARY hashed_array_dictionary_complex_key_complex_attributes
@@ -97,7 +100,7 @@ SELECT dictGetOrDefault('hashed_array_dictionary_complex_key_complex_attributes'
 SELECT 'dictHas';
 SELECT dictHas('hashed_array_dictionary_complex_key_complex_attributes', (number, concat('id_key_', toString(number)))) FROM system.numbers LIMIT 4;
 SELECT 'select all values as input stream';
-SELECT * FROM hashed_array_dictionary_complex_key_complex_attributes ORDER BY (id, id_key);
+SELECT * FROM hashed_array_dictionary_complex_key_complex_attributes ORDER BY (id, id_key) LIMIT 3;
 
 {% endfor %}
 

From 7a8399317398cc32faa42b24c0df9227eef530fd Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Fri, 15 Mar 2024 13:09:13 +0000
Subject: [PATCH 583/985] Convert test 02998_system_dns_cache_table to smoke

---
 .../02998_system_dns_cache_table.reference    |  3 ++-
 .../02998_system_dns_cache_table.sh           | 26 -------------------
 .../02998_system_dns_cache_table.sql          |  3 +++
 3 files changed, 5 insertions(+), 27 deletions(-)
 delete mode 100755 tests/queries/0_stateless/02998_system_dns_cache_table.sh
 create mode 100644 tests/queries/0_stateless/02998_system_dns_cache_table.sql

diff --git a/tests/queries/0_stateless/02998_system_dns_cache_table.reference b/tests/queries/0_stateless/02998_system_dns_cache_table.reference
index ed6cb000142..600d0bc0b39 100644
--- a/tests/queries/0_stateless/02998_system_dns_cache_table.reference
+++ b/tests/queries/0_stateless/02998_system_dns_cache_table.reference
@@ -1 +1,2 @@
-localhost	127.0.0.1	IPv4	1
+hostname	ip_address	ip_family	cached_at
+String	String	Enum8(\'IPv4\' = 0, \'IPv6\' = 1, \'UNIX_LOCAL\' = 2)	DateTime
diff --git a/tests/queries/0_stateless/02998_system_dns_cache_table.sh b/tests/queries/0_stateless/02998_system_dns_cache_table.sh
deleted file mode 100755
index b74fc00ab3b..00000000000
--- a/tests/queries/0_stateless/02998_system_dns_cache_table.sh
+++ /dev/null
@@ -1,26 +0,0 @@
-#!/usr/bin/env bash
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-# Retries are necessary because the DNS cache may be flushed before second statement is executed
-i=0
-retries=5
-while [[ $i -lt $retries ]]; do
-    ${CLICKHOUSE_CURL} -sS --fail --data "SELECT * FROM url('http://localhost:8123/ping', CSV, 'auto', headers())" "${CLICKHOUSE_URL}" | grep -oP -q 'Ok.' || continue
-
-    RECORDS=$(${CLICKHOUSE_CURL} -sS --fail --data "SELECT hostname, ip_address, ip_family, (isNotNull(cached_at) AND cached_at > '1970-01-01 00:00:00') FROM system.dns_cache WHERE hostname = 'localhost' and ip_family = 'IPv4';" "${CLICKHOUSE_URL}")
-
-    if [[ -n "${RECORDS}" ]]; then
-       echo "${RECORDS}"
-       exit 0
-    fi
-
-    ((++i))
-    sleep 0.2
-done
-
-echo "All tries to fetch entries for localhost failed, no rows returned.
-Probably the DNS cache is disabled or the ClickHouse instance not responds to ping."
-exit 1
diff --git a/tests/queries/0_stateless/02998_system_dns_cache_table.sql b/tests/queries/0_stateless/02998_system_dns_cache_table.sql
new file mode 100644
index 00000000000..0ceb3d8a95a
--- /dev/null
+++ b/tests/queries/0_stateless/02998_system_dns_cache_table.sql
@@ -0,0 +1,3 @@
+SELECT hostname, ip_address, ip_family, cached_at FROM system.dns_cache
+LIMIT 0
+FORMAT TSVWithNamesAndTypes;

From 9bb697eb171f3e4d2baed381591fae5493beb80e Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Fri, 15 Mar 2024 17:43:48 +0100
Subject: [PATCH 584/985] Fix finishing a failed RESTORE.

---
 src/Backups/RestorerFromBackup.cpp | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/src/Backups/RestorerFromBackup.cpp b/src/Backups/RestorerFromBackup.cpp
index bae2f9aaa25..87c143f0fe2 100644
--- a/src/Backups/RestorerFromBackup.cpp
+++ b/src/Backups/RestorerFromBackup.cpp
@@ -101,10 +101,12 @@ RestorerFromBackup::RestorerFromBackup(
 
 RestorerFromBackup::~RestorerFromBackup()
 {
-    if (!futures.empty())
+    /// If an exception occurs we can come here to the destructor having some tasks still unfinished.
+    /// We have to wait until they finish.
+    if (getNumFutures() > 0)
     {
-        LOG_ERROR(log, "RestorerFromBackup must not be destroyed while {} tasks are still running", futures.size());
-        chassert(false && "RestorerFromBackup must not be destroyed while some tasks are still running");
+        LOG_INFO(log, "Waiting for {} tasks to finish", getNumFutures());
+        waitFutures();
     }
 }
 

From 4dbf3ee1bb8bf4339fcb0fa5da680f84a2cfed34 Mon Sep 17 00:00:00 2001
From: William Schoeffel <wschoeffel@securityscorecard.io>
Date: Fri, 15 Mar 2024 14:05:24 -0300
Subject: [PATCH 585/985] fix: remove duplicated check containing part

---
 src/Storages/MergeTree/MergeTreeData.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index aacac5366a9..a22a1904345 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -6143,7 +6143,7 @@ MergeTreeData::MutableDataPartsVector MergeTreeData::tryLoadPartsToAttach(const
 
             LOG_DEBUG(log, "Found containing part {} for part {}", containing_part, part_info.dir_name);
 
-            if (!containing_part.empty() && containing_part != part_info.dir_name)
+            if (containing_part != part_info.dir_name)
                 part_info.disk->moveDirectory(fs::path(relative_data_path) / source_dir / part_info.dir_name,
                     fs::path(relative_data_path) / source_dir / ("inactive_" + part_info.dir_name));
             else

From b9f6de095d5932c83abe0092c4b7b7e29a64e4d8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 15 Mar 2024 18:11:35 +0100
Subject: [PATCH 586/985] Disable async_insert_use_adaptive_busy_timeout
 correctly with compatibility settings

---
 src/Core/SettingsChangesHistory.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 4914f97a6fb..5ecaf12647f 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -104,7 +104,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"query_plan_optimize_prewhere", true, true, "Allow to push down filter to PREWHERE expression for supported storages"},
               {"async_insert_max_data_size", 1000000, 10485760, "The previous value appeared to be too small."},
               {"async_insert_poll_timeout_ms", 10, 10, "Timeout in milliseconds for polling data from asynchronous insert queue"},
-              {"async_insert_use_adaptive_busy_timeout", true, true, "Use adaptive asynchronous insert timeout"},
+              {"async_insert_use_adaptive_busy_timeout", false, true, "Use adaptive asynchronous insert timeout"},
               {"async_insert_busy_timeout_min_ms", 50, 50, "The minimum value of the asynchronous insert timeout in milliseconds; it also serves as the initial value, which may be increased later by the adaptive algorithm"},
               {"async_insert_busy_timeout_max_ms", 200, 200, "The minimum value of the asynchronous insert timeout in milliseconds; async_insert_busy_timeout_ms is aliased to async_insert_busy_timeout_max_ms"},
               {"async_insert_busy_timeout_increase_rate", 0.2, 0.2, "The exponential growth rate at which the adaptive asynchronous insert timeout increases"},

From cfb13d212e5e9093542fef7875fd4df764a8dd7d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 15 Mar 2024 18:28:04 +0100
Subject: [PATCH 587/985] Add a test

---
 .../0_stateless/03011_adaptative_timeout_compatibility.reference | 1 +
 .../0_stateless/03011_adaptative_timeout_compatibility.sql       | 1 +
 2 files changed, 2 insertions(+)
 create mode 100644 tests/queries/0_stateless/03011_adaptative_timeout_compatibility.reference
 create mode 100644 tests/queries/0_stateless/03011_adaptative_timeout_compatibility.sql

diff --git a/tests/queries/0_stateless/03011_adaptative_timeout_compatibility.reference b/tests/queries/0_stateless/03011_adaptative_timeout_compatibility.reference
new file mode 100644
index 00000000000..573541ac970
--- /dev/null
+++ b/tests/queries/0_stateless/03011_adaptative_timeout_compatibility.reference
@@ -0,0 +1 @@
+0
diff --git a/tests/queries/0_stateless/03011_adaptative_timeout_compatibility.sql b/tests/queries/0_stateless/03011_adaptative_timeout_compatibility.sql
new file mode 100644
index 00000000000..cdd2da0f6d8
--- /dev/null
+++ b/tests/queries/0_stateless/03011_adaptative_timeout_compatibility.sql
@@ -0,0 +1 @@
+SELECT value from system.settings where name = 'async_insert_use_adaptive_busy_timeout' SETTINGS compatibility = '23.12';

From c97731fb8c7ac9cab37445de41a4bf04838c4d77 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 15 Mar 2024 18:46:23 +0100
Subject: [PATCH 588/985] Correctly process last stacktrace

---
 .../postprocess-traces/postprocess-traces.pl  | 25 ++++++++++++-------
 1 file changed, 16 insertions(+), 9 deletions(-)

diff --git a/utils/postprocess-traces/postprocess-traces.pl b/utils/postprocess-traces/postprocess-traces.pl
index 476fb46418f..3e50f64d864 100755
--- a/utils/postprocess-traces/postprocess-traces.pl
+++ b/utils/postprocess-traces/postprocess-traces.pl
@@ -8,6 +8,19 @@ use Data::Dumper;
 my @current_stack = ();
 my $grouped_stacks = {};
 
+sub process_stacktrace
+{
+    my $group = \$grouped_stacks;
+    for my $frame (reverse @current_stack)
+    {
+        $$group->{count} ||= 0;
+        ++$$group->{count};
+        $group = \$$group->{children}{$frame};
+    }
+
+    @current_stack = ();
+}
+
 while (my $line = <>)
 {
     chomp $line;
@@ -21,18 +34,12 @@ while (my $line = <>)
 
     if ($line eq '')
     {
-        my $group = \$grouped_stacks;
-        for my $frame (reverse @current_stack)
-        {
-            $$group->{count} ||= 0;
-            ++$$group->{count};
-            $group = \$$group->{children}{$frame};
-        }
-
-        @current_stack = ();
+        process_stacktrace();
     }
 }
 
+process_stacktrace();
+
 sub print_group
 {
     my $group = shift;

From 8be4a3d7a569d6ea59ebfa4409c5ce13567b4a09 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Fri, 15 Mar 2024 20:28:46 +0100
Subject: [PATCH 589/985] Update BackupsWorker.cpp

---
 src/Backups/BackupsWorker.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Backups/BackupsWorker.cpp b/src/Backups/BackupsWorker.cpp
index 1b4279ca9a7..d0853300edb 100644
--- a/src/Backups/BackupsWorker.cpp
+++ b/src/Backups/BackupsWorker.cpp
@@ -327,7 +327,7 @@ public:
                 metric_active_threads = CurrentMetrics::RestoreThreadsActive;
                 metric_active_threads = CurrentMetrics::RestoreThreadsScheduled;
                 max_threads = num_restore_threads;
-                use_queue = (thread_pool_id != ThreadPoolId::RESTORE);
+                use_queue = true;
                 break;
             }
         }

From e1730c070ea815657463e8ba4ac34d41ef52d6a2 Mon Sep 17 00:00:00 2001
From: Han Fei <hanfei19910905@gmail.com>
Date: Fri, 15 Mar 2024 21:00:42 +0100
Subject: [PATCH 590/985] fix style

---
 tests/integration/test_memory_limit_observer/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_memory_limit_observer/test.py b/tests/integration/test_memory_limit_observer/test.py
index 6badb26c538..fe3acd9a0cf 100644
--- a/tests/integration/test_memory_limit_observer/test.py
+++ b/tests/integration/test_memory_limit_observer/test.py
@@ -50,4 +50,4 @@ def test_observe_memory_limit(started_cluster):
         logging.debug(f"get new memory limit {new_max_mem}")
         if new_max_mem > original_max_mem:
             return
-    raise Exception('the memory limit does not increase as expected')
+    raise Exception("the memory limit does not increase as expected")

From bc6cd6e769c165a2aaffd06a2960bbce3cb616f0 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Fri, 15 Mar 2024 22:30:49 +0000
Subject: [PATCH 591/985] fix test_polymorphic_parts

---
 tests/integration/test_polymorphic_parts/test.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_polymorphic_parts/test.py b/tests/integration/test_polymorphic_parts/test.py
index 01bc4804c9f..b91a72c5534 100644
--- a/tests/integration/test_polymorphic_parts/test.py
+++ b/tests/integration/test_polymorphic_parts/test.py
@@ -332,7 +332,13 @@ def test_different_part_types_on_replicas(start_cluster, table, part_type):
     for _ in range(3):
         insert_random_data(table, leader, 100)
 
-    leader.query("OPTIMIZE TABLE {} FINAL".format(table))
+    exec_query_with_retry(
+        leader,
+        "OPTIMIZE TABLE {} FINAL".format(table),
+        settings={"optimize_throw_if_noop": 1},
+        silent=True,
+    )
+
     follower.query("SYSTEM SYNC REPLICA {}".format(table), timeout=20)
 
     expected = "{}\t1\n".format(part_type)

From e1b2e0a00bae0347f02eba4c484577ed41b51c46 Mon Sep 17 00:00:00 2001
From: Shaun Struwig <41984034+Blargian@users.noreply.github.com>
Date: Sat, 16 Mar 2024 02:34:45 +0100
Subject: [PATCH 592/985] Update polygon.md

Add WKT function to documentation
---
 .../en/sql-reference/functions/geo/polygon.md | 28 +++++++++++++++++++
 1 file changed, 28 insertions(+)

diff --git a/docs/en/sql-reference/functions/geo/polygon.md b/docs/en/sql-reference/functions/geo/polygon.md
index 35e2280e5cc..3aee8f03e28 100644
--- a/docs/en/sql-reference/functions/geo/polygon.md
+++ b/docs/en/sql-reference/functions/geo/polygon.md
@@ -4,6 +4,34 @@ sidebar_label: Polygons
 title: "Functions for Working with Polygons"
 ---
 
+## WKT
+
+Returns a WKT (Well Known Text) geometric object from tuples which represent point coordinates.
+
+**Syntax**
+
+```sql
+WKT(points)
+```
+
+**Parameters**
+
+- `points`: a [tuple](../../data-types/tuple.md) representing coordinate point (x, y) or an [array](../../data-types/array.md) of tuples, or an array of tuple arrays.
+
+**Returned value**
+
+WKT (Well Known Text) geometric object.
+
+**Example**
+
+```sql
+SELECT wkt([[(0., 0.), (10., 0.), (10., 10.), (0., 10.)], [(4., 4.), (5., 4.), (5., 5.), (4., 5.)]]);
+```
+
+```response
+POLYGON((0 0,10 0,10 10,0 10,0 0),(4 4,5 4,5 5,4 5,4 4))
+```
+
 ## readWKTMultiPolygon
 
 Converts a WKT (Well Known Text) MultiPolygon into a MultiPolygon type.

From adaf262dc09ff08628d54d5ffd64f7ea5053482d Mon Sep 17 00:00:00 2001
From: Dan Wu <wudanzy@google.com>
Date: Sat, 16 Mar 2024 01:12:59 +0000
Subject: [PATCH 593/985] Fix bug when reading system.parts using UUID (issue
 61220).

During the predicates pushing down of system.parts table, there is a
logic to use that predicates to filter on the storages. This makes sense
if the predicate is on the `database`, `table`, `engine`. But it can be
problem if the predicate is about `uuid`, because storage UUID is
apparently different from parts UUID.

Rename the column name from `uuid` to `storage_uuid` fixed this.
---
 src/Storages/System/StorageSystemPartsBase.cpp         |  4 ++--
 .../03010_read_system_parts_table_test.reference       |  4 ++++
 .../0_stateless/03010_read_system_parts_table_test.sql | 10 ++++++++++
 3 files changed, 16 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/03010_read_system_parts_table_test.reference
 create mode 100644 tests/queries/0_stateless/03010_read_system_parts_table_test.sql

diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index 6bdfdd357e8..1283f2d6ce0 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -188,7 +188,7 @@ StoragesInfoStream::StoragesInfoStream(const ActionsDAG::Node * predicate, Conte
     block_to_filter.insert(ColumnWithTypeAndName(std::move(table_column_mut), std::make_shared<DataTypeString>(), "table"));
     block_to_filter.insert(ColumnWithTypeAndName(std::move(engine_column_mut), std::make_shared<DataTypeString>(), "engine"));
     block_to_filter.insert(ColumnWithTypeAndName(std::move(active_column_mut), std::make_shared<DataTypeUInt8>(), "active"));
-    block_to_filter.insert(ColumnWithTypeAndName(std::move(storage_uuid_column_mut), std::make_shared<DataTypeUUID>(), "uuid"));
+    block_to_filter.insert(ColumnWithTypeAndName(std::move(storage_uuid_column_mut), std::make_shared<DataTypeUUID>(), "storage_uuid"));
 
     if (rows)
     {
@@ -200,7 +200,7 @@ StoragesInfoStream::StoragesInfoStream(const ActionsDAG::Node * predicate, Conte
     database_column = block_to_filter.getByName("database").column;
     table_column = block_to_filter.getByName("table").column;
     active_column = block_to_filter.getByName("active").column;
-    storage_uuid_column = block_to_filter.getByName("uuid").column;
+    storage_uuid_column = block_to_filter.getByName("storage_uuid").column;
 }
 
 class ReadFromSystemPartsBase : public SourceStepWithFilter
diff --git a/tests/queries/0_stateless/03010_read_system_parts_table_test.reference b/tests/queries/0_stateless/03010_read_system_parts_table_test.reference
new file mode 100644
index 00000000000..6847786761e
--- /dev/null
+++ b/tests/queries/0_stateless/03010_read_system_parts_table_test.reference
@@ -0,0 +1,4 @@
+00000000-0000-0000-0000-000000000000	1231_1_1_0
+00000000-0000-0000-0000-000000000000	6666_2_2_0
+users
+users
diff --git a/tests/queries/0_stateless/03010_read_system_parts_table_test.sql b/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
new file mode 100644
index 00000000000..6ec7e6212d5
--- /dev/null
+++ b/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
@@ -0,0 +1,10 @@
+DROP TABLE IF EXISTS users;
+CREATE TABLE users (uid Int16, name String, age Int16) ENGINE=MergeTree ORDER BY uid PARTITION BY uid;
+
+INSERT INTO users VALUES (1231, 'John', 33);
+INSERT INTO users VALUES (6666, 'Ksenia', 48);
+
+SELECT uuid, name from system.parts WHERE table = 'users';
+
+SELECT table from system.parts WHERE uuid = '00000000-0000-0000-0000-000000000000';
+DROP TABLE IF EXISTS users;

From 5c9f132800975f16346c70d483ff54363bc0e99f Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Sat, 16 Mar 2024 13:18:56 +0100
Subject: [PATCH 594/985] Explain behaviour for various geometric types and
 array shapes

---
 .../en/sql-reference/functions/geo/polygon.md | 38 ++++++++++++++++---
 1 file changed, 33 insertions(+), 5 deletions(-)

diff --git a/docs/en/sql-reference/functions/geo/polygon.md b/docs/en/sql-reference/functions/geo/polygon.md
index 3aee8f03e28..afdd6fe3f96 100644
--- a/docs/en/sql-reference/functions/geo/polygon.md
+++ b/docs/en/sql-reference/functions/geo/polygon.md
@@ -6,7 +6,11 @@ title: "Functions for Working with Polygons"
 
 ## WKT
 
-Returns a WKT (Well Known Text) geometric object from tuples which represent point coordinates.
+Returns a WKT (Well Known Text) geometric object from tuples which represent point coordinates. Supported WKT objects are: 
+
+- POINT
+- POLYGON
+- MULTIPOLYGON
 
 **Syntax**
 
@@ -20,16 +24,40 @@ WKT(points)
 
 **Returned value**
 
-WKT (Well Known Text) geometric object.
+- POINT is returned for a tuple.
+- POLYGON is returned for an array of tuples.
+- MULTIPOLYGON is returned for an array of tuple arrays. 
 
-**Example**
+**Examples**
+
+POINT from tuple:
 
 ```sql
-SELECT wkt([[(0., 0.), (10., 0.), (10., 10.), (0., 10.)], [(4., 4.), (5., 4.), (5., 5.), (4., 5.)]]);
+SELECT wkt((0., 0.));
 ```
 
 ```response
-POLYGON((0 0,10 0,10 10,0 10,0 0),(4 4,5 4,5 5,4 5,4 4))
+POINT(0 0)
+```
+
+POLYGON from an array of tuples:
+
+```sql
+SELECT wkt([(0., 0.), (10., 0.), (10., 10.), (0., 10.)]);
+```
+
+```response
+POLYGON((0 0,10 0,10 10,0 10))
+```
+
+MULTIPOLYGON from an array of multi-dimensional tuple arrays:
+
+```sql
+SELECT wkt([[[(0., 0.), (10., 0.), (10., 10.), (0., 10.)], [(4., 4.), (5., 4.), (5., 5.), (4., 5.)]], [[(-10., -10.), (-10., -9.), (-9., 10.)]]]);
+```
+
+```response
+MULTIPOLYGON(((0 0,10 0,10 10,0 10,0 0),(4 4,5 4,5 5,4 5,4 4)),((-10 -10,-10 -9,-9 10,-10 -10)))
 ```
 
 ## readWKTMultiPolygon

From f85eda34d937ad28044f063dde0378582823b8d2 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Sat, 16 Mar 2024 13:25:07 +0100
Subject: [PATCH 595/985] Update wording for multipolygon

---
 docs/en/sql-reference/functions/geo/polygon.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/en/sql-reference/functions/geo/polygon.md b/docs/en/sql-reference/functions/geo/polygon.md
index afdd6fe3f96..886ad511b9b 100644
--- a/docs/en/sql-reference/functions/geo/polygon.md
+++ b/docs/en/sql-reference/functions/geo/polygon.md
@@ -20,13 +20,13 @@ WKT(points)
 
 **Parameters**
 
-- `points`: a [tuple](../../data-types/tuple.md) representing coordinate point (x, y) or an [array](../../data-types/array.md) of tuples, or an array of tuple arrays.
+- `points`: a [tuple](../../data-types/tuple.md) representing coordinate point (x, y) or an [array](../../data-types/array.md) of tuples, or an array of multi-dimensional tuple arrays.
 
 **Returned value**
 
 - POINT is returned for a tuple.
 - POLYGON is returned for an array of tuples.
-- MULTIPOLYGON is returned for an array of tuple arrays. 
+- MULTIPOLYGON is returned for an array of multi-dimensional tuple arrays. 
 
 **Examples**
 
@@ -40,7 +40,7 @@ SELECT wkt((0., 0.));
 POINT(0 0)
 ```
 
-POLYGON from an array of tuples:
+POLYGON from an array of tuples or an array of tuple arrays:
 
 ```sql
 SELECT wkt([(0., 0.), (10., 0.), (10., 10.), (0., 10.)]);

From 335f147a3b6e69d7924a2f70449f5b2ee125bac6 Mon Sep 17 00:00:00 2001
From: Nikolay Yankin <211292+kolya7k@users.noreply.github.com>
Date: Sat, 16 Mar 2024 16:57:39 +0300
Subject: [PATCH 596/985] Update install.md

Alternative URL for latest version
---
 docs/en/getting-started/install.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/getting-started/install.md b/docs/en/getting-started/install.md
index 3b01434ecc5..cf95560b311 100644
--- a/docs/en/getting-started/install.md
+++ b/docs/en/getting-started/install.md
@@ -262,7 +262,7 @@ The required version can be downloaded with `curl` or `wget` from repository htt
 After that downloaded archives should be unpacked and installed with installation scripts. Example for the latest stable version:
 
 ``` bash
-LATEST_VERSION=$(curl -s -L https://api.github.com/repos/ClickHouse/ClickHouse/tags | \
+LATEST_VERSION=$(curl -s https://raw.githubusercontent.com/ClickHouse/ClickHouse/master/utils/list-versions/version_date.tsv | \
     grep -Eo '[0-9]+\.[0-9]+\.[0-9]+\.[0-9]+' | sort -V -r | head -n 1)
 export LATEST_VERSION
 

From 5b05bee2a9f70242c59c67ffdfb7fcade326601d Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Sat, 16 Mar 2024 15:16:53 +0100
Subject: [PATCH 597/985] Add reference to geodata types

---
 docs/en/sql-reference/functions/geo/polygon.md | 17 +++++++++++------
 1 file changed, 11 insertions(+), 6 deletions(-)

diff --git a/docs/en/sql-reference/functions/geo/polygon.md b/docs/en/sql-reference/functions/geo/polygon.md
index 886ad511b9b..6483709b461 100644
--- a/docs/en/sql-reference/functions/geo/polygon.md
+++ b/docs/en/sql-reference/functions/geo/polygon.md
@@ -6,7 +6,7 @@ title: "Functions for Working with Polygons"
 
 ## WKT
 
-Returns a WKT (Well Known Text) geometric object from tuples which represent point coordinates. Supported WKT objects are: 
+Returns a WKT (Well Known Text) geometric object from various [Geo Data Types](../../data-types/geo.md). Supported WKT objects are: 
 
 - POINT
 - POLYGON
@@ -15,18 +15,23 @@ Returns a WKT (Well Known Text) geometric object from tuples which represent poi
 **Syntax**
 
 ```sql
-WKT(points)
+WKT(geo_data)
 ```
 
 **Parameters**
 
-- `points`: a [tuple](../../data-types/tuple.md) representing coordinate point (x, y) or an [array](../../data-types/array.md) of tuples, or an array of multi-dimensional tuple arrays.
+`geo_data` can be one of the following [Geo Data Types](../../data-types/geo.md) or their underlying primitive types:
+
+- [Point](../../data-types/geo.md#point) / [Tuple](../../data-types/.md)
+- [Ring](../../data-types/geo.md#ring) / [Array](../../data-types/array.md)([Tuple](../../data-types/.md))
+- [Polygon](../../data-types/geo.md#polygon) / [Array](../../data-types/array.md)([Array](../../data-types/.md)([Tuple](../../data-types/array.md))) 
+- [MultiPolygon](../../data-types/geo.md#multipolygon) / [Array](../../data-types/array.md)([Array](../../data-types/array.md)([Array](../../data-types/array.md)([Tuple](../../data-types/.md))))
 
 **Returned value**
 
-- POINT is returned for a tuple.
-- POLYGON is returned for an array of tuples.
-- MULTIPOLYGON is returned for an array of multi-dimensional tuple arrays. 
+- WKT geometric object `POINT` is returned for a Point.
+- WKT geometric object `POLYGON` is returned for a Polygon
+- WKT geometric object `MULTIPOLYGON` is returned for a MultiPolygon. 
 
 **Examples**
 

From e956656e9d99cd142cde92c50fa01558587f8813 Mon Sep 17 00:00:00 2001
From: Blargian <shaunstruwig.ss@gmail.com>
Date: Sat, 16 Mar 2024 15:19:30 +0100
Subject: [PATCH 598/985] Remove primitive types from parameters - looks ugly

---
 docs/en/sql-reference/functions/geo/polygon.md | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/en/sql-reference/functions/geo/polygon.md b/docs/en/sql-reference/functions/geo/polygon.md
index 6483709b461..c2572779ada 100644
--- a/docs/en/sql-reference/functions/geo/polygon.md
+++ b/docs/en/sql-reference/functions/geo/polygon.md
@@ -22,10 +22,10 @@ WKT(geo_data)
 
 `geo_data` can be one of the following [Geo Data Types](../../data-types/geo.md) or their underlying primitive types:
 
-- [Point](../../data-types/geo.md#point) / [Tuple](../../data-types/.md)
-- [Ring](../../data-types/geo.md#ring) / [Array](../../data-types/array.md)([Tuple](../../data-types/.md))
-- [Polygon](../../data-types/geo.md#polygon) / [Array](../../data-types/array.md)([Array](../../data-types/.md)([Tuple](../../data-types/array.md))) 
-- [MultiPolygon](../../data-types/geo.md#multipolygon) / [Array](../../data-types/array.md)([Array](../../data-types/array.md)([Array](../../data-types/array.md)([Tuple](../../data-types/.md))))
+- [Point](../../data-types/geo.md#point)
+- [Ring](../../data-types/geo.md#ring)
+- [Polygon](../../data-types/geo.md#polygon)
+- [MultiPolygon](../../data-types/geo.md#multipolygon)
 
 **Returned value**
 

From 3a8974e7e1bbad9d6ae49c3624609b69eedf4b1c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 16 Mar 2024 16:23:12 +0100
Subject: [PATCH 599/985] A definitive guide to CAST

---
 src/Functions/formatDateTime.cpp              |   4 +-
 src/Functions/parseDateTime.cpp               |   2 +-
 .../03011_definitive_guide_to_cast.reference  |  56 ++++
 .../03011_definitive_guide_to_cast.sql        | 252 ++++++++++++++++++
 4 files changed, 311 insertions(+), 3 deletions(-)
 create mode 100644 tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
 create mode 100644 tests/queries/0_stateless/03011_definitive_guide_to_cast.sql

diff --git a/src/Functions/formatDateTime.cpp b/src/Functions/formatDateTime.cpp
index 01ef2a733c8..87438365901 100644
--- a/src/Functions/formatDateTime.cpp
+++ b/src/Functions/formatDateTime.cpp
@@ -1832,10 +1832,10 @@ using FunctionFromUnixTimestampInJodaSyntax = FunctionFormatDateTimeImpl<NameFro
 REGISTER_FUNCTION(FormatDateTime)
 {
     factory.registerFunction<FunctionFormatDateTime>();
-    factory.registerAlias("DATE_FORMAT", FunctionFormatDateTime::name);
+    factory.registerAlias("DATE_FORMAT", FunctionFormatDateTime::name, FunctionFactory::CaseInsensitive);
 
     factory.registerFunction<FunctionFromUnixTimestamp>();
-    factory.registerAlias("FROM_UNIXTIME", FunctionFromUnixTimestamp::name);
+    factory.registerAlias("FROM_UNIXTIME", FunctionFromUnixTimestamp::name, FunctionFactory::CaseInsensitive);
 
     factory.registerFunction<FunctionFormatDateTimeInJodaSyntax>();
     factory.registerFunction<FunctionFromUnixTimestampInJodaSyntax>();
diff --git a/src/Functions/parseDateTime.cpp b/src/Functions/parseDateTime.cpp
index 18882177c90..7a0d7c75774 100644
--- a/src/Functions/parseDateTime.cpp
+++ b/src/Functions/parseDateTime.cpp
@@ -1942,7 +1942,7 @@ namespace
 REGISTER_FUNCTION(ParseDateTime)
 {
     factory.registerFunction<FunctionParseDateTime>();
-    factory.registerAlias("TO_UNIXTIME", FunctionParseDateTime::name);
+    factory.registerAlias("TO_UNIXTIME", FunctionParseDateTime::name, FunctionFactory::CaseInsensitive);
     factory.registerFunction<FunctionParseDateTimeOrZero>();
     factory.registerFunction<FunctionParseDateTimeOrNull>();
     factory.registerAlias("str_to_date", FunctionParseDateTimeOrNull::name, FunctionFactory::CaseInsensitive);
diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference b/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
new file mode 100644
index 00000000000..f8f37fa7807
--- /dev/null
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
@@ -0,0 +1,56 @@
+123
+2009-02-14 00:31:30
+[1,2,3]
+123	Nullable(UInt8)
+\N	Nullable(UInt8)
+1
+255
+['Hello','wo\'rld\\']
+Hello	wo\\\'rld\\\\
+wo\'rld\\	wo\\\'rld\\\\
+123
+123
+123
+1	-1
+[]	[]	Array(Nothing)	Array(Array(Array(Tuple(UInt64, String))))
+123
+123
+123
+123
+123
+123
+123
+String	123
+123	UInt8
+200	UInt8
+123
+123
+1.1
+1.10000000000000016387
+18446744073709551615
+[1.1,2.3]
+[1.10000000000000016387,2.29999999999999967236]
+Row 1:
+──────
+CAST('1.1', 'Decimal(30, 20)'): 1.1
+CAST('1.1', 'Decimal(30, 20)'): 1.1
+CAST(plus(1, 1), 'UInt8'):      2
+-1
+\N
+0
+255
+123
+Hello\0\0\0\0\0
+Hello\0\0\0\0\0
+123.45
+2024-04-25 01:02:03
+2024-04-25 01:02:03.000000
+2024-04-25 01:02:03
+2024-04-25 01:02:03.000000
+2024-03-16 16:22:33
+2024-03-16 16:22:33
+2024-04-25	2024-01-01 02:03:04	1	12
+2024-04-25	2024-01-01 02:03:04.000000	2009-02-14 00:31:30
+2024-04-25	2024-01-01 02:03:04.000000	2009-02-14 00:31:30
+1986-04-25 13:00:00
+14
diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
new file mode 100644
index 00000000000..771123b153a
--- /dev/null
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
@@ -0,0 +1,252 @@
+SET session_timezone = 'Europe/Amsterdam';
+
+-- Type conversion functions and operators.
+
+
+-- 1. SQL standard CAST operator: `CAST(value AS Type)`.
+
+SELECT CAST(123 AS String);
+
+-- It convert between various data types, including parameterized data types
+
+SELECT CAST(1234567890 AS DateTime('Europe/Amsterdam'));
+
+-- and composite data types:
+
+SELECT CAST('[1, 2, 3]' AS Array(UInt8));
+
+-- It's return type depends on the setting `cast_keep_nullable`. If it is enabled, if the source argument type is Nullable, the resulting data type will be also Nullable, even if it is not written explicitly:
+
+SET cast_keep_nullable = 1;
+SELECT CAST(x AS UInt8) AS y, toTypeName(y) FROM VALUES('x Nullable(String)', ('123'), ('NULL'));
+
+SET cast_keep_nullable = 0;
+SELECT CAST(x AS UInt8) AS y, toTypeName(y) FROM VALUES('x Nullable(String)', ('123'), ('NULL')); -- { serverError CANNOT_PARSE_TEXT }
+
+-- There are various type conversion rules, some worth noting.
+
+-- Conversion between numeric types can involve implementation defined overflow:
+
+SELECT CAST(257 AS UInt8);
+SELECT CAST(-1 AS UInt8);
+
+-- Conversion from string acts like parsing, and for composite data types like Array, Tuple, it works in the same way as from the `Values` data format:
+
+SELECT CAST($$['Hello', 'wo\'rld\\']$$ AS Array(String));
+
+-- '
+-- While for simple data types it does not interpret escape sequences:
+
+SELECT arrayJoin(CAST($$['Hello', 'wo\'rld\\']$$ AS Array(String))) AS x, CAST($$wo\'rld\\$$ AS FixedString(9)) AS y;
+
+-- The operator is case-insensitive:
+
+SELECT CAST(123 AS String);
+SELECT cast(123 AS String);
+SELECT Cast(123 AS String);
+
+-- Conversion from a floating point value to an integer will involve truncation towards zero:
+
+SELECT CAST(1.9, 'Int64'), CAST(-1.9, 'Int64');
+
+-- Conversion from NULL into a non-Nullable type will throw an exception, as well as conversions from denormal floating point numbers (NaN, inf, -inf) to an integer, or conversion between arrays of different dimensions.
+
+-- However, you might find it amusing that an empty array of Nothing data type can be converted to arrays of any dimensions:
+
+SELECT [] AS x, CAST(x AS Array(Array(Array(Tuple(UInt64, String))))) AS y, toTypeName(x), toTypeName(y);
+
+
+-- 2. The functional form of this operator: `CAST(value, 'Type')`:
+
+SELECT CAST(123, 'String');
+
+-- This form is equivalent. Keep in mind that the type has to be a constant expression:
+
+SELECT CAST(123, 'Str'||'ing'); -- this works.
+
+-- This does not work: SELECT materialize('String') AS type, CAST(123, type);
+
+-- It is also case-insensitive:
+
+SELECT CasT(123, 'String');
+
+-- The functional form exists for the consistency of implementation (as every operator also exists in the functional form and the functional form is represented in the query's Abstract Syntax Tree). Anyway, the functional form also makes sense for users, when they need to construct a data type name from a constant expression, or when they want to generate a query programmatically.
+
+-- It's worth noting that the operator form does not allow to specify the type name as a string literal:
+
+-- This does not work: SELECT CAST(123 AS 'String');
+
+-- By only allowing it as an identifier, either bare word:
+
+SELECT CAST(123 AS String);
+
+-- Or as a MySQL or PostgreSQL quoted identifiers:
+
+SELECT CAST(123 AS `String`);
+SELECT CAST(123 AS "String");
+
+-- While the functional form only allows the type name as a string literal:
+
+SELECT CAST(123, 'String'); -- works
+SELECT CAST(123, String); -- { serverError UNKNOWN_IDENTIFIER }
+
+-- However, you can cheat:
+
+SELECT 'String' AS String, CAST(123, String);
+
+
+-- 3. The internal function `_CAST` which is different from `CAST` only by being not dependent on the value of `cast_keep_nullable` setting and other settings.
+
+-- This is needed when ClickHouse has to persist an expression for future use, like in table definitions, including primary and partition key and other indices.
+
+-- The function is not intended for being used directly. When a user uses a regular `CAST` operator or function in a table definition, it is transparently converted to `_CAST` to persist its behavior. However, the user can still use the internal version directly:
+
+SELECT _CAST(x, 'UInt8') AS y, toTypeName(y) FROM VALUES('x Nullable(String)', ('123'), ('456'));
+
+-- There is no operator form of this function:
+
+--  does not work, here UInt8 is interpreted as an alias for the value:
+SELECT _CAST(123 AS UInt8); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
+
+SELECT CAST(123 AS UInt8); -- works
+
+
+-- 4. PostgreSQL-style cast syntax `::`
+
+SELECT 123::String;
+
+-- It has a difference from the `CAST` operator: if it is applied to a simple literal value, instead of performing a type conversion, it invokes the SQL parser directly on the corresponding text fragment of the query. The most important case will be the floating-point and decimal types.
+
+-- In this example, we parse `1.1` as Decimal and not involving any type conversion:
+
+SELECT 1.1::Decimal(30, 20);
+
+-- In this example, `1.1` is first parsed as usual, yielding a Float64 value, and then converted to Decimal, producing a wrong result:
+
+SELECT CAST(1.1 AS Decimal(30, 20));
+
+-- We can change this behavior in the future.
+
+-- Another example:
+
+SELECT -1::UInt64; -- { serverError CANNOT_PARSE_NUMBER }
+
+SELECT CAST(-1 AS UInt64); -- conversion with overflow
+
+-- For composite data types, if a value is a literal, it is parsed directly:
+
+SELECT [1.1, 2.3]::Array(Decimal(30, 20));
+
+-- But if the value contains expressions, the usage of the `::` operator will be equivalent to invoking the CAST operator on the expression:
+
+SELECT [1.1, 2.3 + 0]::Array(Decimal(30, 20));
+
+-- The automatic column name for the result of an application of the `::` operator may be the same as for the result of an application of the CAST operator to a string containing the corresponding fragment of the query or to a corresponding expression:
+
+SELECT 1.1::Decimal(30, 20), CAST('1.1' AS Decimal(30, 20)), (1+1)::UInt8 FORMAT Vertical;
+
+-- The operator has the highest priority among others:
+
+SELECT 1-1::String; -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+
+-- But one interesting example is the unary minus. Here the minus is not an operator, but part of the numeric literal:
+
+SELECT -1::String;
+
+-- Here it is an operator:
+
+SELECT 1 AS x, -x::String; -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+
+
+-- 5. Accurate casting functions: `accurateCast`, `accurateCastOrNull`, `accurateCastOrDefault`.
+
+-- These functions check if the value is exactly representable in the target data type.
+
+-- The function `accurateCast` performs the conversion or throws an exception if the value is not exactly representable:
+
+SELECT accurateCast(1.123456789, 'Float32'); -- { serverError CANNOT_CONVERT_TYPE }
+
+-- The function `accurateCastOrNull` always wraps the target type into Nullable, and returns NULL if the value is not exactly representable:
+
+SELECT accurateCastOrNull(1.123456789, 'Float32');
+
+-- The function `accurateCastOrDefault` takes an additional parameter, which must be of the target type, and returns it if the value is not exactly representable:
+
+SELECT accurateCastOrDefault(-1, 'UInt64', 0::UInt64);
+
+-- These functions are case-sensitive and there are no corresponding operators:
+
+SELECT ACCURATECAST(1, 'String'); -- { serverError UNKNOWN_FUNCTION }.
+
+
+-- 6. Explicit conversion functions:
+
+-- `toString`, `toFixedString`,
+-- `toUInt8`, `toUInt16`, `toUInt32`, `toUInt64`, `toUInt128`, `toUInt256`,
+-- `toInt8`, `toInt16`, `toInt32`, `toInt64`, `toInt128`, `toInt256`,
+-- `toFloat32`, `toFloat64`,
+-- `toDecimal32`, `toDecimal64`, `toDecimal128`, `toDecimal256`,
+-- `toDate`, `toDate32`, `toDateTime`, `toDateTime64`,
+-- `toUUID`, `toIPv4`, `toIPv6`,
+-- `toIntervalNanosecond`, `toIntervalMicrosecond`, `toIntervalMillisecond`,
+-- `toIntervalSecond`, `toIntervalMinute`, `toIntervalHour`,
+-- `toIntervalDay`, `toIntervalWeek`, `toIntervalMonth`, `toIntervalQuarter`, `toIntervalYear`
+
+-- These functions work under the same rules as the CAST operator, and can be thought as a elementary implementation parts of that operator. They allow implementation defined overflow while converting between numeric types.
+
+SELECT toUInt8(-1);
+
+-- These are ClickHouse-native conversion functions. They take an argument with the input value, and for some of data types (`FixedString`, `DateTime`, `DateTime64`, `Decimal`s) the subsequent arguments are constant expressions, defining the parameters of these data types, or the rules to interpret the source value.
+
+SELECT toFloat64(123); -- no arguments
+SELECT toFixedString('Hello', 10) FORMAT TSV; -- the parameter of the FixedString data type, the function returns FixedString(10)
+SELECT toFixedString('Hello', 5 + 5) FORMAT TSV; -- it can be a constant expression
+
+SELECT toDecimal32('123.456', 2); -- the scale of the Decimal data type
+
+SELECT toDateTime('2024-04-25 01:02:03', 'Europe/Amsterdam'); -- the time zone of DateTime
+SELECT toDateTime64('2024-04-25 01:02:03', 6, 'Europe/Amsterdam'); -- the scale of DateTime64 and its time zone
+
+-- The length of FixedString and the scale of Decimal and DateTime64 types are mandatory arguments, while the time zone of the DateTime data type is optional.
+
+-- If the time zone is not specified, the time zone of the argument's data type is used, and if the argument is not a date time, the session time zone is used.
+
+SELECT toDateTime('2024-04-25 01:02:03');
+SELECT toDateTime64('2024-04-25 01:02:03', 6);
+
+-- Here the time zone can be specified as the rule of interpreration of the value during conversion:
+
+SELECT toString(now(), 'Europe/Amsterdam');
+SELECT toString(now());
+
+
+-- 7. SQL-compatibility type-defining operators:
+
+SELECT DATE '2024-04-25', TIMESTAMP '2024-01-01 02:03:04', INTERVAL 1 MINUTE, INTERVAL '12 hour';
+
+-- These operators are interpreted as the corresponding explicit conversion functions.
+
+
+-- 8. SQL-compatibility aliases for explicit conversion functions:
+
+SELECT DATE('2024-04-25'), TIMESTAMP('2024-01-01 02:03:04'), FROM_UNIXTIME(1234567890);
+
+-- These functions exist for compatibility with MySQL. They are case-insensive.
+
+SELECT date '2024-04-25', timeSTAMP('2024-01-01 02:03:04'), From_Unixtime(1234567890);
+
+
+-- 9. Specialized conversion functions:
+
+-- `parseDateTimeBestEffort`, `parseDateTimeBestEffortUS`, `parseDateTime64BestEffort`, `parseDateTime64BestEffortUS`, `toUnixTimestamp`
+
+-- These functions are similar to explicit conversion functions, but provide special rules on how the conversion is performed.
+
+SELECT parseDateTimeBestEffort('25 Apr 1986 1pm');
+
+
+-- 10. Functions for converting between different components or rounding of date and time data types.
+
+SELECT toDayOfMonth(toDateTime(1234567890));
+
+-- These functions are coverted in a separate topic.

From f5a13a023bc1d19b688ec98902411252796f96d2 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Sat, 16 Mar 2024 18:58:16 +0100
Subject: [PATCH 600/985] Rename CacheGuard -> CachePriorityGuard (because it
 is more correct)

---
 src/Interpreters/Cache/EvictionCandidates.cpp |  2 +-
 src/Interpreters/Cache/EvictionCandidates.h   |  2 +-
 src/Interpreters/Cache/FileCache.cpp          |  6 ++--
 src/Interpreters/Cache/FileCache.h            |  8 ++---
 src/Interpreters/Cache/Guards.h               | 22 ++++++-------
 src/Interpreters/Cache/IFileCachePriority.h   | 26 +++++++--------
 .../Cache/LRUFileCachePriority.cpp            | 26 +++++++--------
 src/Interpreters/Cache/LRUFileCachePriority.h | 32 +++++++++----------
 src/Interpreters/Cache/QueryLimit.cpp         | 12 +++----
 src/Interpreters/Cache/QueryLimit.h           | 12 +++----
 .../Cache/SLRUFileCachePriority.cpp           | 24 +++++++-------
 .../Cache/SLRUFileCachePriority.h             | 22 ++++++-------
 12 files changed, 97 insertions(+), 97 deletions(-)

diff --git a/src/Interpreters/Cache/EvictionCandidates.cpp b/src/Interpreters/Cache/EvictionCandidates.cpp
index 7dceab4f95f..f1ae2baa347 100644
--- a/src/Interpreters/Cache/EvictionCandidates.cpp
+++ b/src/Interpreters/Cache/EvictionCandidates.cpp
@@ -32,7 +32,7 @@ void EvictionCandidates::add(LockedKey & locked_key, const FileSegmentMetadataPt
     ++candidates_size;
 }
 
-void EvictionCandidates::evict(FileCacheQueryLimit::QueryContext * query_context, const CacheGuard::Lock & lock)
+void EvictionCandidates::evict(FileCacheQueryLimit::QueryContext * query_context, const CachePriorityGuard::Lock & lock)
 {
     if (candidates.empty())
         return;
diff --git a/src/Interpreters/Cache/EvictionCandidates.h b/src/Interpreters/Cache/EvictionCandidates.h
index 0557962d97f..e817d33d5fe 100644
--- a/src/Interpreters/Cache/EvictionCandidates.h
+++ b/src/Interpreters/Cache/EvictionCandidates.h
@@ -11,7 +11,7 @@ public:
 
     void add(LockedKey & locked_key, const FileSegmentMetadataPtr & candidate);
 
-    void evict(FileCacheQueryLimit::QueryContext * query_context, const CacheGuard::Lock &);
+    void evict(FileCacheQueryLimit::QueryContext * query_context, const CachePriorityGuard::Lock &);
 
     size_t size() const { return candidates_size; }
 
diff --git a/src/Interpreters/Cache/FileCache.cpp b/src/Interpreters/Cache/FileCache.cpp
index ea40ffcfa3c..65b6a3a172d 100644
--- a/src/Interpreters/Cache/FileCache.cpp
+++ b/src/Interpreters/Cache/FileCache.cpp
@@ -183,13 +183,13 @@ void FileCache::initialize()
     is_initialized = true;
 }
 
-CacheGuard::Lock FileCache::lockCache() const
+CachePriorityGuard::Lock FileCache::lockCache() const
 {
     ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheLockCacheMicroseconds);
     return cache_guard.lock();
 }
 
-CacheGuard::Lock FileCache::tryLockCache(std::optional<std::chrono::milliseconds> acquire_timeout) const
+CachePriorityGuard::Lock FileCache::tryLockCache(std::optional<std::chrono::milliseconds> acquire_timeout) const
 {
     return acquire_timeout.has_value() ? cache_guard.tryLockFor(acquire_timeout.value()) : cache_guard.tryLock();
 }
@@ -706,7 +706,7 @@ KeyMetadata::iterator FileCache::addFileSegment(
     size_t size,
     FileSegment::State state,
     const CreateFileSegmentSettings & create_settings,
-    const CacheGuard::Lock * lock)
+    const CachePriorityGuard::Lock * lock)
 {
     /// Create a file_segment_metadata and put it in `files` map by [key][offset].
 
diff --git a/src/Interpreters/Cache/FileCache.h b/src/Interpreters/Cache/FileCache.h
index 007c4fd9483..8ea5f4dab40 100644
--- a/src/Interpreters/Cache/FileCache.h
+++ b/src/Interpreters/Cache/FileCache.h
@@ -173,8 +173,8 @@ public:
 
     void deactivateBackgroundOperations();
 
-    CacheGuard::Lock lockCache() const;
-    CacheGuard::Lock tryLockCache(std::optional<std::chrono::milliseconds> acquire_timeout = std::nullopt) const;
+    CachePriorityGuard::Lock lockCache() const;
+    CachePriorityGuard::Lock tryLockCache(std::optional<std::chrono::milliseconds> acquire_timeout = std::nullopt) const;
 
     std::vector<FileSegment::Info> sync();
 
@@ -208,7 +208,7 @@ private:
     CacheMetadata metadata;
 
     FileCachePriorityPtr main_priority;
-    mutable CacheGuard cache_guard;
+    mutable CachePriorityGuard cache_guard;
 
     struct HitsCountStash
     {
@@ -280,7 +280,7 @@ private:
         size_t size,
         FileSegment::State state,
         const CreateFileSegmentSettings & create_settings,
-        const CacheGuard::Lock *);
+        const CachePriorityGuard::Lock *);
 };
 
 }
diff --git a/src/Interpreters/Cache/Guards.h b/src/Interpreters/Cache/Guards.h
index 0ac7cb80483..6193ee38755 100644
--- a/src/Interpreters/Cache/Guards.h
+++ b/src/Interpreters/Cache/Guards.h
@@ -10,17 +10,17 @@ namespace DB
  * 2. KeyGuard::Lock (hold till the end of the method)
  *
  * FileCache::tryReserve
- * 1. CacheGuard::Lock
+ * 1. CachePriorityGuard::Lock
  * 2. KeyGuard::Lock (taken without metadata lock)
  * 3. any number of KeyGuard::Lock's for files which are going to be evicted (taken via metadata lock)
  *
  * FileCache::removeIfExists
- * 1. CacheGuard::Lock
+ * 1. CachePriorityGuard::Lock
  * 2. KeyGuard::Lock (taken via metadata lock)
  * 3. FileSegmentGuard::Lock
  *
  * FileCache::removeAllReleasable
- * 1. CacheGuard::Lock
+ * 1. CachePriorityGuard::Lock
  * 2. any number of KeyGuard::Lock's locks (takken via metadata lock), but at a moment of time only one key lock can be hold
  * 3. FileSegmentGuard::Lock
  *
@@ -34,23 +34,23 @@ namespace DB
  * 2. FileSegmentGuard::Lock
  *
  * FileSegment::complete
- * 1. CacheGuard::Lock
+ * 1. CachePriorityGuard::Lock
  * 2. KeyGuard::Lock (taken without metadata lock)
  * 3. FileSegmentGuard::Lock
  *
  * Rules:
- * 1. Priority of locking: CacheGuard::Lock > CacheMetadataGuard::Lock > KeyGuard::Lock > FileSegmentGuard::Lock
- * 2. If we take more than one key lock at a moment of time, we need to take CacheGuard::Lock (example: tryReserve())
+ * 1. Priority of locking: CachePriorityGuard::Lock > CacheMetadataGuard::Lock > KeyGuard::Lock > FileSegmentGuard::Lock
+ * 2. If we take more than one key lock at a moment of time, we need to take CachePriorityGuard::Lock (example: tryReserve())
  *
  *
- *                                 _CacheGuard_
+ *                                 _CachePriorityGuard_
  *                                 1. FileCache::tryReserve
  *                                 2. FileCache::removeIfExists(key)
  *                                 3. FileCache::removeAllReleasable
  *                                 4. FileSegment::complete
  *
  *             _KeyGuard_                                      _CacheMetadataGuard_
- *             1. all from CacheGuard                          1. getOrSet/get/set
+ *             1. all from CachePriorityGuard                          1. getOrSet/get/set
  *             2. getOrSet/get/Set
  *
  * *This table does not include locks taken for introspection and system tables.
@@ -59,11 +59,11 @@ namespace DB
 /**
  * Cache priority queue guard.
  */
-struct CacheGuard : private boost::noncopyable
+struct CachePriorityGuard : private boost::noncopyable
 {
     using Mutex = std::timed_mutex;
-    /// struct is used (not keyword `using`) to make CacheGuard::Lock non-interchangable with other guards locks
-    /// so, we wouldn't be able to pass CacheGuard::Lock to a function which accepts KeyGuard::Lock, for example
+    /// struct is used (not keyword `using`) to make CachePriorityGuard::Lock non-interchangable with other guards locks
+    /// so, we wouldn't be able to pass CachePriorityGuard::Lock to a function which accepts KeyGuard::Lock, for example
     struct Lock : public std::unique_lock<Mutex>
     {
         using Base = std::unique_lock<Mutex>;
diff --git a/src/Interpreters/Cache/IFileCachePriority.h b/src/Interpreters/Cache/IFileCachePriority.h
index bc036166940..58011780323 100644
--- a/src/Interpreters/Cache/IFileCachePriority.h
+++ b/src/Interpreters/Cache/IFileCachePriority.h
@@ -43,11 +43,11 @@ public:
 
         virtual EntryPtr getEntry() const = 0;
 
-        virtual size_t increasePriority(const CacheGuard::Lock &) = 0;
+        virtual size_t increasePriority(const CachePriorityGuard::Lock &) = 0;
 
         virtual void updateSize(int64_t size) = 0;
 
-        virtual void remove(const CacheGuard::Lock &) = 0;
+        virtual void remove(const CachePriorityGuard::Lock &) = 0;
 
         virtual void invalidate() = 0;
 
@@ -57,13 +57,13 @@ public:
 
     virtual ~IFileCachePriority() = default;
 
-    size_t getElementsLimit(const CacheGuard::Lock &) const { return max_elements; }
+    size_t getElementsLimit(const CachePriorityGuard::Lock &) const { return max_elements; }
 
-    size_t getSizeLimit(const CacheGuard::Lock &) const { return max_size; }
+    size_t getSizeLimit(const CachePriorityGuard::Lock &) const { return max_size; }
 
-    virtual size_t getSize(const CacheGuard::Lock &) const = 0;
+    virtual size_t getSize(const CachePriorityGuard::Lock &) const = 0;
 
-    virtual size_t getElementsCount(const CacheGuard::Lock &) const = 0;
+    virtual size_t getElementsCount(const CachePriorityGuard::Lock &) const = 0;
 
     /// Throws exception if there is not enough size to fit it.
     virtual IteratorPtr add( /// NOLINT
@@ -71,7 +71,7 @@ public:
         size_t offset,
         size_t size,
         const UserInfo & user,
-        const CacheGuard::Lock &,
+        const CachePriorityGuard::Lock &,
         bool best_effort = false) = 0;
 
     /// `reservee` is the entry for which are reserving now.
@@ -79,11 +79,11 @@ public:
     /// for the corresponding file segment.
     virtual bool canFit( /// NOLINT
         size_t size,
-        const CacheGuard::Lock &,
+        const CachePriorityGuard::Lock &,
         IteratorPtr reservee = nullptr,
         bool best_effort = false) const = 0;
 
-    virtual void shuffle(const CacheGuard::Lock &) = 0;
+    virtual void shuffle(const CachePriorityGuard::Lock &) = 0;
 
     struct IPriorityDump
     {
@@ -91,9 +91,9 @@ public:
     };
     using PriorityDumpPtr = std::shared_ptr<IPriorityDump>;
 
-    virtual PriorityDumpPtr dump(const CacheGuard::Lock &) = 0;
+    virtual PriorityDumpPtr dump(const CachePriorityGuard::Lock &) = 0;
 
-    using FinalizeEvictionFunc = std::function<void(const CacheGuard::Lock & lk)>;
+    using FinalizeEvictionFunc = std::function<void(const CachePriorityGuard::Lock & lk)>;
     virtual bool collectCandidatesForEviction(
         size_t size,
         FileCacheReserveStat & stat,
@@ -101,9 +101,9 @@ public:
         IFileCachePriority::IteratorPtr reservee,
         FinalizeEvictionFunc & finalize_eviction_func,
         const UserID & user_id,
-        const CacheGuard::Lock &) = 0;
+        const CachePriorityGuard::Lock &) = 0;
 
-    virtual bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CacheGuard::Lock &) = 0;
+    virtual bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CachePriorityGuard::Lock &) = 0;
 
 protected:
     IFileCachePriority(size_t max_size_, size_t max_elements_);
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.cpp b/src/Interpreters/Cache/LRUFileCachePriority.cpp
index bce03b60024..08e65b577ca 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.cpp
+++ b/src/Interpreters/Cache/LRUFileCachePriority.cpp
@@ -43,13 +43,13 @@ IFileCachePriority::IteratorPtr LRUFileCachePriority::add( /// NOLINT
     size_t offset,
     size_t size,
     const UserInfo &,
-    const CacheGuard::Lock & lock,
+    const CachePriorityGuard::Lock & lock,
     bool)
 {
     return std::make_shared<LRUIterator>(add(std::make_shared<Entry>(key_metadata->key, offset, size, key_metadata), lock));
 }
 
-LRUFileCachePriority::LRUIterator LRUFileCachePriority::add(EntryPtr entry, const CacheGuard::Lock & lock)
+LRUFileCachePriority::LRUIterator LRUFileCachePriority::add(EntryPtr entry, const CachePriorityGuard::Lock & lock)
 {
     if (entry->size == 0)
     {
@@ -93,7 +93,7 @@ LRUFileCachePriority::LRUIterator LRUFileCachePriority::add(EntryPtr entry, cons
     return LRUIterator(this, iterator);
 }
 
-LRUFileCachePriority::LRUQueue::iterator LRUFileCachePriority::remove(LRUQueue::iterator it, const CacheGuard::Lock &)
+LRUFileCachePriority::LRUQueue::iterator LRUFileCachePriority::remove(LRUQueue::iterator it, const CachePriorityGuard::Lock &)
 {
     /// If size is 0, entry is invalidated, current_elements_num was already updated.
     const auto & entry = **it;
@@ -150,7 +150,7 @@ bool LRUFileCachePriority::LRUIterator::operator ==(const LRUIterator & other) c
     return cache_priority == other.cache_priority && iterator == other.iterator;
 }
 
-void LRUFileCachePriority::iterate(IterateFunc && func, const CacheGuard::Lock & lock)
+void LRUFileCachePriority::iterate(IterateFunc && func, const CachePriorityGuard::Lock & lock)
 {
     for (auto it = queue.begin(); it != queue.end();)
     {
@@ -201,7 +201,7 @@ void LRUFileCachePriority::iterate(IterateFunc && func, const CacheGuard::Lock &
 
 bool LRUFileCachePriority::canFit( /// NOLINT
     size_t size,
-    const CacheGuard::Lock & lock,
+    const CachePriorityGuard::Lock & lock,
     IteratorPtr,
     bool) const
 {
@@ -212,7 +212,7 @@ bool LRUFileCachePriority::canFit(
     size_t size,
     size_t released_size_assumption,
     size_t released_elements_assumption,
-    const CacheGuard::Lock &) const
+    const CachePriorityGuard::Lock &) const
 {
     return (max_size == 0 || (state->current_size + size - released_size_assumption <= max_size))
         && (max_elements == 0 || state->current_elements_num + 1 - released_elements_assumption <= max_elements);
@@ -225,7 +225,7 @@ bool LRUFileCachePriority::collectCandidatesForEviction(
     IFileCachePriority::IteratorPtr,
     FinalizeEvictionFunc &,
     const UserID &,
-    const CacheGuard::Lock & lock)
+    const CachePriorityGuard::Lock & lock)
 {
     if (canFit(size, lock))
         return true;
@@ -264,7 +264,7 @@ bool LRUFileCachePriority::collectCandidatesForEviction(
     return can_fit();
 }
 
-LRUFileCachePriority::LRUIterator LRUFileCachePriority::move(LRUIterator & it, LRUFileCachePriority & other, const CacheGuard::Lock &)
+LRUFileCachePriority::LRUIterator LRUFileCachePriority::move(LRUIterator & it, LRUFileCachePriority & other, const CachePriorityGuard::Lock &)
 {
     const auto & entry = *it.getEntry();
     if (entry.size == 0)
@@ -297,7 +297,7 @@ LRUFileCachePriority::LRUIterator LRUFileCachePriority::move(LRUIterator & it, L
     return LRUIterator(this, it.iterator);
 }
 
-IFileCachePriority::PriorityDumpPtr LRUFileCachePriority::dump(const CacheGuard::Lock & lock)
+IFileCachePriority::PriorityDumpPtr LRUFileCachePriority::dump(const CachePriorityGuard::Lock & lock)
 {
     std::vector<FileSegmentInfo> res;
     iterate([&](LockedKey &, const FileSegmentMetadataPtr & segment_metadata)
@@ -309,7 +309,7 @@ IFileCachePriority::PriorityDumpPtr LRUFileCachePriority::dump(const CacheGuard:
 }
 
 bool LRUFileCachePriority::modifySizeLimits(
-    size_t max_size_, size_t max_elements_, double /* size_ratio_ */, const CacheGuard::Lock & lock)
+    size_t max_size_, size_t max_elements_, double /* size_ratio_ */, const CachePriorityGuard::Lock & lock)
 {
     if (max_size == max_size_ && max_elements == max_elements_)
         return false; /// Nothing to change.
@@ -353,7 +353,7 @@ bool LRUFileCachePriority::modifySizeLimits(
     return true;
 }
 
-void LRUFileCachePriority::LRUIterator::remove(const CacheGuard::Lock & lock)
+void LRUFileCachePriority::LRUIterator::remove(const CachePriorityGuard::Lock & lock)
 {
     assertValid();
     cache_priority->remove(iterator, lock);
@@ -389,7 +389,7 @@ void LRUFileCachePriority::LRUIterator::updateSize(int64_t size)
     entry->size += size;
 }
 
-size_t LRUFileCachePriority::LRUIterator::increasePriority(const CacheGuard::Lock &)
+size_t LRUFileCachePriority::LRUIterator::increasePriority(const CachePriorityGuard::Lock &)
 {
     assertValid();
     cache_priority->queue.splice(cache_priority->queue.end(), cache_priority->queue, iterator);
@@ -402,7 +402,7 @@ void LRUFileCachePriority::LRUIterator::assertValid() const
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to use invalid iterator");
 }
 
-void LRUFileCachePriority::shuffle(const CacheGuard::Lock &)
+void LRUFileCachePriority::shuffle(const CachePriorityGuard::Lock &)
 {
     std::vector<LRUQueue::iterator> its;
     its.reserve(queue.size());
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.h b/src/Interpreters/Cache/LRUFileCachePriority.h
index a74a4b8b621..dcd4ee0a24c 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.h
+++ b/src/Interpreters/Cache/LRUFileCachePriority.h
@@ -24,13 +24,13 @@ protected:
 public:
     LRUFileCachePriority(size_t max_size_, size_t max_elements_, StatePtr state_ = nullptr);
 
-    size_t getSize(const CacheGuard::Lock &) const override { return state->current_size; }
+    size_t getSize(const CachePriorityGuard::Lock &) const override { return state->current_size; }
 
-    size_t getElementsCount(const CacheGuard::Lock &) const override { return state->current_elements_num; }
+    size_t getElementsCount(const CachePriorityGuard::Lock &) const override { return state->current_elements_num; }
 
     bool canFit( /// NOLINT
         size_t size,
-        const CacheGuard::Lock &,
+        const CachePriorityGuard::Lock &,
         IteratorPtr reservee = nullptr,
         bool best_effort = false) const override;
 
@@ -39,7 +39,7 @@ public:
         size_t offset,
         size_t size,
         const UserInfo & user,
-        const CacheGuard::Lock &,
+        const CachePriorityGuard::Lock &,
         bool best_effort = false) override;
 
     bool collectCandidatesForEviction(
@@ -49,9 +49,9 @@ public:
         IFileCachePriority::IteratorPtr reservee,
         FinalizeEvictionFunc & finalize_eviction_func,
         const UserID & user_id,
-        const CacheGuard::Lock &) override;
+        const CachePriorityGuard::Lock &) override;
 
-    void shuffle(const CacheGuard::Lock &) override;
+    void shuffle(const CachePriorityGuard::Lock &) override;
 
     struct LRUPriorityDump : public IPriorityDump
     {
@@ -59,11 +59,11 @@ public:
         explicit LRUPriorityDump(const std::vector<FileSegmentInfo> & infos_) : infos(infos_) {}
         void merge(const LRUPriorityDump & other) { infos.insert(infos.end(), other.infos.begin(), other.infos.end()); }
     };
-    PriorityDumpPtr dump(const CacheGuard::Lock &) override;
+    PriorityDumpPtr dump(const CachePriorityGuard::Lock &) override;
 
-    void pop(const CacheGuard::Lock & lock) { remove(queue.begin(), lock); }
+    void pop(const CachePriorityGuard::Lock & lock) { remove(queue.begin(), lock); }
 
-    bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CacheGuard::Lock &) override;
+    bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CachePriorityGuard::Lock &) override;
 
 private:
     class LRUIterator;
@@ -77,9 +77,9 @@ private:
     void updateElementsCount(int64_t num);
     void updateSize(int64_t size);
 
-    bool canFit(size_t size, size_t released_size_assumption, size_t released_elements_assumption, const CacheGuard::Lock &) const;
+    bool canFit(size_t size, size_t released_size_assumption, size_t released_elements_assumption, const CachePriorityGuard::Lock &) const;
 
-    LRUQueue::iterator remove(LRUQueue::iterator it, const CacheGuard::Lock &);
+    LRUQueue::iterator remove(LRUQueue::iterator it, const CachePriorityGuard::Lock &);
 
     enum class IterationResult
     {
@@ -88,10 +88,10 @@ private:
         REMOVE_AND_CONTINUE,
     };
     using IterateFunc = std::function<IterationResult(LockedKey &, const FileSegmentMetadataPtr &)>;
-    void iterate(IterateFunc && func, const CacheGuard::Lock &);
+    void iterate(IterateFunc && func, const CachePriorityGuard::Lock &);
 
-    LRUIterator move(LRUIterator & it, LRUFileCachePriority & other, const CacheGuard::Lock &);
-    LRUIterator add(EntryPtr entry, const CacheGuard::Lock &);
+    LRUIterator move(LRUIterator & it, LRUFileCachePriority & other, const CachePriorityGuard::Lock &);
+    LRUIterator add(EntryPtr entry, const CachePriorityGuard::Lock &);
 };
 
 class LRUFileCachePriority::LRUIterator : public IFileCachePriority::Iterator
@@ -108,9 +108,9 @@ public:
 
     EntryPtr getEntry() const override { return *iterator; }
 
-    size_t increasePriority(const CacheGuard::Lock &) override;
+    size_t increasePriority(const CachePriorityGuard::Lock &) override;
 
-    void remove(const CacheGuard::Lock &) override;
+    void remove(const CachePriorityGuard::Lock &) override;
 
     void invalidate() override;
 
diff --git a/src/Interpreters/Cache/QueryLimit.cpp b/src/Interpreters/Cache/QueryLimit.cpp
index ba4f5017772..9421005dc92 100644
--- a/src/Interpreters/Cache/QueryLimit.cpp
+++ b/src/Interpreters/Cache/QueryLimit.cpp
@@ -16,7 +16,7 @@ static bool isQueryInitialized()
         && !CurrentThread::getQueryId().empty();
 }
 
-FileCacheQueryLimit::QueryContextPtr FileCacheQueryLimit::tryGetQueryContext(const CacheGuard::Lock &)
+FileCacheQueryLimit::QueryContextPtr FileCacheQueryLimit::tryGetQueryContext(const CachePriorityGuard::Lock &)
 {
     if (!isQueryInitialized())
         return nullptr;
@@ -25,7 +25,7 @@ FileCacheQueryLimit::QueryContextPtr FileCacheQueryLimit::tryGetQueryContext(con
     return (query_iter == query_map.end()) ? nullptr : query_iter->second;
 }
 
-void FileCacheQueryLimit::removeQueryContext(const std::string & query_id, const CacheGuard::Lock &)
+void FileCacheQueryLimit::removeQueryContext(const std::string & query_id, const CachePriorityGuard::Lock &)
 {
     auto query_iter = query_map.find(query_id);
     if (query_iter == query_map.end())
@@ -41,7 +41,7 @@ void FileCacheQueryLimit::removeQueryContext(const std::string & query_id, const
 FileCacheQueryLimit::QueryContextPtr FileCacheQueryLimit::getOrSetQueryContext(
     const std::string & query_id,
     const ReadSettings & settings,
-    const CacheGuard::Lock &)
+    const CachePriorityGuard::Lock &)
 {
     if (query_id.empty())
         return nullptr;
@@ -70,7 +70,7 @@ void FileCacheQueryLimit::QueryContext::add(
     size_t offset,
     size_t size,
     const FileCache::UserInfo & user,
-    const CacheGuard::Lock & lock)
+    const CachePriorityGuard::Lock & lock)
 {
     auto it = getPriority().add(key_metadata, offset, size, user, lock);
     auto [_, inserted] = records.emplace(FileCacheKeyAndOffset{key_metadata->key, offset}, it);
@@ -87,7 +87,7 @@ void FileCacheQueryLimit::QueryContext::add(
 void FileCacheQueryLimit::QueryContext::remove(
     const Key & key,
     size_t offset,
-    const CacheGuard::Lock & lock)
+    const CachePriorityGuard::Lock & lock)
 {
     auto record = records.find({key, offset});
     if (record == records.end())
@@ -100,7 +100,7 @@ void FileCacheQueryLimit::QueryContext::remove(
 IFileCachePriority::IteratorPtr FileCacheQueryLimit::QueryContext::tryGet(
     const Key & key,
     size_t offset,
-    const CacheGuard::Lock &)
+    const CachePriorityGuard::Lock &)
 {
     auto it = records.find({key, offset});
     if (it == records.end())
diff --git a/src/Interpreters/Cache/QueryLimit.h b/src/Interpreters/Cache/QueryLimit.h
index 419126601f0..7553eff82ba 100644
--- a/src/Interpreters/Cache/QueryLimit.h
+++ b/src/Interpreters/Cache/QueryLimit.h
@@ -13,14 +13,14 @@ public:
     class QueryContext;
     using QueryContextPtr = std::shared_ptr<QueryContext>;
 
-    QueryContextPtr tryGetQueryContext(const CacheGuard::Lock & lock);
+    QueryContextPtr tryGetQueryContext(const CachePriorityGuard::Lock & lock);
 
     QueryContextPtr getOrSetQueryContext(
         const std::string & query_id,
         const ReadSettings & settings,
-        const CacheGuard::Lock &);
+        const CachePriorityGuard::Lock &);
 
-    void removeQueryContext(const std::string & query_id, const CacheGuard::Lock &);
+    void removeQueryContext(const std::string & query_id, const CachePriorityGuard::Lock &);
 
     class QueryContext
     {
@@ -38,19 +38,19 @@ public:
         Priority::IteratorPtr tryGet(
             const Key & key,
             size_t offset,
-            const CacheGuard::Lock &);
+            const CachePriorityGuard::Lock &);
 
         void add(
             KeyMetadataPtr key_metadata,
             size_t offset,
             size_t size,
             const FileCacheUserInfo & user,
-            const CacheGuard::Lock &);
+            const CachePriorityGuard::Lock &);
 
         void remove(
             const Key & key,
             size_t offset,
-            const CacheGuard::Lock &);
+            const CachePriorityGuard::Lock &);
 
     private:
         using Records = std::unordered_map<FileCacheKeyAndOffset, Priority::IteratorPtr, FileCacheKeyAndOffsetHash>;
diff --git a/src/Interpreters/Cache/SLRUFileCachePriority.cpp b/src/Interpreters/Cache/SLRUFileCachePriority.cpp
index 43f1c1012ba..1767cb94be7 100644
--- a/src/Interpreters/Cache/SLRUFileCachePriority.cpp
+++ b/src/Interpreters/Cache/SLRUFileCachePriority.cpp
@@ -34,19 +34,19 @@ SLRUFileCachePriority::SLRUFileCachePriority(
         probationary_queue.max_size, protected_queue.max_elements);
 }
 
-size_t SLRUFileCachePriority::getSize(const CacheGuard::Lock & lock) const
+size_t SLRUFileCachePriority::getSize(const CachePriorityGuard::Lock & lock) const
 {
     return protected_queue.getSize(lock) + probationary_queue.getSize(lock);
 }
 
-size_t SLRUFileCachePriority::getElementsCount(const CacheGuard::Lock & lock) const
+size_t SLRUFileCachePriority::getElementsCount(const CachePriorityGuard::Lock & lock) const
 {
     return protected_queue.getElementsCount(lock) + probationary_queue.getElementsCount(lock);
 }
 
 bool SLRUFileCachePriority::canFit( /// NOLINT
     size_t size,
-    const CacheGuard::Lock & lock,
+    const CachePriorityGuard::Lock & lock,
     IteratorPtr reservee,
     bool best_effort) const
 {
@@ -70,7 +70,7 @@ IFileCachePriority::IteratorPtr SLRUFileCachePriority::add( /// NOLINT
     size_t offset,
     size_t size,
     const UserInfo &,
-    const CacheGuard::Lock & lock,
+    const CachePriorityGuard::Lock & lock,
     bool is_startup)
 {
     if (is_startup)
@@ -103,7 +103,7 @@ bool SLRUFileCachePriority::collectCandidatesForEviction(
     IFileCachePriority::IteratorPtr reservee,
     FinalizeEvictionFunc & finalize_eviction_func,
     const UserID & user_id,
-    const CacheGuard::Lock & lock)
+    const CachePriorityGuard::Lock & lock)
 {
     /// If `it` is nullptr, then it is the first space reservation attempt
     /// for a corresponding file segment, so it will be directly put into probationary queue.
@@ -143,7 +143,7 @@ bool SLRUFileCachePriority::collectCandidatesForEviction(
         && !probationary_queue.collectCandidatesForEviction(size_to_downgrade, stat, res, reservee, noop, user_id, lock))
         return false;
 
-    finalize_eviction_func = [=, this](const CacheGuard::Lock & lk) mutable
+    finalize_eviction_func = [=, this](const CachePriorityGuard::Lock & lk) mutable
     {
         for (const auto & [key, key_candidates] : *downgrade_candidates)
         {
@@ -159,7 +159,7 @@ bool SLRUFileCachePriority::collectCandidatesForEviction(
     return true;
 }
 
-void SLRUFileCachePriority::increasePriority(SLRUIterator & iterator, const CacheGuard::Lock & lock)
+void SLRUFileCachePriority::increasePriority(SLRUIterator & iterator, const CachePriorityGuard::Lock & lock)
 {
     /// If entry is already in protected queue,
     /// we only need to increase its priority within the protected queue.
@@ -242,7 +242,7 @@ void SLRUFileCachePriority::increasePriority(SLRUIterator & iterator, const Cach
     iterator.is_protected = true;
 }
 
-IFileCachePriority::PriorityDumpPtr SLRUFileCachePriority::dump(const CacheGuard::Lock & lock)
+IFileCachePriority::PriorityDumpPtr SLRUFileCachePriority::dump(const CachePriorityGuard::Lock & lock)
 {
     auto res = dynamic_pointer_cast<LRUFileCachePriority::LRUPriorityDump>(probationary_queue.dump(lock));
     auto part_res = dynamic_pointer_cast<LRUFileCachePriority::LRUPriorityDump>(protected_queue.dump(lock));
@@ -250,14 +250,14 @@ IFileCachePriority::PriorityDumpPtr SLRUFileCachePriority::dump(const CacheGuard
     return res;
 }
 
-void SLRUFileCachePriority::shuffle(const CacheGuard::Lock & lock)
+void SLRUFileCachePriority::shuffle(const CachePriorityGuard::Lock & lock)
 {
     protected_queue.shuffle(lock);
     probationary_queue.shuffle(lock);
 }
 
 bool SLRUFileCachePriority::modifySizeLimits(
-    size_t max_size_, size_t max_elements_, double size_ratio_, const CacheGuard::Lock & lock)
+    size_t max_size_, size_t max_elements_, double size_ratio_, const CachePriorityGuard::Lock & lock)
 {
     if (max_size == max_size_ && max_elements == max_elements_ && size_ratio == size_ratio_)
         return false; /// Nothing to change.
@@ -287,7 +287,7 @@ SLRUFileCachePriority::EntryPtr SLRUFileCachePriority::SLRUIterator::getEntry()
     return entry;
 }
 
-size_t SLRUFileCachePriority::SLRUIterator::increasePriority(const CacheGuard::Lock & lock)
+size_t SLRUFileCachePriority::SLRUIterator::increasePriority(const CachePriorityGuard::Lock & lock)
 {
     assertValid();
     cache_priority->increasePriority(*this, lock);
@@ -306,7 +306,7 @@ void SLRUFileCachePriority::SLRUIterator::invalidate()
     lru_iterator.invalidate();
 }
 
-void SLRUFileCachePriority::SLRUIterator::remove(const CacheGuard::Lock & lock)
+void SLRUFileCachePriority::SLRUIterator::remove(const CachePriorityGuard::Lock & lock)
 {
     assertValid();
     lru_iterator.remove(lock);
diff --git a/src/Interpreters/Cache/SLRUFileCachePriority.h b/src/Interpreters/Cache/SLRUFileCachePriority.h
index d97fa80a6c7..d81ce1bc480 100644
--- a/src/Interpreters/Cache/SLRUFileCachePriority.h
+++ b/src/Interpreters/Cache/SLRUFileCachePriority.h
@@ -21,13 +21,13 @@ public:
         LRUFileCachePriority::StatePtr probationary_state_ = nullptr,
         LRUFileCachePriority::StatePtr protected_state_ = nullptr);
 
-    size_t getSize(const CacheGuard::Lock & lock) const override;
+    size_t getSize(const CachePriorityGuard::Lock & lock) const override;
 
-    size_t getElementsCount(const CacheGuard::Lock &) const override;
+    size_t getElementsCount(const CachePriorityGuard::Lock &) const override;
 
     bool canFit( /// NOLINT
         size_t size,
-        const CacheGuard::Lock &,
+        const CachePriorityGuard::Lock &,
         IteratorPtr reservee = nullptr,
         bool best_effort = false) const override;
 
@@ -36,7 +36,7 @@ public:
         size_t offset,
         size_t size,
         const UserInfo & user,
-        const CacheGuard::Lock &,
+        const CachePriorityGuard::Lock &,
         bool is_startup = false) override;
 
     bool collectCandidatesForEviction(
@@ -46,13 +46,13 @@ public:
         IFileCachePriority::IteratorPtr reservee,
         FinalizeEvictionFunc & finalize_eviction_func,
         const UserID & user_id,
-        const CacheGuard::Lock &) override;
+        const CachePriorityGuard::Lock &) override;
 
-    void shuffle(const CacheGuard::Lock &) override;
+    void shuffle(const CachePriorityGuard::Lock &) override;
 
-    PriorityDumpPtr dump(const CacheGuard::Lock &) override;
+    PriorityDumpPtr dump(const CachePriorityGuard::Lock &) override;
 
-    bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CacheGuard::Lock &) override;
+    bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CachePriorityGuard::Lock &) override;
 
 private:
     double size_ratio;
@@ -60,7 +60,7 @@ private:
     LRUFileCachePriority probationary_queue;
     LoggerPtr log = getLogger("SLRUFileCachePriority");
 
-    void increasePriority(SLRUIterator & iterator, const CacheGuard::Lock & lock);
+    void increasePriority(SLRUIterator & iterator, const CachePriorityGuard::Lock & lock);
 };
 
 class SLRUFileCachePriority::SLRUIterator : public IFileCachePriority::Iterator
@@ -74,9 +74,9 @@ public:
 
     EntryPtr getEntry() const override;
 
-    size_t increasePriority(const CacheGuard::Lock &) override;
+    size_t increasePriority(const CachePriorityGuard::Lock &) override;
 
-    void remove(const CacheGuard::Lock &) override;
+    void remove(const CachePriorityGuard::Lock &) override;
 
     void invalidate() override;
 

From 3fcede709e39db1525c8ed58bc6deb39814edd83 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 16 Mar 2024 19:03:42 +0100
Subject: [PATCH 601/985] Fix error

---
 .../0_stateless/03011_definitive_guide_to_cast.sql        | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
index 771123b153a..7cc662eee29 100644
--- a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
@@ -212,12 +212,12 @@ SELECT toDateTime64('2024-04-25 01:02:03', 6, 'Europe/Amsterdam'); -- the scale
 -- If the time zone is not specified, the time zone of the argument's data type is used, and if the argument is not a date time, the session time zone is used.
 
 SELECT toDateTime('2024-04-25 01:02:03');
-SELECT toDateTime64('2024-04-25 01:02:03', 6);
+SELECT toDateTime64('2024-04-25 01:02:03.456789', 6);
 
--- Here the time zone can be specified as the rule of interpreration of the value during conversion:
+-- Here the time zone can be specified as the rule of interpretation of the value during conversion:
 
-SELECT toString(now(), 'Europe/Amsterdam');
-SELECT toString(now());
+SELECT toString(1710612085::DateTime, 'America/Los_Angeles');
+SELECT toString(1710612085::DateTime);
 
 
 -- 7. SQL-compatibility type-defining operators:

From acd4e49dc2cbc61d03cc1177af40c5c0ce11243d Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 16 Mar 2024 19:35:56 +0100
Subject: [PATCH 602/985] More guides

---
 .../03011_definitive_guide_to_cast.reference  | 31 ++++--
 .../03011_definitive_guide_to_cast.sql        | 97 ++++++++++++++++++-
 2 files changed, 118 insertions(+), 10 deletions(-)

diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference b/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
index f8f37fa7807..f20fe0b7425 100644
--- a/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
@@ -8,11 +8,23 @@
 ['Hello','wo\'rld\\']
 Hello	wo\\\'rld\\\\
 wo\'rld\\	wo\\\'rld\\\\
-123
-123
-123
+133	210
+210
+[123,456]
 1	-1
 []	[]	Array(Nothing)	Array(Array(Array(Tuple(UInt64, String))))
+1970-01-01 01:00:00
+2009-02-14 00:31:30.123456
+1970-01-01 00:59:59.888889
+2009-02-14 00:31:30
+1970-01-01 01:00:00
+2299-12-31 23:59:59.000000
+2009-02-14
+2009-02-14
+123\0\0
+123
+123
+123
 123
 123
 123
@@ -46,9 +58,16 @@ Hello\0\0\0\0\0
 2024-04-25 01:02:03
 2024-04-25 01:02:03.000000
 2024-04-25 01:02:03
-2024-04-25 01:02:03.000000
-2024-03-16 16:22:33
-2024-03-16 16:22:33
+2024-04-25 01:02:03.456789
+2024-03-16 11:01:25
+2024-03-16 19:01:25
+123	\N	\N	\N
+123	0	0	0
+Nullable(UInt8)	UInt8
+123
+123
+123
+\N
 2024-04-25	2024-01-01 02:03:04	1	12
 2024-04-25	2024-01-01 02:03:04.000000	2009-02-14 00:31:30
 2024-04-25	2024-01-01 02:03:04.000000	2009-02-14 00:31:30
diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
index 7cc662eee29..91487666a54 100644
--- a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
@@ -39,11 +39,25 @@ SELECT CAST($$['Hello', 'wo\'rld\\']$$ AS Array(String));
 
 SELECT arrayJoin(CAST($$['Hello', 'wo\'rld\\']$$ AS Array(String))) AS x, CAST($$wo\'rld\\$$ AS FixedString(9)) AS y;
 
--- The operator is case-insensitive:
+-- As conversion from String is similar to direct parsing rather than conversion from other types,
+-- it can be stricter for numbers by not tolerating overflows in some cases:
 
-SELECT CAST(123 AS String);
-SELECT cast(123 AS String);
-SELECT Cast(123 AS String);
+SELECT CAST(-123 AS UInt8), CAST(1234 AS UInt8);
+
+SELECT CAST('-123' AS UInt8); -- { serverError CANNOT_PARSE_NUMBER }
+
+-- In some cases it still allows overflows, but it is implementation defined:
+
+SELECT CAST('1234' AS UInt8);
+
+-- Parsing from a string does not tolerate extra whitespace characters:
+
+SELECT CAST(' 123' AS UInt8); -- { serverError CANNOT_PARSE_TEXT }
+SELECT CAST('123 ' AS UInt8); -- { serverError CANNOT_PARSE_TEXT }
+
+-- But for composite data types, it involves a more featured parser, that take care of whitespace inside the data structures:
+
+SELECT CAST('[ 123 ,456, ]' AS Array(UInt16));
 
 -- Conversion from a floating point value to an integer will involve truncation towards zero:
 
@@ -55,6 +69,54 @@ SELECT CAST(1.9, 'Int64'), CAST(-1.9, 'Int64');
 
 SELECT [] AS x, CAST(x AS Array(Array(Array(Tuple(UInt64, String))))) AS y, toTypeName(x), toTypeName(y);
 
+-- Conversion between numbers and DateTime/Date data types interprets the number as the number of seconds/days from the Unix epoch,
+-- where Unix epoch starts from 1970-01-01T00:00:00Z (the midnight of Gregorian year 1970 in UTC),
+-- and the number of seconds don't count the coordination seconds, as in Unix.
+
+-- For example, it is 1 AM in Amsterdam:
+
+SELECT CAST(0 AS DateTime('Europe/Amsterdam'));
+
+-- The numbers can be fractional and negative (for DateTime64):
+
+SELECT CAST(1234567890.123456 AS DateTime64(6, 'Europe/Amsterdam'));
+SELECT CAST(-0.111111 AS DateTime64(6, 'Europe/Amsterdam'));
+
+-- If the result does not fit in the range of the corresponding time data types, it is truncated and saturated to the boundaries:
+
+SELECT CAST(1234567890.123456 AS DateTime('Europe/Amsterdam'));
+SELECT CAST(-1 AS DateTime('Europe/Amsterdam'));
+
+SELECT CAST(1e20 AS DateTime64(6, 'Europe/Amsterdam'));
+
+-- A special case is DateTime64(9) - the maximum resolution, where is does not cover the usual range,
+-- and in this case, it throws an exception on overflow (I don't mind if we change this behavior in the future):
+
+ SELECT CAST(1e20 AS DateTime64(9, 'Europe/Amsterdam')); -- { serverError DECIMAL_OVERFLOW }
+
+-- If a number is converted to a Date data type, the value is interpreted as the number of days since the Unix epoch,
+-- but if the number is larger than the range of the data type, it is interpreted as a unix timestamp
+-- (the number of seconds since the Unix epoch), similarly how it is done for the DateTime data type,
+-- for convenience (while the internal representation of Date is the number of days,
+-- often people want the unix timestamp to be also parsed into the Date data type):
+
+SELECT CAST(14289 AS Date);
+SELECT CAST(1234567890 AS Date);
+
+-- When converting to a FixedString, if the length of the result data type is larger than the value, the result is padded with zero bytes:
+
+SELECT CAST('123' AS FixedString(5)) FORMAT TSV;
+
+-- But if it does not fit, an exception is thrown:
+
+SELECT CAST('12345' AS FixedString(3)) FORMAT TSV; -- { serverError TOO_LARGE_STRING_SIZE }
+
+-- The operator is case-insensitive:
+
+SELECT CAST(123 AS String);
+SELECT cast(123 AS String);
+SELECT Cast(123 AS String);
+
 
 -- 2. The functional form of this operator: `CAST(value, 'Type')`:
 
@@ -219,6 +281,33 @@ SELECT toDateTime64('2024-04-25 01:02:03.456789', 6);
 SELECT toString(1710612085::DateTime, 'America/Los_Angeles');
 SELECT toString(1710612085::DateTime);
 
+-- Functions converting to numeric types, date and datetime, IP and UUID, also have versions with -OrNull and -OrZero fallbacks,
+-- that don't throw exceptions on parsing errors.
+-- They use the same rules to the accurateCast operator:
+
+SELECT toUInt8OrNull('123'), toUInt8OrNull('-123'), toUInt8OrNull('1234'), toUInt8OrNull(' 123');
+SELECT toUInt8OrZero('123'), toUInt8OrZero('-123'), toUInt8OrZero('1234'), toUInt8OrZero(' 123');
+
+SELECT toTypeName(toUInt8OrNull('123')), toTypeName(toUInt8OrZero('123'));
+
+-- These functions are only applicable to string data types.
+-- Although it is a room for extension:
+
+SELECT toUInt8OrNull(123); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+
+-- String and FixedString work:
+
+SELECT toUInt8OrNull(123::FixedString(3));
+
+-- For the FixedString data type trailing zero bytes are allowed, because they are the padding for FixedString:
+
+SELECT toUInt8OrNull('123'::FixedString(4));
+SELECT toUInt8OrNull('123\0'::FixedString(4));
+
+-- While for String, they don't:
+
+SELECT toUInt8OrNull('123\0');
+
 
 -- 7. SQL-compatibility type-defining operators:
 

From 2d8676d61a58925ace94e4e71893c93fee9551c9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 16 Mar 2024 19:38:32 +0100
Subject: [PATCH 603/985] Update 03011_definitive_guide_to_cast.sql

---
 .../03011_definitive_guide_to_cast.sql        | 30 +++++++++----------
 1 file changed, 15 insertions(+), 15 deletions(-)

diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
index 91487666a54..335b97c9db6 100644
--- a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
@@ -7,7 +7,7 @@ SET session_timezone = 'Europe/Amsterdam';
 
 SELECT CAST(123 AS String);
 
--- It convert between various data types, including parameterized data types
+-- It converts between various data types, including parameterized data types
 
 SELECT CAST(1234567890 AS DateTime('Europe/Amsterdam'));
 
@@ -15,7 +15,7 @@ SELECT CAST(1234567890 AS DateTime('Europe/Amsterdam'));
 
 SELECT CAST('[1, 2, 3]' AS Array(UInt8));
 
--- It's return type depends on the setting `cast_keep_nullable`. If it is enabled, if the source argument type is Nullable, the resulting data type will be also Nullable, even if it is not written explicitly:
+-- Its return type depends on the setting `cast_keep_nullable`. If it is enabled, if the source argument type is Nullable, the resulting data type will be also Nullable, even if it is not written explicitly:
 
 SET cast_keep_nullable = 1;
 SELECT CAST(x AS UInt8) AS y, toTypeName(y) FROM VALUES('x Nullable(String)', ('123'), ('NULL'));
@@ -25,7 +25,7 @@ SELECT CAST(x AS UInt8) AS y, toTypeName(y) FROM VALUES('x Nullable(String)', ('
 
 -- There are various type conversion rules, some worth noting.
 
--- Conversion between numeric types can involve implementation defined overflow:
+-- Conversion between numeric types can involve implementation-defined overflow:
 
 SELECT CAST(257 AS UInt8);
 SELECT CAST(-1 AS UInt8);
@@ -35,7 +35,7 @@ SELECT CAST(-1 AS UInt8);
 SELECT CAST($$['Hello', 'wo\'rld\\']$$ AS Array(String));
 
 -- '
--- While for simple data types it does not interpret escape sequences:
+-- While for simple data types, it does not interpret escape sequences:
 
 SELECT arrayJoin(CAST($$['Hello', 'wo\'rld\\']$$ AS Array(String))) AS x, CAST($$wo\'rld\\$$ AS FixedString(9)) AS y;
 
@@ -159,9 +159,9 @@ SELECT 'String' AS String, CAST(123, String);
 
 -- 3. The internal function `_CAST` which is different from `CAST` only by being not dependent on the value of `cast_keep_nullable` setting and other settings.
 
--- This is needed when ClickHouse has to persist an expression for future use, like in table definitions, including primary and partition key and other indices.
+-- This is needed when ClickHouse has to persist an expression for future use, like in table definitions, including primary and partition keys and other indices.
 
--- The function is not intended for being used directly. When a user uses a regular `CAST` operator or function in a table definition, it is transparently converted to `_CAST` to persist its behavior. However, the user can still use the internal version directly:
+-- The function is not intended to be used directly. When a user uses a regular `CAST` operator or function in a table definition, it is transparently converted to `_CAST` to persist its behavior. However, the user can still use the internal version directly:
 
 SELECT _CAST(x, 'UInt8') AS y, toTypeName(y) FROM VALUES('x Nullable(String)', ('123'), ('456'));
 
@@ -179,7 +179,7 @@ SELECT 123::String;
 
 -- It has a difference from the `CAST` operator: if it is applied to a simple literal value, instead of performing a type conversion, it invokes the SQL parser directly on the corresponding text fragment of the query. The most important case will be the floating-point and decimal types.
 
--- In this example, we parse `1.1` as Decimal and not involving any type conversion:
+-- In this example, we parse `1.1` as Decimal and do not involve any type conversion:
 
 SELECT 1.1::Decimal(30, 20);
 
@@ -211,7 +211,7 @@ SELECT 1.1::Decimal(30, 20), CAST('1.1' AS Decimal(30, 20)), (1+1)::UInt8 FORMAT
 
 SELECT 1-1::String; -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 
--- But one interesting example is the unary minus. Here the minus is not an operator, but part of the numeric literal:
+-- But one interesting example is the unary minus. Here the minus is not an operator but part of the numeric literal:
 
 SELECT -1::String;
 
@@ -236,7 +236,7 @@ SELECT accurateCastOrNull(1.123456789, 'Float32');
 
 SELECT accurateCastOrDefault(-1, 'UInt64', 0::UInt64);
 
--- These functions are case-sensitive and there are no corresponding operators:
+-- These functions are case-sensitive, and there are no corresponding operators:
 
 SELECT ACCURATECAST(1, 'String'); -- { serverError UNKNOWN_FUNCTION }.
 
@@ -254,11 +254,11 @@ SELECT ACCURATECAST(1, 'String'); -- { serverError UNKNOWN_FUNCTION }.
 -- `toIntervalSecond`, `toIntervalMinute`, `toIntervalHour`,
 -- `toIntervalDay`, `toIntervalWeek`, `toIntervalMonth`, `toIntervalQuarter`, `toIntervalYear`
 
--- These functions work under the same rules as the CAST operator, and can be thought as a elementary implementation parts of that operator. They allow implementation defined overflow while converting between numeric types.
+-- These functions work under the same rules as the CAST operator and can be thought as elementary implementation parts of that operator. They allow implementation-defined overflow while converting between numeric types.
 
 SELECT toUInt8(-1);
 
--- These are ClickHouse-native conversion functions. They take an argument with the input value, and for some of data types (`FixedString`, `DateTime`, `DateTime64`, `Decimal`s) the subsequent arguments are constant expressions, defining the parameters of these data types, or the rules to interpret the source value.
+-- These are ClickHouse-native conversion functions. They take an argument with the input value, and for some of the data types (`FixedString`, `DateTime`, `DateTime64`, `Decimal`s), the subsequent arguments are constant expressions, defining the parameters of these data types, or the rules to interpret the source value.
 
 SELECT toFloat64(123); -- no arguments
 SELECT toFixedString('Hello', 10) FORMAT TSV; -- the parameter of the FixedString data type, the function returns FixedString(10)
@@ -276,7 +276,7 @@ SELECT toDateTime64('2024-04-25 01:02:03', 6, 'Europe/Amsterdam'); -- the scale
 SELECT toDateTime('2024-04-25 01:02:03');
 SELECT toDateTime64('2024-04-25 01:02:03.456789', 6);
 
--- Here the time zone can be specified as the rule of interpretation of the value during conversion:
+-- Here, the time zone can be specified as the rule of interpretation of the value during conversion:
 
 SELECT toString(1710612085::DateTime, 'America/Los_Angeles');
 SELECT toString(1710612085::DateTime);
@@ -320,7 +320,7 @@ SELECT DATE '2024-04-25', TIMESTAMP '2024-01-01 02:03:04', INTERVAL 1 MINUTE, IN
 
 SELECT DATE('2024-04-25'), TIMESTAMP('2024-01-01 02:03:04'), FROM_UNIXTIME(1234567890);
 
--- These functions exist for compatibility with MySQL. They are case-insensive.
+-- These functions exist for compatibility with MySQL. They are case-insensitive.
 
 SELECT date '2024-04-25', timeSTAMP('2024-01-01 02:03:04'), From_Unixtime(1234567890);
 
@@ -329,7 +329,7 @@ SELECT date '2024-04-25', timeSTAMP('2024-01-01 02:03:04'), From_Unixtime(123456
 
 -- `parseDateTimeBestEffort`, `parseDateTimeBestEffortUS`, `parseDateTime64BestEffort`, `parseDateTime64BestEffortUS`, `toUnixTimestamp`
 
--- These functions are similar to explicit conversion functions, but provide special rules on how the conversion is performed.
+-- These functions are similar to explicit conversion functions but provide special rules on how the conversion is performed.
 
 SELECT parseDateTimeBestEffort('25 Apr 1986 1pm');
 
@@ -338,4 +338,4 @@ SELECT parseDateTimeBestEffort('25 Apr 1986 1pm');
 
 SELECT toDayOfMonth(toDateTime(1234567890));
 
--- These functions are coverted in a separate topic.
+-- These functions are covered in a separate topic.

From 175efee0891223c6242f34e6bf08301a625ef407 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 16 Mar 2024 19:50:11 +0100
Subject: [PATCH 604/985] More guides

---
 .../0_stateless/03011_definitive_guide_to_cast.reference     | 2 ++
 tests/queries/0_stateless/03011_definitive_guide_to_cast.sql | 5 +++++
 2 files changed, 7 insertions(+)

diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference b/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
index f20fe0b7425..b71011d75ff 100644
--- a/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
@@ -61,6 +61,8 @@ Hello\0\0\0\0\0
 2024-04-25 01:02:03.456789
 2024-03-16 11:01:25
 2024-03-16 19:01:25
+2024-03-16 19:01:25
+2024-03-16 11:01:25
 123	\N	\N	\N
 123	0	0	0
 Nullable(UInt8)	UInt8
diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
index 335b97c9db6..e79572e1ddb 100644
--- a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
@@ -281,6 +281,11 @@ SELECT toDateTime64('2024-04-25 01:02:03.456789', 6);
 SELECT toString(1710612085::DateTime, 'America/Los_Angeles');
 SELECT toString(1710612085::DateTime);
 
+-- In the case when the time zone is not the part of the resulting data type, but a rule of interpretation of the source value,
+-- it can be non-constant. Let's clarify: in this example, the resulting data type is a String; it does not have a time zone parameter:
+
+SELECT toString(1710612085::DateTime, tz) FROM Values('tz String', 'Europe/Amsterdam', 'America/Los_Angeles');
+
 -- Functions converting to numeric types, date and datetime, IP and UUID, also have versions with -OrNull and -OrZero fallbacks,
 -- that don't throw exceptions on parsing errors.
 -- They use the same rules to the accurateCast operator:

From 65eb6f135c19459ace827035dd518b371c64ee49 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 16 Mar 2024 19:52:10 +0100
Subject: [PATCH 605/985] More guides

---
 tests/queries/0_stateless/03011_definitive_guide_to_cast.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
index e79572e1ddb..76819ad8313 100644
--- a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
@@ -55,7 +55,7 @@ SELECT CAST('1234' AS UInt8);
 SELECT CAST(' 123' AS UInt8); -- { serverError CANNOT_PARSE_TEXT }
 SELECT CAST('123 ' AS UInt8); -- { serverError CANNOT_PARSE_TEXT }
 
--- But for composite data types, it involves a more featured parser, that take care of whitespace inside the data structures:
+-- But for composite data types, it involves a more featured parser, that takes care of whitespace inside the data structures:
 
 SELECT CAST('[ 123 ,456, ]' AS Array(UInt16));
 

From e5f15b6ac4894f32c7dd82091a3ee8260ef05f86 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 16 Mar 2024 23:00:57 +0100
Subject: [PATCH 606/985] Fix errors

---
 src/Functions/FunctionsConversion.cpp | 26 +++++++++++++-------------
 1 file changed, 13 insertions(+), 13 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 7f130b0cc86..0deb2960d34 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -364,9 +364,9 @@ struct ToDateTime64TransformUnsigned
 {
     static constexpr auto name = "toDateTime64";
 
-    const DateTime64::NativeType scale_multiplier = 1;
+    const DateTime64::NativeType scale_multiplier;
 
-    ToDateTime64TransformUnsigned(UInt32 scale = 0) /// NOLINT
+    ToDateTime64TransformUnsigned(UInt32 scale) /// NOLINT
         : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
     {}
 
@@ -388,9 +388,9 @@ struct ToDateTime64TransformSigned
 {
     static constexpr auto name = "toDateTime64";
 
-    const DateTime64::NativeType scale_multiplier = 1;
+    const DateTime64::NativeType scale_multiplier;
 
-    ToDateTime64TransformSigned(UInt32 scale = 0) /// NOLINT
+    ToDateTime64TransformSigned(UInt32 scale) /// NOLINT
         : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
     {}
 
@@ -412,9 +412,9 @@ struct ToDateTime64TransformFloat
 {
     static constexpr auto name = "toDateTime64";
 
-    const UInt32 scale = 1;
+    const UInt32 scale;
 
-    ToDateTime64TransformFloat(UInt32 scale_ = 0) /// NOLINT
+    ToDateTime64TransformFloat(UInt32 scale_) /// NOLINT
         : scale(scale_)
     {}
 
@@ -439,7 +439,7 @@ struct FromDateTime64Transform
 {
     static constexpr auto name = Transform::name;
 
-    const DateTime64::NativeType scale_multiplier = 1;
+    const DateTime64::NativeType scale_multiplier;
 
     FromDateTime64Transform(UInt32 scale) /// NOLINT
         : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
@@ -456,9 +456,9 @@ struct ToDateTime64Transform
 {
     static constexpr auto name = "toDateTime64";
 
-    const DateTime64::NativeType scale_multiplier = 1;
+    const DateTime64::NativeType scale_multiplier;
 
-    ToDateTime64Transform(UInt32 scale = 0) /// NOLINT
+    ToDateTime64Transform(UInt32 scale) /// NOLINT
         : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
     {}
 
@@ -1309,14 +1309,14 @@ struct ConvertImpl
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformSigned<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
-                arguments, result_type, input_rows_count);
+                arguments, result_type, input_rows_count, additions);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
             && std::is_same_v<ToDataType, DataTypeDateTime64>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformUnsigned<UInt64, default_date_time_overflow_behavior>, false>::template execute<Additions>(
-                arguments, result_type, input_rows_count);
+                arguments, result_type, input_rows_count, additions);
         }
         else if constexpr ((
                 std::is_same_v<FromDataType, DataTypeFloat32>
@@ -1325,7 +1325,7 @@ struct ConvertImpl
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformFloat<FromDataType, typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
-                arguments, result_type, input_rows_count);
+                arguments, result_type, input_rows_count, additions);
         }
         /// Conversion of DateTime64 to Date or DateTime: discards fractional part.
         else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
@@ -1351,7 +1351,7 @@ struct ConvertImpl
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64Transform, false>::template execute<Additions>(
-                arguments, result_type, input_rows_count);
+                arguments, result_type, input_rows_count, additions);
         }
         else if constexpr (IsDataTypeDateOrDateTime<FromDataType>
             && std::is_same_v<ToDataType, DataTypeString>)

From f1be9e67070a25362e4e67ce78540ce95cc4e952 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 00:17:59 +0100
Subject: [PATCH 607/985] Trash

---
 src/Functions/FunctionsConversion.cpp | 94 ++++++++++-----------------
 1 file changed, 34 insertions(+), 60 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 0deb2960d34..088076eeeb4 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -181,12 +181,12 @@ struct ToDateTimeImpl
 
 /// Implementation of toDate function.
 
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDateTransform32Or64
 {
     static constexpr auto name = "toDate";
 
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    static NO_SANITIZE_UNDEFINED UInt16 execute(const FromType & from, const DateLUTImpl & time_zone)
     {
         if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
         {
@@ -203,12 +203,12 @@ struct ToDateTransform32Or64
 };
 
 
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDateTransform32Or64Signed
 {
     static constexpr auto name = "toDate";
 
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    static NO_SANITIZE_UNDEFINED Int32 execute(const FromType & from, const DateLUTImpl & time_zone)
     {
         // TODO: decide narrow or extended range based on FromType
         if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
@@ -222,17 +222,17 @@ struct ToDateTransform32Or64Signed
                 return 0;
         }
         return (from <= DATE_LUT_MAX_DAY_NUM)
-            ? static_cast<ToType>(from)
+            ? static_cast<Int32>(from)
             : time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATE_TIMESTAMP)));
     }
 };
 
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDateTransform8Or16Signed
 {
     static constexpr auto name = "toDate";
 
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    static NO_SANITIZE_UNDEFINED UInt16 execute(const FromType & from, const DateLUTImpl &)
     {
         if (from < 0)
         {
@@ -247,15 +247,15 @@ struct ToDateTransform8Or16Signed
 
 /// Implementation of toDate32 function.
 
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDate32Transform32Or64
 {
     static constexpr auto name = "toDate32";
 
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    static NO_SANITIZE_UNDEFINED Int32 execute(const FromType & from, const DateLUTImpl & time_zone)
     {
         if (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
-            return static_cast<ToType>(from);
+            return static_cast<Int32>(from);
         else
         {
             if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
@@ -268,12 +268,12 @@ struct ToDate32Transform32Or64
     }
 };
 
-template <typename FromType, typename ToType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
+template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDate32Transform32Or64Signed
 {
     static constexpr auto name = "toDate32";
 
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl & time_zone)
+    static NO_SANITIZE_UNDEFINED Int32 execute(const FromType & from, const DateLUTImpl & time_zone)
     {
         static const Int32 daynum_min_offset = -static_cast<Int32>(time_zone.getDayNumOffsetEpoch());
 
@@ -287,17 +287,17 @@ struct ToDate32Transform32Or64Signed
             return daynum_min_offset;
 
         return (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
-            ? static_cast<ToType>(from)
+            ? static_cast<Int32>(from)
             : time_zone.toDayNum(std::min(time_t(Int64(from)), time_t(MAX_DATETIME64_TIMESTAMP)));
     }
 };
 
-template <typename FromType, typename ToType>
+template <typename FromType>
 struct ToDate32Transform8Or16Signed
 {
     static constexpr auto name = "toDate32";
 
-    static NO_SANITIZE_UNDEFINED ToType execute(const FromType & from, const DateLUTImpl &)
+    static NO_SANITIZE_UNDEFINED Int32 execute(const FromType & from, const DateLUTImpl &)
     {
         return from;
     }
@@ -383,6 +383,7 @@ struct ToDateTime64TransformUnsigned
             return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(std::min<time_t>(from, MAX_DATETIME64_TIMESTAMP), 0, scale_multiplier);
     }
 };
+
 template <typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDateTime64TransformSigned
 {
@@ -407,6 +408,7 @@ struct ToDateTime64TransformSigned
         return DecimalUtils::decimalFromComponentsWithMultiplier<DateTime64>(from, 0, scale_multiplier);
     }
 };
+
 template <typename FromDataType, typename FromType, FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior>
 struct ToDateTime64TransformFloat
 {
@@ -432,26 +434,6 @@ struct ToDateTime64TransformFloat
     }
 };
 
-/** Conversion of DateTime64 to Date or DateTime: discards fractional part.
-  */
-template <typename Transform>
-struct FromDateTime64Transform
-{
-    static constexpr auto name = Transform::name;
-
-    const DateTime64::NativeType scale_multiplier;
-
-    FromDateTime64Transform(UInt32 scale) /// NOLINT
-        : scale_multiplier(DecimalUtils::scaleMultiplier<DateTime64::NativeType>(scale))
-    {}
-
-    auto execute(DateTime64::NativeType dt, const DateLUTImpl & time_zone) const
-    {
-        const auto c = DecimalUtils::splitWithScaleMultiplier(DateTime64(dt), scale_multiplier);
-        return Transform::execute(static_cast<UInt32>(c.whole), time_zone);
-    }
-};
-
 struct ToDateTime64Transform
 {
     static constexpr auto name = "toDateTime64";
@@ -972,7 +954,7 @@ struct ConvertThroughParsing
             size_t next_offset = std::is_same_v<FromDataType, DataTypeString> ? (*offsets)[i] : (current_offset + fixed_string_size);
             size_t string_size = std::is_same_v<FromDataType, DataTypeString> ? next_offset - current_offset - 1 : fixed_string_size;
 
-            ReadBufferFromMemory read_buffer(&(*chars)[current_offset], string_size);
+            ReadBufferFromMemory read_buffer(chars->data() + current_offset, string_size);
 
             if constexpr (exception_mode == ConvertFromStringExceptionMode::Throw)
             {
@@ -1087,23 +1069,15 @@ struct ConvertThroughParsing
                         parsed = SerializationDecimal<typename ToDataType::FieldType>::tryReadText(
                             vec_to[i], read_buffer, ToDataType::maxPrecision(), col_to->getScale());
                     }
+                    else if (std::is_same_v<FromDataType, DataTypeFixedString> && std::is_same_v<ToDataType, DataTypeIPv6>
+                            && fixed_string_size == IPV6_BINARY_LENGTH)
+                    {
+                        readBinary(vec_to[i], read_buffer);
+                        parsed = true;
+                    }
                     else
                     {
-                        /// we want to utilize constexpr condition here, which is not mixable with value comparison
-                        do
-                        {
-                            if constexpr (std::is_same_v<FromDataType, DataTypeFixedString> && std::is_same_v<ToDataType, DataTypeIPv6>)
-                            {
-                                if (fixed_string_size == IPV6_BINARY_LENGTH)
-                                {
-                                    readBinary(vec_to[i], read_buffer);
-                                    parsed = true;
-                                    break;
-                                }
-                            }
-
-                            parsed = tryParseImpl<ToDataType>(vec_to[i], read_buffer, local_time_zone, precise_float_parsing);
-                        } while (false);
+                        parsed = tryParseImpl<ToDataType>(vec_to[i], read_buffer, local_time_zone, precise_float_parsing);
                     }
                 }
 
@@ -1220,7 +1194,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1229,7 +1203,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform8Or16Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform8Or16Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1240,7 +1214,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1249,7 +1223,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate32>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1258,7 +1232,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate32>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform8Or16Signed<typename FromDataType::FieldType, UInt16>, false>::template execute<Additions>(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform8Or16Signed<typename FromDataType::FieldType>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1269,7 +1243,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate32>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, UInt16, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         /// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.
@@ -2475,7 +2449,7 @@ public:
     }
 
     template <typename ConvertToDataType>
-    ColumnPtr executeInternal(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count, UInt32 scale = 0) const
+    ColumnPtr executeInternal(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count, UInt32 scale) const
     {
         const IDataType * from_type = arguments[0].type.get();
 
@@ -2510,7 +2484,7 @@ public:
 
             if (scale == 0)
             {
-                result_column = executeInternal<DataTypeDateTime>(arguments, result_type, input_rows_count);
+                result_column = executeInternal<DataTypeDateTime>(arguments, result_type, input_rows_count, 0);
             }
             else
             {
@@ -2519,7 +2493,7 @@ public:
         }
         else
         {
-            result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count);
+            result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count, 0);
         }
 
         if (!result_column)

From ced06cb163bdf9280cde5ee49f9ab3eb506228e3 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 00:18:38 +0100
Subject: [PATCH 608/985] More guides

---
 .../03011_definitive_guide_to_cast.reference         |  4 ++++
 .../0_stateless/03011_definitive_guide_to_cast.sql   | 12 +++++++++++-
 2 files changed, 15 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference b/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
index b71011d75ff..7c875a24b6d 100644
--- a/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.reference
@@ -50,6 +50,8 @@ CAST(plus(1, 1), 'UInt8'):      2
 -1
 \N
 0
+0
+1970-01-01 01:00:00
 255
 123
 Hello\0\0\0\0\0
@@ -65,6 +67,8 @@ Hello\0\0\0\0\0
 2024-03-16 11:01:25
 123	\N	\N	\N
 123	0	0	0
+123	10	10	10
+123	0	0	0
 Nullable(UInt8)	UInt8
 123
 123
diff --git a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
index 76819ad8313..708db0adce0 100644
--- a/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
+++ b/tests/queries/0_stateless/03011_definitive_guide_to_cast.sql
@@ -236,6 +236,14 @@ SELECT accurateCastOrNull(1.123456789, 'Float32');
 
 SELECT accurateCastOrDefault(-1, 'UInt64', 0::UInt64);
 
+-- If this parameter is omitted, it is assumed to be the default value of the corresponding data type:
+
+SELECT accurateCastOrDefault(-1, 'UInt64');
+SELECT accurateCastOrDefault(-1, 'DateTime');
+
+-- Unfortunately, this does not work as expected: SELECT accurateCastOrDefault(-1, $$Enum8('None' = 1, 'Hello' = 2, 'World' = 3)$$);
+-- https://github.com/ClickHouse/ClickHouse/issues/61495
+
 -- These functions are case-sensitive, and there are no corresponding operators:
 
 SELECT ACCURATECAST(1, 'String'); -- { serverError UNKNOWN_FUNCTION }.
@@ -286,12 +294,14 @@ SELECT toString(1710612085::DateTime);
 
 SELECT toString(1710612085::DateTime, tz) FROM Values('tz String', 'Europe/Amsterdam', 'America/Los_Angeles');
 
--- Functions converting to numeric types, date and datetime, IP and UUID, also have versions with -OrNull and -OrZero fallbacks,
+-- Functions converting to numeric types, date and datetime, IP and UUID, also have versions with -OrNull, -OrZero, and -OrDefault fallbacks,
 -- that don't throw exceptions on parsing errors.
 -- They use the same rules to the accurateCast operator:
 
 SELECT toUInt8OrNull('123'), toUInt8OrNull('-123'), toUInt8OrNull('1234'), toUInt8OrNull(' 123');
 SELECT toUInt8OrZero('123'), toUInt8OrZero('-123'), toUInt8OrZero('1234'), toUInt8OrZero(' 123');
+SELECT toUInt8OrDefault('123', 10), toUInt8OrDefault('-123', 10), toUInt8OrDefault('1234', 10), toUInt8OrDefault(' 123', 10);
+SELECT toUInt8OrDefault('123'), toUInt8OrDefault('-123'), toUInt8OrDefault('1234'), toUInt8OrDefault(' 123');
 
 SELECT toTypeName(toUInt8OrNull('123')), toTypeName(toUInt8OrZero('123'));
 

From d627fbef557422cff10dda9f890d6b805fda5a19 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 00:26:07 +0100
Subject: [PATCH 609/985] Fix errors

---
 src/Functions/FunctionsConversion.cpp | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 088076eeeb4..ada7e4ac58d 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -208,7 +208,7 @@ struct ToDateTransform32Or64Signed
 {
     static constexpr auto name = "toDate";
 
-    static NO_SANITIZE_UNDEFINED Int32 execute(const FromType & from, const DateLUTImpl & time_zone)
+    static NO_SANITIZE_UNDEFINED UInt16 execute(const FromType & from, const DateLUTImpl & time_zone)
     {
         // TODO: decide narrow or extended range based on FromType
         if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
@@ -222,7 +222,7 @@ struct ToDateTransform32Or64Signed
                 return 0;
         }
         return (from <= DATE_LUT_MAX_DAY_NUM)
-            ? static_cast<Int32>(from)
+            ? static_cast<UInt16>(from)
             : time_zone.toDayNum(std::min(time_t(from), time_t(MAX_DATE_TIMESTAMP)));
     }
 };
@@ -255,7 +255,9 @@ struct ToDate32Transform32Or64
     static NO_SANITIZE_UNDEFINED Int32 execute(const FromType & from, const DateLUTImpl & time_zone)
     {
         if (from < DATE_LUT_MAX_EXTEND_DAY_NUM)
+        {
             return static_cast<Int32>(from);
+        }
         else
         {
             if constexpr (date_time_overflow_behavior == FormatSettings::DateTimeOverflowBehavior::Throw)
@@ -1214,7 +1216,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr ((
@@ -1243,7 +1245,7 @@ struct ConvertImpl
             && std::is_same_v<ToDataType, DataTypeDate32>
             && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
         {
-            return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
+            return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         /// Special case of converting Int8, Int16, Int32 or (U)Int64 (and also, for convenience, Float32, Float64) to DateTime.

From fac040e08eda9ad958785965f45ebc038155b2de Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 00:34:32 +0100
Subject: [PATCH 610/985] Add documentation

---
 src/Functions/castOrDefault.cpp | 13 ++++++++++++-
 1 file changed, 12 insertions(+), 1 deletion(-)

diff --git a/src/Functions/castOrDefault.cpp b/src/Functions/castOrDefault.cpp
index 57cb03e0349..ac04a883c11 100644
--- a/src/Functions/castOrDefault.cpp
+++ b/src/Functions/castOrDefault.cpp
@@ -329,7 +329,18 @@ REGISTER_FUNCTION(CastOrDefault)
     factory.registerFunction("toUInt64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
         std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt64OrDefault", std::make_shared<DataTypeUInt64>())); });
     factory.registerFunction("toUInt128OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt128OrDefault", std::make_shared<DataTypeUInt128>())); });
+        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt128OrDefault", std::make_shared<DataTypeUInt128>())); },
+        FunctionDocumentation{
+            .description=R"(
+Converts a string in the first argument of the function to UInt128 by parsing it.
+If it cannot parse the value, returns the default value, which can be provided as the second function argument, and if provided, must be of UInt128 type.
+If the default value is not provided in the second argument, it is assumed to be zero.
+)",
+            .examples{
+                {"Successful conversion", "SELECT toUInt128OrDefault('1', 2::UInt128)", "1"},
+                {"Default value", "SELECT toUInt128OrDefault('upyachka', 123456789012345678901234567890::UInt128)", "123456789012345678901234567890"}},
+            .categories{"ConversionFunctions"}
+        });
     factory.registerFunction("toUInt256OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
         std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt256OrDefault", std::make_shared<DataTypeUInt256>())); });
 

From 96f53df7ada476384b0665f52a7c22cd33ce2415 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 12:02:02 +0100
Subject: [PATCH 611/985] Fix error

---
 src/Functions/castOrDefault.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Functions/castOrDefault.cpp b/src/Functions/castOrDefault.cpp
index ac04a883c11..c858dfdd589 100644
--- a/src/Functions/castOrDefault.cpp
+++ b/src/Functions/castOrDefault.cpp
@@ -221,7 +221,7 @@ private:
         size_t scale = 0;
         std::string time_zone;
 
-        if (isDecimal(type))
+        if (isDecimal(type) || isDateTime64(type))
         {
             const auto & scale_argument = arguments[additional_argument_index];
 
@@ -338,7 +338,8 @@ If the default value is not provided in the second argument, it is assumed to be
 )",
             .examples{
                 {"Successful conversion", "SELECT toUInt128OrDefault('1', 2::UInt128)", "1"},
-                {"Default value", "SELECT toUInt128OrDefault('upyachka', 123456789012345678901234567890::UInt128)", "123456789012345678901234567890"}},
+                {"Default value", "SELECT toUInt128OrDefault('upyachka', 123456789012345678901234567890::UInt128)", "123456789012345678901234567890"},
+                {"Implicit default value", "SELECT toUInt128OrDefault('upyachka')", "0"}},
             .categories{"ConversionFunctions"}
         });
     factory.registerFunction("toUInt256OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(

From 41d8621d975497f7a5b0c1fbe845a6410a2a5341 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Thu, 14 Mar 2024 23:50:01 +0100
Subject: [PATCH 612/985] Fix replacing dictionaries: StorageID is now updated
 immediately for every dictionary during CREATE OR REPLACE even if the
 dictionary is not loaded yet or loading right now.

---
 src/Dictionaries/IDictionary.h                | 18 +++++++------
 .../ExternalDictionariesLoader.cpp            | 14 ++++++++++
 src/Interpreters/ExternalDictionariesLoader.h |  3 +++
 src/Interpreters/ExternalLoader.cpp           | 21 ++++++++++++---
 src/Interpreters/ExternalLoader.h             |  4 +++
 src/Storages/StorageDictionary.cpp            | 27 ++++++++++---------
 6 files changed, 63 insertions(+), 24 deletions(-)

diff --git a/src/Dictionaries/IDictionary.h b/src/Dictionaries/IDictionary.h
index bab3e470b79..9770e93669e 100644
--- a/src/Dictionaries/IDictionary.h
+++ b/src/Dictionaries/IDictionary.h
@@ -75,13 +75,6 @@ public:
         return dictionary_id;
     }
 
-    void updateDictionaryName(const StorageID & new_name) const
-    {
-        std::lock_guard lock{mutex};
-        assert(new_name.uuid == dictionary_id.uuid && dictionary_id.uuid != UUIDHelpers::Nil);
-        dictionary_id = new_name;
-    }
-
     std::string getLoadableName() const final
     {
         std::lock_guard lock{mutex};
@@ -452,9 +445,18 @@ public:
         return sample_block;
     }
 
+    /// Internally called by ExternalDictionariesLoader.
+    /// In order to update the dictionary ID change its configuration first and then call ExternalDictionariesLoader::reloadConfig().
+    void updateDictionaryID(const StorageID & new_dictionary_id)
+    {
+        std::lock_guard lock{mutex};
+        assert((new_dictionary_id.uuid == dictionary_id.uuid) && (dictionary_id.uuid != UUIDHelpers::Nil));
+        dictionary_id = new_dictionary_id;
+    }
+
 private:
     mutable std::mutex mutex;
-    mutable StorageID dictionary_id TSA_GUARDED_BY(mutex);
+    StorageID dictionary_id TSA_GUARDED_BY(mutex);
     String dictionary_comment TSA_GUARDED_BY(mutex);
 };
 
diff --git a/src/Interpreters/ExternalDictionariesLoader.cpp b/src/Interpreters/ExternalDictionariesLoader.cpp
index 74984de0064..760f94d18c2 100644
--- a/src/Interpreters/ExternalDictionariesLoader.cpp
+++ b/src/Interpreters/ExternalDictionariesLoader.cpp
@@ -41,6 +41,20 @@ ExternalLoader::LoadablePtr ExternalDictionariesLoader::create(
     return DictionaryFactory::instance().create(name, config, key_in_config, getContext(), created_from_ddl);
 }
 
+void ExternalDictionariesLoader::updateObjectFromConfigWithoutReloading(IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config) const
+{
+    IDictionary & dict = static_cast<IDictionary &>(object);
+
+    auto new_dictionary_id = StorageID::fromDictionaryConfig(config, key_in_config);
+    auto old_dictionary_id = dict.getDictionaryID();
+    if ((new_dictionary_id.table_name != old_dictionary_id.table_name) || (new_dictionary_id.database_name != old_dictionary_id.database_name))
+    {
+        /// We can update the dictionary ID without reloading only if it's in the atomic database.
+        if ((new_dictionary_id.uuid == old_dictionary_id.uuid) && (new_dictionary_id.uuid != UUIDHelpers::Nil))
+            dict.updateDictionaryID(new_dictionary_id);
+    }
+}
+
 ExternalDictionariesLoader::DictPtr ExternalDictionariesLoader::getDictionary(const std::string & dictionary_name, ContextPtr local_context) const
 {
     std::string resolved_dictionary_name = resolveDictionaryName(dictionary_name, local_context->getCurrentDatabase());
diff --git a/src/Interpreters/ExternalDictionariesLoader.h b/src/Interpreters/ExternalDictionariesLoader.h
index 5f27d695c8b..3c226f998be 100644
--- a/src/Interpreters/ExternalDictionariesLoader.h
+++ b/src/Interpreters/ExternalDictionariesLoader.h
@@ -43,6 +43,9 @@ protected:
     LoadablePtr create(const std::string & name, const Poco::Util::AbstractConfiguration & config,
             const std::string & key_in_config, const std::string & repository_name) const override;
 
+    void updateObjectFromConfigWithoutReloading(
+        IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config) const override;
+
     std::string resolveDictionaryName(const std::string & dictionary_name, const std::string & current_database_name) const;
 
     /// Try convert qualified dictionary name to persistent UUID
diff --git a/src/Interpreters/ExternalLoader.cpp b/src/Interpreters/ExternalLoader.cpp
index 36664cbd06f..ec429054475 100644
--- a/src/Interpreters/ExternalLoader.cpp
+++ b/src/Interpreters/ExternalLoader.cpp
@@ -87,6 +87,8 @@ namespace
                 lock = std::unique_lock(mutex);
         }
     };
+
+    using UpdateObjectFromConfigWithoutReloadingFunction = std::function<void(const IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config)>;
 }
 
 
@@ -377,7 +379,7 @@ private:
     }
 
     const String type_name;
-    LoggerPtr log;
+    const LoggerPtr log;
 
     std::mutex mutex;
     ExternalLoaderConfigSettings settings;
@@ -400,9 +402,11 @@ public:
 
     LoadingDispatcher(
         const CreateObjectFunction & create_object_function_,
+        const UpdateObjectFromConfigWithoutReloadingFunction & update_object_from_config_without_reloading_,
         const String & type_name_,
         LoggerPtr log_)
         : create_object(create_object_function_)
+        , update_object_from_config_without_reloading(update_object_from_config_without_reloading_)
         , type_name(type_name_)
         , log(log_)
     {
@@ -457,10 +461,15 @@ public:
             else
             {
                 const auto & new_config = new_config_it->second;
-                bool config_is_same = isSameConfiguration(*info.config->config, info.config->key_in_config, *new_config->config, new_config->key_in_config);
+                auto previous_config = info.config;
                 info.config = new_config;
-                if (!config_is_same)
+
+                bool config_changed = !isSameConfiguration(*previous_config->config, previous_config->key_in_config, *new_config->config, new_config->key_in_config);
+                if (config_changed)
                 {
+                    if (info.object)
+                        update_object_from_config_without_reloading(*info.object, *new_config->config, new_config->key_in_config);
+
                     if (info.triedToLoad())
                     {
                         /// The object has been tried to load before, so it is currently in use or was in use
@@ -1117,7 +1126,10 @@ private:
         }
 
         if (new_object)
+        {
+            update_object_from_config_without_reloading(*new_object, *info->config->config, info->config->key_in_config);
             info->object = new_object;
+        }
 
         info->exception = new_exception;
         info->error_count = error_count;
@@ -1192,6 +1204,7 @@ private:
     }
 
     const CreateObjectFunction create_object;
+    const UpdateObjectFromConfigWithoutReloadingFunction update_object_from_config_without_reloading;
     const String type_name;
     LoggerPtr log;
 
@@ -1277,6 +1290,8 @@ ExternalLoader::ExternalLoader(const String & type_name_, LoggerPtr log_)
     : config_files_reader(std::make_unique<LoadablesConfigReader>(type_name_, log_))
     , loading_dispatcher(std::make_unique<LoadingDispatcher>(
           [this](auto && a, auto && b, auto && c) { return createObject(a, b, c); },
+          [this](const IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config)
+                { return updateObjectFromConfigWithoutReloading(const_cast<IExternalLoadable &>(object), config, key_in_config); },
           type_name_,
           log_))
     , periodic_updater(std::make_unique<PeriodicUpdater>(*config_files_reader, *loading_dispatcher))
diff --git a/src/Interpreters/ExternalLoader.h b/src/Interpreters/ExternalLoader.h
index a5d83bdab50..279157b6d51 100644
--- a/src/Interpreters/ExternalLoader.h
+++ b/src/Interpreters/ExternalLoader.h
@@ -213,6 +213,10 @@ public:
 protected:
     virtual LoadablePtr create(const String & name, const Poco::Util::AbstractConfiguration & config, const String & key_in_config, const String & repository_name) const = 0;
 
+    /// Updates the object from the configuration without reloading as much as possible.
+    virtual void updateObjectFromConfigWithoutReloading(
+        IExternalLoadable & /* object */, const Poco::Util::AbstractConfiguration & /* config */, const String & /* key_in_config */) const {}
+
 private:
     void checkLoaded(const LoadResult & result, bool check_no_errors) const;
     void checkLoaded(const LoadResults & results, bool check_no_errors) const;
diff --git a/src/Storages/StorageDictionary.cpp b/src/Storages/StorageDictionary.cpp
index f716332dd24..0c6f6a25b9d 100644
--- a/src/Storages/StorageDictionary.cpp
+++ b/src/Storages/StorageDictionary.cpp
@@ -221,6 +221,10 @@ void StorageDictionary::renameInMemory(const StorageID & new_table_id)
     bool move_to_ordinary = old_table_id.uuid != UUIDHelpers::Nil && new_table_id.uuid == UUIDHelpers::Nil;
     assert(old_table_id.uuid == new_table_id.uuid || move_to_atomic || move_to_ordinary);
 
+    /// It's better not to update an associated `IDictionary` directly here because it can be not loaded yet or
+    /// it can be in the process of loading or reloading right now.
+    /// The correct way is to update the dictionary's configuration first and then ask ExternalDictionariesLoader to reload our dictionary.
+
     {
         std::lock_guard lock(dictionary_config_mutex);
 
@@ -232,31 +236,28 @@ void StorageDictionary::renameInMemory(const StorageID & new_table_id)
             configuration->remove("dictionary.uuid");
     }
 
+    const auto & external_dictionaries_loader = getContext()->getExternalDictionariesLoader();
+
     /// Dictionary is moving between databases of different engines or is renaming inside Ordinary database
     bool recreate_dictionary = old_table_id.uuid == UUIDHelpers::Nil || new_table_id.uuid == UUIDHelpers::Nil;
 
     if (recreate_dictionary)
     {
-        /// It's too hard to update both name and uuid, better to reload dictionary with new name
+        /// For an ordinary database the config repositories of dictionaries are identified by the full name (database name + dictionary name),
+        /// so we cannot change the dictionary name or the database name on the fly (without extra reloading) and have to recreate the config repository.
         removeDictionaryConfigurationFromRepository();
         auto repository = std::make_unique<ExternalLoaderDictionaryStorageConfigRepository>(*this);
-        remove_repository_callback = getContext()->getExternalDictionariesLoader().addConfigRepository(std::move(repository));
-        /// Dictionary will be reloaded lazily to avoid exceptions in the middle of renaming
+        remove_repository_callback = external_dictionaries_loader.addConfigRepository(std::move(repository));
+        /// Dictionary will be now reloaded lazily.
     }
     else
     {
-        const auto & external_dictionaries_loader = getContext()->getExternalDictionariesLoader();
-        auto result = external_dictionaries_loader.getLoadResult(old_table_id.getInternalDictionaryName());
-
-        if (result.object)
-        {
-            const auto dictionary = std::static_pointer_cast<const IDictionary>(result.object);
-            dictionary->updateDictionaryName(new_table_id);
-        }
-
+        /// For an atomic database dictionaries are identified inside the ExternalLoader by UUID,
+        /// so we can change the dictionary name or the database name on the fly (without extra reloading) because UUID doesn't change.
         external_dictionaries_loader.reloadConfig(old_table_id.getInternalDictionaryName());
-        dictionary_name = new_table_id.getFullNameNotQuoted();
     }
+
+    dictionary_name = new_table_id.getFullNameNotQuoted();
 }
 
 void StorageDictionary::checkAlterIsPossible(const AlterCommands & commands, ContextPtr /* context */) const

From 4fe1c9a78f99b915dd4f31cbf37a2c3db6f49e1d Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Fri, 15 Mar 2024 00:07:53 +0100
Subject: [PATCH 613/985] Get rid of checking the "last modification time" when
 the configuration is generated to allow ExternalLoader::reloadConfig() work
 for generated configurations too.

---
 src/Interpreters/ExternalLoader.cpp                       | 4 ++--
 .../ExternalLoaderDictionaryStorageConfigRepository.cpp   | 5 -----
 .../ExternalLoaderDictionaryStorageConfigRepository.h     | 2 --
 src/Interpreters/ExternalLoaderTempConfigRepository.cpp   | 8 --------
 src/Interpreters/ExternalLoaderTempConfigRepository.h     | 2 --
 src/Interpreters/ExternalLoaderXMLConfigRepository.cpp    | 2 +-
 src/Interpreters/ExternalLoaderXMLConfigRepository.h      | 2 +-
 src/Interpreters/IExternalLoaderConfigRepository.h        | 2 +-
 src/Storages/StorageDictionary.cpp                        | 6 ------
 src/Storages/StorageDictionary.h                          | 2 --
 10 files changed, 5 insertions(+), 30 deletions(-)

diff --git a/src/Interpreters/ExternalLoader.cpp b/src/Interpreters/ExternalLoader.cpp
index ec429054475..3e162b1114f 100644
--- a/src/Interpreters/ExternalLoader.cpp
+++ b/src/Interpreters/ExternalLoader.cpp
@@ -169,7 +169,7 @@ public:
 private:
     struct FileInfo
     {
-        Poco::Timestamp last_update_time = 0;
+        std::optional<Poco::Timestamp> last_update_time;
         bool in_use = true; // Whether the `FileInfo` should be destroyed because the correspondent file is deleted.
         Poco::AutoPtr<Poco::Util::AbstractConfiguration> file_contents; // Parsed contents of the file.
         std::unordered_map<String /* object name */, String /* key in file_contents */> objects;
@@ -268,7 +268,7 @@ private:
             // is updated, but in the same second).
             // The solution to this is probably switching to std::filesystem
             // -- the work is underway to do so.
-            if (update_time_from_repository == file_info.last_update_time)
+            if (update_time_from_repository && (update_time_from_repository == file_info.last_update_time))
             {
                 file_info.in_use = true;
                 return false;
diff --git a/src/Interpreters/ExternalLoaderDictionaryStorageConfigRepository.cpp b/src/Interpreters/ExternalLoaderDictionaryStorageConfigRepository.cpp
index 86f5a9ded0a..042992fcd2e 100644
--- a/src/Interpreters/ExternalLoaderDictionaryStorageConfigRepository.cpp
+++ b/src/Interpreters/ExternalLoaderDictionaryStorageConfigRepository.cpp
@@ -26,11 +26,6 @@ bool ExternalLoaderDictionaryStorageConfigRepository::exists(const std::string &
     return getName() == loadable_definition_name;
 }
 
-Poco::Timestamp ExternalLoaderDictionaryStorageConfigRepository::getUpdateTime(const std::string &)
-{
-    return dictionary_storage.getUpdateTime();
-}
-
 LoadablesConfigurationPtr ExternalLoaderDictionaryStorageConfigRepository::load(const std::string &)
 {
     return dictionary_storage.getConfiguration();
diff --git a/src/Interpreters/ExternalLoaderDictionaryStorageConfigRepository.h b/src/Interpreters/ExternalLoaderDictionaryStorageConfigRepository.h
index 06d2b0faf75..f357df990e6 100644
--- a/src/Interpreters/ExternalLoaderDictionaryStorageConfigRepository.h
+++ b/src/Interpreters/ExternalLoaderDictionaryStorageConfigRepository.h
@@ -19,8 +19,6 @@ public:
 
     bool exists(const std::string & loadable_definition_name) override;
 
-    Poco::Timestamp getUpdateTime(const std::string & loadable_definition_name) override;
-
     LoadablesConfigurationPtr load(const std::string & loadable_definition_name) override;
 
 private:
diff --git a/src/Interpreters/ExternalLoaderTempConfigRepository.cpp b/src/Interpreters/ExternalLoaderTempConfigRepository.cpp
index 10fc61a2ed0..0a8fc170294 100644
--- a/src/Interpreters/ExternalLoaderTempConfigRepository.cpp
+++ b/src/Interpreters/ExternalLoaderTempConfigRepository.cpp
@@ -28,14 +28,6 @@ bool ExternalLoaderTempConfigRepository::exists(const String & path_)
 }
 
 
-Poco::Timestamp ExternalLoaderTempConfigRepository::getUpdateTime(const String & path_)
-{
-    if (!exists(path_))
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Loadable {} not found", path_);
-    return creation_time;
-}
-
-
 LoadablesConfigurationPtr ExternalLoaderTempConfigRepository::load(const String & path_)
 {
     if (!exists(path_))
diff --git a/src/Interpreters/ExternalLoaderTempConfigRepository.h b/src/Interpreters/ExternalLoaderTempConfigRepository.h
index 92816dcb7f2..a3c67b3eed6 100644
--- a/src/Interpreters/ExternalLoaderTempConfigRepository.h
+++ b/src/Interpreters/ExternalLoaderTempConfigRepository.h
@@ -18,14 +18,12 @@ public:
 
     std::set<String> getAllLoadablesDefinitionNames() override;
     bool exists(const String & path) override;
-    Poco::Timestamp getUpdateTime(const String & path) override;
     LoadablesConfigurationPtr load(const String & path) override;
 
 private:
     String name;
     String path;
     LoadablesConfigurationPtr config;
-    Poco::Timestamp creation_time;
 };
 
 }
diff --git a/src/Interpreters/ExternalLoaderXMLConfigRepository.cpp b/src/Interpreters/ExternalLoaderXMLConfigRepository.cpp
index 8b9584f1242..a15f918f457 100644
--- a/src/Interpreters/ExternalLoaderXMLConfigRepository.cpp
+++ b/src/Interpreters/ExternalLoaderXMLConfigRepository.cpp
@@ -24,7 +24,7 @@ ExternalLoaderXMLConfigRepository::ExternalLoaderXMLConfigRepository(
 {
 }
 
-Poco::Timestamp ExternalLoaderXMLConfigRepository::getUpdateTime(const std::string & definition_entity_name)
+std::optional<Poco::Timestamp> ExternalLoaderXMLConfigRepository::getUpdateTime(const std::string & definition_entity_name)
 {
     return FS::getModificationTimestamp(definition_entity_name);
 }
diff --git a/src/Interpreters/ExternalLoaderXMLConfigRepository.h b/src/Interpreters/ExternalLoaderXMLConfigRepository.h
index 25646d72db3..814817cad6f 100644
--- a/src/Interpreters/ExternalLoaderXMLConfigRepository.h
+++ b/src/Interpreters/ExternalLoaderXMLConfigRepository.h
@@ -26,7 +26,7 @@ public:
     bool exists(const std::string & definition_entity_name) override;
 
     /// Return xml-file modification time via stat call
-    Poco::Timestamp getUpdateTime(const std::string & definition_entity_name) override;
+    std::optional<Poco::Timestamp> getUpdateTime(const std::string & definition_entity_name) override;
 
     /// May contain definition about several entities (several dictionaries in one .xml file)
     LoadablesConfigurationPtr load(const std::string & config_file) override;
diff --git a/src/Interpreters/IExternalLoaderConfigRepository.h b/src/Interpreters/IExternalLoaderConfigRepository.h
index 0d0c8acc01a..6ba4add86e2 100644
--- a/src/Interpreters/IExternalLoaderConfigRepository.h
+++ b/src/Interpreters/IExternalLoaderConfigRepository.h
@@ -37,7 +37,7 @@ public:
     virtual bool exists(const std::string & path) = 0;
 
     /// Returns entity last update time
-    virtual Poco::Timestamp getUpdateTime(const std::string & path) = 0;
+    virtual std::optional<Poco::Timestamp> getUpdateTime(const std::string & /* path */) { return {}; }
 
     /// Load configuration from some concrete source to AbstractConfiguration
     virtual LoadablesConfigurationPtr load(const std::string & path) = 0;
diff --git a/src/Storages/StorageDictionary.cpp b/src/Storages/StorageDictionary.cpp
index 0c6f6a25b9d..ee76522fe48 100644
--- a/src/Storages/StorageDictionary.cpp
+++ b/src/Storages/StorageDictionary.cpp
@@ -194,12 +194,6 @@ void StorageDictionary::removeDictionaryConfigurationFromRepository()
     remove_repository_callback.reset();
 }
 
-Poco::Timestamp StorageDictionary::getUpdateTime() const
-{
-    std::lock_guard lock(dictionary_config_mutex);
-    return update_time;
-}
-
 LoadablesConfigurationPtr StorageDictionary::getConfiguration() const
 {
     std::lock_guard lock(dictionary_config_mutex);
diff --git a/src/Storages/StorageDictionary.h b/src/Storages/StorageDictionary.h
index 995a0192269..5c6b2f6d8ad 100644
--- a/src/Storages/StorageDictionary.h
+++ b/src/Storages/StorageDictionary.h
@@ -92,7 +92,6 @@ public:
 
     void alter(const AlterCommands & params, ContextPtr alter_context, AlterLockHolder &) override;
 
-    Poco::Timestamp getUpdateTime() const;
     LoadablesConfigurationPtr getConfiguration() const;
 
     String getDictionaryName() const { return dictionary_name; }
@@ -102,7 +101,6 @@ private:
     const Location location;
 
     mutable std::mutex dictionary_config_mutex;
-    Poco::Timestamp update_time;
     LoadablesConfigurationPtr configuration;
 
     scope_guard remove_repository_callback;

From 921ec12192fc2461bc828653bd9c3900daee74c8 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 12:29:45 +0100
Subject: [PATCH 614/985] Maybe not worse

---
 src/Functions/FunctionsConversion.cpp | 86 ++++++++-------------------
 1 file changed, 24 insertions(+), 62 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index ada7e4ac58d..0d245f809bb 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -53,6 +53,7 @@
 #include <Functions/TransformDateTime64.h>
 #include <Functions/FunctionsCodingIP.h>
 #include <Functions/CastOverloadResolver.h>
+#include <Functions/castTypeToEither.h>
 #include <DataTypes/DataTypeLowCardinality.h>
 #include <Columns/ColumnLowCardinality.h>
 #include <Interpreters/Context.h>
@@ -4776,67 +4777,6 @@ arguments, result_type, input_rows_count); \
     }
 };
 
-class MonotonicityHelper
-{
-public:
-    using MonotonicityForRange = FunctionCast::MonotonicityForRange;
-
-    template <typename DataType>
-    static auto monotonicityForType(const DataType * const)
-    {
-        return FunctionTo<DataType>::Type::Monotonic::get;
-    }
-
-    static MonotonicityForRange getMonotonicityInformation(const DataTypePtr & from_type, const IDataType * to_type)
-    {
-        if (const auto * type = checkAndGetDataType<DataTypeUInt8>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt16>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt64>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt128>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeUInt256>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt8>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt16>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt64>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt128>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeInt256>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeFloat32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeFloat64>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeDate>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeDate32>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeDateTime>(to_type))
-            return monotonicityForType(type);
-        if (const auto * type = checkAndGetDataType<DataTypeString>(to_type))
-            return monotonicityForType(type);
-        if (isEnum(from_type))
-        {
-            if (const auto * type = checkAndGetDataType<DataTypeEnum8>(to_type))
-                return monotonicityForType(type);
-            if (const auto * type = checkAndGetDataType<DataTypeEnum16>(to_type))
-                return monotonicityForType(type);
-        }
-        /// other types like Null, FixedString, Array and Tuple have no monotonicity defined
-        return {};
-    }
-};
-
 }
 
 
@@ -4853,7 +4793,29 @@ FunctionBasePtr createFunctionBaseCast(
     for (size_t i = 0; i < arguments.size(); ++i)
         data_types[i] = arguments[i].type;
 
-    auto monotonicity = MonotonicityHelper::getMonotonicityInformation(arguments.front().type, return_type.get());
+    FunctionCast::MonotonicityForRange monotonicity;
+
+    if (isEnum(arguments.front().type)
+        && castTypeToEither<DataTypeEnum8, DataTypeEnum16>(return_type.get(), [&](auto & type)
+        {
+            monotonicity = FunctionTo<std::decay_t<decltype(type)>>::Type::Monotonic::get;
+            return true;
+        }))
+    {
+    }
+    else if (castTypeToEither<
+        DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64, DataTypeUInt128, DataTypeUInt256,
+        DataTypeInt8, DataTypeInt16, DataTypeInt32, DataTypeInt64, DataTypeInt128, DataTypeInt256,
+        DataTypeFloat32, DataTypeFloat64,
+        DataTypeDate, DataTypeDate32, DataTypeDateTime,
+        DataTypeString>(return_type.get(), [&](auto & type)
+        {
+            monotonicity = FunctionTo<std::decay_t<decltype(type)>>::Type::Monotonic::get;
+            return true;
+        }))
+    {
+    }
+
     return std::make_unique<FunctionCast>(context, name, std::move(monotonicity), data_types, return_type, diagnostic, cast_type);
 }
 

From 2af6d35752e064bfd7859b23a52948c222f7c716 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 12:53:59 +0100
Subject: [PATCH 615/985] Less crap

---
 src/Functions/FunctionFactory.cpp          |  12 +++
 src/Functions/FunctionFactory.h            |   7 ++
 src/Functions/array/emptyArray.cpp         |   3 +-
 src/Functions/castOrDefault.cpp            | 100 ++++++++++-----------
 src/Functions/coverage.cpp                 |   6 +-
 src/Functions/currentProfiles.cpp          |   6 +-
 src/Functions/fromUnixTimestamp64Micro.cpp |   3 +-
 src/Functions/fromUnixTimestamp64Milli.cpp |   3 +-
 src/Functions/fromUnixTimestamp64Nano.cpp  |   3 +-
 src/Functions/snowflake.cpp                |  12 +--
 src/Functions/toUnixTimestamp64Micro.cpp   |   3 +-
 src/Functions/toUnixTimestamp64Milli.cpp   |   3 +-
 src/Functions/toUnixTimestamp64Nano.cpp    |   3 +-
 13 files changed, 86 insertions(+), 78 deletions(-)

diff --git a/src/Functions/FunctionFactory.cpp b/src/Functions/FunctionFactory.cpp
index 6a7274376b9..004ef745a93 100644
--- a/src/Functions/FunctionFactory.cpp
+++ b/src/Functions/FunctionFactory.cpp
@@ -49,6 +49,18 @@ void FunctionFactory::registerFunction(
     }
 }
 
+void FunctionFactory::registerFunction(
+    const std::string & name,
+    FunctionSimpleCreator creator,
+    FunctionDocumentation doc,
+    CaseSensitiveness case_sensitiveness)
+{
+    registerFunction(name, [my_creator = std::move(creator)](ContextPtr context)
+    {
+        return std::make_unique<FunctionToOverloadResolverAdaptor>(my_creator(context));
+    }, std::move(doc), std::move(case_sensitiveness));
+}
+
 
 FunctionOverloadResolverPtr FunctionFactory::getImpl(
     const std::string & name,
diff --git a/src/Functions/FunctionFactory.h b/src/Functions/FunctionFactory.h
index 588cae64e16..c2fd34f0488 100644
--- a/src/Functions/FunctionFactory.h
+++ b/src/Functions/FunctionFactory.h
@@ -17,6 +17,7 @@ namespace DB
 {
 
 using FunctionCreator = std::function<FunctionOverloadResolverPtr(ContextPtr)>;
+using FunctionSimpleCreator = std::function<FunctionPtr(ContextPtr)>;
 using FunctionFactoryData = std::pair<FunctionCreator, FunctionDocumentation>;
 
 /** Creates function by name.
@@ -66,6 +67,12 @@ public:
         FunctionDocumentation doc = {},
         CaseSensitiveness case_sensitiveness = CaseSensitive);
 
+    void registerFunction(
+        const std::string & name,
+        FunctionSimpleCreator creator,
+        FunctionDocumentation doc = {},
+        CaseSensitiveness case_sensitiveness = CaseSensitive);
+
     FunctionDocumentation getDocumentation(const std::string & name) const;
 
 private:
diff --git a/src/Functions/array/emptyArray.cpp b/src/Functions/array/emptyArray.cpp
index 684f8af162a..77c191b3adc 100644
--- a/src/Functions/array/emptyArray.cpp
+++ b/src/Functions/array/emptyArray.cpp
@@ -49,8 +49,7 @@ private:
 void registerFunction(FunctionFactory & factory, const String & element_type)
 {
     factory.registerFunction(FunctionEmptyArray::getNameImpl(element_type),
-        [element_type](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionEmptyArray>(element_type)); });
+        [element_type](ContextPtr){ return std::make_shared<FunctionEmptyArray>(element_type); });
 }
 
 }
diff --git a/src/Functions/castOrDefault.cpp b/src/Functions/castOrDefault.cpp
index c858dfdd589..b5653fca1e9 100644
--- a/src/Functions/castOrDefault.cpp
+++ b/src/Functions/castOrDefault.cpp
@@ -320,16 +320,16 @@ REGISTER_FUNCTION(CastOrDefault)
 {
     factory.registerFunction<FunctionCastOrDefault>();
 
-    factory.registerFunction("toUInt8OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt8OrDefault", std::make_shared<DataTypeUInt8>())); });
-    factory.registerFunction("toUInt16OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt16OrDefault", std::make_shared<DataTypeUInt16>())); });
-    factory.registerFunction("toUInt32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt32OrDefault", std::make_shared<DataTypeUInt32>())); });
-    factory.registerFunction("toUInt64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt64OrDefault", std::make_shared<DataTypeUInt64>())); });
-    factory.registerFunction("toUInt128OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt128OrDefault", std::make_shared<DataTypeUInt128>())); },
+    factory.registerFunction("toUInt8OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt8OrDefault", std::make_shared<DataTypeUInt8>()); });
+    factory.registerFunction("toUInt16OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt16OrDefault", std::make_shared<DataTypeUInt16>()); });
+    factory.registerFunction("toUInt32OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt32OrDefault", std::make_shared<DataTypeUInt32>()); });
+    factory.registerFunction("toUInt64OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt64OrDefault", std::make_shared<DataTypeUInt64>()); });
+    factory.registerFunction("toUInt128OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt128OrDefault", std::make_shared<DataTypeUInt128>()); },
         FunctionDocumentation{
             .description=R"(
 Converts a string in the first argument of the function to UInt128 by parsing it.
@@ -342,51 +342,51 @@ If the default value is not provided in the second argument, it is assumed to be
                 {"Implicit default value", "SELECT toUInt128OrDefault('upyachka')", "0"}},
             .categories{"ConversionFunctions"}
         });
-    factory.registerFunction("toUInt256OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt256OrDefault", std::make_shared<DataTypeUInt256>())); });
+    factory.registerFunction("toUInt256OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt256OrDefault", std::make_shared<DataTypeUInt256>()); });
 
-    factory.registerFunction("toInt8OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt8OrDefault", std::make_shared<DataTypeInt8>())); });
-    factory.registerFunction("toInt16OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt16OrDefault", std::make_shared<DataTypeInt16>())); });
-    factory.registerFunction("toInt32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt32OrDefault", std::make_shared<DataTypeInt32>())); });
-    factory.registerFunction("toInt64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt64OrDefault", std::make_shared<DataTypeInt64>())); });
-    factory.registerFunction("toInt128OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt128OrDefault", std::make_shared<DataTypeInt128>())); });
-    factory.registerFunction("toInt256OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt256OrDefault", std::make_shared<DataTypeInt256>())); });
+    factory.registerFunction("toInt8OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt8OrDefault", std::make_shared<DataTypeInt8>()); });
+    factory.registerFunction("toInt16OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt16OrDefault", std::make_shared<DataTypeInt16>()); });
+    factory.registerFunction("toInt32OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt32OrDefault", std::make_shared<DataTypeInt32>()); });
+    factory.registerFunction("toInt64OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt64OrDefault", std::make_shared<DataTypeInt64>()); });
+    factory.registerFunction("toInt128OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt128OrDefault", std::make_shared<DataTypeInt128>()); });
+    factory.registerFunction("toInt256OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt256OrDefault", std::make_shared<DataTypeInt256>()); });
 
-    factory.registerFunction("toFloat32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat32OrDefault", std::make_shared<DataTypeFloat32>())); });
-    factory.registerFunction("toFloat64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat64OrDefault", std::make_shared<DataTypeFloat64>())); });
+    factory.registerFunction("toFloat32OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat32OrDefault", std::make_shared<DataTypeFloat32>()); });
+    factory.registerFunction("toFloat64OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat64OrDefault", std::make_shared<DataTypeFloat64>()); });
 
-    factory.registerFunction("toDateOrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateOrDefault", std::make_shared<DataTypeDate>())); });
-    factory.registerFunction("toDate32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDate32OrDefault", std::make_shared<DataTypeDate32>())); });
-    factory.registerFunction("toDateTimeOrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTimeOrDefault", std::make_shared<DataTypeDateTime>())); });
-    factory.registerFunction("toDateTime64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTime64OrDefault", std::make_shared<DataTypeDateTime64>(3 /* default scale */))); });
+    factory.registerFunction("toDateOrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateOrDefault", std::make_shared<DataTypeDate>()); });
+    factory.registerFunction("toDate32OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDate32OrDefault", std::make_shared<DataTypeDate32>()); });
+    factory.registerFunction("toDateTimeOrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTimeOrDefault", std::make_shared<DataTypeDateTime>()); });
+    factory.registerFunction("toDateTime64OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTime64OrDefault", std::make_shared<DataTypeDateTime64>(3 /* default scale */)); });
 
-    factory.registerFunction("toDecimal32OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal32OrDefault", createDecimalMaxPrecision<Decimal32>(0))); });
-    factory.registerFunction("toDecimal64OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal64OrDefault", createDecimalMaxPrecision<Decimal64>(0))); });
-    factory.registerFunction("toDecimal128OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal128OrDefault", createDecimalMaxPrecision<Decimal128>(0))); });
-    factory.registerFunction("toDecimal256OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal256OrDefault", createDecimalMaxPrecision<Decimal256>(0))); });
+    factory.registerFunction("toDecimal32OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal32OrDefault", createDecimalMaxPrecision<Decimal32>(0)); });
+    factory.registerFunction("toDecimal64OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal64OrDefault", createDecimalMaxPrecision<Decimal64>(0)); });
+    factory.registerFunction("toDecimal128OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal128OrDefault", createDecimalMaxPrecision<Decimal128>(0)); });
+    factory.registerFunction("toDecimal256OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal256OrDefault", createDecimalMaxPrecision<Decimal256>(0)); });
 
-    factory.registerFunction("toUUIDOrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toUUIDOrDefault", std::make_shared<DataTypeUUID>())); });
-    factory.registerFunction("toIPv4OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv4OrDefault", std::make_shared<DataTypeIPv4>())); });
-    factory.registerFunction("toIPv6OrDefault", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-        std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv6OrDefault", std::make_shared<DataTypeIPv6>())); });
+    factory.registerFunction("toUUIDOrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUUIDOrDefault", std::make_shared<DataTypeUUID>()); });
+    factory.registerFunction("toIPv4OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv4OrDefault", std::make_shared<DataTypeIPv4>()); });
+    factory.registerFunction("toIPv6OrDefault", [](ContextPtr context){
+        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv6OrDefault", std::make_shared<DataTypeIPv6>()); });
 }
 
 }
diff --git a/src/Functions/coverage.cpp b/src/Functions/coverage.cpp
index a1a43d0cf58..97f807e22b7 100644
--- a/src/Functions/coverage.cpp
+++ b/src/Functions/coverage.cpp
@@ -93,7 +93,7 @@ public:
 
 REGISTER_FUNCTION(Coverage)
 {
-    factory.registerFunction("coverageCurrent", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::Current)); },
+    factory.registerFunction("coverageCurrent", [](ContextPtr){ return std::make_shared<FunctionCoverage>(Kind::Current); },
         FunctionDocumentation
         {
             .description=R"(
@@ -124,7 +124,7 @@ See https://clang.llvm.org/docs/SanitizerCoverage.html for more information.
             .categories{"Introspection"}
         });
 
-    factory.registerFunction("coverageCumulative", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::Cumulative)); },
+    factory.registerFunction("coverageCumulative", [](ContextPtr){ return std::make_shared<FunctionCoverage>(Kind::Cumulative); },
         FunctionDocumentation
         {
             .description=R"(
@@ -140,7 +140,7 @@ See the `coverageCurrent` function for the details.
             .categories{"Introspection"}
         });
 
-    factory.registerFunction("coverageAll", [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionCoverage>(Kind::All)); },
+    factory.registerFunction("coverageAll", [](ContextPtr){ return std::make_shared<FunctionCoverage>(Kind::All); },
         FunctionDocumentation
         {
             .description=R"(
diff --git a/src/Functions/currentProfiles.cpp b/src/Functions/currentProfiles.cpp
index 77c8a20ccee..8f14943e011 100644
--- a/src/Functions/currentProfiles.cpp
+++ b/src/Functions/currentProfiles.cpp
@@ -98,9 +98,9 @@ namespace
 
 REGISTER_FUNCTION(Profiles)
 {
-    factory.registerFunction("currentProfiles", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionProfiles>(context, Kind::currentProfiles)); });
-    factory.registerFunction("enabledProfiles", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionProfiles>(context, Kind::enabledProfiles)); });
-    factory.registerFunction("defaultProfiles", [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionProfiles>(context, Kind::defaultProfiles)); });
+    factory.registerFunction("currentProfiles", [](ContextPtr context){ return std::make_shared<FunctionProfiles>(context, Kind::currentProfiles); });
+    factory.registerFunction("enabledProfiles", [](ContextPtr context){ return std::make_shared<FunctionProfiles>(context, Kind::enabledProfiles); });
+    factory.registerFunction("defaultProfiles", [](ContextPtr context){ return std::make_shared<FunctionProfiles>(context, Kind::defaultProfiles); });
 }
 
 }
diff --git a/src/Functions/fromUnixTimestamp64Micro.cpp b/src/Functions/fromUnixTimestamp64Micro.cpp
index 191e2137a0d..d96e0232335 100644
--- a/src/Functions/fromUnixTimestamp64Micro.cpp
+++ b/src/Functions/fromUnixTimestamp64Micro.cpp
@@ -7,8 +7,7 @@ namespace DB
 REGISTER_FUNCTION(FromUnixTimestamp64Micro)
 {
     factory.registerFunction("fromUnixTimestamp64Micro",
-        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionFromUnixTimestamp64>(6, "fromUnixTimestamp64Micro", context)); });
+        [](ContextPtr context){ return std::make_shared<FunctionFromUnixTimestamp64>(6, "fromUnixTimestamp64Micro", context); });
 }
 
 }
diff --git a/src/Functions/fromUnixTimestamp64Milli.cpp b/src/Functions/fromUnixTimestamp64Milli.cpp
index c6d4fcd30a2..aa77e8043c1 100644
--- a/src/Functions/fromUnixTimestamp64Milli.cpp
+++ b/src/Functions/fromUnixTimestamp64Milli.cpp
@@ -7,8 +7,7 @@ namespace DB
 REGISTER_FUNCTION(FromUnixTimestamp64Milli)
 {
     factory.registerFunction("fromUnixTimestamp64Milli",
-        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionFromUnixTimestamp64>(3, "fromUnixTimestamp64Milli", context)); });
+        [](ContextPtr context){ return std::make_shared<FunctionFromUnixTimestamp64>(3, "fromUnixTimestamp64Milli", context); });
 }
 
 }
diff --git a/src/Functions/fromUnixTimestamp64Nano.cpp b/src/Functions/fromUnixTimestamp64Nano.cpp
index 2b5a7addbfc..f9d69219933 100644
--- a/src/Functions/fromUnixTimestamp64Nano.cpp
+++ b/src/Functions/fromUnixTimestamp64Nano.cpp
@@ -7,8 +7,7 @@ namespace DB
 REGISTER_FUNCTION(FromUnixTimestamp64Nano)
 {
     factory.registerFunction("fromUnixTimestamp64Nano",
-        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionFromUnixTimestamp64>(9, "fromUnixTimestamp64Nano", context)); });
+        [](ContextPtr context){ return std::make_shared<FunctionFromUnixTimestamp64>(9, "fromUnixTimestamp64Nano", context); });
 }
 
 }
diff --git a/src/Functions/snowflake.cpp b/src/Functions/snowflake.cpp
index f2dd1f1c51d..4a2d502a31a 100644
--- a/src/Functions/snowflake.cpp
+++ b/src/Functions/snowflake.cpp
@@ -249,28 +249,24 @@ public:
 REGISTER_FUNCTION(DateTimeToSnowflake)
 {
     factory.registerFunction("dateTimeToSnowflake",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionDateTimeToSnowflake>("dateTimeToSnowflake")); });
+        [](ContextPtr){ return std::make_shared<FunctionDateTimeToSnowflake>("dateTimeToSnowflake"); });
 }
 
 REGISTER_FUNCTION(DateTime64ToSnowflake)
 {
     factory.registerFunction("dateTime64ToSnowflake",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionDateTime64ToSnowflake>("dateTime64ToSnowflake")); });
+        [](ContextPtr){ return std::make_shared<FunctionDateTime64ToSnowflake>("dateTime64ToSnowflake"); });
 }
 
 REGISTER_FUNCTION(SnowflakeToDateTime)
 {
     factory.registerFunction("snowflakeToDateTime",
-        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionSnowflakeToDateTime>("snowflakeToDateTime", context)); });
+        [](ContextPtr context){ return std::make_shared<FunctionSnowflakeToDateTime>("snowflakeToDateTime", context); });
 }
 REGISTER_FUNCTION(SnowflakeToDateTime64)
 {
     factory.registerFunction("snowflakeToDateTime64",
-        [](ContextPtr context){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionSnowflakeToDateTime64>("snowflakeToDateTime64", context)); });
+        [](ContextPtr context){ return std::make_shared<FunctionSnowflakeToDateTime64>("snowflakeToDateTime64", context); });
 }
 
 }
diff --git a/src/Functions/toUnixTimestamp64Micro.cpp b/src/Functions/toUnixTimestamp64Micro.cpp
index fd35e2a7a73..964ad5a2c18 100644
--- a/src/Functions/toUnixTimestamp64Micro.cpp
+++ b/src/Functions/toUnixTimestamp64Micro.cpp
@@ -7,8 +7,7 @@ namespace DB
 REGISTER_FUNCTION(ToUnixTimestamp64Micro)
 {
     factory.registerFunction("toUnixTimestamp64Micro",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionToUnixTimestamp64>(6, "toUnixTimestamp64Micro")); });
+        [](ContextPtr){ return std::make_shared<FunctionToUnixTimestamp64>(6, "toUnixTimestamp64Micro"); });
 }
 
 }
diff --git a/src/Functions/toUnixTimestamp64Milli.cpp b/src/Functions/toUnixTimestamp64Milli.cpp
index e6a680f941a..bc92a6d1fe3 100644
--- a/src/Functions/toUnixTimestamp64Milli.cpp
+++ b/src/Functions/toUnixTimestamp64Milli.cpp
@@ -7,8 +7,7 @@ namespace DB
 REGISTER_FUNCTION(ToUnixTimestamp64Milli)
 {
     factory.registerFunction("toUnixTimestamp64Milli",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionToUnixTimestamp64>(3, "toUnixTimestamp64Milli")); });
+        [](ContextPtr){ return std::make_shared<FunctionToUnixTimestamp64>(3, "toUnixTimestamp64Milli"); });
 }
 
 }
diff --git a/src/Functions/toUnixTimestamp64Nano.cpp b/src/Functions/toUnixTimestamp64Nano.cpp
index 257f011603c..8829b00bf56 100644
--- a/src/Functions/toUnixTimestamp64Nano.cpp
+++ b/src/Functions/toUnixTimestamp64Nano.cpp
@@ -7,8 +7,7 @@ namespace DB
 REGISTER_FUNCTION(ToUnixTimestamp64Nano)
 {
     factory.registerFunction("toUnixTimestamp64Nano",
-        [](ContextPtr){ return std::make_unique<FunctionToOverloadResolverAdaptor>(
-            std::make_shared<FunctionToUnixTimestamp64>(9, "toUnixTimestamp64Nano")); });
+        [](ContextPtr){ return std::make_shared<FunctionToUnixTimestamp64>(9, "toUnixTimestamp64Nano"); });
 }
 
 }

From 427a8b3264cd9000b6f7ab13f13ceac0878d000a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 13:20:49 +0100
Subject: [PATCH 616/985] Less crap

---
 programs/local/LocalServer.cpp        |  4 ++++
 src/Functions/CRC.cpp                 | 21 ++++++++-------------
 src/Functions/FunctionFQDN.cpp        |  2 +-
 src/Functions/FunctionFactory.h       | 21 ++++++---------------
 src/Functions/FunctionsConversion.cpp | 15 ++++++---------
 src/Functions/FunctionsRound.cpp      | 10 +++++-----
 src/Functions/caseWithExpression.cpp  |  4 +---
 src/Functions/getFuzzerData.h         |  8 ++------
 src/Functions/multiIf.cpp             |  6 ++----
 src/Functions/toFixedString.h         |  2 --
 10 files changed, 35 insertions(+), 58 deletions(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 50f9c242712..0dd3823cc6d 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -1013,13 +1013,16 @@ extern "C" int LLVMFuzzerInitialize(int * pargc, char *** pargv)
 
     auto it = argv.begin() + 1;
     for (; *it; ++it)
+    {
         if (strcmp(*it, "--") == 0)
         {
             ++it;
             break;
         }
+    }
 
     while (*it)
+    {
         if (strncmp(*it, "--", 2) != 0)
         {
             *(p++) = *it;
@@ -1027,6 +1030,7 @@ extern "C" int LLVMFuzzerInitialize(int * pargc, char *** pargv)
         }
         else
             ++it;
+    }
 
     *pargc = static_cast<int>(p - &(*pargv)[0]);
     *p = nullptr;
diff --git a/src/Functions/CRC.cpp b/src/Functions/CRC.cpp
index ba13fcf78f1..49d6dd6fa52 100644
--- a/src/Functions/CRC.cpp
+++ b/src/Functions/CRC.cpp
@@ -51,7 +51,7 @@ struct CRC32IEEEImpl : public CRCImpl<UInt32, CRC32_IEEE>
     static constexpr auto name = "CRC32IEEE";
 };
 
-struct CRC32ZLIBImpl
+struct CRC32ZLibImpl
 {
     using ReturnType = UInt32;
     static constexpr auto name = "CRC32";
@@ -133,13 +133,14 @@ private:
     }
 };
 
-template <class T>
+template <typename T>
 using FunctionCRC = FunctionStringOrArrayToT<CRCFunctionWrapper<T>, T, typename T::ReturnType>;
+
 // The same as IEEE variant, but uses 0xffffffff as initial value
 // This is the default
 //
-// (And zlib is used here, since it has optimized version)
-using FunctionCRC32ZLIB = FunctionCRC<CRC32ZLIBImpl>;
+// (And ZLib is used here, since it has optimized version)
+using FunctionCRC32ZLib = FunctionCRC<CRC32ZLibImpl>;
 // Uses CRC-32-IEEE 802.3 polynomial
 using FunctionCRC32IEEE = FunctionCRC<CRC32IEEEImpl>;
 // Uses CRC-64-ECMA polynomial
@@ -147,17 +148,11 @@ using FunctionCRC64ECMA = FunctionCRC<CRC64ECMAImpl>;
 
 }
 
-template <class T>
-void registerFunctionCRCImpl(FunctionFactory & factory)
-{
-    factory.registerFunction<T>(T::name, {}, FunctionFactory::CaseInsensitive);
-}
-
 REGISTER_FUNCTION(CRC)
 {
-    registerFunctionCRCImpl<FunctionCRC32ZLIB>(factory);
-    registerFunctionCRCImpl<FunctionCRC32IEEE>(factory);
-    registerFunctionCRCImpl<FunctionCRC64ECMA>(factory);
+    factory.registerFunction<FunctionCRC32ZLib>({}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction<FunctionCRC32IEEE>({}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction<FunctionCRC64ECMA>({}, FunctionFactory::CaseInsensitive);
 }
 
 }
diff --git a/src/Functions/FunctionFQDN.cpp b/src/Functions/FunctionFQDN.cpp
index b054ff8e1d7..108a96216fd 100644
--- a/src/Functions/FunctionFQDN.cpp
+++ b/src/Functions/FunctionFQDN.cpp
@@ -47,7 +47,7 @@ public:
 REGISTER_FUNCTION(FQDN)
 {
     factory.registerFunction<FunctionFQDN>({}, FunctionFactory::CaseInsensitive);
-    factory.registerFunction<FunctionFQDN>("fullHostName");
+    factory.registerAlias("fullHostName", "FQDN");
 }
 
 }
diff --git a/src/Functions/FunctionFactory.h b/src/Functions/FunctionFactory.h
index c2fd34f0488..bb43d4719b8 100644
--- a/src/Functions/FunctionFactory.h
+++ b/src/Functions/FunctionFactory.h
@@ -35,15 +35,6 @@ public:
         registerFunction<Function>(Function::name, std::move(doc), case_sensitiveness);
     }
 
-    template <typename Function>
-    void registerFunction(const std::string & name, FunctionDocumentation doc = {}, CaseSensitiveness case_sensitiveness = CaseSensitive)
-    {
-        if constexpr (std::is_base_of_v<IFunction, Function>)
-            registerFunction(name, &adaptFunctionToOverloadResolver<Function>, std::move(doc), case_sensitiveness);
-        else
-            registerFunction(name, &Function::create, std::move(doc), case_sensitiveness);
-    }
-
     /// This function is used by YQL - innovative transactional DBMS that depends on ClickHouse by source code.
     std::vector<std::string> getAllNames() const;
 
@@ -81,17 +72,17 @@ private:
     Functions functions;
     Functions case_insensitive_functions;
 
-    template <typename Function>
-    static FunctionOverloadResolverPtr adaptFunctionToOverloadResolver(ContextPtr context)
-    {
-        return std::make_unique<FunctionToOverloadResolverAdaptor>(Function::create(context));
-    }
-
     const Functions & getMap() const override { return functions; }
 
     const Functions & getCaseInsensitiveMap() const override { return case_insensitive_functions; }
 
     String getFactoryName() const override { return "FunctionFactory"; }
+
+    template <typename Function>
+    void registerFunction(const std::string & name, FunctionDocumentation doc = {}, CaseSensitiveness case_sensitiveness = CaseSensitive)
+    {
+        registerFunction(name, &Function::create, std::move(doc), case_sensitiveness);
+    }
 };
 
 const String & getFunctionCanonicalNameIfAny(const String & name);
diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 0d245f809bb..ceff4f3fd7e 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1955,9 +1955,6 @@ public:
     static constexpr bool to_decimal = IsDataTypeDecimal<ToDataType> && !to_datetime64;
 
     static FunctionPtr create(ContextPtr context) { return std::make_shared<FunctionConvert>(context); }
-    static FunctionPtr create() { return std::make_shared<FunctionConvert>(); }
-
-    FunctionConvert() = default;
     explicit FunctionConvert(ContextPtr context_) : context(context_) {}
 
     String getName() const override
@@ -3295,9 +3292,9 @@ arguments, result_type, input_rows_count); \
         };
     }
 
-    static WrapperType createStringWrapper(const DataTypePtr & from_type)
+    WrapperType createStringWrapper(const DataTypePtr & from_type) const
     {
-        FunctionPtr function = FunctionToString::create();
+        FunctionPtr function = FunctionToString::create(context);
         return createFunctionAdaptor(function, from_type);
     }
 
@@ -3318,9 +3315,9 @@ arguments, result_type, input_rows_count); \
 
 #define GENERATE_INTERVAL_CASE(INTERVAL_KIND) \
             case IntervalKind::Kind::INTERVAL_KIND: \
-                return createFunctionAdaptor(FunctionConvert<DataTypeInterval, NameToInterval##INTERVAL_KIND, PositiveMonotonicity>::create(), from_type);
+                return createFunctionAdaptor(FunctionConvert<DataTypeInterval, NameToInterval##INTERVAL_KIND, PositiveMonotonicity>::create(context), from_type);
 
-    static WrapperType createIntervalWrapper(const DataTypePtr & from_type, IntervalKind kind)
+    WrapperType createIntervalWrapper(const DataTypePtr & from_type, IntervalKind kind) const
     {
         switch (kind.kind)
         {
@@ -4207,7 +4204,7 @@ arguments, result_type, input_rows_count); \
             return createStringToEnumWrapper<ColumnFixedString, EnumType>();
         else if (isNativeNumber(from_type) || isEnum(from_type))
         {
-            auto function = Function::create();
+            auto function = Function::create(context);
             return createFunctionAdaptor(function, from_type);
         }
         else
@@ -4846,7 +4843,7 @@ REGISTER_FUNCTION(Conversion)
     /// MySQL compatibility alias. Cannot be registered as alias,
     /// because we don't want it to be normalized to toDate in queries,
     /// otherwise CREATE DICTIONARY query breaks.
-    factory.registerFunction<FunctionToDate>("DATE", {}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction("DATE", &FunctionToDate::create, {}, FunctionFactory::CaseInsensitive);
 
     factory.registerFunction<FunctionToDate32>();
     factory.registerFunction<FunctionToDateTime>();
diff --git a/src/Functions/FunctionsRound.cpp b/src/Functions/FunctionsRound.cpp
index 02fe1d659de..059476acb40 100644
--- a/src/Functions/FunctionsRound.cpp
+++ b/src/Functions/FunctionsRound.cpp
@@ -7,11 +7,11 @@ namespace DB
 
 REGISTER_FUNCTION(Round)
 {
-    factory.registerFunction<FunctionRound>("round", {}, FunctionFactory::CaseInsensitive);
-    factory.registerFunction<FunctionRoundBankers>("roundBankers", {}, FunctionFactory::CaseSensitive);
-    factory.registerFunction<FunctionFloor>("floor", {}, FunctionFactory::CaseInsensitive);
-    factory.registerFunction<FunctionCeil>("ceil", {}, FunctionFactory::CaseInsensitive);
-    factory.registerFunction<FunctionTrunc>("trunc", {}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction<FunctionRound>({}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction<FunctionRoundBankers>({}, FunctionFactory::CaseSensitive);
+    factory.registerFunction<FunctionFloor>({}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction<FunctionCeil>({}, FunctionFactory::CaseInsensitive);
+    factory.registerFunction<FunctionTrunc>({}, FunctionFactory::CaseInsensitive);
     factory.registerFunction<FunctionRoundDown>();
 
     /// Compatibility aliases.
diff --git a/src/Functions/caseWithExpression.cpp b/src/Functions/caseWithExpression.cpp
index 9547cd200b2..71fccc8436e 100644
--- a/src/Functions/caseWithExpression.cpp
+++ b/src/Functions/caseWithExpression.cpp
@@ -113,9 +113,7 @@ REGISTER_FUNCTION(CaseWithExpression)
     factory.registerFunction<FunctionCaseWithExpression>();
 
     /// These are obsolete function names.
-    factory.registerFunction<FunctionCaseWithExpression>("caseWithExpr");
+    factory.registerAlias("caseWithExpr", "caseWithExpression");
 }
 
 }
-
-
diff --git a/src/Functions/getFuzzerData.h b/src/Functions/getFuzzerData.h
index 635ca2bdce9..8d7b3c090c4 100644
--- a/src/Functions/getFuzzerData.h
+++ b/src/Functions/getFuzzerData.h
@@ -7,6 +7,7 @@
 
 namespace DB
 {
+
 class FunctionGetFuzzerData : public IFunction
 {
     inline static String fuzz_data;
@@ -14,12 +15,7 @@ class FunctionGetFuzzerData : public IFunction
 public:
     static constexpr auto name = "getFuzzerData";
 
-    inline static FunctionPtr create(ContextPtr) { return create(); }
-
-    static FunctionPtr create()
-    {
-        return std::make_shared<FunctionGetFuzzerData>();
-    }
+    inline static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionGetFuzzerData>(); }
 
     inline String getName() const override { return name; }
 
diff --git a/src/Functions/multiIf.cpp b/src/Functions/multiIf.cpp
index 81304f3afbd..49c45d0c0be 100644
--- a/src/Functions/multiIf.cpp
+++ b/src/Functions/multiIf.cpp
@@ -549,8 +549,8 @@ REGISTER_FUNCTION(MultiIf)
     factory.registerFunction<FunctionMultiIf>();
 
     /// These are obsolete function names.
-    factory.registerFunction<FunctionMultiIf>("caseWithoutExpr");
-    factory.registerFunction<FunctionMultiIf>("caseWithoutExpression");
+    factory.registerAlias("caseWithoutExpr", "multiIf");
+    factory.registerAlias("caseWithoutExpression", "multiIf");
 }
 
 FunctionOverloadResolverPtr createInternalMultiIfOverloadResolver(bool allow_execute_multiif_columnar, bool allow_experimental_variant_type, bool use_variant_as_common_type)
@@ -559,5 +559,3 @@ FunctionOverloadResolverPtr createInternalMultiIfOverloadResolver(bool allow_exe
 }
 
 }
-
-
diff --git a/src/Functions/toFixedString.h b/src/Functions/toFixedString.h
index 7bee666c5dd..9c7ffc48004 100644
--- a/src/Functions/toFixedString.h
+++ b/src/Functions/toFixedString.h
@@ -34,7 +34,6 @@ class FunctionToFixedString : public IFunction
 public:
     static constexpr auto name = "toFixedString";
     static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionToFixedString>(); }
-    static FunctionPtr create() { return std::make_shared<FunctionToFixedString>(); }
 
     String getName() const override
     {
@@ -158,4 +157,3 @@ public:
 };
 
 }
-

From 7c35f1d07e5d9c344bdb3a14e6f03efd76212e4e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 13:23:09 +0100
Subject: [PATCH 617/985] Less crap

---
 src/Functions/getFuzzerData.cpp | 48 ++++++++++++++++++++++++++++++++-
 src/Functions/getFuzzerData.h   | 46 -------------------------------
 2 files changed, 47 insertions(+), 47 deletions(-)
 delete mode 100644 src/Functions/getFuzzerData.h

diff --git a/src/Functions/getFuzzerData.cpp b/src/Functions/getFuzzerData.cpp
index 6d748619926..5c536477401 100644
--- a/src/Functions/getFuzzerData.cpp
+++ b/src/Functions/getFuzzerData.cpp
@@ -1,13 +1,59 @@
 #ifdef FUZZING_MODE
-#include <Functions/getFuzzerData.h>
+
+#include <Functions/IFunction.h>
+#include <Functions/FunctionFactory.h>
+#include <DataTypes/DataTypeString.h>
+#include <Core/Field.h>
+
 
 namespace DB
 {
 
+namespace
+{
+
+class FunctionGetFuzzerData : public IFunction
+{
+    inline static String fuzz_data;
+
+public:
+    static constexpr auto name = "getFuzzerData";
+
+    inline static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionGetFuzzerData>(); }
+
+    inline String getName() const override { return name; }
+
+    inline size_t getNumberOfArguments() const override { return 0; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & /*arguments*/) const override
+    {
+        return std::make_shared<DataTypeString>();
+    }
+
+    inline bool isDeterministic() const override { return false; }
+
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName &,
+                          const DataTypePtr &,
+                          size_t input_rows_count) const override
+    {
+        return DataTypeString().createColumnConst(input_rows_count, fuzz_data);
+    }
+
+    static void update(const String & fuzz_data_)
+    {
+        fuzz_data = fuzz_data_;
+    }
+};
+
+}
+
 REGISTER_FUNCTION(GetFuzzerData)
 {
     factory.registerFunction<FunctionGetFuzzerData>();
 }
 
 }
+
 #endif
diff --git a/src/Functions/getFuzzerData.h b/src/Functions/getFuzzerData.h
deleted file mode 100644
index 8d7b3c090c4..00000000000
--- a/src/Functions/getFuzzerData.h
+++ /dev/null
@@ -1,46 +0,0 @@
-#pragma once
-
-#include <Functions/IFunction.h>
-#include <Functions/FunctionFactory.h>
-#include <DataTypes/DataTypeString.h>
-#include <Core/Field.h>
-
-namespace DB
-{
-
-class FunctionGetFuzzerData : public IFunction
-{
-    inline static String fuzz_data;
-
-public:
-    static constexpr auto name = "getFuzzerData";
-
-    inline static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionGetFuzzerData>(); }
-
-    inline String getName() const override { return name; }
-
-    inline size_t getNumberOfArguments() const override { return 0; }
-
-    DataTypePtr getReturnTypeImpl(const DataTypes & /*arguments*/) const override
-    {
-        return std::make_shared<DataTypeString>();
-    }
-
-    inline bool isDeterministic() const override { return false; }
-
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; }
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName &,
-                          const DataTypePtr &,
-                          size_t input_rows_count) const override
-    {
-        return DataTypeString().createColumnConst(input_rows_count, fuzz_data);
-    }
-
-    static void update(const String & fuzz_data_)
-    {
-        fuzz_data = fuzz_data_;
-    }
-};
-
-}

From eec0bf2f52e0f7465de2e4b78af5886d13d14893 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 13:34:34 +0100
Subject: [PATCH 618/985] Fix style

---
 src/Functions/castOrDefault.cpp | 100 ++++++++++++++++----------------
 1 file changed, 50 insertions(+), 50 deletions(-)

diff --git a/src/Functions/castOrDefault.cpp b/src/Functions/castOrDefault.cpp
index b5653fca1e9..44b39811882 100644
--- a/src/Functions/castOrDefault.cpp
+++ b/src/Functions/castOrDefault.cpp
@@ -320,16 +320,16 @@ REGISTER_FUNCTION(CastOrDefault)
 {
     factory.registerFunction<FunctionCastOrDefault>();
 
-    factory.registerFunction("toUInt8OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt8OrDefault", std::make_shared<DataTypeUInt8>()); });
-    factory.registerFunction("toUInt16OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt16OrDefault", std::make_shared<DataTypeUInt16>()); });
-    factory.registerFunction("toUInt32OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt32OrDefault", std::make_shared<DataTypeUInt32>()); });
-    factory.registerFunction("toUInt64OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt64OrDefault", std::make_shared<DataTypeUInt64>()); });
-    factory.registerFunction("toUInt128OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt128OrDefault", std::make_shared<DataTypeUInt128>()); },
+    factory.registerFunction("toUInt8OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt8OrDefault", std::make_shared<DataTypeUInt8>()); });
+    factory.registerFunction("toUInt16OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt16OrDefault", std::make_shared<DataTypeUInt16>()); });
+    factory.registerFunction("toUInt32OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt32OrDefault", std::make_shared<DataTypeUInt32>()); });
+    factory.registerFunction("toUInt64OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt64OrDefault", std::make_shared<DataTypeUInt64>()); });
+    factory.registerFunction("toUInt128OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt128OrDefault", std::make_shared<DataTypeUInt128>()); },
         FunctionDocumentation{
             .description=R"(
 Converts a string in the first argument of the function to UInt128 by parsing it.
@@ -342,51 +342,51 @@ If the default value is not provided in the second argument, it is assumed to be
                 {"Implicit default value", "SELECT toUInt128OrDefault('upyachka')", "0"}},
             .categories{"ConversionFunctions"}
         });
-    factory.registerFunction("toUInt256OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt256OrDefault", std::make_shared<DataTypeUInt256>()); });
+    factory.registerFunction("toUInt256OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUInt256OrDefault", std::make_shared<DataTypeUInt256>()); });
 
-    factory.registerFunction("toInt8OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt8OrDefault", std::make_shared<DataTypeInt8>()); });
-    factory.registerFunction("toInt16OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt16OrDefault", std::make_shared<DataTypeInt16>()); });
-    factory.registerFunction("toInt32OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt32OrDefault", std::make_shared<DataTypeInt32>()); });
-    factory.registerFunction("toInt64OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt64OrDefault", std::make_shared<DataTypeInt64>()); });
-    factory.registerFunction("toInt128OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt128OrDefault", std::make_shared<DataTypeInt128>()); });
-    factory.registerFunction("toInt256OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt256OrDefault", std::make_shared<DataTypeInt256>()); });
+    factory.registerFunction("toInt8OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt8OrDefault", std::make_shared<DataTypeInt8>()); });
+    factory.registerFunction("toInt16OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt16OrDefault", std::make_shared<DataTypeInt16>()); });
+    factory.registerFunction("toInt32OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt32OrDefault", std::make_shared<DataTypeInt32>()); });
+    factory.registerFunction("toInt64OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt64OrDefault", std::make_shared<DataTypeInt64>()); });
+    factory.registerFunction("toInt128OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt128OrDefault", std::make_shared<DataTypeInt128>()); });
+    factory.registerFunction("toInt256OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toInt256OrDefault", std::make_shared<DataTypeInt256>()); });
 
-    factory.registerFunction("toFloat32OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat32OrDefault", std::make_shared<DataTypeFloat32>()); });
-    factory.registerFunction("toFloat64OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat64OrDefault", std::make_shared<DataTypeFloat64>()); });
+    factory.registerFunction("toFloat32OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat32OrDefault", std::make_shared<DataTypeFloat32>()); });
+    factory.registerFunction("toFloat64OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toFloat64OrDefault", std::make_shared<DataTypeFloat64>()); });
 
-    factory.registerFunction("toDateOrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateOrDefault", std::make_shared<DataTypeDate>()); });
-    factory.registerFunction("toDate32OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDate32OrDefault", std::make_shared<DataTypeDate32>()); });
-    factory.registerFunction("toDateTimeOrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTimeOrDefault", std::make_shared<DataTypeDateTime>()); });
-    factory.registerFunction("toDateTime64OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTime64OrDefault", std::make_shared<DataTypeDateTime64>(3 /* default scale */)); });
+    factory.registerFunction("toDateOrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateOrDefault", std::make_shared<DataTypeDate>()); });
+    factory.registerFunction("toDate32OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDate32OrDefault", std::make_shared<DataTypeDate32>()); });
+    factory.registerFunction("toDateTimeOrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTimeOrDefault", std::make_shared<DataTypeDateTime>()); });
+    factory.registerFunction("toDateTime64OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDateTime64OrDefault", std::make_shared<DataTypeDateTime64>(3 /* default scale */)); });
 
-    factory.registerFunction("toDecimal32OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal32OrDefault", createDecimalMaxPrecision<Decimal32>(0)); });
-    factory.registerFunction("toDecimal64OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal64OrDefault", createDecimalMaxPrecision<Decimal64>(0)); });
-    factory.registerFunction("toDecimal128OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal128OrDefault", createDecimalMaxPrecision<Decimal128>(0)); });
-    factory.registerFunction("toDecimal256OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal256OrDefault", createDecimalMaxPrecision<Decimal256>(0)); });
+    factory.registerFunction("toDecimal32OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal32OrDefault", createDecimalMaxPrecision<Decimal32>(0)); });
+    factory.registerFunction("toDecimal64OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal64OrDefault", createDecimalMaxPrecision<Decimal64>(0)); });
+    factory.registerFunction("toDecimal128OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal128OrDefault", createDecimalMaxPrecision<Decimal128>(0)); });
+    factory.registerFunction("toDecimal256OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toDecimal256OrDefault", createDecimalMaxPrecision<Decimal256>(0)); });
 
-    factory.registerFunction("toUUIDOrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUUIDOrDefault", std::make_shared<DataTypeUUID>()); });
-    factory.registerFunction("toIPv4OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv4OrDefault", std::make_shared<DataTypeIPv4>()); });
-    factory.registerFunction("toIPv6OrDefault", [](ContextPtr context){
-        return std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv6OrDefault", std::make_shared<DataTypeIPv6>()); });
+    factory.registerFunction("toUUIDOrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toUUIDOrDefault", std::make_shared<DataTypeUUID>()); });
+    factory.registerFunction("toIPv4OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv4OrDefault", std::make_shared<DataTypeIPv4>()); });
+    factory.registerFunction("toIPv6OrDefault", [](ContextPtr context)
+        { return std::make_shared<FunctionCastOrDefaultTyped>(context, "toIPv6OrDefault", std::make_shared<DataTypeIPv6>()); });
 }
 
 }

From 938a54c85c9b82bd51607080239574b0bb83d311 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 14:12:48 +0100
Subject: [PATCH 619/985] Update reference

---
 .../02415_all_new_functions_must_be_documented.reference      | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
index e15002da69c..8b85ac48c16 100644
--- a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
+++ b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
@@ -194,10 +194,7 @@ blockSerializedSize
 blockSize
 buildId
 byteSize
-caseWithExpr
 caseWithExpression
-caseWithoutExpr
-caseWithoutExpression
 catboostEvaluate
 cbrt
 ceil
@@ -312,7 +309,6 @@ fromUnixTimestamp64Micro
 fromUnixTimestamp64Milli
 fromUnixTimestamp64Nano
 fromUnixTimestampInJodaSyntax
-fullHostName
 fuzzBits
 gccMurmurHash
 gcd

From 4527b3e0d4b1e02285fcfc3579c8c48c5b7657b2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 15:17:58 +0100
Subject: [PATCH 620/985] Remove useless code

---
 CMakeLists.txt     |  5 -----
 cmake/fuzzer.cmake | 17 -----------------
 2 files changed, 22 deletions(-)
 delete mode 100644 cmake/fuzzer.cmake

diff --git a/CMakeLists.txt b/CMakeLists.txt
index eff6dd3ff6a..957bb3f71de 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -110,11 +110,6 @@ endif()
 # - sanitize.cmake
 add_library(global-libs INTERFACE)
 
-# We don't want to instrument everything with fuzzer, but only specific targets (see below),
-# also, since we build our own llvm, we specifically don't want to instrument
-# libFuzzer library itself - it would result in infinite recursion
-#include (cmake/fuzzer.cmake)
-
 include (cmake/sanitize.cmake)
 
 option(ENABLE_COLORED_BUILD "Enable colors in compiler output" ON)
diff --git a/cmake/fuzzer.cmake b/cmake/fuzzer.cmake
deleted file mode 100644
index dd0c4b080fe..00000000000
--- a/cmake/fuzzer.cmake
+++ /dev/null
@@ -1,17 +0,0 @@
-# see ./CMakeLists.txt for variable declaration
-if (FUZZER)
-    if (FUZZER STREQUAL "libfuzzer")
-        # NOTE: Eldar Zaitov decided to name it "libfuzzer" instead of "fuzzer" to keep in mind another possible fuzzer backends.
-        # NOTE: no-link means that all the targets are built with instrumentation for fuzzer, but only some of them
-        # (tests) have entry point for fuzzer and it's not checked.
-        set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${SAN_FLAGS} -fsanitize=fuzzer-no-link -DFUZZER=1")
-        set (CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${SAN_FLAGS} -fsanitize=fuzzer-no-link -DFUZZER=1")
-
-        # NOTE: oss-fuzz can change LIB_FUZZING_ENGINE variable
-        if (NOT LIB_FUZZING_ENGINE)
-            set (LIB_FUZZING_ENGINE "-fsanitize=fuzzer")
-        endif ()
-    else ()
-        message (FATAL_ERROR "Unknown fuzzer type: ${FUZZER}")
-    endif ()
-endif()

From 0a3e42401ce11036a64a2d7a7c30f425d8b700f2 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 15:44:36 +0100
Subject: [PATCH 621/985] Fix fuzzers

---
 .../aggregate_function_state_deserialization_fuzzer.cpp     | 3 +++
 src/Common/tests/gtest_global_context.cpp                   | 6 ------
 src/Common/tests/gtest_global_context.h                     | 2 --
 src/DataTypes/fuzzers/data_type_deserialization_fuzzer.cpp  | 3 +++
 src/Formats/fuzzers/format_fuzzer.cpp                       | 3 +++
 src/Interpreters/fuzzers/execute_query_fuzzer.cpp           | 3 +++
 6 files changed, 12 insertions(+), 8 deletions(-)

diff --git a/src/AggregateFunctions/fuzzers/aggregate_function_state_deserialization_fuzzer.cpp b/src/AggregateFunctions/fuzzers/aggregate_function_state_deserialization_fuzzer.cpp
index 290da81944d..425364efb9c 100644
--- a/src/AggregateFunctions/fuzzers/aggregate_function_state_deserialization_fuzzer.cpp
+++ b/src/AggregateFunctions/fuzzers/aggregate_function_state_deserialization_fuzzer.cpp
@@ -27,6 +27,9 @@ extern "C" int LLVMFuzzerTestOneInput(const uint8_t * data, size_t size)
 
         auto initialize = [&]() mutable
         {
+            if (context)
+                return true;
+
             shared_context = Context::createShared();
             context = Context::createGlobal(shared_context.get());
             context->makeGlobalContext();
diff --git a/src/Common/tests/gtest_global_context.cpp b/src/Common/tests/gtest_global_context.cpp
index ec86c953c5b..0c1556766a9 100644
--- a/src/Common/tests/gtest_global_context.cpp
+++ b/src/Common/tests/gtest_global_context.cpp
@@ -10,9 +10,3 @@ ContextHolder & getMutableContext()
     static ContextHolder holder;
     return holder;
 }
-
-void destroyContext()
-{
-    auto & holder = getMutableContext();
-    return holder.destroy();
-}
diff --git a/src/Common/tests/gtest_global_context.h b/src/Common/tests/gtest_global_context.h
index f846a0dbe4f..7ae8bb32f70 100644
--- a/src/Common/tests/gtest_global_context.h
+++ b/src/Common/tests/gtest_global_context.h
@@ -28,5 +28,3 @@ struct ContextHolder
 const ContextHolder & getContext();
 
 ContextHolder & getMutableContext();
-
-void destroyContext();
diff --git a/src/DataTypes/fuzzers/data_type_deserialization_fuzzer.cpp b/src/DataTypes/fuzzers/data_type_deserialization_fuzzer.cpp
index e40734e0a57..0ae325871fb 100644
--- a/src/DataTypes/fuzzers/data_type_deserialization_fuzzer.cpp
+++ b/src/DataTypes/fuzzers/data_type_deserialization_fuzzer.cpp
@@ -24,6 +24,9 @@ extern "C" int LLVMFuzzerTestOneInput(const uint8_t * data, size_t size)
 
         auto initialize = [&]() mutable
         {
+            if (context)
+                return true;
+
             shared_context = Context::createShared();
             context = Context::createGlobal(shared_context.get());
             context->makeGlobalContext();
diff --git a/src/Formats/fuzzers/format_fuzzer.cpp b/src/Formats/fuzzers/format_fuzzer.cpp
index 583d1173a01..46661e4828c 100644
--- a/src/Formats/fuzzers/format_fuzzer.cpp
+++ b/src/Formats/fuzzers/format_fuzzer.cpp
@@ -32,6 +32,9 @@ extern "C" int LLVMFuzzerTestOneInput(const uint8_t * data, size_t size)
 
         auto initialize = [&]() mutable
         {
+            if (context)
+                return true;
+
             shared_context = Context::createShared();
             context = Context::createGlobal(shared_context.get());
             context->makeGlobalContext();
diff --git a/src/Interpreters/fuzzers/execute_query_fuzzer.cpp b/src/Interpreters/fuzzers/execute_query_fuzzer.cpp
index edff202d547..a02ce66e6b5 100644
--- a/src/Interpreters/fuzzers/execute_query_fuzzer.cpp
+++ b/src/Interpreters/fuzzers/execute_query_fuzzer.cpp
@@ -25,6 +25,9 @@ extern "C" int LLVMFuzzerTestOneInput(const uint8_t * data, size_t size)
 
         auto initialize = [&]() mutable
         {
+            if (context)
+                return true;
+
             shared_context = Context::createShared();
             context = Context::createGlobal(shared_context.get());
             context->makeGlobalContext();

From 44e918bc67efe0b1c36059693ee2eb709d31c59c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 16:22:33 +0100
Subject: [PATCH 622/985] Revive `getFuzzerData`

---
 CMakeLists.txt                             |  9 ++++-----
 programs/local/LocalServer.cpp             |  6 ------
 programs/main.cpp                          | 15 +++++++--------
 src/Interpreters/AsynchronousMetricLog.cpp |  1 -
 4 files changed, 11 insertions(+), 20 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 957bb3f71de..8c4e16eace2 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -549,7 +549,9 @@ if (ENABLE_RUST)
     endif()
 endif()
 
-if (CMAKE_BUILD_TYPE_UC STREQUAL "RELWITHDEBINFO" AND NOT SANITIZE AND NOT SANITIZE_COVERAGE AND OS_LINUX AND (ARCH_AMD64 OR ARCH_AARCH64))
+if (CMAKE_BUILD_TYPE_UC STREQUAL "RELWITHDEBINFO"
+    AND NOT SANITIZE AND NOT SANITIZE_COVERAGE AND NOT ENABLE_FUZZING
+    AND OS_LINUX AND (ARCH_AMD64 OR ARCH_AARCH64))
     set(CHECK_LARGE_OBJECT_SIZES_DEFAULT ON)
 else ()
     set(CHECK_LARGE_OBJECT_SIZES_DEFAULT OFF)
@@ -572,10 +574,7 @@ if (FUZZER)
             if (NOT(target_type STREQUAL "INTERFACE_LIBRARY" OR target_type STREQUAL "UTILITY"))
                 target_compile_options(${target} PRIVATE "-fsanitize=fuzzer-no-link")
             endif()
-            # clickhouse fuzzer isn't working correctly
-            # initial PR https://github.com/ClickHouse/ClickHouse/pull/27526
-            #if (target MATCHES ".+_fuzzer" OR target STREQUAL "clickhouse")
-            if (target_type STREQUAL "EXECUTABLE" AND target MATCHES ".+_fuzzer")
+            if (target_type STREQUAL "EXECUTABLE" AND (target MATCHES ".+_fuzzer" OR target STREQUAL "clickhouse"))
                 message(STATUS "${target} instrumented with fuzzer")
                 target_link_libraries(${target} PUBLIC ch_contrib::fuzzer)
                 # Add to fuzzers bundle
diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 50f9c242712..10fbda0fe46 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -1000,12 +1000,6 @@ extern "C" int LLVMFuzzerInitialize(int * pargc, char *** pargv)
 {
     std::vector<char *> argv(*pargv, *pargv + (*pargc + 1));
 
-    if (!isClickhouseApp("local", argv))
-    {
-        std::cerr << "\033[31m" << "ClickHouse compiled in fuzzing mode, only clickhouse local is available." << "\033[0m" << std::endl;
-        exit(1);
-    }
-
     /// As a user you can add flags to clickhouse binary in fuzzing mode as follows
     /// clickhouse local <set of clickhouse-local specific flag> -- <set of libfuzzer flags>
 
diff --git a/programs/main.cpp b/programs/main.cpp
index c5f1b30f60e..0a35594bd30 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -68,7 +68,6 @@ namespace
 using MainFunc = int (*)(int, char**);
 
 #if !defined(FUZZING_MODE)
-
 /// Add an item here to register new application
 std::pair<std::string_view, MainFunc> clickhouse_applications[] =
 {
@@ -105,13 +104,6 @@ std::pair<std::string_view, MainFunc> clickhouse_applications[] =
     {"restart", mainEntryClickHouseRestart},
 };
 
-/// Add an item here to register a new short name
-std::pair<std::string_view, std::string_view> clickhouse_short_names[] =
-{
-    {"chl", "local"},
-    {"chc", "client"},
-};
-
 int printHelp(int, char **)
 {
     std::cerr << "Use one of the following commands:" << std::endl;
@@ -121,6 +113,13 @@ int printHelp(int, char **)
 }
 #endif
 
+/// Add an item here to register a new short name
+std::pair<std::string_view, std::string_view> clickhouse_short_names[] =
+{
+    {"chl", "local"},
+    {"chc", "client"},
+};
+
 
 enum class InstructionFail
 {
diff --git a/src/Interpreters/AsynchronousMetricLog.cpp b/src/Interpreters/AsynchronousMetricLog.cpp
index f905f72e7a7..5cf7f951eec 100644
--- a/src/Interpreters/AsynchronousMetricLog.cpp
+++ b/src/Interpreters/AsynchronousMetricLog.cpp
@@ -8,7 +8,6 @@
 #include <Interpreters/AsynchronousMetricLog.h>
 #include <Parsers/parseQuery.h>
 #include <Parsers/ExpressionElementParsers.h>
-#include <Common/AsynchronousMetrics.h>
 
 
 namespace DB

From 01136bbc3beb01eb1f150747412db2030115507a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 19:53:58 +0100
Subject: [PATCH 623/985] Limit backtracking in parser

---
 programs/compressor/Compressor.cpp            |   2 +-
 programs/format/Format.cpp                    |   2 +-
 programs/keeper-client/KeeperClient.cpp       |   3 +-
 src/Access/AccessEntityIO.cpp                 |   2 +-
 src/Access/RowPolicyCache.cpp                 |   2 +-
 src/Access/UsersConfigAccessStorage.cpp       |   2 +-
 .../parseAggregateFunctionParameters.cpp      |   3 +-
 src/Backups/BackupInfo.cpp                    |   2 +-
 src/Backups/RestorerFromBackup.cpp            |   4 +-
 src/Client/ClientBase.cpp                     |  24 +--
 src/Client/ClientBase.h                       |   2 +-
 src/Client/QueryFuzzer.cpp                    |   6 +-
 .../NamedCollections/NamedCollectionUtils.cpp |   2 +-
 .../tests/gtest_compressionCodec.cpp          |   2 +-
 src/Core/Defines.h                            |   2 +
 src/Core/Settings.h                           |   1 +
 src/Core/SettingsChangesHistory.h             |   1 +
 src/DataTypes/DataTypeFactory.cpp             |   5 +-
 src/Databases/DDLDependencyVisitor.cpp        |   3 +-
 src/Databases/DatabaseDictionary.cpp          |   4 +-
 src/Databases/DatabaseFilesystem.cpp          |   2 +-
 src/Databases/DatabaseHDFS.cpp                |   2 +-
 src/Databases/DatabaseOnDisk.cpp              |  18 +-
 src/Databases/DatabaseOrdinary.cpp            |   2 +-
 src/Databases/DatabaseReplicated.cpp          |   7 +-
 src/Databases/DatabaseS3.cpp                  |   2 +-
 src/Databases/DatabasesCommon.cpp             |   5 +-
 src/Databases/DatabasesCommon.h               |   3 +-
 src/Databases/MySQL/DatabaseMySQL.cpp         |  14 +-
 .../MySQL/tryConvertStringLiterals.cpp        |   2 +-
 .../MySQL/tryParseTableIDFromDDL.cpp          |   2 +-
 .../MySQL/tryQuoteUnrecognizedTokens.cpp      |   2 +-
 src/Databases/SQLite/DatabaseSQLite.cpp       |   6 +-
 .../tests/gtest_dictionary_configuration.cpp  |   8 +-
 src/Formats/SchemaInferenceUtils.cpp          |   2 +-
 src/Functions/FunctionSQLJSON.h               |   9 +-
 .../UserDefinedSQLObjectsBackup.cpp           |   2 +-
 .../UserDefinedSQLObjectsDiskStorage.cpp      |   3 +-
 .../UserDefinedSQLObjectsZooKeeperStorage.cpp |   3 +-
 src/Functions/formatQuery.cpp                 | 168 +++++++++---------
 ...InterpreterShowCreateAccessEntityQuery.cpp |   2 +-
 src/Interpreters/AsynchronousMetricLog.cpp    |  10 +-
 src/Interpreters/DDLTask.cpp                  |   5 +-
 .../IInterpreterUnionOrSelectQuery.cpp        |   2 +-
 src/Interpreters/InterpreterCreateQuery.cpp   |  10 +-
 src/Interpreters/InterpreterDeleteQuery.cpp   |   3 +-
 .../InterpreterKillQueryQuery.cpp             |   2 +-
 src/Interpreters/InterpreterSelectQuery.cpp   |   4 +-
 .../JoinToSubqueryTransformVisitor.cpp        |   2 +-
 .../MySQL/tests/gtest_create_rewritten.cpp    |   2 +-
 src/Interpreters/SystemLog.cpp                |   4 +-
 src/Interpreters/executeQuery.cpp             |  10 +-
 .../getCustomKeyFilterForParallelReplicas.cpp |   2 +-
 src/Interpreters/loadMetadata.cpp             |   4 +-
 .../parseColumnsListForTableFunction.cpp      |   4 +-
 .../tests/gtest_comparison_graph.cpp          |   2 +-
 .../tests/gtest_cycle_aliases.cpp             |  10 +-
 .../tests/gtest_table_overrides.cpp           |   4 +-
 src/Parsers/ExpressionListParsers.cpp         |   2 +-
 src/Parsers/IParser.cpp                       |  33 ++++
 src/Parsers/IParser.h                         |  15 +-
 .../KustoFunctions/IParserKQLFunction.cpp     |   8 +-
 .../Kusto/KustoFunctions/IParserKQLFunction.h |   4 +-
 .../KustoFunctions/KQLCastingFunctions.cpp    |   2 +-
 .../KustoFunctions/KQLDynamicFunctions.cpp    |  10 +-
 .../Kusto/KustoFunctions/KQLIPFunctions.cpp   |  32 ++--
 .../KustoFunctions/KQLStringFunctions.cpp     |   4 +-
 src/Parsers/Kusto/ParserKQLDistinct.cpp       |   2 +-
 src/Parsers/Kusto/ParserKQLExtend.cpp         |   4 +-
 src/Parsers/Kusto/ParserKQLFilter.cpp         |   2 +-
 src/Parsers/Kusto/ParserKQLLimit.cpp          |   2 +-
 src/Parsers/Kusto/ParserKQLMVExpand.cpp       |  16 +-
 src/Parsers/Kusto/ParserKQLMVExpand.h         |   2 +-
 src/Parsers/Kusto/ParserKQLMakeSeries.cpp     |  20 +--
 src/Parsers/Kusto/ParserKQLMakeSeries.h       |   2 +-
 src/Parsers/Kusto/ParserKQLPrint.cpp          |   2 +-
 src/Parsers/Kusto/ParserKQLProject.cpp        |   2 +-
 src/Parsers/Kusto/ParserKQLQuery.cpp          |  18 +-
 src/Parsers/Kusto/ParserKQLQuery.h            |   6 +-
 src/Parsers/Kusto/ParserKQLSort.cpp           |   2 +-
 src/Parsers/Kusto/ParserKQLStatement.cpp      |   2 +-
 src/Parsers/Kusto/ParserKQLSummarize.cpp      |   8 +-
 src/Parsers/Kusto/parseKQLQuery.cpp           |  23 ++-
 src/Parsers/Kusto/parseKQLQuery.h             |  26 +--
 .../tests/gtest_alter_command_parser.cpp      |   2 +-
 .../MySQL/tests/gtest_alter_parser.cpp        |   2 +-
 .../MySQL/tests/gtest_column_parser.cpp       |   4 +-
 .../MySQL/tests/gtest_constraint_parser.cpp   |  10 +-
 .../MySQL/tests/gtest_create_parser.cpp       |   8 +-
 .../MySQL/tests/gtest_index_parser.cpp        |  50 +++---
 .../tests/gtest_partition_options_parser.cpp  |  26 +--
 .../MySQL/tests/gtest_partition_parser.cpp    |  21 ++-
 .../MySQL/tests/gtest_reference_parser.cpp    |  21 ++-
 .../MySQL/tests/gtest_subpartition_parser.cpp |   5 +-
 .../tests/gtest_table_options_parser.cpp      |   4 +-
 src/Parsers/PRQL/ParserPRQLQuery.cpp          |   4 +-
 src/Parsers/PRQL/ParserPRQLQuery.h            |   3 +-
 src/Parsers/ParserAlterQuery.cpp              |   3 +-
 src/Parsers/ParserCreateQuery.h               |   2 +-
 src/Parsers/QueryParameterVisitor.cpp         |   2 +-
 src/Parsers/TokenIterator.h                   |  12 --
 src/Parsers/examples/create_parser.cpp        |   2 +-
 src/Parsers/examples/select_parser.cpp        |   2 +-
 src/Parsers/fuzzers/select_parser_fuzzer.cpp  |   3 +-
 src/Parsers/parseQuery.cpp                    |  28 +--
 src/Parsers/parseQuery.h                      |  16 +-
 src/Parsers/tests/gtest_Parser.cpp            |  13 +-
 src/Parsers/tests/gtest_common.cpp            |   8 +-
 src/Parsers/tests/gtest_dictionary_parser.cpp |  18 +-
 src/Parsers/tests/gtest_format_hiliting.cpp   |   2 +-
 src/Planner/PlannerJoinTree.cpp               |   2 +-
 src/Planner/Utils.cpp                         |   2 +-
 .../Impl/ConstantExpressionTemplate.cpp       |   2 +-
 .../Formats/Impl/MySQLDumpRowInputFormat.cpp  |   3 +-
 .../Formats/Impl/ValuesBlockInputFormat.cpp   |   4 +-
 .../QueryPlan/ReadFromMergeTree.cpp           |   2 +-
 src/Server/GRPCServer.cpp                     |   2 +-
 src/Server/PostgreSQLHandler.cpp              |   1 +
 src/Storages/ColumnsDescription.cpp           |   4 +-
 src/Storages/ConstraintsDescription.cpp       |   2 +-
 src/Storages/IndicesDescription.cpp           |   2 +-
 src/Storages/KeyDescription.cpp               |   2 +-
 src/Storages/MergeTree/IMergeTreeDataPart.cpp |   2 +-
 .../MergeTreeDataPartWriterCompact.cpp        |   2 +-
 .../MergeTreeDataPartWriterOnDisk.cpp         |   4 +-
 .../MergeTree/MergeTreeDataPartWriterWide.cpp |   2 +-
 .../MergeTree/MergeTreeDataSelectExecutor.cpp |   2 +-
 .../ReplicatedMergeTreeTableMetadata.cpp      |   4 +-
 src/Storages/MutationCommands.cpp             |   2 +-
 .../StorageMaterializedPostgreSQL.cpp         |   2 +-
 src/Storages/ProjectionsDescription.cpp       |   2 +-
 .../System/StorageSystemDDLWorkerQueue.cpp    |   3 +-
 .../System/attachInformationSchemaTables.cpp  |   2 +-
 src/Storages/TTLDescription.cpp               |   2 +-
 src/Storages/getStructureOfRemoteTable.cpp    |   4 +-
 ..._transform_query_for_external_database.cpp |   4 +-
 src/TableFunctions/Hive/TableFunctionHive.cpp |   4 +-
 src/TableFunctions/TableFunctionExplain.cpp   |   8 +-
 138 files changed, 549 insertions(+), 466 deletions(-)
 create mode 100644 src/Parsers/IParser.cpp

diff --git a/programs/compressor/Compressor.cpp b/programs/compressor/Compressor.cpp
index 7125fdc744f..050bb495024 100644
--- a/programs/compressor/Compressor.cpp
+++ b/programs/compressor/Compressor.cpp
@@ -143,7 +143,7 @@ int mainEntryClickHouseCompressor(int argc, char ** argv)
             ParserCodec codec_parser;
 
             std::string codecs_line = boost::algorithm::join(codecs, ",");
-            auto ast = parseQuery(codec_parser, "(" + codecs_line + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+            auto ast = parseQuery(codec_parser, "(" + codecs_line + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
             codec = CompressionCodecFactory::instance().get(ast, nullptr);
         }
         else
diff --git a/programs/format/Format.cpp b/programs/format/Format.cpp
index c92106e2f90..50f801f2560 100644
--- a/programs/format/Format.cpp
+++ b/programs/format/Format.cpp
@@ -234,7 +234,7 @@ int mainEntryClickHouseFormat(int argc, char ** argv)
                 size_t approx_query_length = multiple ? find_first_symbols<';'>(pos, end) - pos : end - pos;
 
                 ASTPtr res = parseQueryAndMovePosition(
-                    parser, pos, end, "query", multiple, cmd_settings.max_query_size, cmd_settings.max_parser_depth);
+                    parser, pos, end, "query", multiple, cmd_settings.max_query_size, cmd_settings.max_parser_depth, cmd_settings.max_parser_backtracks);
 
                 std::unique_ptr<ReadBuffer> insert_query_payload = nullptr;
                 /// If the query is INSERT ... VALUES, then we will try to parse the data.
diff --git a/programs/keeper-client/KeeperClient.cpp b/programs/keeper-client/KeeperClient.cpp
index 595fc65e50e..8297fab5ed9 100644
--- a/programs/keeper-client/KeeperClient.cpp
+++ b/programs/keeper-client/KeeperClient.cpp
@@ -44,7 +44,7 @@ String KeeperClient::executeFourLetterCommand(const String & command)
 std::vector<String> KeeperClient::getCompletions(const String & prefix) const
 {
     Tokens tokens(prefix.data(), prefix.data() + prefix.size(), 0, false);
-    IParser::Pos pos(tokens, 0);
+    IParser::Pos pos(tokens, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
     if (pos->type != TokenType::BareWord)
         return registered_commands_and_four_letter_words;
@@ -278,6 +278,7 @@ bool KeeperClient::processQueryText(const String & text)
                 /* allow_multi_statements = */ true,
                 /* max_query_size = */ 0,
                 /* max_parser_depth = */ 0,
+                /* max_parser_backtracks = */ 0,
                 /* skip_insignificant = */ false);
 
             if (!res)
diff --git a/src/Access/AccessEntityIO.cpp b/src/Access/AccessEntityIO.cpp
index 80bb63b04bf..b0dfd74c53b 100644
--- a/src/Access/AccessEntityIO.cpp
+++ b/src/Access/AccessEntityIO.cpp
@@ -62,7 +62,7 @@ AccessEntityPtr deserializeAccessEntityImpl(const String & definition)
     const char * end = begin + definition.size();
     while (pos < end)
     {
-        queries.emplace_back(parseQueryAndMovePosition(parser, pos, end, "", true, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH));
+        queries.emplace_back(parseQueryAndMovePosition(parser, pos, end, "", true, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS));
         while (isWhitespaceASCII(*pos) || *pos == ';')
             ++pos;
     }
diff --git a/src/Access/RowPolicyCache.cpp b/src/Access/RowPolicyCache.cpp
index 13140099a63..c1c4928d0da 100644
--- a/src/Access/RowPolicyCache.cpp
+++ b/src/Access/RowPolicyCache.cpp
@@ -86,7 +86,7 @@ void RowPolicyCache::PolicyInfo::setPolicy(const RowPolicyPtr & policy_)
         try
         {
             ParserExpression parser;
-            parsed_filters[filter_type_i] = parseQuery(parser, filter, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+            parsed_filters[filter_type_i] = parseQuery(parser, filter, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
         }
         catch (...)
         {
diff --git a/src/Access/UsersConfigAccessStorage.cpp b/src/Access/UsersConfigAccessStorage.cpp
index e9b2e1397ab..b4b843fc77e 100644
--- a/src/Access/UsersConfigAccessStorage.cpp
+++ b/src/Access/UsersConfigAccessStorage.cpp
@@ -66,7 +66,7 @@ namespace
 
         String error_message;
         const char * pos = string_query.data();
-        auto ast = tryParseQuery(parser, pos, pos + string_query.size(), error_message, false, "", false, 0, 0);
+        auto ast = tryParseQuery(parser, pos, pos + string_query.size(), error_message, false, "", false, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS, true);
 
         if (!ast)
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Failed to parse grant query. Error: {}", error_message);
diff --git a/src/AggregateFunctions/parseAggregateFunctionParameters.cpp b/src/AggregateFunctions/parseAggregateFunctionParameters.cpp
index db1efe224d1..593be1e0a79 100644
--- a/src/AggregateFunctions/parseAggregateFunctionParameters.cpp
+++ b/src/AggregateFunctions/parseAggregateFunctionParameters.cpp
@@ -81,7 +81,8 @@ void getAggregateFunctionNameAndParametersArray(
     ParserExpressionList params_parser(false);
     ASTPtr args_ast = parseQuery(params_parser,
         parameters_str.data(), parameters_str.data() + parameters_str.size(),
-        "parameters of aggregate function in " + error_context, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        "parameters of aggregate function in " + error_context,
+        0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
     if (args_ast->children.empty())
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Incorrect list of parameters to aggregate function {}",
diff --git a/src/Backups/BackupInfo.cpp b/src/Backups/BackupInfo.cpp
index 2bff400d4fe..461f613ecd2 100644
--- a/src/Backups/BackupInfo.cpp
+++ b/src/Backups/BackupInfo.cpp
@@ -25,7 +25,7 @@ String BackupInfo::toString() const
 BackupInfo BackupInfo::fromString(const String & str)
 {
     ParserIdentifierWithOptionalParameters parser;
-    ASTPtr ast = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    ASTPtr ast = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     return fromAST(*ast);
 }
 
diff --git a/src/Backups/RestorerFromBackup.cpp b/src/Backups/RestorerFromBackup.cpp
index 87c143f0fe2..e20e8eb66c6 100644
--- a/src/Backups/RestorerFromBackup.cpp
+++ b/src/Backups/RestorerFromBackup.cpp
@@ -424,7 +424,7 @@ void RestorerFromBackup::findTableInBackupImpl(const QualifiedTableName & table_
     readStringUntilEOF(create_query_str, *read_buffer);
     read_buffer.reset();
     ParserCreateQuery create_parser;
-    ASTPtr create_table_query = parseQuery(create_parser, create_query_str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    ASTPtr create_table_query = parseQuery(create_parser, create_query_str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     applyCustomStoragePolicy(create_table_query);
     renameDatabaseAndTableNameInCreateQuery(create_table_query, renaming_map, context->getGlobalContext());
     String create_table_query_str = serializeAST(*create_table_query);
@@ -534,7 +534,7 @@ void RestorerFromBackup::findDatabaseInBackupImpl(const String & database_name_i
         readStringUntilEOF(create_query_str, *read_buffer);
         read_buffer.reset();
         ParserCreateQuery create_parser;
-        ASTPtr create_database_query = parseQuery(create_parser, create_query_str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        ASTPtr create_database_query = parseQuery(create_parser, create_query_str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
         renameDatabaseAndTableNameInCreateQuery(create_database_query, renaming_map, context->getGlobalContext());
         String create_database_query_str = serializeAST(*create_database_query);
 
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index 48962880b8f..d561a64895b 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -345,7 +345,7 @@ ASTPtr ClientBase::parseQuery(const char *& pos, const char * end, bool allow_mu
     if (dialect == Dialect::kusto)
         parser = std::make_unique<ParserKQLStatement>(end, global_context->getSettings().allow_settings_after_format_in_insert);
     else if (dialect == Dialect::prql)
-        parser = std::make_unique<ParserPRQLQuery>(max_length, settings.max_parser_depth);
+        parser = std::make_unique<ParserPRQLQuery>(max_length, settings.max_parser_depth, settings.max_parser_backtracks);
     else
         parser = std::make_unique<ParserQuery>(end, global_context->getSettings().allow_settings_after_format_in_insert);
 
@@ -353,9 +353,9 @@ ASTPtr ClientBase::parseQuery(const char *& pos, const char * end, bool allow_mu
     {
         String message;
         if (dialect == Dialect::kusto)
-            res = tryParseKQLQuery(*parser, pos, end, message, true, "", allow_multi_statements, max_length, settings.max_parser_depth);
+            res = tryParseKQLQuery(*parser, pos, end, message, true, "", allow_multi_statements, max_length, settings.max_parser_depth, settings.max_parser_backtracks, true);
         else
-            res = tryParseQuery(*parser, pos, end, message, true, "", allow_multi_statements, max_length, settings.max_parser_depth);
+            res = tryParseQuery(*parser, pos, end, message, true, "", allow_multi_statements, max_length, settings.max_parser_depth, settings.max_parser_backtracks, true);
 
         if (!res)
         {
@@ -366,9 +366,9 @@ ASTPtr ClientBase::parseQuery(const char *& pos, const char * end, bool allow_mu
     else
     {
         if (dialect == Dialect::kusto)
-            res = parseKQLQueryAndMovePosition(*parser, pos, end, "", allow_multi_statements, max_length, settings.max_parser_depth);
+            res = parseKQLQueryAndMovePosition(*parser, pos, end, "", allow_multi_statements, max_length, settings.max_parser_depth, settings.max_parser_backtracks);
         else
-            res = parseQueryAndMovePosition(*parser, pos, end, "", allow_multi_statements, max_length, settings.max_parser_depth);
+            res = parseQueryAndMovePosition(*parser, pos, end, "", allow_multi_statements, max_length, settings.max_parser_depth, settings.max_parser_backtracks);
     }
 
     if (is_interactive)
@@ -385,12 +385,12 @@ ASTPtr ClientBase::parseQuery(const char *& pos, const char * end, bool allow_mu
 
 
 /// Consumes trailing semicolons and tries to consume the same-line trailing comment.
-void ClientBase::adjustQueryEnd(const char *& this_query_end, const char * all_queries_end, uint32_t max_parser_depth)
+void ClientBase::adjustQueryEnd(const char *& this_query_end, const char * all_queries_end, uint32_t max_parser_depth, uint32_t max_parser_backtracks)
 {
     // We have to skip the trailing semicolon that might be left
     // after VALUES parsing or just after a normal semicolon-terminated query.
     Tokens after_query_tokens(this_query_end, all_queries_end);
-    IParser::Pos after_query_iterator(after_query_tokens, max_parser_depth);
+    IParser::Pos after_query_iterator(after_query_tokens, max_parser_depth, max_parser_backtracks);
     while (after_query_iterator.isValid() && after_query_iterator->type == TokenType::Semicolon)
     {
         this_query_end = after_query_iterator->end;
@@ -1984,6 +1984,7 @@ MultiQueryProcessingStage ClientBase::analyzeMultiQueryText(
         return MultiQueryProcessingStage::QUERIES_END;
 
     unsigned max_parser_depth = static_cast<unsigned>(global_context->getSettingsRef().max_parser_depth);
+    unsigned max_parser_backtracks = static_cast<unsigned>(global_context->getSettingsRef().max_parser_backtracks);
 
     // If there are only comments left until the end of file, we just
     // stop. The parser can't handle this situation because it always
@@ -1994,7 +1995,7 @@ MultiQueryProcessingStage ClientBase::analyzeMultiQueryText(
     // and it makes more sense to treat them as such.
     {
         Tokens tokens(this_query_begin, all_queries_end);
-        IParser::Pos token_iterator(tokens, max_parser_depth);
+        IParser::Pos token_iterator(tokens, max_parser_depth, max_parser_backtracks);
         if (!token_iterator.isValid())
             return MultiQueryProcessingStage::QUERIES_END;
     }
@@ -2015,7 +2016,7 @@ MultiQueryProcessingStage ClientBase::analyzeMultiQueryText(
         if (ignore_error)
         {
             Tokens tokens(this_query_begin, all_queries_end);
-            IParser::Pos token_iterator(tokens, max_parser_depth);
+            IParser::Pos token_iterator(tokens, max_parser_depth, max_parser_backtracks);
             while (token_iterator->type != TokenType::Semicolon && token_iterator.isValid())
                 ++token_iterator;
             this_query_begin = token_iterator->end;
@@ -2055,7 +2056,7 @@ MultiQueryProcessingStage ClientBase::analyzeMultiQueryText(
     // after we have processed the query. But even this guess is
     // beneficial so that we see proper trailing comments in "echo" and
     // server log.
-    adjustQueryEnd(this_query_end, all_queries_end, max_parser_depth);
+    adjustQueryEnd(this_query_end, all_queries_end, max_parser_depth, max_parser_backtracks);
     return MultiQueryProcessingStage::EXECUTE_QUERY;
 }
 
@@ -2251,7 +2252,8 @@ bool ClientBase::executeMultiQuery(const String & all_queries_text)
                     this_query_end = insert_ast->end;
                     adjustQueryEnd(
                         this_query_end, all_queries_end,
-                        static_cast<unsigned>(global_context->getSettingsRef().max_parser_depth));
+                        static_cast<unsigned>(global_context->getSettingsRef().max_parser_depth),
+                        static_cast<unsigned>(global_context->getSettingsRef().max_parser_backtracks));
                 }
 
                 // Report error.
diff --git a/src/Client/ClientBase.h b/src/Client/ClientBase.h
index dd08e7c059b..7a9e9666e67 100644
--- a/src/Client/ClientBase.h
+++ b/src/Client/ClientBase.h
@@ -94,7 +94,7 @@ protected:
     void processParsedSingleQuery(const String & full_query, const String & query_to_execute,
         ASTPtr parsed_query, std::optional<bool> echo_query_ = {}, bool report_error = false);
 
-    static void adjustQueryEnd(const char *& this_query_end, const char * all_queries_end, uint32_t max_parser_depth);
+    static void adjustQueryEnd(const char *& this_query_end, const char * all_queries_end, uint32_t max_parser_depth, uint32_t max_parser_backtracks);
     ASTPtr parseQuery(const char *& pos, const char * end, bool allow_multi_statements) const;
     static void setupSignalHandler();
 
diff --git a/src/Client/QueryFuzzer.cpp b/src/Client/QueryFuzzer.cpp
index 0a7cb1b36db..7be01686258 100644
--- a/src/Client/QueryFuzzer.cpp
+++ b/src/Client/QueryFuzzer.cpp
@@ -569,7 +569,8 @@ void QueryFuzzer::fuzzColumnDeclaration(ASTColumnDeclaration & column)
         auto data_type = fuzzDataType(DataTypeFactory::instance().get(column.type));
 
         ParserDataType parser;
-        column.type = parseQuery(parser, data_type->getName(), DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        column.type = parseQuery(parser, data_type->getName(),
+            DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     }
 }
 
@@ -821,7 +822,8 @@ static ASTPtr tryParseInsertQuery(const String & full_query)
     ParserInsertQuery parser(end, false);
     String message;
 
-    return tryParseQuery(parser, pos, end, message, false, "", false, DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    return tryParseQuery(parser, pos, end, message, false, "", false,
+        DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS, true);
 }
 
 ASTs QueryFuzzer::getInsertQueriesForFuzzedTables(const String & full_query)
diff --git a/src/Common/NamedCollections/NamedCollectionUtils.cpp b/src/Common/NamedCollections/NamedCollectionUtils.cpp
index fe0f42467c7..9b569390b3c 100644
--- a/src/Common/NamedCollections/NamedCollectionUtils.cpp
+++ b/src/Common/NamedCollections/NamedCollectionUtils.cpp
@@ -302,7 +302,7 @@ private:
         readStringUntilEOF(query, in);
 
         ParserCreateNamedCollectionQuery parser;
-        auto ast = parseQuery(parser, query, "in file " + path, 0, settings.max_parser_depth);
+        auto ast = parseQuery(parser, query, "in file " + path, 0, settings.max_parser_depth, settings.max_parser_backtracks);
         const auto & create_query = ast->as<const ASTCreateNamedCollectionQuery &>();
         return create_query;
     }
diff --git a/src/Compression/tests/gtest_compressionCodec.cpp b/src/Compression/tests/gtest_compressionCodec.cpp
index 24f16a55c25..16573e035e0 100644
--- a/src/Compression/tests/gtest_compressionCodec.cpp
+++ b/src/Compression/tests/gtest_compressionCodec.cpp
@@ -442,7 +442,7 @@ CompressionCodecPtr makeCodec(const std::string & codec_string, const DataTypePt
 {
     const std::string codec_statement = "(" + codec_string + ")";
     Tokens tokens(codec_statement.begin().base(), codec_statement.end().base());
-    IParser::Pos token_iterator(tokens, 0);
+    IParser::Pos token_iterator(tokens, 0, 0);
 
     Expected expected;
     ASTPtr codec_ast;
diff --git a/src/Core/Defines.h b/src/Core/Defines.h
index cc6f49aa361..a8dd26519c2 100644
--- a/src/Core/Defines.h
+++ b/src/Core/Defines.h
@@ -63,6 +63,8 @@ static constexpr auto DBMS_DEFAULT_LOCK_ACQUIRE_TIMEOUT_SEC = 120;
 
 /// Default limit on recursion depth of recursive descend parser.
 static constexpr auto DBMS_DEFAULT_MAX_PARSER_DEPTH = 1000;
+/// Default limit on the amount of backtracking of recursive descend parser.
+static constexpr auto DBMS_DEFAULT_MAX_PARSER_BACKTRACKS = 1000000;
 
 /// Default limit on query size.
 static constexpr auto DBMS_DEFAULT_MAX_QUERY_SIZE = 262144;
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 48f6b4d621c..e6adb00137f 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -607,6 +607,7 @@ class IColumn;
     M(Bool, use_compact_format_in_distributed_parts_names, true, "Changes format of directories names for distributed table insert parts.", 0) \
     M(Bool, validate_polygons, true, "Throw exception if polygon is invalid in function pointInPolygon (e.g. self-tangent, self-intersecting). If the setting is false, the function will accept invalid polygons but may silently return wrong result.", 0) \
     M(UInt64, max_parser_depth, DBMS_DEFAULT_MAX_PARSER_DEPTH, "Maximum parser depth (recursion depth of recursive descend parser).", 0) \
+    M(UInt64, max_parser_backtracks, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS, "Maximum parser backtracking (how many times it tries different alternatives in the recursive descend parsing process).", 0) \
     M(Bool, allow_settings_after_format_in_insert, false, "Allow SETTINGS after FORMAT, but note, that this is not always safe (note: this is a compatibility setting).", 0) \
     M(Seconds, periodic_live_view_refresh, 60, "Interval after which periodically refreshed live view is forced to refresh.", 0) \
     M(Bool, transform_null_in, false, "If enabled, NULL values will be matched with 'IN' operator as if they are considered equal.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 4914f97a6fb..8e2b2915c2a 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -95,6 +95,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"throw_if_deduplication_in_dependent_materialized_views_enabled_with_async_insert", false, true, "Deduplication is dependent materialized view cannot work together with async inserts."},
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
               {"filesystem_cache_reserve_space_wait_lock_timeout_milliseconds", 1000, 1000, "Wait time to lock cache for sapce reservation in filesystem cache"},
+              {"max_parser_backtracks", 0, 1000000, "Limiting the complexity of parsing"},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
diff --git a/src/DataTypes/DataTypeFactory.cpp b/src/DataTypes/DataTypeFactory.cpp
index d154b386ace..844384f3c95 100644
--- a/src/DataTypes/DataTypeFactory.cpp
+++ b/src/DataTypes/DataTypeFactory.cpp
@@ -56,13 +56,14 @@ DataTypePtr DataTypeFactory::getImpl(const String & full_name) const
     {
         String out_err;
         const char * start = full_name.data();
-        ast = tryParseQuery(parser, start, start + full_name.size(), out_err, false, "data type", false, DBMS_DEFAULT_MAX_QUERY_SIZE, data_type_max_parse_depth);
+        ast = tryParseQuery(parser, start, start + full_name.size(), out_err, false, "data type", false,
+            DBMS_DEFAULT_MAX_QUERY_SIZE, data_type_max_parse_depth, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS, true);
         if (!ast)
             return nullptr;
     }
     else
     {
-        ast = parseQuery(parser, full_name.data(), full_name.data() + full_name.size(), "data type", false, data_type_max_parse_depth);
+        ast = parseQuery(parser, full_name.data(), full_name.data() + full_name.size(), "data type", false, data_type_max_parse_depth, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     }
 
     return getImpl<nullptr_on_error>(ast);
diff --git a/src/Databases/DDLDependencyVisitor.cpp b/src/Databases/DDLDependencyVisitor.cpp
index cb85119e3b0..75a01a6190f 100644
--- a/src/Databases/DDLDependencyVisitor.cpp
+++ b/src/Databases/DDLDependencyVisitor.cpp
@@ -444,8 +444,9 @@ namespace
             ParserSelectWithUnionQuery parser;
             String description = fmt::format("Query for ClickHouse dictionary {}", data.table_name);
             String fixed_query = removeWhereConditionPlaceholder(query);
+            const Settings & settings = data.context->getSettingsRef();
             ASTPtr select = parseQuery(parser, fixed_query, description,
-                                       data.context->getSettingsRef().max_query_size, data.context->getSettingsRef().max_parser_depth);
+                settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
 
             DDLDependencyVisitor::Visitor visitor{data};
             visitor.visit(select);
diff --git a/src/Databases/DatabaseDictionary.cpp b/src/Databases/DatabaseDictionary.cpp
index 9a65c7a46ef..76fdb4fa961 100644
--- a/src/Databases/DatabaseDictionary.cpp
+++ b/src/Databases/DatabaseDictionary.cpp
@@ -115,7 +115,7 @@ ASTPtr DatabaseDictionary::getCreateTableQueryImpl(const String & table_name, Co
     const char * pos = query.data();
     std::string error_message;
     auto ast = tryParseQuery(parser, pos, pos + query.size(), error_message,
-            /* hilite = */ false, "", /* allow_multi_statements = */ false, 0, settings.max_parser_depth);
+        /* hilite = */ false, "", /* allow_multi_statements = */ false, 0, settings.max_parser_depth, settings.max_parser_backtracks, true);
 
     if (!ast && throw_on_error)
         throw Exception::createDeprecated(error_message, ErrorCodes::SYNTAX_ERROR);
@@ -134,7 +134,7 @@ ASTPtr DatabaseDictionary::getCreateDatabaseQuery() const
     }
     auto settings = getContext()->getSettingsRef();
     ParserCreateQuery parser;
-    return parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth);
+    return parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth, settings.max_parser_backtracks);
 }
 
 void DatabaseDictionary::shutdown()
diff --git a/src/Databases/DatabaseFilesystem.cpp b/src/Databases/DatabaseFilesystem.cpp
index 5af1e1ae0d2..05af0acf978 100644
--- a/src/Databases/DatabaseFilesystem.cpp
+++ b/src/Databases/DatabaseFilesystem.cpp
@@ -187,7 +187,7 @@ ASTPtr DatabaseFilesystem::getCreateDatabaseQuery() const
     const String query = fmt::format("CREATE DATABASE {} ENGINE = Filesystem('{}')", backQuoteIfNeed(getDatabaseName()), path);
 
     ParserCreateQuery parser;
-    ASTPtr ast = parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth);
+    ASTPtr ast = parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth, settings.max_parser_backtracks);
 
     if (const auto database_comment = getDatabaseComment(); !database_comment.empty())
     {
diff --git a/src/Databases/DatabaseHDFS.cpp b/src/Databases/DatabaseHDFS.cpp
index 3a1e6b16ccf..2688ff2443c 100644
--- a/src/Databases/DatabaseHDFS.cpp
+++ b/src/Databases/DatabaseHDFS.cpp
@@ -183,7 +183,7 @@ ASTPtr DatabaseHDFS::getCreateDatabaseQuery() const
     ParserCreateQuery parser;
 
     const String query = fmt::format("CREATE DATABASE {} ENGINE = HDFS('{}')", backQuoteIfNeed(getDatabaseName()), source);
-    ASTPtr ast = parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth);
+    ASTPtr ast = parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth, settings.max_parser_backtracks);
 
     if (const auto database_comment = getDatabaseComment(); !database_comment.empty())
     {
diff --git a/src/Databases/DatabaseOnDisk.cpp b/src/Databases/DatabaseOnDisk.cpp
index fcb073644c5..dcfc1916450 100644
--- a/src/Databases/DatabaseOnDisk.cpp
+++ b/src/Databases/DatabaseOnDisk.cpp
@@ -526,7 +526,7 @@ ASTPtr DatabaseOnDisk::getCreateDatabaseQuery() const
         /// If database.sql doesn't exist, then engine is Ordinary
         String query = "CREATE DATABASE " + backQuoteIfNeed(getDatabaseName()) + " ENGINE = Ordinary";
         ParserCreateQuery parser;
-        ast = parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth);
+        ast = parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth, settings.max_parser_backtracks);
     }
 
     if (const auto database_comment = getDatabaseComment(); !database_comment.empty())
@@ -707,7 +707,7 @@ ASTPtr DatabaseOnDisk::parseQueryFromMetadata(
     const char * pos = query.data();
     std::string error_message;
     auto ast = tryParseQuery(parser, pos, pos + query.size(), error_message, /* hilite = */ false,
-                             "in file " + metadata_file_path, /* allow_multi_statements = */ false, 0, settings.max_parser_depth);
+        "in file " + metadata_file_path, /* allow_multi_statements = */ false, 0, settings.max_parser_depth, settings.max_parser_backtracks, true);
 
     if (!ast && throw_on_error)
         throw Exception::createDeprecated(error_message, ErrorCodes::SYNTAX_ERROR);
@@ -765,12 +765,14 @@ ASTPtr DatabaseOnDisk::getCreateQueryFromStorage(const String & table_name, cons
     auto ast_storage = std::make_shared<ASTStorage>();
     ast_storage->set(ast_storage->engine, ast_engine);
 
-    unsigned max_parser_depth = static_cast<unsigned>(getContext()->getSettingsRef().max_parser_depth);
-    auto create_table_query = DB::getCreateQueryFromStorage(storage,
-                                                            ast_storage,
-                                                            false,
-                                                            max_parser_depth,
-                                                            throw_on_error);
+    const Settings & settings = getContext()->getSettingsRef();
+    auto create_table_query = DB::getCreateQueryFromStorage(
+        storage,
+        ast_storage,
+        false,
+        static_cast<unsigned>(settings.max_parser_depth),
+        static_cast<unsigned>(settings.max_parser_backtracks),
+        throw_on_error);
 
     create_table_query->set(create_table_query->as<ASTCreateQuery>()->comment,
                             std::make_shared<ASTLiteral>("SYSTEM TABLE is built on the fly."));
diff --git a/src/Databases/DatabaseOrdinary.cpp b/src/Databases/DatabaseOrdinary.cpp
index bc552b9c927..161dd3d3f60 100644
--- a/src/Databases/DatabaseOrdinary.cpp
+++ b/src/Databases/DatabaseOrdinary.cpp
@@ -469,7 +469,7 @@ void DatabaseOrdinary::alterTable(ContextPtr local_context, const StorageID & ta
         statement.data() + statement.size(),
         "in file " + table_metadata_path,
         0,
-        local_context->getSettingsRef().max_parser_depth);
+        local_context->getSettingsRef().max_parser_depth, local_context->getSettingsRef().max_parser_backtracks);
 
     applyMetadataChangesToCreateQuery(ast, metadata);
 
diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index 9cf19a251f7..3b6a712510d 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -812,7 +812,8 @@ static UUID getTableUUIDIfReplicated(const String & metadata, ContextPtr context
     ParserCreateQuery parser;
     auto size = context->getSettingsRef().max_query_size;
     auto depth = context->getSettingsRef().max_parser_depth;
-    ASTPtr query = parseQuery(parser, metadata, size, depth);
+    auto backtracks = context->getSettingsRef().max_parser_backtracks;
+    ASTPtr query = parseQuery(parser, metadata, size, depth, backtracks);
     const ASTCreateQuery & create = query->as<const ASTCreateQuery &>();
     if (!create.storage || !create.storage->engine)
         return UUIDHelpers::Nil;
@@ -1234,7 +1235,7 @@ ASTPtr DatabaseReplicated::parseQueryFromMetadataInZooKeeper(const String & node
 {
     ParserCreateQuery parser;
     String description = "in ZooKeeper " + zookeeper_path + "/metadata/" + node_name;
-    auto ast = parseQuery(parser, query, description, 0, getContext()->getSettingsRef().max_parser_depth);
+    auto ast = parseQuery(parser, query, description, 0, getContext()->getSettingsRef().max_parser_depth, getContext()->getSettingsRef().max_parser_backtracks);
 
     auto & create = ast->as<ASTCreateQuery &>();
     if (create.uuid == UUIDHelpers::Nil || create.getTable() != TABLE_WITH_UUID_NAME_PLACEHOLDER || create.database)
@@ -1559,7 +1560,7 @@ DatabaseReplicated::getTablesForBackup(const FilterByNameFunction & filter, cons
     for (const auto & [table_name, metadata] : snapshot)
     {
         ParserCreateQuery parser;
-        auto create_table_query = parseQuery(parser, metadata, 0, getContext()->getSettingsRef().max_parser_depth);
+        auto create_table_query = parseQuery(parser, metadata, 0, getContext()->getSettingsRef().max_parser_depth, getContext()->getSettingsRef().max_parser_backtracks);
 
         auto & create = create_table_query->as<ASTCreateQuery &>();
         create.attach = false;
diff --git a/src/Databases/DatabaseS3.cpp b/src/Databases/DatabaseS3.cpp
index d2ca5a05ea4..159a5242dbe 100644
--- a/src/Databases/DatabaseS3.cpp
+++ b/src/Databases/DatabaseS3.cpp
@@ -191,7 +191,7 @@ ASTPtr DatabaseS3::getCreateDatabaseQuery() const
         creation_args += fmt::format(", '{}', '{}'", config.access_key_id.value(), config.secret_access_key.value());
 
     const String query = fmt::format("CREATE DATABASE {} ENGINE = S3({})", backQuoteIfNeed(getDatabaseName()), creation_args);
-    ASTPtr ast = parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth);
+    ASTPtr ast = parseQuery(parser, query.data(), query.data() + query.size(), "", 0, settings.max_parser_depth, settings.max_parser_backtracks);
 
     if (const auto database_comment = getDatabaseComment(); !database_comment.empty())
     {
diff --git a/src/Databases/DatabasesCommon.cpp b/src/Databases/DatabasesCommon.cpp
index 963cf0064df..f8d6ad69ba8 100644
--- a/src/Databases/DatabasesCommon.cpp
+++ b/src/Databases/DatabasesCommon.cpp
@@ -108,7 +108,8 @@ void applyMetadataChangesToCreateQuery(const ASTPtr & query, const StorageInMemo
 }
 
 
-ASTPtr getCreateQueryFromStorage(const StoragePtr & storage, const ASTPtr & ast_storage, bool only_ordinary, uint32_t max_parser_depth, bool throw_on_error)
+ASTPtr getCreateQueryFromStorage(const StoragePtr & storage, const ASTPtr & ast_storage, bool only_ordinary,
+    uint32_t max_parser_depth, uint32_t max_parser_backtracks, bool throw_on_error)
 {
     auto table_id = storage->getStorageID();
     auto metadata_ptr = storage->getInMemoryMetadataPtr();
@@ -148,7 +149,7 @@ ASTPtr getCreateQueryFromStorage(const StoragePtr & storage, const ASTPtr & ast_
                 Expected expected;
                 expected.max_parsed_pos = string_end;
                 Tokens tokens(type_name.c_str(), string_end);
-                IParser::Pos pos(tokens, max_parser_depth);
+                IParser::Pos pos(tokens, max_parser_depth, max_parser_backtracks);
                 ParserDataType parser;
                 if (!parser.parse(pos, ast_type, expected))
                 {
diff --git a/src/Databases/DatabasesCommon.h b/src/Databases/DatabasesCommon.h
index 4e9d967c11a..81a3c55a435 100644
--- a/src/Databases/DatabasesCommon.h
+++ b/src/Databases/DatabasesCommon.h
@@ -13,7 +13,8 @@ namespace DB
 {
 
 void applyMetadataChangesToCreateQuery(const ASTPtr & query, const StorageInMemoryMetadata & metadata);
-ASTPtr getCreateQueryFromStorage(const StoragePtr & storage, const ASTPtr & ast_storage, bool only_ordinary, uint32_t max_parser_depth, bool throw_on_error);
+ASTPtr getCreateQueryFromStorage(const StoragePtr & storage, const ASTPtr & ast_storage, bool only_ordinary,
+    uint32_t max_parser_depth, uint32_t max_parser_backtracks, bool throw_on_error);
 
 /// Cleans a CREATE QUERY from temporary flags like "IF NOT EXISTS", "OR REPLACE", "AS SELECT" (for non-views), etc.
 void cleanupObjectDefinitionFromTemporaryFlags(ASTCreateQuery & query);
diff --git a/src/Databases/MySQL/DatabaseMySQL.cpp b/src/Databases/MySQL/DatabaseMySQL.cpp
index 96a5c3a18ce..d9b0f7f9ac7 100644
--- a/src/Databases/MySQL/DatabaseMySQL.cpp
+++ b/src/Databases/MySQL/DatabaseMySQL.cpp
@@ -174,12 +174,14 @@ ASTPtr DatabaseMySQL::getCreateTableQueryImpl(const String & table_name, Context
         ast_storage->settings = nullptr;
     }
 
-    unsigned max_parser_depth = static_cast<unsigned>(getContext()->getSettingsRef().max_parser_depth);
-    auto create_table_query = DB::getCreateQueryFromStorage(storage,
-                                                            table_storage_define,
-                                                            true,
-                                                            max_parser_depth,
-                                                            throw_on_error);
+    const Settings & settings = getContext()->getSettingsRef();
+    auto create_table_query = DB::getCreateQueryFromStorage(
+        storage,
+        table_storage_define,
+        true,
+        static_cast<unsigned>(settings.max_parser_depth),
+        static_cast<unsigned>(settings.max_parser_backtracks),
+        throw_on_error);
     return create_table_query;
 }
 
diff --git a/src/Databases/MySQL/tryConvertStringLiterals.cpp b/src/Databases/MySQL/tryConvertStringLiterals.cpp
index ab392b301e8..ac65d510f67 100644
--- a/src/Databases/MySQL/tryConvertStringLiterals.cpp
+++ b/src/Databases/MySQL/tryConvertStringLiterals.cpp
@@ -61,7 +61,7 @@ static bool tryReadCharset(
 bool tryConvertStringLiterals(String & query)
 {
     Tokens tokens(query.data(), query.data() + query.size());
-    IParser::Pos pos(tokens, 0);
+    IParser::Pos pos(tokens, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     Expected expected;
     String rewritten_query;
     rewritten_query.reserve(query.size());
diff --git a/src/Databases/MySQL/tryParseTableIDFromDDL.cpp b/src/Databases/MySQL/tryParseTableIDFromDDL.cpp
index a01eb311450..4fe0f44c767 100644
--- a/src/Databases/MySQL/tryParseTableIDFromDDL.cpp
+++ b/src/Databases/MySQL/tryParseTableIDFromDDL.cpp
@@ -10,7 +10,7 @@ StorageID tryParseTableIDFromDDL(const String & query, const String & default_da
 {
     bool is_ddl = false;
     Tokens tokens(query.data(), query.data() + query.size());
-    IParser::Pos pos(tokens, 0);
+    IParser::Pos pos(tokens, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     Expected expected;
     if (ParserKeyword("CREATE TEMPORARY TABLE").ignore(pos, expected) || ParserKeyword("CREATE TABLE").ignore(pos, expected))
     {
diff --git a/src/Databases/MySQL/tryQuoteUnrecognizedTokens.cpp b/src/Databases/MySQL/tryQuoteUnrecognizedTokens.cpp
index c5a366698e6..9ecc81c693f 100644
--- a/src/Databases/MySQL/tryQuoteUnrecognizedTokens.cpp
+++ b/src/Databases/MySQL/tryQuoteUnrecognizedTokens.cpp
@@ -37,7 +37,7 @@ static void quoteLiteral(
 bool tryQuoteUnrecognizedTokens(String & query)
 {
     Tokens tokens(query.data(), query.data() + query.size());
-    IParser::Pos pos(tokens, 0);
+    IParser::Pos pos(tokens, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     Expected expected;
     String rewritten_query;
     const char * copy_from = query.data();
diff --git a/src/Databases/SQLite/DatabaseSQLite.cpp b/src/Databases/SQLite/DatabaseSQLite.cpp
index b3d5288cdf7..b7a82fd9d0f 100644
--- a/src/Databases/SQLite/DatabaseSQLite.cpp
+++ b/src/Databases/SQLite/DatabaseSQLite.cpp
@@ -194,10 +194,10 @@ ASTPtr DatabaseSQLite::getCreateTableQueryImpl(const String & table_name, Contex
     /// Add table_name to engine arguments
     storage_engine_arguments->children.insert(storage_engine_arguments->children.begin() + 1, std::make_shared<ASTLiteral>(table_id.table_name));
 
-    unsigned max_parser_depth = static_cast<unsigned>(getContext()->getSettingsRef().max_parser_depth);
+    const Settings & settings = getContext()->getSettingsRef();
+
     auto create_table_query = DB::getCreateQueryFromStorage(storage, table_storage_define, true,
-                                                            max_parser_depth,
-                                                            throw_on_error);
+        static_cast<uint32_t>(settings.max_parser_depth), static_cast<uint32_t>(settings.max_parser_backtracks), throw_on_error);
 
     return create_table_query;
 }
diff --git a/src/Dictionaries/tests/gtest_dictionary_configuration.cpp b/src/Dictionaries/tests/gtest_dictionary_configuration.cpp
index 989ce5c8f18..08aad663a8c 100644
--- a/src/Dictionaries/tests/gtest_dictionary_configuration.cpp
+++ b/src/Dictionaries/tests/gtest_dictionary_configuration.cpp
@@ -48,7 +48,7 @@ TEST(ConvertDictionaryAST, SimpleDictConfiguration)
                    " COMMENT 'hello world!'";
 
     ParserCreateDictionaryQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
     ASTCreateQuery * create = ast->as<ASTCreateQuery>();
     DictionaryConfigurationPtr config = getDictionaryConfigurationFromAST(*create, getContext().context);
 
@@ -119,7 +119,7 @@ TEST(ConvertDictionaryAST, TrickyAttributes)
                    " SOURCE(CLICKHOUSE(HOST 'localhost'))";
 
     ParserCreateDictionaryQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
     ASTCreateQuery * create = ast->as<ASTCreateQuery>();
     DictionaryConfigurationPtr config = getDictionaryConfigurationFromAST(*create, getContext().context);
 
@@ -164,7 +164,7 @@ TEST(ConvertDictionaryAST, ComplexKeyAndLayoutWithParams)
                    " LIFETIME(MIN 1 MAX 10)";
 
     ParserCreateDictionaryQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
     ASTCreateQuery * create = ast->as<ASTCreateQuery>();
     DictionaryConfigurationPtr config = getDictionaryConfigurationFromAST(*create, getContext().context);
 
@@ -215,7 +215,7 @@ TEST(ConvertDictionaryAST, ComplexSource)
                    " RANGE(MIN second_column MAX third_column)";
 
     ParserCreateDictionaryQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
     ASTCreateQuery * create = ast->as<ASTCreateQuery>();
     DictionaryConfigurationPtr config = getDictionaryConfigurationFromAST(*create, getContext().context);
     /// source
diff --git a/src/Formats/SchemaInferenceUtils.cpp b/src/Formats/SchemaInferenceUtils.cpp
index cb574551d26..0bba7a1f424 100644
--- a/src/Formats/SchemaInferenceUtils.cpp
+++ b/src/Formats/SchemaInferenceUtils.cpp
@@ -1054,7 +1054,7 @@ namespace
     {
         if (depth > settings.max_parser_depth)
             throw Exception(ErrorCodes::TOO_DEEP_RECURSION,
-                            "Maximum parse depth ({}) exceeded. Consider raising max_parser_depth setting.", settings.max_parser_depth);
+                "Maximum parse depth ({}) exceeded. Consider raising max_parser_depth setting.", settings.max_parser_depth);
 
         assertChar('{', buf);
         skipWhitespaceIfAny(buf);
diff --git a/src/Functions/FunctionSQLJSON.h b/src/Functions/FunctionSQLJSON.h
index 3efa40df9be..37db514fd1f 100644
--- a/src/Functions/FunctionSQLJSON.h
+++ b/src/Functions/FunctionSQLJSON.h
@@ -123,7 +123,7 @@ public:
     class Executor
     {
     public:
-        static ColumnPtr run(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count, uint32_t parse_depth, const ContextPtr & context)
+        static ColumnPtr run(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count, uint32_t parse_depth, uint32_t parse_backtracks, const ContextPtr & context)
         {
             MutableColumnPtr to{result_type->createColumn()};
             to->reserve(input_rows_count);
@@ -161,7 +161,7 @@ public:
             /// Tokenize the query
             Tokens tokens(query.data(), query.data() + query.size());
             /// Max depth 0 indicates that depth is not limited
-            IParser::Pos token_iterator(tokens, parse_depth);
+            IParser::Pos token_iterator(tokens, parse_depth, parse_backtracks);
 
             /// Parse query and create AST tree
             Expected expected;
@@ -232,16 +232,17 @@ public:
         /// 3. Parser(Tokens, ASTPtr) -> complete AST
         /// 4. Execute functions: call getNextItem on generator and handle each item
         unsigned parse_depth = static_cast<unsigned>(getContext()->getSettingsRef().max_parser_depth);
+        unsigned parse_backtracks = static_cast<unsigned>(getContext()->getSettingsRef().max_parser_backtracks);
 #if USE_SIMDJSON
         if (getContext()->getSettingsRef().allow_simdjson)
             return FunctionSQLJSONHelpers::Executor<
                 Name,
                 Impl<SimdJSONParser, JSONStringSerializer<SimdJSONParser::Element, SimdJSONElementFormatter>>,
-                SimdJSONParser>::run(arguments, result_type, input_rows_count, parse_depth, getContext());
+                SimdJSONParser>::run(arguments, result_type, input_rows_count, parse_depth, parse_backtracks, getContext());
 #endif
         return FunctionSQLJSONHelpers::
             Executor<Name, Impl<DummyJSONParser, DefaultJSONStringSerializer<DummyJSONParser::Element>>, DummyJSONParser>::run(
-                arguments, result_type, input_rows_count, parse_depth, getContext());
+                arguments, result_type, input_rows_count, parse_depth, parse_backtracks, getContext());
     }
 };
 
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp b/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp
index 3ec5393fa6f..b7c7e5847bd 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp
@@ -128,7 +128,7 @@ restoreUserDefinedSQLObjects(RestorerFromBackup & restorer, const String & data_
                     statement_def.data() + statement_def.size(),
                     "in file " + filepath + " from backup " + backup->getNameForLogging(),
                     0,
-                    context->getSettingsRef().max_parser_depth);
+                    context->getSettingsRef().max_parser_depth, context->getSettingsRef().max_parser_backtracks);
                 break;
             }
         }
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.cpp b/src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.cpp
index 34946db7d9e..b083c540083 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.cpp
@@ -92,7 +92,8 @@ ASTPtr UserDefinedSQLObjectsDiskStorage::tryLoadObject(UserDefinedSQLObjectType
                     object_create_query.data() + object_create_query.size(),
                     "",
                     0,
-                    global_context->getSettingsRef().max_parser_depth);
+                    global_context->getSettingsRef().max_parser_depth,
+                    global_context->getSettingsRef().max_parser_backtracks);
                 return ast;
             }
         }
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp b/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp
index c43b223ffeb..4ec34c15efc 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp
@@ -314,7 +314,8 @@ ASTPtr UserDefinedSQLObjectsZooKeeperStorage::parseObjectData(const String & obj
                 object_data.data() + object_data.size(),
                 "",
                 0,
-                global_context->getSettingsRef().max_parser_depth);
+                global_context->getSettingsRef().max_parser_depth,
+                global_context->getSettingsRef().max_parser_backtracks);
             return ast;
         }
     }
diff --git a/src/Functions/formatQuery.cpp b/src/Functions/formatQuery.cpp
index 92403d2e88e..d7addcc284e 100644
--- a/src/Functions/formatQuery.cpp
+++ b/src/Functions/formatQuery.cpp
@@ -17,6 +17,9 @@ namespace ErrorCodes
     extern const int ILLEGAL_COLUMN;
 }
 
+namespace
+{
+
 enum class OutputFormatting
 {
     SingleLine,
@@ -29,21 +32,16 @@ enum class ErrorHandling
     Null
 };
 
-template <OutputFormatting output_formatting, ErrorHandling error_handling, typename Name>
 class FunctionFormatQuery : public IFunction
 {
 public:
-    static constexpr auto name = Name::name;
-    static FunctionPtr create(ContextPtr context)
-    {
-        const auto & settings = context->getSettings();
-        return std::make_shared<FunctionFormatQuery>(settings.max_query_size, settings.max_parser_depth);
-    }
-
-    FunctionFormatQuery(size_t max_query_size_, size_t max_parser_depth_)
-        : max_query_size(max_query_size_)
-        , max_parser_depth(max_parser_depth_)
+    FunctionFormatQuery(ContextPtr context, String name_, OutputFormatting output_formatting_, ErrorHandling error_handling_)
+        : name(name_), output_formatting(output_formatting_), error_handling(error_handling_)
     {
+        const Settings & settings = context->getSettings();
+        max_query_size = settings.max_query_size;
+        max_parser_depth = settings.max_parser_depth;
+        max_parser_backtracks = settings.max_parser_backtracks;
     }
 
     String getName() const override { return name; }
@@ -59,7 +57,7 @@ public:
         validateFunctionArgumentTypes(*this, arguments, args);
 
         DataTypePtr string_type = std::make_shared<DataTypeString>();
-        if constexpr (error_handling == ErrorHandling::Null)
+        if (error_handling == ErrorHandling::Null)
             return std::make_shared<DataTypeNullable>(string_type);
         else
             return string_type;
@@ -70,7 +68,7 @@ public:
         const ColumnPtr col_query = arguments[0].column;
 
         ColumnUInt8::MutablePtr col_null_map;
-        if constexpr (error_handling == ErrorHandling::Null)
+        if (error_handling == ErrorHandling::Null)
             col_null_map = ColumnUInt8::create(input_rows_count, 0);
 
         if (const ColumnString * col_query_string = checkAndGetColumn<ColumnString>(col_query.get()))
@@ -78,7 +76,7 @@ public:
             auto col_res = ColumnString::create();
             formatVector(col_query_string->getChars(), col_query_string->getOffsets(), col_res->getChars(), col_res->getOffsets(), col_null_map);
 
-            if constexpr (error_handling == ErrorHandling::Null)
+            if (error_handling == ErrorHandling::Null)
                 return ColumnNullable::create(std::move(col_res), std::move(col_null_map));
             else
                 return col_res;
@@ -113,11 +111,11 @@ private:
 
             try
             {
-                ast = parseQuery(parser, begin, end, /*query_description*/ {}, max_query_size, max_parser_depth);
+                ast = parseQuery(parser, begin, end, /*query_description*/ {}, max_query_size, max_parser_depth, max_parser_backtracks);
             }
             catch (...)
             {
-                if constexpr (error_handling == ErrorHandling::Null)
+                if (error_handling == ErrorHandling::Null)
                 {
                     const size_t res_data_new_size = res_data_size + 1;
                     if (res_data_new_size > res_data.size())
@@ -135,7 +133,6 @@ private:
                 }
                 else
                 {
-                    static_assert(error_handling == ErrorHandling::Exception);
                     throw;
                 }
             }
@@ -160,92 +157,91 @@ private:
         res_data.resize(res_data_size);
     }
 
-    const size_t max_query_size;
-    const size_t max_parser_depth;
+    String name;
+    OutputFormatting output_formatting;
+    ErrorHandling error_handling;
+
+    size_t max_query_size;
+    size_t max_parser_depth;
+    size_t max_parser_backtracks;
 };
 
-struct NameFormatQuery
-{
-    static constexpr auto name = "formatQuery";
-};
-
-struct NameFormatQueryOrNull
-{
-    static constexpr auto name = "formatQueryOrNull";
-};
-
-struct NameFormatQuerySingleLine
-{
-    static constexpr auto name = "formatQuerySingleLine";
-};
-
-struct NameFormatQuerySingleLineOrNull
-{
-    static constexpr auto name = "formatQuerySingleLineOrNull";
-};
+}
 
 REGISTER_FUNCTION(formatQuery)
 {
-    factory.registerFunction<FunctionFormatQuery<OutputFormatting::MultiLine, ErrorHandling::Exception, NameFormatQuery>>(FunctionDocumentation{
-        .description = "Returns a formatted, possibly multi-line, version of the given SQL query. Throws in case of a parsing error.\n[example:multiline]",
-        .syntax = "formatQuery(query)",
-        .arguments = {{"query", "The SQL query to be formatted. [String](../../sql-reference/data-types/string.md)"}},
-        .returned_value = "The formatted query. [String](../../sql-reference/data-types/string.md).",
-        .examples{
-            {"multiline",
-             "SELECT formatQuery('select a,    b FRom tab WHERE a > 3 and  b < 3');",
-             "SELECT\n"
-             "    a,\n"
-             "    b\n"
-             "FROM tab\n"
-             "WHERE (a > 3) AND (b < 3)"}},
-        .categories{"Other"}});
+    factory.registerFunction(
+        "formatQuery",
+        [](ContextPtr context) { return std::make_shared<FunctionFormatQuery>(context, "formatQuery", OutputFormatting::MultiLine, ErrorHandling::Exception); },
+        FunctionDocumentation{
+            .description = "Returns a formatted, possibly multi-line, version of the given SQL query. Throws in case of a parsing error.\n[example:multiline]",
+            .syntax = "formatQuery(query)",
+            .arguments = {{"query", "The SQL query to be formatted. [String](../../sql-reference/data-types/string.md)"}},
+            .returned_value = "The formatted query. [String](../../sql-reference/data-types/string.md).",
+            .examples{
+                {"multiline",
+                 "SELECT formatQuery('select a,    b FRom tab WHERE a > 3 and  b < 3');",
+                 "SELECT\n"
+                 "    a,\n"
+                 "    b\n"
+                 "FROM tab\n"
+                 "WHERE (a > 3) AND (b < 3)"}},
+            .categories{"Other"}});
 }
 
 REGISTER_FUNCTION(formatQueryOrNull)
 {
-    factory.registerFunction<FunctionFormatQuery<OutputFormatting::MultiLine, ErrorHandling::Null, NameFormatQueryOrNull>>(FunctionDocumentation{
-        .description = "Returns a formatted, possibly multi-line, version of the given SQL query. Returns NULL in case of a parsing error.\n[example:multiline]",
-        .syntax = "formatQueryOrNull(query)",
-        .arguments = {{"query", "The SQL query to be formatted. [String](../../sql-reference/data-types/string.md)"}},
-        .returned_value = "The formatted query. [String](../../sql-reference/data-types/string.md).",
-        .examples{
-            {"multiline",
-             "SELECT formatQuery('select a,    b FRom tab WHERE a > 3 and  b < 3');",
-             "SELECT\n"
-             "    a,\n"
-             "    b\n"
-             "FROM tab\n"
-             "WHERE (a > 3) AND (b < 3)"}},
-        .categories{"Other"}});
+    factory.registerFunction(
+        "formatQueryOrNull",
+        [](ContextPtr context) { return std::make_shared<FunctionFormatQuery>(context, "formatQueryOrNull", OutputFormatting::MultiLine, ErrorHandling::Null); },
+        FunctionDocumentation{
+            .description = "Returns a formatted, possibly multi-line, version of the given SQL query. Returns NULL in case of a parsing error.\n[example:multiline]",
+            .syntax = "formatQueryOrNull(query)",
+            .arguments = {{"query", "The SQL query to be formatted. [String](../../sql-reference/data-types/string.md)"}},
+            .returned_value = "The formatted query. [String](../../sql-reference/data-types/string.md).",
+            .examples{
+                {"multiline",
+                 "SELECT formatQuery('select a,    b FRom tab WHERE a > 3 and  b < 3');",
+                 "SELECT\n"
+                 "    a,\n"
+                 "    b\n"
+                 "FROM tab\n"
+                 "WHERE (a > 3) AND (b < 3)"}},
+            .categories{"Other"}});
 }
 
 REGISTER_FUNCTION(formatQuerySingleLine)
 {
-    factory.registerFunction<FunctionFormatQuery<OutputFormatting::SingleLine, ErrorHandling::Exception, NameFormatQuerySingleLine>>(FunctionDocumentation{
-        .description = "Like formatQuery() but the returned formatted string contains no line breaks. Throws in case of a parsing error.\n[example:multiline]",
-        .syntax = "formatQuerySingleLine(query)",
-        .arguments = {{"query", "The SQL query to be formatted. [String](../../sql-reference/data-types/string.md)"}},
-        .returned_value = "The formatted query. [String](../../sql-reference/data-types/string.md).",
-        .examples{
-            {"multiline",
-             "SELECT formatQuerySingleLine('select a,    b FRom tab WHERE a > 3 and  b < 3');",
-             "SELECT a, b FROM tab WHERE (a > 3) AND (b < 3)"}},
-        .categories{"Other"}});
+    factory.registerFunction(
+        "formatQuerySingleLine",
+        [](ContextPtr context) { return std::make_shared<FunctionFormatQuery>(context, "formatQuerySingleLine", OutputFormatting::SingleLine, ErrorHandling::Exception); },
+        FunctionDocumentation{
+            .description = "Like formatQuery() but the returned formatted string contains no line breaks. Throws in case of a parsing error.\n[example:multiline]",
+            .syntax = "formatQuerySingleLine(query)",
+            .arguments = {{"query", "The SQL query to be formatted. [String](../../sql-reference/data-types/string.md)"}},
+            .returned_value = "The formatted query. [String](../../sql-reference/data-types/string.md).",
+            .examples{
+                {"multiline",
+                 "SELECT formatQuerySingleLine('select a,    b FRom tab WHERE a > 3 and  b < 3');",
+                 "SELECT a, b FROM tab WHERE (a > 3) AND (b < 3)"}},
+            .categories{"Other"}});
 }
 
 REGISTER_FUNCTION(formatQuerySingleLineOrNull)
 {
-    factory.registerFunction<FunctionFormatQuery<OutputFormatting::SingleLine, ErrorHandling::Null, NameFormatQuerySingleLineOrNull>>(FunctionDocumentation{
-        .description = "Like formatQuery() but the returned formatted string contains no line breaks. Returns NULL in case of a parsing error.\n[example:multiline]",
-        .syntax = "formatQuerySingleLineOrNull(query)",
-        .arguments = {{"query", "The SQL query to be formatted. [String](../../sql-reference/data-types/string.md)"}},
-        .returned_value = "The formatted query. [String](../../sql-reference/data-types/string.md).",
-        .examples{
-            {"multiline",
-             "SELECT formatQuerySingleLine('select a,    b FRom tab WHERE a > 3 and  b < 3');",
-             "SELECT a, b FROM tab WHERE (a > 3) AND (b < 3)"}},
-        .categories{"Other"}});
+    factory.registerFunction(
+        "formatQuerySingleLineOrNull",
+        [](ContextPtr context) { return std::make_shared<FunctionFormatQuery>(context, "formatQuerySingleLineOrNull", OutputFormatting::SingleLine, ErrorHandling::Null); },
+        FunctionDocumentation{
+            .description = "Like formatQuery() but the returned formatted string contains no line breaks. Returns NULL in case of a parsing error.\n[example:multiline]",
+            .syntax = "formatQuerySingleLineOrNull(query)",
+            .arguments = {{"query", "The SQL query to be formatted. [String](../../sql-reference/data-types/string.md)"}},
+            .returned_value = "The formatted query. [String](../../sql-reference/data-types/string.md).",
+            .examples{
+                {"multiline",
+                 "SELECT formatQuerySingleLine('select a,    b FRom tab WHERE a > 3 and  b < 3');",
+                 "SELECT a, b FROM tab WHERE (a > 3) AND (b < 3)"}},
+            .categories{"Other"}});
 }
 
 }
diff --git a/src/Interpreters/Access/InterpreterShowCreateAccessEntityQuery.cpp b/src/Interpreters/Access/InterpreterShowCreateAccessEntityQuery.cpp
index a55588baeaa..1147d74c146 100644
--- a/src/Interpreters/Access/InterpreterShowCreateAccessEntityQuery.cpp
+++ b/src/Interpreters/Access/InterpreterShowCreateAccessEntityQuery.cpp
@@ -206,7 +206,7 @@ namespace
             if (!filter.empty())
             {
                 ParserExpression parser;
-                ASTPtr expr = parseQuery(parser, filter, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+                ASTPtr expr = parseQuery(parser, filter, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
                 query->filters.emplace_back(type, std::move(expr));
             }
         }
diff --git a/src/Interpreters/AsynchronousMetricLog.cpp b/src/Interpreters/AsynchronousMetricLog.cpp
index 5cf7f951eec..dc67bd91550 100644
--- a/src/Interpreters/AsynchronousMetricLog.cpp
+++ b/src/Interpreters/AsynchronousMetricLog.cpp
@@ -21,31 +21,31 @@ ColumnsDescription AsynchronousMetricLogElement::getColumnsDescription()
         {
             "hostname",
             std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>()),
-            parseQuery(codec_parser, "(ZSTD(1))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH),
+            parseQuery(codec_parser, "(ZSTD(1))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS),
             "Hostname of the server executing the query."
         },
         {
             "event_date",
             std::make_shared<DataTypeDate>(),
-            parseQuery(codec_parser, "(Delta(2), ZSTD(1))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH),
+            parseQuery(codec_parser, "(Delta(2), ZSTD(1))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS),
             "Event date."
         },
         {
             "event_time",
             std::make_shared<DataTypeDateTime>(),
-            parseQuery(codec_parser, "(Delta(4), ZSTD(1))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH),
+            parseQuery(codec_parser, "(Delta(4), ZSTD(1))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS),
             "Event time."
         },
         {
             "metric",
             std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>()),
-            parseQuery(codec_parser, "(ZSTD(1))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH),
+            parseQuery(codec_parser, "(ZSTD(1))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS),
             "Metric name."
         },
         {
             "value",
             std::make_shared<DataTypeFloat64>(),
-            parseQuery(codec_parser, "(ZSTD(3))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH),
+            parseQuery(codec_parser, "(ZSTD(3))", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS),
             "Metric value."
         }
     };
diff --git a/src/Interpreters/DDLTask.cpp b/src/Interpreters/DDLTask.cpp
index fe2baea6b4e..e10f3ecfbc9 100644
--- a/src/Interpreters/DDLTask.cpp
+++ b/src/Interpreters/DDLTask.cpp
@@ -154,7 +154,8 @@ void DDLLogEntry::parse(const String & data)
             rb >> "settings: " >> settings_str >> "\n";
             ParserSetQuery parser{true};
             constexpr UInt64 max_depth = 16;
-            ASTPtr settings_ast = parseQuery(parser, settings_str, Context::getGlobalContextInstance()->getSettingsRef().max_query_size, max_depth);
+            constexpr UInt64 max_backtracks = DBMS_DEFAULT_MAX_PARSER_BACKTRACKS;
+            ASTPtr settings_ast = parseQuery(parser, settings_str, Context::getGlobalContextInstance()->getSettingsRef().max_query_size, max_depth, max_backtracks);
             settings.emplace(std::move(settings_ast->as<ASTSetQuery>()->changes));
         }
     }
@@ -197,7 +198,7 @@ void DDLTaskBase::parseQueryFromEntry(ContextPtr context)
 
     ParserQuery parser_query(end, settings.allow_settings_after_format_in_insert);
     String description;
-    query = parseQuery(parser_query, begin, end, description, 0, settings.max_parser_depth);
+    query = parseQuery(parser_query, begin, end, description, 0, settings.max_parser_depth, settings.max_parser_backtracks);
 }
 
 void DDLTaskBase::formatRewrittenQuery(ContextPtr context)
diff --git a/src/Interpreters/IInterpreterUnionOrSelectQuery.cpp b/src/Interpreters/IInterpreterUnionOrSelectQuery.cpp
index 60110916760..fed29b410db 100644
--- a/src/Interpreters/IInterpreterUnionOrSelectQuery.cpp
+++ b/src/Interpreters/IInterpreterUnionOrSelectQuery.cpp
@@ -96,7 +96,7 @@ static ASTPtr parseAdditionalPostFilter(const Context & context)
     ParserExpression parser;
     return parseQuery(
                 parser, filter.data(), filter.data() + filter.size(),
-                "additional filter", settings.max_query_size, settings.max_parser_depth);
+                "additional filter", settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
 }
 
 static ActionsDAGPtr makeAdditionalPostFilter(ASTPtr & ast, ContextPtr context, const Block & header)
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index edd7452c130..2a08e8458a4 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -381,7 +381,7 @@ ASTPtr InterpreterCreateQuery::formatColumns(const NamesAndTypesList & columns)
         String type_name = column.type->getName();
         const char * pos = type_name.data();
         const char * end = pos + type_name.size();
-        column_declaration->type = parseQuery(type_parser, pos, end, "data type", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        column_declaration->type = parseQuery(type_parser, pos, end, "data type", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
         columns_list->children.emplace_back(column_declaration);
     }
 
@@ -401,7 +401,7 @@ ASTPtr InterpreterCreateQuery::formatColumns(const NamesAndTypesList & columns,
         String type_name = alias_column.type->getName();
         const char * type_pos = type_name.data();
         const char * type_end = type_pos + type_name.size();
-        column_declaration->type = parseQuery(type_parser, type_pos, type_end, "data type", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        column_declaration->type = parseQuery(type_parser, type_pos, type_end, "data type", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
         column_declaration->default_specifier = "ALIAS";
 
@@ -409,7 +409,7 @@ ASTPtr InterpreterCreateQuery::formatColumns(const NamesAndTypesList & columns,
         const char * alias_pos = alias.data();
         const char * alias_end = alias_pos + alias.size();
         ParserExpression expression_parser;
-        column_declaration->default_expression = parseQuery(expression_parser, alias_pos, alias_end, "expression", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        column_declaration->default_expression = parseQuery(expression_parser, alias_pos, alias_end, "expression", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
         column_declaration->children.push_back(column_declaration->default_expression);
 
         columns_list->children.emplace_back(column_declaration);
@@ -433,7 +433,7 @@ ASTPtr InterpreterCreateQuery::formatColumns(const ColumnsDescription & columns)
         String type_name = column.type->getName();
         const char * type_name_pos = type_name.data();
         const char * type_name_end = type_name_pos + type_name.size();
-        column_declaration->type = parseQuery(type_parser, type_name_pos, type_name_end, "data type", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        column_declaration->type = parseQuery(type_parser, type_name_pos, type_name_end, "data type", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
         if (column.default_desc.expression)
         {
@@ -1852,10 +1852,12 @@ void InterpreterCreateQuery::addColumnsDescriptionToCreateQueryIfNecessary(ASTCr
 
     auto ast_storage = std::make_shared<ASTStorage>();
     unsigned max_parser_depth = static_cast<unsigned>(getContext()->getSettingsRef().max_parser_depth);
+    unsigned max_parser_backtracks = static_cast<unsigned>(getContext()->getSettingsRef().max_parser_backtracks);
     auto query_from_storage = DB::getCreateQueryFromStorage(storage,
                                                             ast_storage,
                                                             false,
                                                             max_parser_depth,
+                                                            max_parser_backtracks,
                                                             true);
     auto & create_query_from_storage = query_from_storage->as<ASTCreateQuery &>();
 
diff --git a/src/Interpreters/InterpreterDeleteQuery.cpp b/src/Interpreters/InterpreterDeleteQuery.cpp
index 97ae9649ae8..8fb0dabb5b5 100644
--- a/src/Interpreters/InterpreterDeleteQuery.cpp
+++ b/src/Interpreters/InterpreterDeleteQuery.cpp
@@ -97,7 +97,8 @@ BlockIO InterpreterDeleteQuery::execute()
             alter_query.data() + alter_query.size(),
             "ALTER query",
             0,
-            DBMS_DEFAULT_MAX_PARSER_DEPTH);
+            DBMS_DEFAULT_MAX_PARSER_DEPTH,
+            DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
         auto context = Context::createCopy(getContext());
         context->setSetting("mutations_sync", 2);   /// Lightweight delete is always synchronous
diff --git a/src/Interpreters/InterpreterKillQueryQuery.cpp b/src/Interpreters/InterpreterKillQueryQuery.cpp
index 86196270ed1..26dae6a1df3 100644
--- a/src/Interpreters/InterpreterKillQueryQuery.cpp
+++ b/src/Interpreters/InterpreterKillQueryQuery.cpp
@@ -281,7 +281,7 @@ BlockIO InterpreterKillQueryQuery::execute()
                     const auto with_round_bracket = alter_command.front() == '(';
                     ParserAlterCommand parser{with_round_bracket};
                     auto command_ast
-                        = parseQuery(parser, alter_command, 0, getContext()->getSettingsRef().max_parser_depth);
+                        = parseQuery(parser, alter_command, 0, getContext()->getSettingsRef().max_parser_depth, getContext()->getSettingsRef().max_parser_backtracks);
                     required_access_rights = InterpreterAlterQuery::getRequiredAccessForCommand(
                         command_ast->as<const ASTAlterCommand &>(), table_id.database_name, table_id.table_name);
                     if (!access->isGranted(required_access_rights))
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index a314492c5b0..07f4e94680c 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -160,7 +160,7 @@ FilterDAGInfoPtr generateFilterActions(
     {
         ParserExpression expr_parser;
         /// We should add back quotes around column name as it can contain dots.
-        expr_list->children.push_back(parseQuery(expr_parser, backQuoteIfNeed(column_str), 0, context->getSettingsRef().max_parser_depth));
+        expr_list->children.push_back(parseQuery(expr_parser, backQuoteIfNeed(column_str), 0, context->getSettingsRef().max_parser_depth, context->getSettingsRef().max_parser_backtracks));
     }
 
     select_ast->setExpression(ASTSelectQuery::Expression::TABLES, std::make_shared<ASTTablesInSelectQuery>());
@@ -331,7 +331,7 @@ ASTPtr parseAdditionalFilterConditionForTable(
             const auto & settings = context.getSettingsRef();
             return parseQuery(
                 parser, filter.data(), filter.data() + filter.size(),
-                "additional filter", settings.max_query_size, settings.max_parser_depth);
+                "additional filter", settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
         }
     }
 
diff --git a/src/Interpreters/JoinToSubqueryTransformVisitor.cpp b/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
index 6251a9604e1..5c4ae528fc1 100644
--- a/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
+++ b/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
@@ -43,7 +43,7 @@ ASTPtr makeSubqueryTemplate(const String & table_alias)
     String query_template = "(select * from _t)";
     if (!table_alias.empty())
         query_template += " as " + table_alias;
-    ASTPtr subquery_template = parseQuery(parser, query_template, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    ASTPtr subquery_template = parseQuery(parser, query_template, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     if (!subquery_template)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot parse subquery template");
     return subquery_template;
diff --git a/src/Interpreters/MySQL/tests/gtest_create_rewritten.cpp b/src/Interpreters/MySQL/tests/gtest_create_rewritten.cpp
index 9f6e9b930fd..6d6077a0295 100644
--- a/src/Interpreters/MySQL/tests/gtest_create_rewritten.cpp
+++ b/src/Interpreters/MySQL/tests/gtest_create_rewritten.cpp
@@ -19,7 +19,7 @@ using namespace DB;
 static inline ASTPtr tryRewrittenCreateQuery(const String & query, ContextPtr context)
 {
     ParserExternalDDLQuery external_ddl_parser;
-    ASTPtr ast = parseQuery(external_ddl_parser, "EXTERNAL DDL FROM MySQL(test_database, test_database) " + query, 0, 0);
+    ASTPtr ast = parseQuery(external_ddl_parser, "EXTERNAL DDL FROM MySQL(test_database, test_database) " + query, 0, 0, 0);
 
     return MySQLInterpreter::InterpreterCreateImpl::getRewrittenQueries(
         *ast->as<ASTExternalDDLQuery>()->external_ddl->as<MySQLParser::ASTCreateQuery>(),
diff --git a/src/Interpreters/SystemLog.cpp b/src/Interpreters/SystemLog.cpp
index a74b5c67726..e4cbbb8f5f7 100644
--- a/src/Interpreters/SystemLog.cpp
+++ b/src/Interpreters/SystemLog.cpp
@@ -216,7 +216,7 @@ std::shared_ptr<TSystemLog> createSystemLog(
     /// Validate engine definition syntax to prevent some configuration errors.
     ParserStorageWithComment storage_parser;
     auto storage_ast = parseQuery(storage_parser, log_settings.engine.data(), log_settings.engine.data() + log_settings.engine.size(),
-            "Storage to create table for " + config_prefix, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+            "Storage to create table for " + config_prefix, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     auto & storage_with_comment = storage_ast->as<StorageWithComment &>();
 
     /// Add comment to AST. So it will be saved when the table will be renamed.
@@ -647,7 +647,7 @@ ASTPtr SystemLog<LogElement>::getCreateTableQuery()
 
     ASTPtr storage_with_comment_ast = parseQuery(
         storage_parser, storage_def.data(), storage_def.data() + storage_def.size(),
-        "Storage to create table for " + LogElement::name(), 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        "Storage to create table for " + LogElement::name(), 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
     StorageWithComment & storage_with_comment = storage_with_comment_ast->as<StorageWithComment &>();
 
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 88021038ebb..7dd46534fdf 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -746,18 +746,18 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
         {
             ParserKQLStatement parser(end, settings.allow_settings_after_format_in_insert);
             /// TODO: parser should fail early when max_query_size limit is reached.
-            ast = parseKQLQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
+            ast = parseKQLQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
         }
         else if (settings.dialect == Dialect::prql && !internal)
         {
-            ParserPRQLQuery parser(max_query_size, settings.max_parser_depth);
-            ast = parseQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
+            ParserPRQLQuery parser(max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
+            ast = parseQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
         }
         else
         {
             ParserQuery parser(end, settings.allow_settings_after_format_in_insert);
             /// TODO: parser should fail early when max_query_size limit is reached.
-            ast = parseQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth);
+            ast = parseQuery(parser, begin, end, "", max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
 
 #ifndef NDEBUG
             /// Verify that AST formatting is consistent:
@@ -774,7 +774,7 @@ static std::tuple<ASTPtr, BlockIO> executeQueryImpl(
                 ast2 = parseQuery(parser,
                     formatted1.data(),
                     formatted1.data() + formatted1.size(),
-                    "", new_max_query_size, settings.max_parser_depth);
+                    "", new_max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
             }
             catch (const Exception & e)
             {
diff --git a/src/Interpreters/getCustomKeyFilterForParallelReplicas.cpp b/src/Interpreters/getCustomKeyFilterForParallelReplicas.cpp
index 1295a4d5a75..d78b6ab0c4d 100644
--- a/src/Interpreters/getCustomKeyFilterForParallelReplicas.cpp
+++ b/src/Interpreters/getCustomKeyFilterForParallelReplicas.cpp
@@ -122,7 +122,7 @@ ASTPtr parseCustomKeyForTable(const String & custom_key, const Context & context
     const auto & settings = context.getSettingsRef();
     return parseQuery(
         parser, custom_key.data(), custom_key.data() + custom_key.size(),
-        "parallel replicas custom key", settings.max_query_size, settings.max_parser_depth);
+        "parallel replicas custom key", settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
 }
 
 }
diff --git a/src/Interpreters/loadMetadata.cpp b/src/Interpreters/loadMetadata.cpp
index 2723eb37350..226472175b3 100644
--- a/src/Interpreters/loadMetadata.cpp
+++ b/src/Interpreters/loadMetadata.cpp
@@ -55,9 +55,11 @@ static void executeCreateQuery(
     bool create,
     bool has_force_restore_data_flag)
 {
+    const Settings & settings = context->getSettingsRef();
     ParserCreateQuery parser;
     ASTPtr ast = parseQuery(
-        parser, query.data(), query.data() + query.size(), "in file " + file_name, 0, context->getSettingsRef().max_parser_depth);
+        parser, query.data(), query.data() + query.size(), "in file " + file_name,
+        0, settings.max_parser_depth, settings.max_parser_backtracks);
 
     auto & ast_create_query = ast->as<ASTCreateQuery &>();
     ast_create_query.setDatabase(database);
diff --git a/src/Interpreters/parseColumnsListForTableFunction.cpp b/src/Interpreters/parseColumnsListForTableFunction.cpp
index 78b72022a9a..30a41c090d5 100644
--- a/src/Interpreters/parseColumnsListForTableFunction.cpp
+++ b/src/Interpreters/parseColumnsListForTableFunction.cpp
@@ -115,7 +115,7 @@ ColumnsDescription parseColumnsListFromString(const std::string & structure, con
     ParserColumnDeclarationList parser(true, true);
     const Settings & settings = context->getSettingsRef();
 
-    ASTPtr columns_list_raw = parseQuery(parser, structure, "columns declaration list", settings.max_query_size, settings.max_parser_depth);
+    ASTPtr columns_list_raw = parseQuery(parser, structure, "columns declaration list", settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
 
     auto * columns_list = dynamic_cast<ASTExpressionList *>(columns_list_raw.get());
     if (!columns_list)
@@ -136,7 +136,7 @@ bool tryParseColumnsListFromString(const std::string & structure, ColumnsDescrip
     const char * start = structure.data();
     const char * end = structure.data() + structure.size();
     ASTPtr columns_list_raw = tryParseQuery(
-        parser, start, end, error, false, "columns declaration list", false, settings.max_query_size, settings.max_parser_depth);
+        parser, start, end, error, false, "columns declaration list", false, settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks, true);
     if (!columns_list_raw)
         return false;
 
diff --git a/src/Interpreters/tests/gtest_comparison_graph.cpp b/src/Interpreters/tests/gtest_comparison_graph.cpp
index 96a78241c8e..ac24a8de368 100644
--- a/src/Interpreters/tests/gtest_comparison_graph.cpp
+++ b/src/Interpreters/tests/gtest_comparison_graph.cpp
@@ -12,7 +12,7 @@ using namespace DB;
 static ComparisonGraph<ASTPtr> getGraph(const String & query)
 {
     ParserExpressionList parser(false);
-    ASTPtr ast = parseQuery(parser, query, 0, 0);
+    ASTPtr ast = parseQuery(parser, query, 0, 0, 0);
     return ComparisonGraph<ASTPtr>(ast->children);
 }
 
diff --git a/src/Interpreters/tests/gtest_cycle_aliases.cpp b/src/Interpreters/tests/gtest_cycle_aliases.cpp
index 2bdeac90f8f..5ff3fbe1c2d 100644
--- a/src/Interpreters/tests/gtest_cycle_aliases.cpp
+++ b/src/Interpreters/tests/gtest_cycle_aliases.cpp
@@ -14,10 +14,10 @@ TEST(QueryNormalizer, SimpleLoopAlias)
 {
     String query = "a as a";
     ParserExpressionList parser(false);
-    ASTPtr ast = parseQuery(parser, query, 0, 0);
+    ASTPtr ast = parseQuery(parser, query, 0, 0, 0);
 
     Aliases aliases;
-    aliases["a"] = parseQuery(parser, "a as a", 0, 0)->children[0];
+    aliases["a"] = parseQuery(parser, "a as a", 0, 0, 0)->children[0];
 
     Settings settings;
     QueryNormalizer::Data normalizer_data(aliases, {}, false, settings, false);
@@ -28,11 +28,11 @@ TEST(QueryNormalizer, SimpleCycleAlias)
 {
     String query = "a as b, b as a";
     ParserExpressionList parser(false);
-    ASTPtr ast = parseQuery(parser, query, 0, 0);
+    ASTPtr ast = parseQuery(parser, query, 0, 0, 0);
 
     Aliases aliases;
-    aliases["a"] = parseQuery(parser, "b as a", 0, 0)->children[0];
-    aliases["b"] = parseQuery(parser, "a as b", 0, 0)->children[0];
+    aliases["a"] = parseQuery(parser, "b as a", 0, 0, 0)->children[0];
+    aliases["b"] = parseQuery(parser, "a as b", 0, 0, 0)->children[0];
 
     Settings settings;
     QueryNormalizer::Data normalizer_data(aliases, {}, false, settings, true);
diff --git a/src/Interpreters/tests/gtest_table_overrides.cpp b/src/Interpreters/tests/gtest_table_overrides.cpp
index 779bc7a53a4..09aa2e1f37f 100644
--- a/src/Interpreters/tests/gtest_table_overrides.cpp
+++ b/src/Interpreters/tests/gtest_table_overrides.cpp
@@ -34,11 +34,11 @@ TEST_P(TableOverrideTest, applyOverrides)
     const auto & [database_query, table_query, expected_query] = GetParam();
     ParserCreateQuery parser;
     ASTPtr database_ast;
-    ASSERT_NO_THROW(database_ast = parseQuery(parser, database_query, 0, 0));
+    ASSERT_NO_THROW(database_ast = parseQuery(parser, database_query, 0, 0, 0));
     auto * database = database_ast->as<ASTCreateQuery>();
     ASSERT_NE(nullptr, database);
     ASTPtr table_ast;
-    ASSERT_NO_THROW(table_ast = parseQuery(parser, table_query, 0, 0));
+    ASSERT_NO_THROW(table_ast = parseQuery(parser, table_query, 0, 0, 0));
     auto * table = table_ast->as<ASTCreateQuery>();
     ASSERT_NE(nullptr, table);
     auto table_name = table->table->as<ASTIdentifier>()->name();
diff --git a/src/Parsers/ExpressionListParsers.cpp b/src/Parsers/ExpressionListParsers.cpp
index 6d267a7d215..1e7d0158878 100644
--- a/src/Parsers/ExpressionListParsers.cpp
+++ b/src/Parsers/ExpressionListParsers.cpp
@@ -1918,7 +1918,7 @@ public:
                 && string_literal->as<ASTLiteral &>().value.tryGet(literal))
             {
                 Tokens tokens(literal.data(), literal.data() + literal.size());
-                IParser::Pos token_pos(tokens, 0);
+                IParser::Pos token_pos(tokens, pos.max_depth, pos.max_backtracks);
                 Expected token_expected;
                 ASTPtr expr;
 
diff --git a/src/Parsers/IParser.cpp b/src/Parsers/IParser.cpp
new file mode 100644
index 00000000000..d1e9ace89b6
--- /dev/null
+++ b/src/Parsers/IParser.cpp
@@ -0,0 +1,33 @@
+#include <Parsers/IParser.h>
+#include <iostream>
+
+namespace DB
+{
+
+IParser::Pos & IParser::Pos::operator=(const IParser::Pos & rhs)
+{
+    depth = rhs.depth;
+    max_depth = rhs.max_depth;
+
+    if (rhs.backtracks > backtracks)
+        backtracks = rhs.backtracks;
+
+    max_backtracks = rhs.max_backtracks;
+
+    if (rhs < *this)
+    {
+        ++backtracks;
+        if (max_backtracks && backtracks > max_backtracks)
+            throw Exception(ErrorCodes::TOO_DEEP_RECURSION, "Maximum amount of backtracking ({}) exceeded in the parser. "
+                "Consider rising max_parser_backtracks parameter.", max_backtracks);
+    }
+
+    TokenIterator::operator=(rhs);
+
+    if (backtracks % 1000 == 0)
+        std::cerr << backtracks << "\n";
+
+    return *this;
+}
+
+}
diff --git a/src/Parsers/IParser.h b/src/Parsers/IParser.h
index 198ec0346ff..291f8ee7d44 100644
--- a/src/Parsers/IParser.h
+++ b/src/Parsers/IParser.h
@@ -62,11 +62,18 @@ public:
         uint32_t depth = 0;
         uint32_t max_depth = 0;
 
-        Pos(Tokens & tokens_, uint32_t max_depth_) : TokenIterator(tokens_), max_depth(max_depth_)
+        uint32_t backtracks = 0;
+        uint32_t max_backtracks = 0;
+
+        Pos(Tokens & tokens_, uint32_t max_depth_, uint32_t max_backtracks_)
+            : TokenIterator(tokens_), max_depth(max_depth_), max_backtracks(max_backtracks_)
         {
         }
 
-        Pos(TokenIterator token_iterator_, uint32_t max_depth_) : TokenIterator(token_iterator_), max_depth(max_depth_) { }
+        Pos(TokenIterator token_iterator_, uint32_t max_depth_, uint32_t max_backtracks_)
+            : TokenIterator(token_iterator_), max_depth(max_depth_), max_backtracks(max_backtracks_)
+        {
+        }
 
         ALWAYS_INLINE void increaseDepth()
         {
@@ -97,6 +104,10 @@ public:
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error in parser: incorrect calculation of parse depth");
             --depth;
         }
+
+        Pos(const Pos & rhs) = default;
+
+        Pos & operator=(const Pos & rhs);
     };
 
     /** Get the text of this parser parses. */
diff --git a/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.cpp b/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.cpp
index 152c29e5941..1d77007a37c 100644
--- a/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.cpp
+++ b/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.cpp
@@ -279,13 +279,13 @@ String IParserKQLFunction::getKQLFunctionName(IParser::Pos & pos)
 }
 
 String IParserKQLFunction::kqlCallToExpression(
-    const std::string_view function_name, const std::initializer_list<const std::string_view> params, const uint32_t max_depth)
+    const std::string_view function_name, const std::initializer_list<const std::string_view> params, uint32_t max_depth, uint32_t max_backtracks)
 {
-    return kqlCallToExpression(function_name, std::span(params), max_depth);
+    return kqlCallToExpression(function_name, std::span(params), max_depth, max_backtracks);
 }
 
 String IParserKQLFunction::kqlCallToExpression(
-    const std::string_view function_name, const std::span<const std::string_view> params, const uint32_t max_depth)
+    const std::string_view function_name, const std::span<const std::string_view> params, uint32_t max_depth, uint32_t max_backtracks)
 {
     const auto params_str = std::accumulate(
         std::cbegin(params),
@@ -302,7 +302,7 @@ String IParserKQLFunction::kqlCallToExpression(
 
     const auto kql_call = std::format("{}({})", function_name, params_str);
     DB::Tokens call_tokens(kql_call.c_str(), kql_call.c_str() + kql_call.length());
-    DB::IParser::Pos tokens_pos(call_tokens, max_depth);
+    DB::IParser::Pos tokens_pos(call_tokens, max_depth, max_backtracks);
     return DB::IParserKQLFunction::getExpression(tokens_pos);
 }
 
diff --git a/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.h b/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.h
index 147436551f9..f5069e80745 100644
--- a/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.h
+++ b/src/Parsers/Kusto/KustoFunctions/IParserKQLFunction.h
@@ -77,8 +77,8 @@ public:
     static std::optional<String>
     getOptionalArgument(const String & function_name, DB::IParser::Pos & pos, ArgumentState argument_state = ArgumentState::Parsed);
     static String
-    kqlCallToExpression(std::string_view function_name, std::initializer_list<const std::string_view> params, uint32_t max_depth);
-    static String kqlCallToExpression(std::string_view function_name, std::span<const std::string_view> params, uint32_t max_depth);
+    kqlCallToExpression(std::string_view function_name, std::initializer_list<const std::string_view> params, uint32_t max_depth, uint32_t max_backtracks);
+    static String kqlCallToExpression(std::string_view function_name, std::span<const std::string_view> params, uint32_t max_depth, uint32_t max_backtracks);
     static String escapeSingleQuotes(const String & input);
 
 protected:
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLCastingFunctions.cpp b/src/Parsers/Kusto/KustoFunctions/KQLCastingFunctions.cpp
index b0eec16f56f..87841e295ba 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLCastingFunctions.cpp
+++ b/src/Parsers/Kusto/KustoFunctions/KQLCastingFunctions.cpp
@@ -99,7 +99,7 @@ bool ToTimeSpan::convertImpl(String & out, IParser::Pos & pos)
         ++pos;
         try
         {
-            auto result = kqlCallToExpression("time", {arg}, pos.max_depth);
+            auto result = kqlCallToExpression("time", {arg}, pos.max_depth, pos.max_backtracks);
             out = std::format("{}", result);
         }
         catch (...)
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLDynamicFunctions.cpp b/src/Parsers/Kusto/KustoFunctions/KQLDynamicFunctions.cpp
index 924ac9f6490..e90be363e4b 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLDynamicFunctions.cpp
+++ b/src/Parsers/Kusto/KustoFunctions/KQLDynamicFunctions.cpp
@@ -99,7 +99,7 @@ bool ArrayRotateRight::convertImpl(String & out, IParser::Pos & pos)
 
     const auto array = getArgument(function_name, pos, ArgumentState::Raw);
     const auto count = getArgument(function_name, pos, ArgumentState::Raw);
-    out = kqlCallToExpression("array_rotate_left", {array, "-1 * " + count}, pos.max_depth);
+    out = kqlCallToExpression("array_rotate_left", {array, "-1 * " + count}, pos.max_depth, pos.max_backtracks);
 
     return true;
 }
@@ -140,7 +140,7 @@ bool ArrayShiftRight::convertImpl(String & out, IParser::Pos & pos)
         "array_shift_left",
         fill ? std::initializer_list<std::string_view>{array, negated_count, *fill}
              : std::initializer_list<std::string_view>{array, negated_count},
-        pos.max_depth);
+        pos.max_depth, pos.max_backtracks);
 
     return true;
 }
@@ -233,8 +233,8 @@ bool JaccardIndex::convertImpl(String & out, IParser::Pos & pos)
     const auto rhs = getArgument(function_name, pos, ArgumentState::Raw);
     out = std::format(
         "divide(length({0}), length({1}))",
-        kqlCallToExpression("set_intersect", {lhs, rhs}, pos.max_depth),
-        kqlCallToExpression("set_union", {lhs, rhs}, pos.max_depth));
+        kqlCallToExpression("set_intersect", {lhs, rhs}, pos.max_depth, pos.max_backtracks),
+        kqlCallToExpression("set_union", {lhs, rhs}, pos.max_depth, pos.max_backtracks));
 
     return true;
 }
@@ -292,7 +292,7 @@ bool SetDifference::convertImpl(String & out, IParser::Pos & pos)
             while (auto next_array = getOptionalArgument(function_name, pos, ArgumentState::Raw))
                 arrays.push_back(*next_array);
 
-            return kqlCallToExpression("set_union", std::vector<std::string_view>(arrays.cbegin(), arrays.cend()), pos.max_depth);
+            return kqlCallToExpression("set_union", std::vector<std::string_view>(arrays.cbegin(), arrays.cend()), pos.max_depth, pos.max_backtracks);
         });
 
     out = std::format("arrayFilter(x -> not has({1}, x), arrayDistinct({0}))", lhs, rhs);
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLIPFunctions.cpp b/src/Parsers/Kusto/KustoFunctions/KQLIPFunctions.cpp
index 6f853b16fbc..06566dc54ec 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLIPFunctions.cpp
+++ b/src/Parsers/Kusto/KustoFunctions/KQLIPFunctions.cpp
@@ -34,10 +34,10 @@ bool Ipv4Compare::convertImpl(String & out, IParser::Pos & pos)
         "sign(IPv4StringToNumOrNull(toString((tupleElement(IPv4CIDRToRange(assumeNotNull(lhs_ip_{5}), "
         "toUInt8(min2({4}, min2(assumeNotNull(lhs_mask_{5}), assumeNotNull(rhs_mask_{5})))) as mask_{5}), 1))))"
         "   - IPv4StringToNumOrNull(toString((tupleElement(IPv4CIDRToRange(assumeNotNull(rhs_ip_{5}), mask_{5}), 1))))))",
-        kqlCallToExpression("parse_ipv4", {lhs}, pos.max_depth),
-        kqlCallToExpression("ipv4_netmask_suffix", {lhs}, pos.max_depth),
-        kqlCallToExpression("parse_ipv4", {rhs}, pos.max_depth),
-        kqlCallToExpression("ipv4_netmask_suffix", {rhs}, pos.max_depth),
+        kqlCallToExpression("parse_ipv4", {lhs}, pos.max_depth, pos.max_backtracks),
+        kqlCallToExpression("ipv4_netmask_suffix", {lhs}, pos.max_depth, pos.max_backtracks),
+        kqlCallToExpression("parse_ipv4", {rhs}, pos.max_depth, pos.max_backtracks),
+        kqlCallToExpression("ipv4_netmask_suffix", {rhs}, pos.max_depth, pos.max_backtracks),
         mask ? *mask : "32",
         generateUniqueIdentifier());
     return true;
@@ -56,8 +56,8 @@ bool Ipv4IsInRange::convertImpl(String & out, IParser::Pos & pos)
         "or isNull({1} as range_start_ip_{3}) or isNull({2} as range_mask_{3}), null, "
         "bitXor(range_start_ip_{3}, bitAnd(ip_{3}, bitNot(toUInt32(intExp2(toInt32(32 - range_mask_{3})) - 1)))) = 0) ",
         ip_address,
-        kqlCallToExpression("parse_ipv4", {ip_range}, pos.max_depth),
-        kqlCallToExpression("ipv4_netmask_suffix", {ip_range}, pos.max_depth),
+        kqlCallToExpression("parse_ipv4", {ip_range}, pos.max_depth, pos.max_backtracks),
+        kqlCallToExpression("ipv4_netmask_suffix", {ip_range}, pos.max_depth, pos.max_backtracks),
         generateUniqueIdentifier());
     return true;
 }
@@ -71,7 +71,7 @@ bool Ipv4IsMatch::convertImpl(String & out, IParser::Pos & pos)
     const auto lhs = getArgument(function_name, pos, ArgumentState::Raw);
     const auto rhs = getArgument(function_name, pos, ArgumentState::Raw);
     const auto mask = getOptionalArgument(function_name, pos, ArgumentState::Raw);
-    out = std::format("equals({}, 0)", kqlCallToExpression("ipv4_compare", {lhs, rhs, mask ? *mask : "32"}, pos.max_depth));
+    out = std::format("equals({}, 0)", kqlCallToExpression("ipv4_compare", {lhs, rhs, mask ? *mask : "32"}, pos.max_depth, pos.max_backtracks));
     return true;
 }
 
@@ -196,7 +196,7 @@ bool Ipv6IsMatch::convertImpl(String & out, IParser::Pos & pos)
     const auto lhs = getArgument(function_name, pos, ArgumentState::Raw);
     const auto rhs = getArgument(function_name, pos, ArgumentState::Raw);
     const auto mask = getOptionalArgument(function_name, pos, ArgumentState::Raw);
-    out = std::format("equals({}, 0)", kqlCallToExpression("ipv6_compare", {lhs, rhs, mask ? *mask : "128"}, pos.max_depth));
+    out = std::format("equals({}, 0)", kqlCallToExpression("ipv6_compare", {lhs, rhs, mask ? *mask : "128"}, pos.max_depth, pos.max_backtracks));
     return true;
 }
 
@@ -228,9 +228,9 @@ bool ParseIpv6Mask::convertImpl(String & out, IParser::Pos & pos)
     const auto unique_identifier = generateUniqueIdentifier();
     out = std::format(
         "if(empty({0} as ipv4_{3}), {1}, {2})",
-        kqlCallToExpression("format_ipv4", {"trim_start('::', " + ip_address + ")", mask + " - 96"}, pos.max_depth),
-        kqlCallToExpression("parse_ipv6", {"strcat(tostring(parse_ipv6(" + ip_address + ")), '/', tostring(" + mask + "))"}, pos.max_depth),
-        kqlCallToExpression("parse_ipv6", {"ipv4_" + unique_identifier}, pos.max_depth),
+        kqlCallToExpression("format_ipv4", {"trim_start('::', " + ip_address + ")", mask + " - 96"}, pos.max_depth, pos.max_backtracks),
+        kqlCallToExpression("parse_ipv6", {"strcat(tostring(parse_ipv6(" + ip_address + ")), '/', tostring(" + mask + "))"}, pos.max_depth, pos.max_backtracks),
+        kqlCallToExpression("parse_ipv6", {"ipv4_" + unique_identifier}, pos.max_depth, pos.max_backtracks),
         unique_identifier);
     return true;
 }
@@ -247,9 +247,9 @@ bool FormatIpv4::convertImpl(String & out, IParser::Pos & pos)
         "ifNull(if(isNotNull(toUInt32OrNull(toString({0})) as param_as_uint32_{3}) and toTypeName({0}) = 'String' or ({1}) < 0 "
         "or isNull(ifNull(param_as_uint32_{3}, {2}) as ip_as_number_{3}), null, "
         "IPv4NumToString(bitAnd(ip_as_number_{3}, bitNot(toUInt32(intExp2(toInt32(32 - ({1}))) - 1))))), '')",
-        ParserKQLBase::getExprFromToken(ip_address, pos.max_depth),
+        ParserKQLBase::getExprFromToken(ip_address, pos.max_depth, pos.max_backtracks),
         mask ? *mask : "32",
-        kqlCallToExpression("parse_ipv4", {"tostring(" + ip_address + ")"}, pos.max_depth),
+        kqlCallToExpression("parse_ipv4", {"tostring(" + ip_address + ")"}, pos.max_depth, pos.max_backtracks),
         generateUniqueIdentifier());
     return true;
 }
@@ -266,10 +266,10 @@ bool FormatIpv4Mask::convertImpl(String & out, IParser::Pos & pos)
     out = std::format(
         "if(empty({1} as formatted_ip_{2}) or position(toTypeName({0}), 'Int') = 0 or not {0} between 0 and 32, '', "
         "concat(formatted_ip_{2}, '/', toString(toInt64(min2({0}, ifNull({3} as suffix_{2}, 32))))))",
-        ParserKQLBase::getExprFromToken(calculated_mask, pos.max_depth),
-        kqlCallToExpression("format_ipv4", {ip_address, calculated_mask}, pos.max_depth),
+        ParserKQLBase::getExprFromToken(calculated_mask, pos.max_depth, pos.max_backtracks),
+        kqlCallToExpression("format_ipv4", {ip_address, calculated_mask}, pos.max_depth, pos.max_backtracks),
         generateUniqueIdentifier(),
-        kqlCallToExpression("ipv4_netmask_suffix", {"tostring(" + ip_address + ")"}, pos.max_depth));
+        kqlCallToExpression("ipv4_netmask_suffix", {"tostring(" + ip_address + ")"}, pos.max_depth, pos.max_backtracks));
     return true;
 }
 }
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp
index 82cfa68b180..18c986c2191 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp
+++ b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp
@@ -442,7 +442,7 @@ bool ParseJSON::convertImpl(String & out, IParser::Pos & pos)
     {
         --pos;
         auto arg = getArgument(fn_name, pos);
-        auto result = kqlCallToExpression("dynamic", {arg}, pos.max_depth);
+        auto result = kqlCallToExpression("dynamic", {arg}, pos.max_depth, pos.max_backtracks);
         out = std::format("{}", result);
     }
     else
@@ -729,7 +729,7 @@ bool Trim::convertImpl(String & out, IParser::Pos & pos)
 
     const auto regex = getArgument(fn_name, pos, ArgumentState::Raw);
     const auto source = getArgument(fn_name, pos, ArgumentState::Raw);
-    out = kqlCallToExpression("trim_start", {regex, std::format("trim_end({0}, {1})", regex, source)}, pos.max_depth);
+    out = kqlCallToExpression("trim_start", {regex, std::format("trim_end({0}, {1})", regex, source)}, pos.max_depth, pos.max_backtracks);
 
     return true;
 }
diff --git a/src/Parsers/Kusto/ParserKQLDistinct.cpp b/src/Parsers/Kusto/ParserKQLDistinct.cpp
index 2de4d2c28e7..3ec823a61b5 100644
--- a/src/Parsers/Kusto/ParserKQLDistinct.cpp
+++ b/src/Parsers/Kusto/ParserKQLDistinct.cpp
@@ -12,7 +12,7 @@ bool ParserKQLDistinct::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     expr = getExprFromToken(pos);
 
     Tokens tokens(expr.c_str(), expr.c_str() + expr.size());
-    IParser::Pos new_pos(tokens, pos.max_depth);
+    IParser::Pos new_pos(tokens, pos.max_depth, pos.max_backtracks);
 
     if (!ParserNotEmptyExpressionList(false).parse(new_pos, select_expression_list, expected))
         return false;
diff --git a/src/Parsers/Kusto/ParserKQLExtend.cpp b/src/Parsers/Kusto/ParserKQLExtend.cpp
index b37618f69fd..41ce296bd25 100644
--- a/src/Parsers/Kusto/ParserKQLExtend.cpp
+++ b/src/Parsers/Kusto/ParserKQLExtend.cpp
@@ -23,7 +23,7 @@ bool ParserKQLExtend ::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     String except_str;
     String new_extend_str;
     Tokens ntokens(extend_expr.c_str(), extend_expr.c_str() + extend_expr.size());
-    IParser::Pos npos(ntokens, pos.max_depth);
+    IParser::Pos npos(ntokens, pos.max_depth, pos.max_backtracks);
 
     String alias;
 
@@ -77,7 +77,7 @@ bool ParserKQLExtend ::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
     String expr = std::format("SELECT * {}, {} from prev", except_str, new_extend_str);
     Tokens tokens(expr.c_str(), expr.c_str() + expr.size());
-    IParser::Pos new_pos(tokens, pos.max_depth);
+    IParser::Pos new_pos(tokens, pos.max_depth, pos.max_backtracks);
 
     if (!ParserSelectQuery().parse(new_pos, select_query, expected))
         return false;
diff --git a/src/Parsers/Kusto/ParserKQLFilter.cpp b/src/Parsers/Kusto/ParserKQLFilter.cpp
index 74d8610ecd4..b060ce8d2c7 100644
--- a/src/Parsers/Kusto/ParserKQLFilter.cpp
+++ b/src/Parsers/Kusto/ParserKQLFilter.cpp
@@ -14,7 +14,7 @@ bool ParserKQLFilter::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     ASTPtr where_expression;
 
     Tokens token_filter(expr.c_str(), expr.c_str() + expr.size());
-    IParser::Pos pos_filter(token_filter, pos.max_depth);
+    IParser::Pos pos_filter(token_filter, pos.max_depth, pos.max_backtracks);
     if (!ParserExpressionWithOptionalAlias(false).parse(pos_filter, where_expression, expected))
         return false;
 
diff --git a/src/Parsers/Kusto/ParserKQLLimit.cpp b/src/Parsers/Kusto/ParserKQLLimit.cpp
index 910f0e8e1a3..0eb460757b1 100644
--- a/src/Parsers/Kusto/ParserKQLLimit.cpp
+++ b/src/Parsers/Kusto/ParserKQLLimit.cpp
@@ -14,7 +14,7 @@ bool ParserKQLLimit::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     auto expr = getExprFromToken(pos);
 
     Tokens tokens(expr.c_str(), expr.c_str() + expr.size());
-    IParser::Pos new_pos(tokens, pos.max_depth);
+    IParser::Pos new_pos(tokens, pos.max_depth, pos.max_backtracks);
 
     if (!ParserExpressionWithOptionalAlias(false).parse(new_pos, limit_length, expected))
         return false;
diff --git a/src/Parsers/Kusto/ParserKQLMVExpand.cpp b/src/Parsers/Kusto/ParserKQLMVExpand.cpp
index 7d242dffaf7..d174e9b5911 100644
--- a/src/Parsers/Kusto/ParserKQLMVExpand.cpp
+++ b/src/Parsers/Kusto/ParserKQLMVExpand.cpp
@@ -69,7 +69,7 @@ bool ParserKQLMVExpand::parseColumnArrayExprs(ColumnArrayExprs & column_array_ex
 
         auto add_columns = [&]
         {
-            column_array_expr = getExprFromToken(String(expr_begin_pos->begin, expr_end_pos->end), pos.max_depth);
+            column_array_expr = getExprFromToken(String(expr_begin_pos->begin, expr_end_pos->end), pos.max_depth, pos.max_backtracks);
 
             if (alias.empty())
             {
@@ -189,7 +189,7 @@ bool ParserKQLMVExpand::parserMVExpand(KQLMVExpand & kql_mv_expand, Pos & pos, E
     return true;
 }
 
-bool ParserKQLMVExpand::genQuery(KQLMVExpand & kql_mv_expand, ASTPtr & select_node, int32_t max_depth)
+bool ParserKQLMVExpand::genQuery(KQLMVExpand & kql_mv_expand, ASTPtr & select_node, uint32_t max_depth, uint32_t max_backtracks)
 {
     String expand_str;
     String cast_type_column_remove, cast_type_column_rename;
@@ -253,7 +253,7 @@ bool ParserKQLMVExpand::genQuery(KQLMVExpand & kql_mv_expand, ASTPtr & select_no
     if (cast_type_column_remove.empty())
     {
         query = std::format("Select {} {} From {} {}", columns, extra_columns, input, expand_str);
-        if (!parseSQLQueryByString(std::make_unique<ParserSelectQuery>(), query, sub_query_node, max_depth))
+        if (!parseSQLQueryByString(std::make_unique<ParserSelectQuery>(), query, sub_query_node, max_depth, max_backtracks))
             return false;
         if (!setSubQuerySource(sub_query_node, select_node, false, false))
             return false;
@@ -262,14 +262,14 @@ bool ParserKQLMVExpand::genQuery(KQLMVExpand & kql_mv_expand, ASTPtr & select_no
     else
     {
         query = std::format("(Select {} {} From {} {})", columns, extra_columns, input, expand_str);
-        if (!parseSQLQueryByString(std::make_unique<ParserTablesInSelectQuery>(), query, sub_query_node, max_depth))
+        if (!parseSQLQueryByString(std::make_unique<ParserTablesInSelectQuery>(), query, sub_query_node, max_depth, max_backtracks))
             return false;
         if (!setSubQuerySource(sub_query_node, select_node, true, false))
             return false;
         select_node = std::move(sub_query_node);
 
         auto rename_query = std::format("(Select * {}, {} From {})", cast_type_column_remove, cast_type_column_rename, "query");
-        if (!parseSQLQueryByString(std::make_unique<ParserTablesInSelectQuery>(), rename_query, sub_query_node, max_depth))
+        if (!parseSQLQueryByString(std::make_unique<ParserTablesInSelectQuery>(), rename_query, sub_query_node, max_depth, max_backtracks))
             return false;
         if (!setSubQuerySource(sub_query_node, select_node, true, true))
             return false;
@@ -277,7 +277,7 @@ bool ParserKQLMVExpand::genQuery(KQLMVExpand & kql_mv_expand, ASTPtr & select_no
         select_node = std::move(sub_query_node);
         query = std::format("Select * {}, {} from {}", cast_type_column_restore, cast_type_column_restore_name, "rename_query");
 
-        if (!parseSQLQueryByString(std::make_unique<ParserSelectQuery>(), query, sub_query_node, max_depth))
+        if (!parseSQLQueryByString(std::make_unique<ParserSelectQuery>(), query, sub_query_node, max_depth, max_backtracks))
             return false;
         sub_query_node->as<ASTSelectQuery>()->setExpression(ASTSelectQuery::Expression::TABLES, std::move(select_node));
         select_node = std::move(sub_query_node);
@@ -294,12 +294,12 @@ bool ParserKQLMVExpand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     KQLMVExpand kql_mv_expand;
     if (!parserMVExpand(kql_mv_expand, pos, expected))
         return false;
-    if (!genQuery(kql_mv_expand, node, pos.max_depth))
+    if (!genQuery(kql_mv_expand, node, pos.max_depth, pos.max_backtracks))
         return false;
 
     const String setting_str = "enable_unaligned_array_join = 1";
     Tokens token_settings(setting_str.c_str(), setting_str.c_str() + setting_str.size());
-    IParser::Pos pos_settings(token_settings, pos.max_depth);
+    IParser::Pos pos_settings(token_settings, pos.max_depth, pos.max_backtracks);
 
     if (!ParserSetQuery(true).parse(pos_settings, setting, expected))
         return false;
diff --git a/src/Parsers/Kusto/ParserKQLMVExpand.h b/src/Parsers/Kusto/ParserKQLMVExpand.h
index 61f206bb00d..068aee53f58 100644
--- a/src/Parsers/Kusto/ParserKQLMVExpand.h
+++ b/src/Parsers/Kusto/ParserKQLMVExpand.h
@@ -33,7 +33,7 @@ protected:
 
     static bool parseColumnArrayExprs(ColumnArrayExprs & column_array_exprs, Pos & pos, Expected & expected);
     static bool parserMVExpand(KQLMVExpand & kql_mv_expand, Pos & pos, Expected & expected);
-    static bool genQuery(KQLMVExpand & kql_mv_expand, ASTPtr & select_node, int32_t max_depth);
+    static bool genQuery(KQLMVExpand & kql_mv_expand, ASTPtr & select_node, uint32_t max_depth, uint32_t max_backtracks);
 
     const char * getName() const override { return "KQL mv-expand"; }
     bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
diff --git a/src/Parsers/Kusto/ParserKQLMakeSeries.cpp b/src/Parsers/Kusto/ParserKQLMakeSeries.cpp
index e89423e2fc9..4759efc0025 100644
--- a/src/Parsers/Kusto/ParserKQLMakeSeries.cpp
+++ b/src/Parsers/Kusto/ParserKQLMakeSeries.cpp
@@ -142,7 +142,7 @@ bool ParserKQLMakeSeries ::parseFromToStepClause(FromToStepClause & from_to_step
         || ParserKQLDateTypeTimespan().parseConstKQLTimespan(from_to_step.step_str))
     {
         from_to_step.is_timespan = true;
-        from_to_step.step = std::stod(getExprFromToken(from_to_step.step_str, pos.max_depth));
+        from_to_step.step = std::stod(getExprFromToken(from_to_step.step_str, pos.max_depth, pos.max_backtracks));
     }
     else
         from_to_step.step = std::stod(from_to_step.step_str);
@@ -150,7 +150,7 @@ bool ParserKQLMakeSeries ::parseFromToStepClause(FromToStepClause & from_to_step
     return true;
 }
 
-bool ParserKQLMakeSeries ::makeSeries(KQLMakeSeries & kql_make_series, ASTPtr & select_node, const uint32_t & max_depth)
+bool ParserKQLMakeSeries ::makeSeries(KQLMakeSeries & kql_make_series, ASTPtr & select_node, uint32_t max_depth, uint32_t max_backtracks)
 {
     const uint64_t era_diff
         = 62135596800; // this magic number is the differicen is second form 0001-01-01 (Azure start time ) and 1970-01-01 (CH start time)
@@ -166,15 +166,15 @@ bool ParserKQLMakeSeries ::makeSeries(KQLMakeSeries & kql_make_series, ASTPtr &
     auto step = from_to_step.step;
 
     if (!kql_make_series.from_to_step.from_str.empty())
-        start_str = getExprFromToken(kql_make_series.from_to_step.from_str, max_depth);
+        start_str = getExprFromToken(kql_make_series.from_to_step.from_str, max_depth, max_backtracks);
 
     if (!kql_make_series.from_to_step.to_str.empty())
-        end_str = getExprFromToken(from_to_step.to_str, max_depth);
+        end_str = getExprFromToken(from_to_step.to_str, max_depth, max_backtracks);
 
     auto date_type_cast = [&](String & src)
     {
         Tokens tokens(src.c_str(), src.c_str() + src.size());
-        IParser::Pos pos(tokens, max_depth);
+        IParser::Pos pos(tokens, max_depth, max_backtracks);
         String res;
         while (isValidKQLPos(pos))
         {
@@ -201,7 +201,7 @@ bool ParserKQLMakeSeries ::makeSeries(KQLMakeSeries & kql_make_series, ASTPtr &
     {
         std::vector<String> group_expression_tokens;
         Tokens tokens(group_expression.c_str(), group_expression.c_str() + group_expression.size());
-        IParser::Pos pos(tokens, max_depth);
+        IParser::Pos pos(tokens, max_depth, max_backtracks);
         while (isValidKQLPos(pos))
         {
             if (String(pos->begin, pos->end) == "AS")
@@ -296,7 +296,7 @@ bool ParserKQLMakeSeries ::makeSeries(KQLMakeSeries & kql_make_series, ASTPtr &
 
     ASTPtr sub_query_node;
 
-    if (!ParserSimpleCHSubquery(select_node).parseByString(sub_sub_query, sub_query_node, max_depth))
+    if (!ParserSimpleCHSubquery(select_node).parseByString(sub_sub_query, sub_query_node, max_depth, max_backtracks))
         return false;
     select_node->as<ASTSelectQuery>()->setExpression(ASTSelectQuery::Expression::TABLES, std::move(sub_query_node));
 
@@ -351,7 +351,7 @@ bool ParserKQLMakeSeries ::makeSeries(KQLMakeSeries & kql_make_series, ASTPtr &
     else
         main_query = std::format("{},{}", group_expression_alias, final_axis_agg_alias_list);
 
-    if (!ParserSimpleCHSubquery(select_node).parseByString(sub_query, sub_query_node, max_depth))
+    if (!ParserSimpleCHSubquery(select_node).parseByString(sub_query, sub_query_node, max_depth, max_backtracks))
         return false;
     select_node->as<ASTSelectQuery>()->setExpression(ASTSelectQuery::Expression::TABLES, std::move(sub_query_node));
 
@@ -411,10 +411,10 @@ bool ParserKQLMakeSeries ::parseImpl(Pos & pos, ASTPtr & node, Expected & expect
             subquery_columns += ", " + column_str;
     }
 
-    makeSeries(kql_make_series, node, pos.max_depth);
+    makeSeries(kql_make_series, node, pos.max_depth, pos.max_backtracks);
 
     Tokens token_main_query(kql_make_series.main_query.c_str(), kql_make_series.main_query.c_str() + kql_make_series.main_query.size());
-    IParser::Pos pos_main_query(token_main_query, pos.max_depth);
+    IParser::Pos pos_main_query(token_main_query, pos.max_depth, pos.max_backtracks);
 
     if (!ParserNotEmptyExpressionList(true).parse(pos_main_query, select_expression_list, expected))
         return false;
diff --git a/src/Parsers/Kusto/ParserKQLMakeSeries.h b/src/Parsers/Kusto/ParserKQLMakeSeries.h
index ef7cc4976f6..6a32e76eff3 100644
--- a/src/Parsers/Kusto/ParserKQLMakeSeries.h
+++ b/src/Parsers/Kusto/ParserKQLMakeSeries.h
@@ -42,7 +42,7 @@ protected:
         String main_query;
     };
 
-    static bool makeSeries(KQLMakeSeries & kql_make_series, ASTPtr & select_node, const uint32_t & max_depth);
+    static bool makeSeries(KQLMakeSeries & kql_make_series, ASTPtr & select_node, uint32_t max_depth, uint32_t max_backtracks);
     static bool parseAggregationColumns(AggregationColumns & aggregation_columns, Pos & pos);
     static bool parseFromToStepClause(FromToStepClause & from_to_step, Pos & pos);
 
diff --git a/src/Parsers/Kusto/ParserKQLPrint.cpp b/src/Parsers/Kusto/ParserKQLPrint.cpp
index bd9980ea96d..37483439f14 100644
--- a/src/Parsers/Kusto/ParserKQLPrint.cpp
+++ b/src/Parsers/Kusto/ParserKQLPrint.cpp
@@ -10,7 +10,7 @@ bool ParserKQLPrint::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     const String expr = getExprFromToken(pos);
 
     Tokens tokens(expr.c_str(), expr.c_str() + expr.size());
-    IParser::Pos new_pos(tokens, pos.max_depth);
+    IParser::Pos new_pos(tokens, pos.max_depth, pos.max_backtracks);
 
     if (!ParserNotEmptyExpressionList(true).parse(new_pos, select_expression_list, expected))
         return false;
diff --git a/src/Parsers/Kusto/ParserKQLProject.cpp b/src/Parsers/Kusto/ParserKQLProject.cpp
index fdc458b7707..eab9ee082c5 100644
--- a/src/Parsers/Kusto/ParserKQLProject.cpp
+++ b/src/Parsers/Kusto/ParserKQLProject.cpp
@@ -12,7 +12,7 @@ bool ParserKQLProject ::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     expr = getExprFromToken(pos);
 
     Tokens tokens(expr.c_str(), expr.c_str() + expr.size());
-    IParser::Pos new_pos(tokens, pos.max_depth);
+    IParser::Pos new_pos(tokens, pos.max_depth, pos.max_backtracks);
 
     if (!ParserNotEmptyExpressionList(false).parse(new_pos, select_expression_list, expected))
         return false;
diff --git a/src/Parsers/Kusto/ParserKQLQuery.cpp b/src/Parsers/Kusto/ParserKQLQuery.cpp
index a54a2b0eda9..6fd9c95ec6f 100644
--- a/src/Parsers/Kusto/ParserKQLQuery.cpp
+++ b/src/Parsers/Kusto/ParserKQLQuery.cpp
@@ -33,20 +33,20 @@ namespace ErrorCodes
     extern const int SYNTAX_ERROR;
 }
 
-bool ParserKQLBase::parseByString(const String expr, ASTPtr & node, const uint32_t max_depth)
+bool ParserKQLBase::parseByString(String expr, ASTPtr & node, uint32_t max_depth, uint32_t max_backtracks)
 {
     Expected expected;
 
     Tokens tokens(expr.c_str(), expr.c_str() + expr.size());
-    IParser::Pos pos(tokens, max_depth);
+    IParser::Pos pos(tokens, max_depth, max_backtracks);
     return parse(pos, node, expected);
 }
 
-bool ParserKQLBase::parseSQLQueryByString(ParserPtr && parser, String & query, ASTPtr & select_node, int32_t max_depth)
+bool ParserKQLBase::parseSQLQueryByString(ParserPtr && parser, String & query, ASTPtr & select_node, uint32_t max_depth, uint32_t max_backtracks)
 {
     Expected expected;
     Tokens token_subquery(query.c_str(), query.c_str() + query.size());
-    IParser::Pos pos_subquery(token_subquery, max_depth);
+    IParser::Pos pos_subquery(token_subquery, max_depth, max_backtracks);
     if (!parser->parse(pos_subquery, select_node, expected))
         return false;
     return true;
@@ -121,10 +121,10 @@ bool ParserKQLBase::setSubQuerySource(ASTPtr & select_query, ASTPtr & source, bo
     return true;
 }
 
-String ParserKQLBase::getExprFromToken(const String & text, const uint32_t max_depth)
+String ParserKQLBase::getExprFromToken(const String & text, uint32_t max_depth, uint32_t max_backtracks)
 {
     Tokens tokens(text.c_str(), text.c_str() + text.size());
-    IParser::Pos pos(tokens, max_depth);
+    IParser::Pos pos(tokens, max_depth, max_backtracks);
 
     return getExprFromToken(pos);
 }
@@ -523,7 +523,7 @@ bool ParserKQLQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
             String sub_query = std::format("({})", String(operation_pos.front().second->begin, last_pos->end));
             Tokens token_subquery(sub_query.c_str(), sub_query.c_str() + sub_query.size());
-            IParser::Pos pos_subquery(token_subquery, pos.max_depth);
+            IParser::Pos pos_subquery(token_subquery, pos.max_depth, pos.max_backtracks);
 
             if (!ParserKQLSubquery().parse(pos_subquery, tables, expected))
                 return false;
@@ -544,7 +544,7 @@ bool ParserKQLQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             if (oprator)
             {
                 Tokens token_clause(op_calsue.c_str(), op_calsue.c_str() + op_calsue.size());
-                IParser::Pos pos_clause(token_clause, pos.max_depth);
+                IParser::Pos pos_clause(token_clause, pos.max_depth, pos.max_backtracks);
                 if (!oprator->parse(pos_clause, node, expected))
                     return false;
             }
@@ -577,7 +577,7 @@ bool ParserKQLQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     {
         auto expr = String("*");
         Tokens tokens(expr.c_str(), expr.c_str() + expr.size());
-        IParser::Pos new_pos(tokens, pos.max_depth);
+        IParser::Pos new_pos(tokens, pos.max_depth, pos.max_backtracks);
         if (!std::make_unique<ParserKQLProject>()->parse(new_pos, node, expected))
             return false;
     }
diff --git a/src/Parsers/Kusto/ParserKQLQuery.h b/src/Parsers/Kusto/ParserKQLQuery.h
index a594f43ceec..e003ee3ee8b 100644
--- a/src/Parsers/Kusto/ParserKQLQuery.h
+++ b/src/Parsers/Kusto/ParserKQLQuery.h
@@ -9,11 +9,11 @@ class ParserKQLBase : public IParserBase
 {
 public:
     static String getExprFromToken(Pos & pos);
-    static String getExprFromToken(const String & text, uint32_t max_depth);
+    static String getExprFromToken(const String & text, uint32_t max_depth, uint32_t max_backtracks);
     static String getExprFromPipe(Pos & pos);
     static bool setSubQuerySource(ASTPtr & select_query, ASTPtr & source, bool dest_is_subquery, bool src_is_subquery);
-    static bool parseSQLQueryByString(ParserPtr && parser, String & query, ASTPtr & select_node, int32_t max_depth);
-    bool parseByString(String expr, ASTPtr & node, uint32_t max_depth);
+    static bool parseSQLQueryByString(ParserPtr && parser, String & query, ASTPtr & select_node, uint32_t max_depth, uint32_t max_backtracks);
+    bool parseByString(String expr, ASTPtr & node, uint32_t max_depth, uint32_t max_backtracks);
 };
 
 class ParserKQLQuery : public IParserBase
diff --git a/src/Parsers/Kusto/ParserKQLSort.cpp b/src/Parsers/Kusto/ParserKQLSort.cpp
index 7e5ac2b17e7..852ba50698d 100644
--- a/src/Parsers/Kusto/ParserKQLSort.cpp
+++ b/src/Parsers/Kusto/ParserKQLSort.cpp
@@ -19,7 +19,7 @@ bool ParserKQLSort::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     auto expr = getExprFromToken(pos);
 
     Tokens tokens(expr.c_str(), expr.c_str() + expr.size());
-    IParser::Pos new_pos(tokens, pos.max_depth);
+    IParser::Pos new_pos(tokens, pos.max_depth, pos.max_backtracks);
 
     auto pos_backup = new_pos;
     if (!order_list.parse(pos_backup, order_expression_list, expected))
diff --git a/src/Parsers/Kusto/ParserKQLStatement.cpp b/src/Parsers/Kusto/ParserKQLStatement.cpp
index 668696fa9dc..fbf2110e664 100644
--- a/src/Parsers/Kusto/ParserKQLStatement.cpp
+++ b/src/Parsers/Kusto/ParserKQLStatement.cpp
@@ -95,7 +95,7 @@ bool ParserKQLTableFunction::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
         }
         ++pos;
         Tokens token_kql(kql_statement.c_str(), kql_statement.c_str() + kql_statement.size());
-        IParser::Pos pos_kql(token_kql, pos.max_depth);
+        IParser::Pos pos_kql(token_kql, pos.max_depth, pos.max_backtracks);
 
         if (kql_p.parse(pos_kql, select, expected))
         {
diff --git a/src/Parsers/Kusto/ParserKQLSummarize.cpp b/src/Parsers/Kusto/ParserKQLSummarize.cpp
index a45717930bb..47d706d0b4b 100644
--- a/src/Parsers/Kusto/ParserKQLSummarize.cpp
+++ b/src/Parsers/Kusto/ParserKQLSummarize.cpp
@@ -192,10 +192,10 @@ bool ParserKQLSummarize::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
             expr_columns = expr_columns + "," + expr_aggregation;
     }
 
-    String converted_columns = getExprFromToken(expr_columns, pos.max_depth);
+    String converted_columns = getExprFromToken(expr_columns, pos.max_depth, pos.max_backtracks);
 
     Tokens token_converted_columns(converted_columns.c_str(), converted_columns.c_str() + converted_columns.size());
-    IParser::Pos pos_converted_columns(token_converted_columns, pos.max_depth);
+    IParser::Pos pos_converted_columns(token_converted_columns, pos.max_depth, pos.max_backtracks);
 
     if (!ParserNotEmptyExpressionList(true).parse(pos_converted_columns, select_expression_list, expected))
         return false;
@@ -204,10 +204,10 @@ bool ParserKQLSummarize::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
 
     if (groupby)
     {
-        String converted_groupby = getExprFromToken(expr_groupby, pos.max_depth);
+        String converted_groupby = getExprFromToken(expr_groupby, pos.max_depth, pos.max_backtracks);
 
         Tokens token_converted_groupby(converted_groupby.c_str(), converted_groupby.c_str() + converted_groupby.size());
-        IParser::Pos postoken_converted_groupby(token_converted_groupby, pos.max_depth);
+        IParser::Pos postoken_converted_groupby(token_converted_groupby, pos.max_depth, pos.max_backtracks);
 
         if (!ParserNotEmptyExpressionList(false).parse(postoken_converted_groupby, group_expression_list, expected))
             return false;
diff --git a/src/Parsers/Kusto/parseKQLQuery.cpp b/src/Parsers/Kusto/parseKQLQuery.cpp
index bcc04ef7001..34a009873f8 100644
--- a/src/Parsers/Kusto/parseKQLQuery.cpp
+++ b/src/Parsers/Kusto/parseKQLQuery.cpp
@@ -322,12 +322,13 @@ ASTPtr tryParseKQLQuery(
     bool allow_multi_statements,
     size_t max_query_size,
     size_t max_parser_depth,
+    size_t max_parser_backtracks,
     bool skip_insignificant)
 {
     const char * query_begin = _out_query_end;
     Tokens tokens(query_begin, all_queries_end, max_query_size, skip_insignificant);
     /// NOTE: consider use UInt32 for max_parser_depth setting.
-    IParser::Pos token_iterator(tokens, static_cast<uint32_t>(max_parser_depth));
+    IParser::Pos token_iterator(tokens, static_cast<uint32_t>(max_parser_depth), static_cast<uint32_t>(max_parser_backtracks));
 
     if (token_iterator->isEnd()
         || token_iterator->type == TokenType::Semicolon)
@@ -441,10 +442,11 @@ ASTPtr parseKQLQueryAndMovePosition(
     const std::string & query_description,
     bool allow_multi_statements,
     size_t max_query_size,
-    size_t max_parser_depth)
+    size_t max_parser_depth,
+    size_t max_parser_backtracks)
 {
     std::string error_message;
-    ASTPtr res = tryParseKQLQuery(parser, pos, end, error_message, false, query_description, allow_multi_statements, max_query_size, max_parser_depth);
+    ASTPtr res = tryParseKQLQuery(parser, pos, end, error_message, false, query_description, allow_multi_statements, max_query_size, max_parser_depth, max_parser_backtracks);
 
     if (res)
         return res;
@@ -458,9 +460,10 @@ ASTPtr parseKQLQuery(
     const char * end,
     const std::string & query_description,
     size_t max_query_size,
-    size_t max_parser_depth)
+    size_t max_parser_depth,
+    size_t max_parser_backtracks)
 {
-    return parseKQLQueryAndMovePosition(parser, begin, end, query_description, false, max_query_size, max_parser_depth);
+    return parseKQLQueryAndMovePosition(parser, begin, end, query_description, false, max_query_size, max_parser_depth, max_parser_backtracks);
 }
 
 ASTPtr parseKQLQuery(
@@ -468,18 +471,20 @@ ASTPtr parseKQLQuery(
     const std::string & query,
     const std::string & query_description,
     size_t max_query_size,
-    size_t max_parser_depth)
+    size_t max_parser_depth,
+    size_t max_parser_backtracks)
 {
-    return parseKQLQuery(parser, query.data(), query.data() + query.size(), query_description, max_query_size, max_parser_depth);
+    return parseKQLQuery(parser, query.data(), query.data() + query.size(), query_description, max_query_size, max_parser_depth, max_parser_backtracks);
 }
 
 ASTPtr parseKQLQuery(
     IParser & parser,
     const std::string & query,
     size_t max_query_size,
-    size_t max_parser_depth)
+    size_t max_parser_depth,
+    size_t max_parser_backtracks)
 {
-    return parseKQLQuery(parser, query.data(), query.data() + query.size(), parser.getName(), max_query_size, max_parser_depth);
+    return parseKQLQuery(parser, query.data(), query.data() + query.size(), parser.getName(), max_query_size, max_parser_depth, max_parser_backtracks);
 }
 
 }
diff --git a/src/Parsers/Kusto/parseKQLQuery.h b/src/Parsers/Kusto/parseKQLQuery.h
index fca017e70fe..9e52ba56307 100644
--- a/src/Parsers/Kusto/parseKQLQuery.h
+++ b/src/Parsers/Kusto/parseKQLQuery.h
@@ -3,6 +3,7 @@
 #include <Parsers/IAST_fwd.h>
 #include <Parsers/parseQuery.h>
 #include <IO/WriteBufferFromString.h>
+
 namespace DB
 {
 
@@ -10,10 +11,6 @@ namespace DB
   * Used in syntax error message.
   */
 
-}
-namespace DB
-{
-
 class IParser;
 
 /// Parse query or set 'out_error_message'.
@@ -24,11 +21,11 @@ ASTPtr tryParseKQLQuery(
     std::string & out_error_message,
     bool hilite,
     const std::string & description,
-    bool allow_multi_statements,    /// If false, check for non-space characters after semicolon and set error message if any.
-    size_t max_query_size,          /// If (end - pos) > max_query_size and query is longer than max_query_size then throws "Max query size exceeded".
-                                    /// Disabled if zero. Is used in order to check query size if buffer can contains data for INSERT query.
+    bool allow_multi_statements,
+    size_t max_query_size,
     size_t max_parser_depth,
-    bool skip_insignificant = true);  /// If true, lexer will skip all insignificant tokens (e.g. whitespaces)
+    size_t max_parser_backtracks,
+    bool skip_insignificant = true);
 
 
 /// Parse query or throw an exception with error message.
@@ -39,7 +36,8 @@ ASTPtr parseKQLQueryAndMovePosition(
     const std::string & description,
     bool allow_multi_statements,
     size_t max_query_size,
-    size_t max_parser_depth);
+    size_t max_parser_depth,
+    size_t max_parser_backtracks);
 
 ASTPtr parseKQLQuery(
     IParser & parser,
@@ -47,18 +45,22 @@ ASTPtr parseKQLQuery(
     const char * end,
     const std::string & description,
     size_t max_query_size,
-    size_t max_parser_depth);
+    size_t max_parser_depth,
+    size_t max_parser_backtracks);
 
 ASTPtr parseKQLQuery(
     IParser & parser,
     const std::string & query,
     const std::string & query_description,
     size_t max_query_size,
-    size_t max_parser_depth);
+    size_t max_parser_depth,
+    size_t max_parser_backtracks);
 
 ASTPtr parseKQLQuery(
     IParser & parser,
     const std::string & query,
     size_t max_query_size,
-    size_t max_parser_depth);
+    size_t max_parser_depth,
+    size_t max_parser_backtracks);
+
 }
diff --git a/src/Parsers/MySQL/tests/gtest_alter_command_parser.cpp b/src/Parsers/MySQL/tests/gtest_alter_command_parser.cpp
index d406cdbd3b9..4db96646e16 100644
--- a/src/Parsers/MySQL/tests/gtest_alter_command_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_alter_command_parser.cpp
@@ -11,7 +11,7 @@ using namespace DB::MySQLParser;
 
 static inline ASTPtr tryParserQuery(IParser & parser, const String & query)
 {
-    return parseQuery(parser, query.data(), query.data() + query.size(), "", 0, 0);
+    return parseQuery(parser, query.data(), query.data() + query.size(), "", 0, 0, 0);
 }
 
 TEST(ParserAlterCommand, AddAlterCommand)
diff --git a/src/Parsers/MySQL/tests/gtest_alter_parser.cpp b/src/Parsers/MySQL/tests/gtest_alter_parser.cpp
index 4ebbe332710..2b12d7bdcf1 100644
--- a/src/Parsers/MySQL/tests/gtest_alter_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_alter_parser.cpp
@@ -9,7 +9,7 @@ using namespace DB::MySQLParser;
 
 static inline ASTPtr tryParserQuery(IParser & parser, const String & query)
 {
-    return parseQuery(parser, query.data(), query.data() + query.size(), "", 0, 0);
+    return parseQuery(parser, query.data(), query.data() + query.size(), "", 0, 0, 0);
 }
 
 TEST(ParserAlterQuery, AlterQuery)
diff --git a/src/Parsers/MySQL/tests/gtest_column_parser.cpp b/src/Parsers/MySQL/tests/gtest_column_parser.cpp
index b1c7c778bea..21c37e4ee2e 100644
--- a/src/Parsers/MySQL/tests/gtest_column_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_column_parser.cpp
@@ -17,7 +17,7 @@ TEST(ParserColumn, AllNonGeneratedColumnOption)
 
     String input = "col_01 VARCHAR(100) NOT NULL DEFAULT NULL AUTO_INCREMENT UNIQUE KEY PRIMARY KEY COMMENT 'column comment' COLLATE utf8 "
                    "COLUMN_FORMAT FIXED STORAGE MEMORY REFERENCES tbl_name (col_01) CHECK 1";
-    ASTPtr ast = parseQuery(p_column, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_column, input.data(), input.data() + input.size(), "", 0, 0, 0);
     EXPECT_EQ(ast->as<ASTDeclareColumn>()->name, "col_01");
     EXPECT_EQ(ast->as<ASTDeclareColumn>()->data_type->as<ASTFunction>()->name, "VARCHAR");
     EXPECT_EQ(ast->as<ASTDeclareColumn>()->data_type->as<ASTFunction>()->arguments->children[0]->as<ASTLiteral>()->value.safeGet<UInt64>(), 100);
@@ -42,7 +42,7 @@ TEST(ParserColumn, AllGeneratedColumnOption)
 
     String input = "col_01 VARCHAR(100) NULL UNIQUE KEY PRIMARY KEY COMMENT 'column comment' COLLATE utf8 "
                    "REFERENCES tbl_name (col_01) CHECK 1 GENERATED ALWAYS AS (1) STORED";
-    ASTPtr ast = parseQuery(p_column, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_column, input.data(), input.data() + input.size(), "", 0, 0, 0);
     EXPECT_EQ(ast->as<ASTDeclareColumn>()->name, "col_01");
     EXPECT_EQ(ast->as<ASTDeclareColumn>()->data_type->as<ASTFunction>()->name, "VARCHAR");
     EXPECT_EQ(ast->as<ASTDeclareColumn>()->data_type->as<ASTFunction>()->arguments->children[0]->as<ASTLiteral>()->value.safeGet<UInt64>(), 100);
diff --git a/src/Parsers/MySQL/tests/gtest_constraint_parser.cpp b/src/Parsers/MySQL/tests/gtest_constraint_parser.cpp
index 9c9124c9f58..a06f2ade24a 100644
--- a/src/Parsers/MySQL/tests/gtest_constraint_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_constraint_parser.cpp
@@ -14,7 +14,7 @@ TEST(ParserConstraint, CheckConstraint)
     ParserDeclareConstraint p_constraint;
 
     String constraint_01 = "CONSTRAINT symbol_name CHECK col_01 = 1";
-    ASTPtr ast_constraint_01 = parseQuery(p_constraint, constraint_01.data(), constraint_01.data() + constraint_01.size(), "", 0, 0);
+    ASTPtr ast_constraint_01 = parseQuery(p_constraint, constraint_01.data(), constraint_01.data() + constraint_01.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_constraint_01->as<ASTDeclareConstraint>()->constraint_name, "symbol_name");
     auto * check_expression_01 = ast_constraint_01->as<ASTDeclareConstraint>()->check_expression->as<ASTFunction>();
     EXPECT_EQ(check_expression_01->name, "equals");
@@ -22,7 +22,7 @@ TEST(ParserConstraint, CheckConstraint)
     EXPECT_EQ(check_expression_01->arguments->children[1]->as<ASTLiteral>()->value.safeGet<UInt64>(), 1);
 
     String constraint_02 = "CONSTRAINT CHECK col_01 = 1";
-    ASTPtr ast_constraint_02 = parseQuery(p_constraint, constraint_02.data(), constraint_02.data() + constraint_02.size(), "", 0, 0);
+    ASTPtr ast_constraint_02 = parseQuery(p_constraint, constraint_02.data(), constraint_02.data() + constraint_02.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_constraint_02->as<ASTDeclareConstraint>()->constraint_name, "");
     auto * check_expression_02 = ast_constraint_02->as<ASTDeclareConstraint>()->check_expression->as<ASTFunction>();
     EXPECT_EQ(check_expression_02->name, "equals");
@@ -30,7 +30,7 @@ TEST(ParserConstraint, CheckConstraint)
     EXPECT_EQ(check_expression_02->arguments->children[1]->as<ASTLiteral>()->value.safeGet<UInt64>(), 1);
 
     String constraint_03 = "CHECK col_01 = 1";
-    ASTPtr ast_constraint_03 = parseQuery(p_constraint, constraint_03.data(), constraint_03.data() + constraint_03.size(), "", 0, 0);
+    ASTPtr ast_constraint_03 = parseQuery(p_constraint, constraint_03.data(), constraint_03.data() + constraint_03.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_constraint_03->as<ASTDeclareConstraint>()->constraint_name, "");
     auto * check_expression_03 = ast_constraint_03->as<ASTDeclareConstraint>()->check_expression->as<ASTFunction>();
     EXPECT_EQ(check_expression_03->name, "equals");
@@ -38,7 +38,7 @@ TEST(ParserConstraint, CheckConstraint)
     EXPECT_EQ(check_expression_03->arguments->children[1]->as<ASTLiteral>()->value.safeGet<UInt64>(), 1);
 
     String constraint_04 = "CONSTRAINT CHECK col_01 = 1 ENFORCED";
-    ASTPtr ast_constraint_04 = parseQuery(p_constraint, constraint_04.data(), constraint_04.data() + constraint_04.size(), "", 0, 0);
+    ASTPtr ast_constraint_04 = parseQuery(p_constraint, constraint_04.data(), constraint_04.data() + constraint_04.size(), "", 0, 0, 0);
     EXPECT_TRUE(ast_constraint_04->as<ASTDeclareConstraint>()->enforced);
     EXPECT_EQ(ast_constraint_04->as<ASTDeclareConstraint>()->constraint_name, "");
     auto * check_expression_04 = ast_constraint_04->as<ASTDeclareConstraint>()->check_expression->as<ASTFunction>();
@@ -47,7 +47,7 @@ TEST(ParserConstraint, CheckConstraint)
     EXPECT_EQ(check_expression_04->arguments->children[1]->as<ASTLiteral>()->value.safeGet<UInt64>(), 1);
 
     String constraint_05 = "CONSTRAINT CHECK col_01 = 1 NOT ENFORCED";
-    ASTPtr ast_constraint_05 = parseQuery(p_constraint, constraint_05.data(), constraint_05.data() + constraint_05.size(), "", 0, 0);
+    ASTPtr ast_constraint_05 = parseQuery(p_constraint, constraint_05.data(), constraint_05.data() + constraint_05.size(), "", 0, 0, 0);
     EXPECT_FALSE(ast_constraint_05->as<ASTDeclareConstraint>()->enforced);
     EXPECT_EQ(ast_constraint_05->as<ASTDeclareConstraint>()->constraint_name, "");
     auto * check_expression_05 = ast_constraint_05->as<ASTDeclareConstraint>()->check_expression->as<ASTFunction>();
diff --git a/src/Parsers/MySQL/tests/gtest_create_parser.cpp b/src/Parsers/MySQL/tests/gtest_create_parser.cpp
index 2f65eb6e592..8512b88ffc1 100644
--- a/src/Parsers/MySQL/tests/gtest_create_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_create_parser.cpp
@@ -15,16 +15,16 @@ TEST(CreateTableParser, LikeCreate)
 {
     ParserCreateQuery p_create_query;
     String like_create_01 = "CREATE TABLE IF NOT EXISTS table_name LIKE table_name_01";
-    parseQuery(p_create_query, like_create_01.data(), like_create_01.data() + like_create_01.size(), "", 0, 0);
+    parseQuery(p_create_query, like_create_01.data(), like_create_01.data() + like_create_01.size(), "", 0, 0, 0);
     String like_create_02 = "CREATE TABLE IF NOT EXISTS table_name (LIKE table_name_01)";
-    parseQuery(p_create_query, like_create_02.data(), like_create_02.data() + like_create_02.size(), "", 0, 0);
+    parseQuery(p_create_query, like_create_02.data(), like_create_02.data() + like_create_02.size(), "", 0, 0, 0);
 }
 
 TEST(CreateTableParser, SimpleCreate)
 {
     ParserCreateQuery p_create_query;
     String input = "CREATE TABLE IF NOT EXISTS table_name(col_01 VARCHAR(100), INDEX (col_01), CHECK 1) ENGINE INNODB PARTITION BY HASH(col_01)";
-    ASTPtr ast = parseQuery(p_create_query, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_create_query, input.data(), input.data() + input.size(), "", 0, 0, 0);
     EXPECT_TRUE(ast->as<ASTCreateQuery>()->if_not_exists);
     EXPECT_EQ(ast->as<ASTCreateQuery>()->columns_list->as<ASTCreateDefines>()->columns->children.size(), 1);
     EXPECT_EQ(ast->as<ASTCreateQuery>()->columns_list->as<ASTCreateDefines>()->indices->children.size(), 1);
@@ -37,7 +37,7 @@ TEST(CreateTableParser, SS)
 {
     ParserCreateQuery p_create_query;
     String input = "CREATE TABLE `test_table_1` (`a` int DEFAULT NULL, `b` int DEFAULT NULL) ENGINE=InnoDB DEFAULT CHARSET=utf8mb4 COLLATE=utf8mb4_0900_ai_ci";
-    ASTPtr ast = parseQuery(p_create_query, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_create_query, input.data(), input.data() + input.size(), "", 0, 0, 0);
     WriteBufferFromOStream buf(std::cerr, 4096);
     ast->dumpTree(buf);
     buf.finalize();
diff --git a/src/Parsers/MySQL/tests/gtest_index_parser.cpp b/src/Parsers/MySQL/tests/gtest_index_parser.cpp
index a8be6787b2c..187bac3e090 100644
--- a/src/Parsers/MySQL/tests/gtest_index_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_index_parser.cpp
@@ -14,7 +14,7 @@ TEST(ParserIndex, AllIndexOptions)
     String input = "INDEX (col_01, col_02(100), col_03 DESC) KEY_BLOCK_SIZE 3 USING HASH WITH PARSER parser_name COMMENT 'index comment' VISIBLE";
 
     ParserDeclareIndex p_index;
-    ASTPtr ast = parseQuery(p_index, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_index, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     ASTDeclareIndex * declare_index = ast->as<ASTDeclareIndex>();
     EXPECT_EQ(declare_index->index_columns->children[0]->as<ASTIdentifier>()->name(), "col_01");
@@ -33,7 +33,7 @@ TEST(ParserIndex, OptionalIndexOptions)
     String input = "INDEX (col_01, col_02(100), col_03 DESC) USING HASH INVISIBLE KEY_BLOCK_SIZE 3";
 
     ParserDeclareIndex p_index;
-    ASTPtr ast = parseQuery(p_index, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_index, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     ASTDeclareIndex * declare_index = ast->as<ASTDeclareIndex>();
     EXPECT_EQ(declare_index->index_columns->children[0]->as<ASTIdentifier>()->name(), "col_01");
@@ -50,28 +50,28 @@ TEST(ParserIndex, OrdinaryIndex)
 {
     ParserDeclareIndex p_index;
     String non_unique_index_01 = "KEY index_name USING HASH (col_01) INVISIBLE";
-    parseQuery(p_index, non_unique_index_01.data(), non_unique_index_01.data() + non_unique_index_01.size(), "", 0, 0);
+    parseQuery(p_index, non_unique_index_01.data(), non_unique_index_01.data() + non_unique_index_01.size(), "", 0, 0, 0);
 
     String non_unique_index_02 = "INDEX index_name USING HASH (col_01) INVISIBLE";
-    parseQuery(p_index, non_unique_index_02.data(), non_unique_index_02.data() + non_unique_index_02.size(), "", 0, 0);
+    parseQuery(p_index, non_unique_index_02.data(), non_unique_index_02.data() + non_unique_index_02.size(), "", 0, 0, 0);
 
     String fulltext_index_01 = "FULLTEXT index_name (col_01) INVISIBLE";
-    parseQuery(p_index, fulltext_index_01.data(), fulltext_index_01.data() + fulltext_index_01.size(), "", 0, 0);
+    parseQuery(p_index, fulltext_index_01.data(), fulltext_index_01.data() + fulltext_index_01.size(), "", 0, 0, 0);
 
     String fulltext_index_02 = "FULLTEXT INDEX index_name (col_01) INVISIBLE";
-    parseQuery(p_index, fulltext_index_02.data(), fulltext_index_02.data() + fulltext_index_02.size(), "", 0, 0);
+    parseQuery(p_index, fulltext_index_02.data(), fulltext_index_02.data() + fulltext_index_02.size(), "", 0, 0, 0);
 
     String fulltext_index_03 = "FULLTEXT KEY index_name (col_01) INVISIBLE";
-    parseQuery(p_index, fulltext_index_03.data(), fulltext_index_03.data() + fulltext_index_03.size(), "", 0, 0);
+    parseQuery(p_index, fulltext_index_03.data(), fulltext_index_03.data() + fulltext_index_03.size(), "", 0, 0, 0);
 
     String spatial_index_01 = "SPATIAL index_name (col_01) INVISIBLE";
-    parseQuery(p_index, spatial_index_01.data(), spatial_index_01.data() + spatial_index_01.size(), "", 0, 0);
+    parseQuery(p_index, spatial_index_01.data(), spatial_index_01.data() + spatial_index_01.size(), "", 0, 0, 0);
 
     String spatial_index_02 = "SPATIAL INDEX index_name (col_01) INVISIBLE";
-    parseQuery(p_index, spatial_index_02.data(), spatial_index_02.data() + spatial_index_02.size(), "", 0, 0);
+    parseQuery(p_index, spatial_index_02.data(), spatial_index_02.data() + spatial_index_02.size(), "", 0, 0, 0);
 
     String spatial_index_03 = "SPATIAL KEY index_name (col_01) INVISIBLE";
-    parseQuery(p_index, spatial_index_03.data(), spatial_index_03.data() + spatial_index_03.size(), "", 0, 0);
+    parseQuery(p_index, spatial_index_03.data(), spatial_index_03.data() + spatial_index_03.size(), "", 0, 0, 0);
 }
 
 TEST(ParserIndex, ConstraintIndex)
@@ -79,47 +79,47 @@ TEST(ParserIndex, ConstraintIndex)
     ParserDeclareIndex p_index;
 
     String primary_key_01 = "PRIMARY KEY (col_01) INVISIBLE";
-    parseQuery(p_index, primary_key_01.data(), primary_key_01.data() + primary_key_01.size(), "", 0, 0);
+    parseQuery(p_index, primary_key_01.data(), primary_key_01.data() + primary_key_01.size(), "", 0, 0, 0);
 
     String primary_key_02 = "PRIMARY KEY USING BTREE (col_01) INVISIBLE";
-    parseQuery(p_index, primary_key_02.data(), primary_key_02.data() + primary_key_02.size(), "", 0, 0);
+    parseQuery(p_index, primary_key_02.data(), primary_key_02.data() + primary_key_02.size(), "", 0, 0, 0);
 
     String primary_key_03 = "CONSTRAINT PRIMARY KEY USING BTREE (col_01) INVISIBLE";
-    parseQuery(p_index, primary_key_03.data(), primary_key_03.data() + primary_key_03.size(), "", 0, 0);
+    parseQuery(p_index, primary_key_03.data(), primary_key_03.data() + primary_key_03.size(), "", 0, 0, 0);
 
     String primary_key_04 = "CONSTRAINT index_name PRIMARY KEY USING BTREE (col_01) INVISIBLE";
-    parseQuery(p_index, primary_key_04.data(), primary_key_04.data() + primary_key_04.size(), "", 0, 0);
+    parseQuery(p_index, primary_key_04.data(), primary_key_04.data() + primary_key_04.size(), "", 0, 0, 0);
 
     String unique_key_01 = "UNIQUE (col_01) INVISIBLE";
-    parseQuery(p_index, unique_key_01.data(), unique_key_01.data() + unique_key_01.size(), "", 0, 0);
+    parseQuery(p_index, unique_key_01.data(), unique_key_01.data() + unique_key_01.size(), "", 0, 0, 0);
 
     String unique_key_02 = "UNIQUE INDEX (col_01) INVISIBLE";
-    parseQuery(p_index, unique_key_02.data(), unique_key_02.data() + unique_key_02.size(), "", 0, 0);
+    parseQuery(p_index, unique_key_02.data(), unique_key_02.data() + unique_key_02.size(), "", 0, 0, 0);
 
     String unique_key_03 = "UNIQUE KEY (col_01) INVISIBLE";
-    parseQuery(p_index, unique_key_03.data(), unique_key_03.data() + unique_key_03.size(), "", 0, 0);
+    parseQuery(p_index, unique_key_03.data(), unique_key_03.data() + unique_key_03.size(), "", 0, 0, 0);
 
     String unique_key_04 = "UNIQUE KEY index_name (col_01) INVISIBLE";
-    parseQuery(p_index, unique_key_04.data(), unique_key_04.data() + unique_key_04.size(), "", 0, 0);
+    parseQuery(p_index, unique_key_04.data(), unique_key_04.data() + unique_key_04.size(), "", 0, 0, 0);
 
     String unique_key_05 = "UNIQUE KEY index_name USING HASH (col_01) INVISIBLE";
-    parseQuery(p_index, unique_key_05.data(), unique_key_05.data() + unique_key_05.size(), "", 0, 0);
+    parseQuery(p_index, unique_key_05.data(), unique_key_05.data() + unique_key_05.size(), "", 0, 0, 0);
 
     String unique_key_06 = "CONSTRAINT UNIQUE KEY index_name USING HASH (col_01) INVISIBLE";
-    parseQuery(p_index, unique_key_06.data(), unique_key_06.data() + unique_key_06.size(), "", 0, 0);
+    parseQuery(p_index, unique_key_06.data(), unique_key_06.data() + unique_key_06.size(), "", 0, 0, 0);
 
     String unique_key_07 = "CONSTRAINT index_name UNIQUE KEY index_name_1 USING HASH (col_01) INVISIBLE";
-    parseQuery(p_index, unique_key_07.data(), unique_key_07.data() + unique_key_07.size(), "", 0, 0);
+    parseQuery(p_index, unique_key_07.data(), unique_key_07.data() + unique_key_07.size(), "", 0, 0, 0);
 
     String foreign_key_01 = "FOREIGN KEY (col_01) REFERENCES tbl_name (col_01)";
-    parseQuery(p_index, foreign_key_01.data(), foreign_key_01.data() + foreign_key_01.size(), "", 0, 0);
+    parseQuery(p_index, foreign_key_01.data(), foreign_key_01.data() + foreign_key_01.size(), "", 0, 0, 0);
 
     String foreign_key_02 = "FOREIGN KEY index_name (col_01) REFERENCES tbl_name (col_01)";
-    parseQuery(p_index, foreign_key_02.data(), foreign_key_02.data() + foreign_key_02.size(), "", 0, 0);
+    parseQuery(p_index, foreign_key_02.data(), foreign_key_02.data() + foreign_key_02.size(), "", 0, 0, 0);
 
     String foreign_key_03 = "CONSTRAINT FOREIGN KEY index_name (col_01) REFERENCES tbl_name (col_01)";
-    parseQuery(p_index, foreign_key_03.data(), foreign_key_03.data() + foreign_key_03.size(), "", 0, 0);
+    parseQuery(p_index, foreign_key_03.data(), foreign_key_03.data() + foreign_key_03.size(), "", 0, 0, 0);
 
     String foreign_key_04 = "CONSTRAINT index_name FOREIGN KEY index_name_01 (col_01) REFERENCES tbl_name (col_01)";
-    parseQuery(p_index, foreign_key_04.data(), foreign_key_04.data() + foreign_key_04.size(), "", 0, 0);
+    parseQuery(p_index, foreign_key_04.data(), foreign_key_04.data() + foreign_key_04.size(), "", 0, 0, 0);
 }
diff --git a/src/Parsers/MySQL/tests/gtest_partition_options_parser.cpp b/src/Parsers/MySQL/tests/gtest_partition_options_parser.cpp
index 01b757e5891..6ec8d73530e 100644
--- a/src/Parsers/MySQL/tests/gtest_partition_options_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_partition_options_parser.cpp
@@ -14,14 +14,14 @@ TEST(ParserPartitionOptions, HashPatitionOptions)
     String hash_partition = "PARTITION BY HASH(col_01)";
 
     ParserDeclarePartitionOptions p_partition_options;
-    ASTPtr ast_01 = parseQuery(p_partition_options, hash_partition.data(), hash_partition.data() + hash_partition.size(), "", 0, 0);
+    ASTPtr ast_01 = parseQuery(p_partition_options, hash_partition.data(), hash_partition.data() + hash_partition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options_01 = ast_01->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options_01->partition_type, "hash");
     EXPECT_EQ(declare_partition_options_01->partition_expression->as<ASTIdentifier>()->name(), "col_01");
 
     String linear_hash_partition = "PARTITION BY LINEAR HASH(col_01)";
-    ASTPtr ast_02 = parseQuery(p_partition_options, linear_hash_partition.data(), linear_hash_partition.data() + linear_hash_partition.size(), "", 0, 0);
+    ASTPtr ast_02 = parseQuery(p_partition_options, linear_hash_partition.data(), linear_hash_partition.data() + linear_hash_partition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options_02 = ast_02->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options_02->partition_type, "linear_hash");
@@ -33,14 +33,14 @@ TEST(ParserPartitionOptions, KeyPatitionOptions)
     String key_partition = "PARTITION BY KEY(col_01)";
 
     ParserDeclarePartitionOptions p_partition_options;
-    ASTPtr ast_01 = parseQuery(p_partition_options, key_partition.data(), key_partition.data() + key_partition.size(), "", 0, 0);
+    ASTPtr ast_01 = parseQuery(p_partition_options, key_partition.data(), key_partition.data() + key_partition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options_01 = ast_01->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options_01->partition_type, "key");
     EXPECT_EQ(declare_partition_options_01->partition_expression->as<ASTIdentifier>()->name(), "col_01");
 
     String linear_key_partition = "PARTITION BY LINEAR KEY(col_01, col_02)";
-    ASTPtr ast_02 = parseQuery(p_partition_options, linear_key_partition.data(), linear_key_partition.data() + linear_key_partition.size(), "", 0, 0);
+    ASTPtr ast_02 = parseQuery(p_partition_options, linear_key_partition.data(), linear_key_partition.data() + linear_key_partition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options_02 = ast_02->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options_02->partition_type, "linear_key");
@@ -49,7 +49,7 @@ TEST(ParserPartitionOptions, KeyPatitionOptions)
     EXPECT_EQ(columns_list->children[1]->as<ASTIdentifier>()->name(), "col_02");
 
     String key_partition_with_algorithm = "PARTITION BY KEY ALGORITHM=1 (col_01)";
-    ASTPtr ast_03 = parseQuery(p_partition_options, key_partition_with_algorithm.data(), key_partition_with_algorithm.data() + key_partition_with_algorithm.size(), "", 0, 0);
+    ASTPtr ast_03 = parseQuery(p_partition_options, key_partition_with_algorithm.data(), key_partition_with_algorithm.data() + key_partition_with_algorithm.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options_03 = ast_03->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options_03->partition_type, "key_1");
@@ -61,14 +61,14 @@ TEST(ParserPartitionOptions, RangePatitionOptions)
     String range_partition = "PARTITION BY RANGE(col_01)";
 
     ParserDeclarePartitionOptions p_partition_options;
-    ASTPtr ast_01 = parseQuery(p_partition_options, range_partition.data(), range_partition.data() + range_partition.size(), "", 0, 0);
+    ASTPtr ast_01 = parseQuery(p_partition_options, range_partition.data(), range_partition.data() + range_partition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options_01 = ast_01->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options_01->partition_type, "range");
     EXPECT_EQ(declare_partition_options_01->partition_expression->as<ASTIdentifier>()->name(), "col_01");
 
     String range_columns_partition = "PARTITION BY RANGE COLUMNS(col_01, col_02)";
-    ASTPtr ast_02 = parseQuery(p_partition_options, range_columns_partition.data(), range_columns_partition.data() + range_columns_partition.size(), "", 0, 0);
+    ASTPtr ast_02 = parseQuery(p_partition_options, range_columns_partition.data(), range_columns_partition.data() + range_columns_partition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options_02 = ast_02->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options_02->partition_type, "range");
@@ -82,14 +82,14 @@ TEST(ParserPartitionOptions, ListPatitionOptions)
     String range_partition = "PARTITION BY LIST(col_01)";
 
     ParserDeclarePartitionOptions p_partition_options;
-    ASTPtr ast_01 = parseQuery(p_partition_options, range_partition.data(), range_partition.data() + range_partition.size(), "", 0, 0);
+    ASTPtr ast_01 = parseQuery(p_partition_options, range_partition.data(), range_partition.data() + range_partition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options_01 = ast_01->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options_01->partition_type, "list");
     EXPECT_EQ(declare_partition_options_01->partition_expression->as<ASTIdentifier>()->name(), "col_01");
 
     String range_columns_partition = "PARTITION BY LIST COLUMNS(col_01, col_02)";
-    ASTPtr ast_02 = parseQuery(p_partition_options, range_columns_partition.data(), range_columns_partition.data() + range_columns_partition.size(), "", 0, 0);
+    ASTPtr ast_02 = parseQuery(p_partition_options, range_columns_partition.data(), range_columns_partition.data() + range_columns_partition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options_02 = ast_02->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options_02->partition_type, "list");
@@ -103,7 +103,7 @@ TEST(ParserPartitionOptions, PatitionNumberOptions)
     String numbers_partition = "PARTITION BY KEY(col_01) PARTITIONS 2";
 
     ParserDeclarePartitionOptions p_partition_options;
-    ASTPtr ast = parseQuery(p_partition_options, numbers_partition.data(), numbers_partition.data() + numbers_partition.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_partition_options, numbers_partition.data(), numbers_partition.data() + numbers_partition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options = ast->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options->partition_type, "key");
@@ -116,7 +116,7 @@ TEST(ParserPartitionOptions, PatitionWithSubpartitionOptions)
     String partition_with_subpartition = "PARTITION BY KEY(col_01) PARTITIONS 3 SUBPARTITION BY HASH(col_02) SUBPARTITIONS 4";
 
     ParserDeclarePartitionOptions p_partition_options;
-    ASTPtr ast = parseQuery(p_partition_options, partition_with_subpartition.data(), partition_with_subpartition.data() + partition_with_subpartition.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_partition_options, partition_with_subpartition.data(), partition_with_subpartition.data() + partition_with_subpartition.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options = ast->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options->partition_type, "key");
@@ -134,7 +134,7 @@ TEST(ParserPartitionOptions, PatitionOptionsWithDeclarePartition)
     ParserDeclarePartitionOptions p_partition_options;
     ASTPtr ast = parseQuery(p_partition_options,
         partition_options_with_declare.data(),
-        partition_options_with_declare.data() + partition_options_with_declare.size(), "", 0, 0);
+        partition_options_with_declare.data() + partition_options_with_declare.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options = ast->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options->partition_type, "key");
@@ -153,7 +153,7 @@ TEST(ParserPartitionOptions, PatitionOptionsWithDeclarePartitions)
     ParserDeclarePartitionOptions p_partition_options;
     ASTPtr ast = parseQuery(p_partition_options,
                             partition_options_with_declare.data(),
-                            partition_options_with_declare.data() + partition_options_with_declare.size(), "", 0, 0);
+                            partition_options_with_declare.data() + partition_options_with_declare.size(), "", 0, 0, 0);
 
     ASTDeclarePartitionOptions * declare_partition_options = ast->as<ASTDeclarePartitionOptions>();
     EXPECT_EQ(declare_partition_options->partition_type, "key");
diff --git a/src/Parsers/MySQL/tests/gtest_partition_parser.cpp b/src/Parsers/MySQL/tests/gtest_partition_parser.cpp
index 458c7acd553..07c7c03dbb7 100644
--- a/src/Parsers/MySQL/tests/gtest_partition_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_partition_parser.cpp
@@ -17,7 +17,7 @@ TEST(ParserPartition, AllPatitionOptions)
                    " TABLESPACE table_space_name";
 
     ParserDeclarePartition p_partition;
-    ASTPtr ast = parseQuery(p_partition, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_partition, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition = ast->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition->partition_name, "partition_name");
@@ -35,7 +35,7 @@ TEST(ParserPartition, OptionalPatitionOptions)
 {
     String input = "PARTITION partition_name STORAGE engine = engine_name max_rows 1000 min_rows 0 tablespace table_space_name";
     ParserDeclarePartition p_partition;
-    ASTPtr ast = parseQuery(p_partition, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_partition, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition = ast->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition->partition_name, "partition_name");
@@ -50,7 +50,7 @@ TEST(ParserPartition, PatitionOptionsWithLessThan)
 {
     ParserDeclarePartition p_partition;
     String partition_01 = "PARTITION partition_01 VALUES LESS THAN (1991) STORAGE engine = engine_name";
-    ASTPtr ast_partition_01 = parseQuery(p_partition, partition_01.data(), partition_01.data() + partition_01.size(), "", 0, 0);
+    ASTPtr ast_partition_01 = parseQuery(p_partition, partition_01.data(), partition_01.data() + partition_01.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition_01 = ast_partition_01->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition_01->partition_name, "partition_01");
@@ -59,7 +59,7 @@ TEST(ParserPartition, PatitionOptionsWithLessThan)
     EXPECT_EQ(declare_options_01->changes["engine"]->as<ASTIdentifier>()->name(), "engine_name");
 
     String partition_02 = "PARTITION partition_02 VALUES LESS THAN MAXVALUE STORAGE engine = engine_name";
-    ASTPtr ast_partition_02 = parseQuery(p_partition, partition_02.data(), partition_02.data() + partition_02.size(), "", 0, 0);
+    ASTPtr ast_partition_02 = parseQuery(p_partition, partition_02.data(), partition_02.data() + partition_02.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition_02 = ast_partition_02->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition_02->partition_name, "partition_02");
@@ -68,7 +68,7 @@ TEST(ParserPartition, PatitionOptionsWithLessThan)
     EXPECT_EQ(declare_options_02->changes["engine"]->as<ASTIdentifier>()->name(), "engine_name");
 
     String partition_03 = "PARTITION partition_03 VALUES LESS THAN (50, MAXVALUE) STORAGE engine = engine_name";
-    ASTPtr ast_partition_03 = parseQuery(p_partition, partition_03.data(), partition_03.data() + partition_03.size(), "", 0, 0);
+    ASTPtr ast_partition_03 = parseQuery(p_partition, partition_03.data(), partition_03.data() + partition_03.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition_03 = ast_partition_03->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition_03->partition_name, "partition_03");
@@ -79,7 +79,7 @@ TEST(ParserPartition, PatitionOptionsWithLessThan)
     EXPECT_EQ(declare_options_03->changes["engine"]->as<ASTIdentifier>()->name(), "engine_name");
 
     String partition_04 = "PARTITION partition_04 VALUES LESS THAN (MAXVALUE, MAXVALUE) STORAGE engine = engine_name";
-    ASTPtr ast_partition_04 = parseQuery(p_partition, partition_04.data(), partition_04.data() + partition_04.size(), "", 0, 0);
+    ASTPtr ast_partition_04 = parseQuery(p_partition, partition_04.data(), partition_04.data() + partition_04.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition_04 = ast_partition_04->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition_04->partition_name, "partition_04");
@@ -94,7 +94,7 @@ TEST(ParserPartition, PatitionOptionsWithInExpression)
 {
     ParserDeclarePartition p_partition;
     String partition_01 = "PARTITION partition_01 VALUES IN (NULL, 1991, MAXVALUE) STORAGE engine = engine_name";
-    ASTPtr ast_partition_01 = parseQuery(p_partition, partition_01.data(), partition_01.data() + partition_01.size(), "", 0, 0);
+    ASTPtr ast_partition_01 = parseQuery(p_partition, partition_01.data(), partition_01.data() + partition_01.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition_01 = ast_partition_01->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition_01->partition_name, "partition_01");
@@ -106,7 +106,7 @@ TEST(ParserPartition, PatitionOptionsWithInExpression)
     EXPECT_EQ(declare_options_01->changes["engine"]->as<ASTIdentifier>()->name(), "engine_name");
 
     String partition_02 = "PARTITION partition_02 VALUES IN ((NULL, 1991), (1991, NULL), (MAXVALUE, MAXVALUE)) STORAGE engine = engine_name";
-    ASTPtr ast_partition_02 = parseQuery(p_partition, partition_02.data(), partition_02.data() + partition_02.size(), "", 0, 0);
+    ASTPtr ast_partition_02 = parseQuery(p_partition, partition_02.data(), partition_02.data() + partition_02.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition_02 = ast_partition_02->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition_02->partition_name, "partition_02");
@@ -132,18 +132,17 @@ TEST(ParserPartition, PatitionOptionsWithSubpartitions)
 {
     ParserDeclarePartition p_partition;
     String partition_01 = "PARTITION partition_01 VALUES IN (NULL, 1991, MAXVALUE) STORAGE engine = engine_name (SUBPARTITION s_p01)";
-    ASTPtr ast_partition_01 = parseQuery(p_partition, partition_01.data(), partition_01.data() + partition_01.size(), "", 0, 0);
+    ASTPtr ast_partition_01 = parseQuery(p_partition, partition_01.data(), partition_01.data() + partition_01.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition_01 = ast_partition_01->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition_01->partition_name, "partition_01");
     EXPECT_TRUE(declare_partition_01->subpartitions->as<ASTExpressionList>()->children[0]->as<ASTDeclareSubPartition>());
 
     String partition_02 = "PARTITION partition_02 VALUES IN (NULL, 1991, MAXVALUE) STORAGE engine = engine_name (SUBPARTITION s_p01, SUBPARTITION s_p02)";
-    ASTPtr ast_partition_02 = parseQuery(p_partition, partition_02.data(), partition_02.data() + partition_02.size(), "", 0, 0);
+    ASTPtr ast_partition_02 = parseQuery(p_partition, partition_02.data(), partition_02.data() + partition_02.size(), "", 0, 0, 0);
 
     ASTDeclarePartition * declare_partition_02 = ast_partition_02->as<ASTDeclarePartition>();
     EXPECT_EQ(declare_partition_02->partition_name, "partition_02");
     EXPECT_TRUE(declare_partition_02->subpartitions->as<ASTExpressionList>()->children[0]->as<ASTDeclareSubPartition>());
     EXPECT_TRUE(declare_partition_02->subpartitions->as<ASTExpressionList>()->children[1]->as<ASTDeclareSubPartition>());
 }
-
diff --git a/src/Parsers/MySQL/tests/gtest_reference_parser.cpp b/src/Parsers/MySQL/tests/gtest_reference_parser.cpp
index 7447f16fc7c..d5b3c9b596d 100644
--- a/src/Parsers/MySQL/tests/gtest_reference_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_reference_parser.cpp
@@ -12,12 +12,12 @@ TEST(ParserReference, SimpleReference)
     ParserDeclareReference p_reference;
 
     String reference_01 = "REFERENCES table_name (ref_col_01)";
-    ASTPtr ast_reference_01 = parseQuery(p_reference, reference_01.data(), reference_01.data() + reference_01.size(), "", 0, 0);
+    ASTPtr ast_reference_01 = parseQuery(p_reference, reference_01.data(), reference_01.data() + reference_01.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_01->as<ASTDeclareReference>()->reference_table_name, "table_name");
     EXPECT_EQ(ast_reference_01->as<ASTDeclareReference>()->reference_expression->as<ASTIdentifier>()->name(), "ref_col_01");
 
     String reference_02 = "REFERENCES table_name (ref_col_01, ref_col_02)";
-    ASTPtr ast_reference_02 = parseQuery(p_reference, reference_02.data(), reference_02.data() + reference_02.size(), "", 0, 0);
+    ASTPtr ast_reference_02 = parseQuery(p_reference, reference_02.data(), reference_02.data() + reference_02.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_02->as<ASTDeclareReference>()->reference_table_name, "table_name");
     ASTPtr arguments = ast_reference_02->as<ASTDeclareReference>()->reference_expression->as<ASTFunction>()->arguments;
     EXPECT_EQ(arguments->children[0]->as<ASTIdentifier>()->name(), "ref_col_01");
@@ -28,19 +28,19 @@ TEST(ParserReference, ReferenceDifferenceKind)
 {
     ParserDeclareReference p_reference;
     String reference_01 = "REFERENCES table_name (ref_col_01) MATCH FULL";
-    ASTPtr ast_reference_01 = parseQuery(p_reference, reference_01.data(), reference_01.data() + reference_01.size(), "", 0, 0);
+    ASTPtr ast_reference_01 = parseQuery(p_reference, reference_01.data(), reference_01.data() + reference_01.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_01->as<ASTDeclareReference>()->reference_table_name, "table_name");
     EXPECT_EQ(ast_reference_01->as<ASTDeclareReference>()->reference_expression->as<ASTIdentifier>()->name(), "ref_col_01");
     EXPECT_EQ(ast_reference_01->as<ASTDeclareReference>()->kind, ASTDeclareReference::MATCH_FULL);
 
     String reference_02 = "REFERENCES table_name (ref_col_01) MATCH PARTIAL";
-    ASTPtr ast_reference_02 = parseQuery(p_reference, reference_02.data(), reference_02.data() + reference_02.size(), "", 0, 0);
+    ASTPtr ast_reference_02 = parseQuery(p_reference, reference_02.data(), reference_02.data() + reference_02.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_02->as<ASTDeclareReference>()->reference_table_name, "table_name");
     EXPECT_EQ(ast_reference_02->as<ASTDeclareReference>()->reference_expression->as<ASTIdentifier>()->name(), "ref_col_01");
     EXPECT_EQ(ast_reference_02->as<ASTDeclareReference>()->kind, ASTDeclareReference::MATCH_PARTIAL);
 
     String reference_03 = "REFERENCES table_name (ref_col_01) MATCH SIMPLE";
-    ASTPtr ast_reference_03 = parseQuery(p_reference, reference_03.data(), reference_03.data() + reference_03.size(), "", 0, 0);
+    ASTPtr ast_reference_03 = parseQuery(p_reference, reference_03.data(), reference_03.data() + reference_03.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_03->as<ASTDeclareReference>()->reference_table_name, "table_name");
     EXPECT_EQ(ast_reference_03->as<ASTDeclareReference>()->reference_expression->as<ASTIdentifier>()->name(), "ref_col_01");
     EXPECT_EQ(ast_reference_03->as<ASTDeclareReference>()->kind, ASTDeclareReference::MATCH_SIMPLE);
@@ -50,7 +50,7 @@ TEST(ParserReference, ReferenceDifferenceOption)
 {
     ParserDeclareReference p_reference;
     String reference_01 = "REFERENCES table_name (ref_col_01) MATCH FULL ON DELETE RESTRICT ON UPDATE RESTRICT";
-    ASTPtr ast_reference_01 = parseQuery(p_reference, reference_01.data(), reference_01.data() + reference_01.size(), "", 0, 0);
+    ASTPtr ast_reference_01 = parseQuery(p_reference, reference_01.data(), reference_01.data() + reference_01.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_01->as<ASTDeclareReference>()->reference_table_name, "table_name");
     EXPECT_EQ(ast_reference_01->as<ASTDeclareReference>()->reference_expression->as<ASTIdentifier>()->name(), "ref_col_01");
     EXPECT_EQ(ast_reference_01->as<ASTDeclareReference>()->kind, ASTDeclareReference::MATCH_FULL);
@@ -58,7 +58,7 @@ TEST(ParserReference, ReferenceDifferenceOption)
     EXPECT_EQ(ast_reference_01->as<ASTDeclareReference>()->on_update_option, ASTDeclareReference::RESTRICT);
 
     String reference_02 = "REFERENCES table_name (ref_col_01) MATCH FULL ON DELETE CASCADE ON UPDATE CASCADE";
-    ASTPtr ast_reference_02 = parseQuery(p_reference, reference_02.data(), reference_02.data() + reference_02.size(), "", 0, 0);
+    ASTPtr ast_reference_02 = parseQuery(p_reference, reference_02.data(), reference_02.data() + reference_02.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_02->as<ASTDeclareReference>()->reference_table_name, "table_name");
     EXPECT_EQ(ast_reference_02->as<ASTDeclareReference>()->reference_expression->as<ASTIdentifier>()->name(), "ref_col_01");
     EXPECT_EQ(ast_reference_02->as<ASTDeclareReference>()->kind, ASTDeclareReference::MATCH_FULL);
@@ -66,7 +66,7 @@ TEST(ParserReference, ReferenceDifferenceOption)
     EXPECT_EQ(ast_reference_02->as<ASTDeclareReference>()->on_update_option, ASTDeclareReference::CASCADE);
 
     String reference_03 = "REFERENCES table_name (ref_col_01) MATCH FULL ON DELETE SET NULL ON UPDATE SET NULL";
-    ASTPtr ast_reference_03 = parseQuery(p_reference, reference_03.data(), reference_03.data() + reference_03.size(), "", 0, 0);
+    ASTPtr ast_reference_03 = parseQuery(p_reference, reference_03.data(), reference_03.data() + reference_03.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_03->as<ASTDeclareReference>()->reference_table_name, "table_name");
     EXPECT_EQ(ast_reference_03->as<ASTDeclareReference>()->reference_expression->as<ASTIdentifier>()->name(), "ref_col_01");
     EXPECT_EQ(ast_reference_03->as<ASTDeclareReference>()->kind, ASTDeclareReference::MATCH_FULL);
@@ -74,7 +74,7 @@ TEST(ParserReference, ReferenceDifferenceOption)
     EXPECT_EQ(ast_reference_03->as<ASTDeclareReference>()->on_update_option, ASTDeclareReference::SET_NULL);
 
     String reference_04 = "REFERENCES table_name (ref_col_01) MATCH FULL ON UPDATE NO ACTION ON DELETE NO ACTION";
-    ASTPtr ast_reference_04 = parseQuery(p_reference, reference_04.data(), reference_04.data() + reference_04.size(), "", 0, 0);
+    ASTPtr ast_reference_04 = parseQuery(p_reference, reference_04.data(), reference_04.data() + reference_04.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_04->as<ASTDeclareReference>()->reference_table_name, "table_name");
     EXPECT_EQ(ast_reference_04->as<ASTDeclareReference>()->reference_expression->as<ASTIdentifier>()->name(), "ref_col_01");
     EXPECT_EQ(ast_reference_04->as<ASTDeclareReference>()->kind, ASTDeclareReference::MATCH_FULL);
@@ -82,11 +82,10 @@ TEST(ParserReference, ReferenceDifferenceOption)
     EXPECT_EQ(ast_reference_04->as<ASTDeclareReference>()->on_update_option, ASTDeclareReference::NO_ACTION);
 
     String reference_05 = "REFERENCES table_name (ref_col_01) MATCH FULL ON UPDATE SET DEFAULT ON DELETE SET DEFAULT";
-    ASTPtr ast_reference_05 = parseQuery(p_reference, reference_05.data(), reference_05.data() + reference_05.size(), "", 0, 0);
+    ASTPtr ast_reference_05 = parseQuery(p_reference, reference_05.data(), reference_05.data() + reference_05.size(), "", 0, 0, 0);
     EXPECT_EQ(ast_reference_05->as<ASTDeclareReference>()->reference_table_name, "table_name");
     EXPECT_EQ(ast_reference_05->as<ASTDeclareReference>()->reference_expression->as<ASTIdentifier>()->name(), "ref_col_01");
     EXPECT_EQ(ast_reference_05->as<ASTDeclareReference>()->kind, ASTDeclareReference::MATCH_FULL);
     EXPECT_EQ(ast_reference_05->as<ASTDeclareReference>()->on_delete_option, ASTDeclareReference::SET_DEFAULT);
     EXPECT_EQ(ast_reference_05->as<ASTDeclareReference>()->on_update_option, ASTDeclareReference::SET_DEFAULT);
 }
-
diff --git a/src/Parsers/MySQL/tests/gtest_subpartition_parser.cpp b/src/Parsers/MySQL/tests/gtest_subpartition_parser.cpp
index b375f73c55c..1876cd1d028 100644
--- a/src/Parsers/MySQL/tests/gtest_subpartition_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_subpartition_parser.cpp
@@ -14,7 +14,7 @@ TEST(ParserSubpartition, AllSubpatitionOptions)
                    " DATA DIRECTORY 'data_directory' INDEX DIRECTORY 'index_directory' max_rows 1000 MIN_ROWs 0"
                    " TABLESPACE table_space_name";
     MySQLParser::ParserDeclareSubPartition p_subpartition;
-    ASTPtr ast = parseQuery(p_subpartition, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_subpartition, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     ASTDeclareSubPartition * declare_subpartition = ast->as<ASTDeclareSubPartition>();
     EXPECT_EQ(declare_subpartition->logical_name, "subpartition_name");
@@ -32,7 +32,7 @@ TEST(ParserSubpartition, OptionalSubpatitionOptions)
 {
     String input = "SUBPARTITION subpartition_name STORAGE engine = engine_name max_rows 1000 min_rows 0 tablespace table_space_name";
     MySQLParser::ParserDeclareSubPartition p_subpartition;
-    ASTPtr ast = parseQuery(p_subpartition, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_subpartition, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     ASTDeclareSubPartition * declare_subpartition = ast->as<ASTDeclareSubPartition>();
     EXPECT_EQ(declare_subpartition->logical_name, "subpartition_name");
@@ -42,4 +42,3 @@ TEST(ParserSubpartition, OptionalSubpatitionOptions)
     EXPECT_EQ(declare_options->changes["max_rows"]->as<ASTLiteral>()->value.safeGet<UInt64>(), 1000);
     EXPECT_EQ(declare_options->changes["tablespace"]->as<ASTIdentifier>()->name(), "table_space_name");
 }
-
diff --git a/src/Parsers/MySQL/tests/gtest_table_options_parser.cpp b/src/Parsers/MySQL/tests/gtest_table_options_parser.cpp
index 42b9279c96d..a84da7cb9d5 100644
--- a/src/Parsers/MySQL/tests/gtest_table_options_parser.cpp
+++ b/src/Parsers/MySQL/tests/gtest_table_options_parser.cpp
@@ -18,7 +18,7 @@ TEST(ParserTableOptions, AllSubpatitionOptions)
                    " STATS_PERSISTENT DEFAULT STATS_SAMPLE_PAGES 3 TABLESPACE tablespace_name STORAGE MEMORY UNION (table_01, table_02)";
 
     ParserDeclareTableOptions p_table_options;
-    ASTPtr ast = parseQuery(p_table_options, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_table_options, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     ASTDeclareOptions * declare_options = ast->as<ASTDeclareOptions>();
     EXPECT_EQ(declare_options->changes["auto_increment"]->as<ASTLiteral>()->value.safeGet<UInt64>(), 1);
@@ -56,7 +56,7 @@ TEST(ParserTableOptions, OptionalTableOptions)
 {
     String input = "STATS_AUTO_RECALC DEFAULT AUTO_INCREMENt = 1 ";
     ParserDeclareTableOptions p_table_options;
-    ASTPtr ast = parseQuery(p_table_options, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(p_table_options, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     ASTDeclareOptions * declare_options = ast->as<ASTDeclareOptions>();
     EXPECT_EQ(declare_options->changes["auto_increment"]->as<ASTLiteral>()->value.safeGet<UInt64>(), 1);
diff --git a/src/Parsers/PRQL/ParserPRQLQuery.cpp b/src/Parsers/PRQL/ParserPRQLQuery.cpp
index b3733b727dc..fb1796714cb 100644
--- a/src/Parsers/PRQL/ParserPRQLQuery.cpp
+++ b/src/Parsers/PRQL/ParserPRQLQuery.cpp
@@ -69,7 +69,9 @@ bool ParserPRQLQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         "",
         false,
         max_query_size,
-        max_parser_depth);
+        max_parser_depth,
+        max_parser_backtracks,
+        true);
 
     if (!node)
         throw Exception(
diff --git a/src/Parsers/PRQL/ParserPRQLQuery.h b/src/Parsers/PRQL/ParserPRQLQuery.h
index 4fc450df6b6..88bf97f69d1 100644
--- a/src/Parsers/PRQL/ParserPRQLQuery.h
+++ b/src/Parsers/PRQL/ParserPRQLQuery.h
@@ -13,9 +13,10 @@ private:
     // These fields are not used when PRQL is disabled at build time.
     [[maybe_unused]] size_t max_query_size;
     [[maybe_unused]] size_t max_parser_depth;
+    [[maybe_unused]] size_t max_parser_backtracks;
 
 public:
-    ParserPRQLQuery(size_t max_query_size_, size_t max_parser_depth_) : max_query_size{max_query_size_}, max_parser_depth{max_parser_depth_}
+    ParserPRQLQuery(size_t max_query_size_, size_t max_parser_depth_, size_t max_parser_backtracks_) : max_query_size(max_query_size_), max_parser_depth(max_parser_depth_), max_parser_backtracks(max_parser_backtracks_)
     {
     }
 
diff --git a/src/Parsers/ParserAlterQuery.cpp b/src/Parsers/ParserAlterQuery.cpp
index b1cc7622e00..4bc95e67afb 100644
--- a/src/Parsers/ParserAlterQuery.cpp
+++ b/src/Parsers/ParserAlterQuery.cpp
@@ -865,7 +865,8 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
             else if (s_modify_sql_security.ignore(pos, expected))
             {
                 /// This is a hack so we can reuse parser from create and don't have to write `MODIFY SQL SECURITY SQL SECURITY INVOKER`
-                pos -= 2;
+                --pos;
+                --pos;
                 if (!sql_security_p.parse(pos, command_sql_security, expected))
                     return false;
                 command->type = ASTAlterCommand::MODIFY_SQL_SECURITY;
diff --git a/src/Parsers/ParserCreateQuery.h b/src/Parsers/ParserCreateQuery.h
index 440a8bc1dc7..30bce57f9d9 100644
--- a/src/Parsers/ParserCreateQuery.h
+++ b/src/Parsers/ParserCreateQuery.h
@@ -286,7 +286,7 @@ bool IParserColumnDeclaration<NameParser>::parseImpl(Pos & pos, ASTPtr & node, E
         {
             const String type_int("INT");
             Tokens tokens(type_int.data(), type_int.data() + type_int.size());
-            Pos tmp_pos(tokens, 0);
+            Pos tmp_pos(tokens, pos.max_depth, pos.max_backtracks);
             Expected tmp_expected;
             ParserDataType().parse(tmp_pos, type, tmp_expected);
         }
diff --git a/src/Parsers/QueryParameterVisitor.cpp b/src/Parsers/QueryParameterVisitor.cpp
index b8679cc3b96..9afd9a8615c 100644
--- a/src/Parsers/QueryParameterVisitor.cpp
+++ b/src/Parsers/QueryParameterVisitor.cpp
@@ -43,7 +43,7 @@ NameSet analyzeReceiveQueryParams(const std::string & query)
     const char * query_end = query.data() + query.size();
 
     ParserQuery parser(query_end);
-    ASTPtr extract_query_ast = parseQuery(parser, query_begin, query_end, "analyzeReceiveQueryParams", 0, 0);
+    ASTPtr extract_query_ast = parseQuery(parser, query_begin, query_end, "analyzeReceiveQueryParams", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     QueryParameterVisitor(query_params).visit(extract_query_ast);
 
     NameSet query_param_names;
diff --git a/src/Parsers/TokenIterator.h b/src/Parsers/TokenIterator.h
index 8cb59aa12e2..192f2f55e6a 100644
--- a/src/Parsers/TokenIterator.h
+++ b/src/Parsers/TokenIterator.h
@@ -62,18 +62,6 @@ public:
         return *this;
     }
 
-    ALWAYS_INLINE TokenIterator & operator-=(int value)
-    {
-        index -= value;
-        return *this;
-    }
-
-    ALWAYS_INLINE TokenIterator & operator+=(int value)
-    {
-        index += value;
-        return *this;
-    }
-
     ALWAYS_INLINE bool operator<(const TokenIterator & rhs) const { return index < rhs.index; }
     ALWAYS_INLINE bool operator<=(const TokenIterator & rhs) const { return index <= rhs.index; }
     ALWAYS_INLINE bool operator==(const TokenIterator & rhs) const { return index == rhs.index; }
diff --git a/src/Parsers/examples/create_parser.cpp b/src/Parsers/examples/create_parser.cpp
index c241b353b4f..b628c79435c 100644
--- a/src/Parsers/examples/create_parser.cpp
+++ b/src/Parsers/examples/create_parser.cpp
@@ -13,7 +13,7 @@ int main(int, char **)
 
     std::string input = "CREATE TABLE hits (URL String, UserAgentMinor2 FixedString(2), EventTime DateTime) ENGINE = Log";
     ParserCreateQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     WriteBufferFromOStream out(std::cerr, 4096);
     formatAST(*ast, out);
diff --git a/src/Parsers/examples/select_parser.cpp b/src/Parsers/examples/select_parser.cpp
index 15295170c6b..3ed358121f6 100644
--- a/src/Parsers/examples/select_parser.cpp
+++ b/src/Parsers/examples/select_parser.cpp
@@ -23,7 +23,7 @@ try
         " FORMAT TabSeparated";
 
     ParserQueryWithOutput parser(input.data() + input.size());
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
 
     std::cout << "Success." << std::endl;
     WriteBufferFromOStream out(std::cerr, 4096);
diff --git a/src/Parsers/fuzzers/select_parser_fuzzer.cpp b/src/Parsers/fuzzers/select_parser_fuzzer.cpp
index ae490ed4e56..aed83853c33 100644
--- a/src/Parsers/fuzzers/select_parser_fuzzer.cpp
+++ b/src/Parsers/fuzzers/select_parser_fuzzer.cpp
@@ -15,7 +15,8 @@ extern "C" int LLVMFuzzerTestOneInput(const uint8_t * data, size_t size)
         DB::ParserQueryWithOutput parser(input.data() + input.size());
 
         const UInt64 max_parser_depth = 1000;
-        DB::ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, max_parser_depth);
+        const UInt64 max_parser_backtracks = 1000000;
+        DB::ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, max_parser_depth, max_parser_backtracks);
 
         const UInt64 max_ast_depth = 1000;
         ast->checkDepth(max_ast_depth);
diff --git a/src/Parsers/parseQuery.cpp b/src/Parsers/parseQuery.cpp
index 8f9977c0b8d..7aad0b010a5 100644
--- a/src/Parsers/parseQuery.cpp
+++ b/src/Parsers/parseQuery.cpp
@@ -234,12 +234,13 @@ ASTPtr tryParseQuery(
     bool allow_multi_statements,
     size_t max_query_size,
     size_t max_parser_depth,
+    size_t max_parser_backtracks,
     bool skip_insignificant)
 {
     const char * query_begin = _out_query_end;
     Tokens tokens(query_begin, all_queries_end, max_query_size, skip_insignificant);
     /// NOTE: consider use UInt32 for max_parser_depth setting.
-    IParser::Pos token_iterator(tokens, static_cast<uint32_t>(max_parser_depth));
+    IParser::Pos token_iterator(tokens, static_cast<uint32_t>(max_parser_depth), static_cast<uint32_t>(max_parser_backtracks));
 
     if (token_iterator->isEnd()
         || token_iterator->type == TokenType::Semicolon)
@@ -356,10 +357,13 @@ ASTPtr parseQueryAndMovePosition(
     const std::string & query_description,
     bool allow_multi_statements,
     size_t max_query_size,
-    size_t max_parser_depth)
+    size_t max_parser_depth,
+    size_t max_parser_backtracks)
 {
     std::string error_message;
-    ASTPtr res = tryParseQuery(parser, pos, end, error_message, false, query_description, allow_multi_statements, max_query_size, max_parser_depth);
+    ASTPtr res = tryParseQuery(
+        parser, pos, end, error_message, false, query_description, allow_multi_statements,
+        max_query_size, max_parser_depth, max_parser_backtracks, true);
 
     if (res)
         return res;
@@ -374,9 +378,10 @@ ASTPtr parseQuery(
     const char * end,
     const std::string & query_description,
     size_t max_query_size,
-    size_t max_parser_depth)
+    size_t max_parser_depth,
+    size_t max_parser_backtracks)
 {
-    return parseQueryAndMovePosition(parser, begin, end, query_description, false, max_query_size, max_parser_depth);
+    return parseQueryAndMovePosition(parser, begin, end, query_description, false, max_query_size, max_parser_depth, max_parser_backtracks);
 }
 
 
@@ -385,9 +390,10 @@ ASTPtr parseQuery(
     const std::string & query,
     const std::string & query_description,
     size_t max_query_size,
-    size_t max_parser_depth)
+    size_t max_parser_depth,
+    size_t max_parser_backtracks)
 {
-    return parseQuery(parser, query.data(), query.data() + query.size(), query_description, max_query_size, max_parser_depth);
+    return parseQuery(parser, query.data(), query.data() + query.size(), query_description, max_query_size, max_parser_depth, max_parser_backtracks);
 }
 
 
@@ -395,9 +401,10 @@ ASTPtr parseQuery(
     IParser & parser,
     const std::string & query,
     size_t max_query_size,
-    size_t max_parser_depth)
+    size_t max_parser_depth,
+    size_t max_parser_backtracks)
 {
-    return parseQuery(parser, query.data(), query.data() + query.size(), parser.getName(), max_query_size, max_parser_depth);
+    return parseQuery(parser, query.data(), query.data() + query.size(), parser.getName(), max_query_size, max_parser_depth, max_parser_backtracks);
 }
 
 
@@ -406,6 +413,7 @@ std::pair<const char *, bool> splitMultipartQuery(
     std::vector<std::string> & queries_list,
     size_t max_query_size,
     size_t max_parser_depth,
+    size_t max_parser_backtracks,
     bool allow_settings_after_format_in_insert)
 {
     ASTPtr ast;
@@ -422,7 +430,7 @@ std::pair<const char *, bool> splitMultipartQuery(
     {
         begin = pos;
 
-        ast = parseQueryAndMovePosition(parser, pos, end, "", true, max_query_size, max_parser_depth);
+        ast = parseQueryAndMovePosition(parser, pos, end, "", true, max_query_size, max_parser_depth, max_parser_backtracks);
 
         auto * insert = ast->as<ASTInsertQuery>();
 
diff --git a/src/Parsers/parseQuery.h b/src/Parsers/parseQuery.h
index a087f145d2c..93c1a465267 100644
--- a/src/Parsers/parseQuery.h
+++ b/src/Parsers/parseQuery.h
@@ -19,7 +19,8 @@ ASTPtr tryParseQuery(
     size_t max_query_size,          /// If (end - pos) > max_query_size and query is longer than max_query_size then throws "Max query size exceeded".
                                     /// Disabled if zero. Is used in order to check query size if buffer can contains data for INSERT query.
     size_t max_parser_depth,
-    bool skip_insignificant = true);  /// If true, lexer will skip all insignificant tokens (e.g. whitespaces)
+    size_t max_parser_backtracks,
+    bool skip_insignificant);  /// If true, lexer will skip all insignificant tokens (e.g. whitespaces)
 
 
 /// Parse query or throw an exception with error message.
@@ -30,7 +31,8 @@ ASTPtr parseQueryAndMovePosition(
     const std::string & description,
     bool allow_multi_statements,
     size_t max_query_size,
-    size_t max_parser_depth);
+    size_t max_parser_depth,
+    size_t max_parser_backtracks);
 
 ASTPtr parseQuery(
     IParser & parser,
@@ -38,20 +40,23 @@ ASTPtr parseQuery(
     const char * end,
     const std::string & description,
     size_t max_query_size,
-    size_t max_parser_depth);
+    size_t max_parser_depth,
+    size_t max_parser_backtracks);
 
 ASTPtr parseQuery(
     IParser & parser,
     const std::string & query,
     const std::string & query_description,
     size_t max_query_size,
-    size_t max_parser_depth);
+    size_t max_parser_depth,
+    size_t max_parser_backtracks);
 
 ASTPtr parseQuery(
     IParser & parser,
     const std::string & query,
     size_t max_query_size,
-    size_t max_parser_depth);
+    size_t max_parser_depth,
+    size_t max_parser_backtracks);
 
 
 /** Split queries separated by ; on to list of single queries
@@ -63,6 +68,7 @@ std::pair<const char *, bool> splitMultipartQuery(
     std::vector<std::string> & queries_list,
     size_t max_query_size,
     size_t max_parser_depth,
+    size_t max_parser_backtracks,
     bool allow_settings_after_format_in_insert);
 
 }
diff --git a/src/Parsers/tests/gtest_Parser.cpp b/src/Parsers/tests/gtest_Parser.cpp
index 19947cd38cc..f0abc68f966 100644
--- a/src/Parsers/tests/gtest_Parser.cpp
+++ b/src/Parsers/tests/gtest_Parser.cpp
@@ -1,7 +1,4 @@
-#include <IO/WriteBufferFromOStream.h>
-#include <Interpreters/applyTableOverride.h>
 #include <Parsers/ASTCreateQuery.h>
-#include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/Access/ASTCreateUserQuery.h>
 #include <Parsers/Access/ParserCreateUserQuery.h>
@@ -10,7 +7,6 @@
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/ParserOptimizeQuery.h>
 #include <Parsers/ParserRenameQuery.h>
-#include <Parsers/ParserQueryWithOutput.h>
 #include <Parsers/ParserAttachAccessEntity.h>
 #include <Parsers/formatAST.h>
 #include <Parsers/parseQuery.h>
@@ -54,12 +50,12 @@ TEST_P(ParserTest, parseQuery)
     {
         if (std::string(expected_ast).starts_with("throws"))
         {
-            EXPECT_THROW(parseQuery(*parser, input_text.begin(), input_text.end(), 0, 0), DB::Exception);
+            EXPECT_THROW(parseQuery(*parser, input_text.begin(), input_text.end(), 0, 0, 0), DB::Exception);
         }
         else
         {
             ASTPtr ast;
-            ASSERT_NO_THROW(ast = parseQuery(*parser, input_text.begin(), input_text.end(), 0, 0));
+            ASSERT_NO_THROW(ast = parseQuery(*parser, input_text.begin(), input_text.end(), 0, 0, 0));
             if (std::string("CREATE USER or ALTER USER query") != parser->getName()
                     && std::string("ATTACH access entity query") != parser->getName())
             {
@@ -106,7 +102,7 @@ TEST_P(ParserTest, parseQuery)
     }
     else
     {
-        ASSERT_THROW(parseQuery(*parser, input_text.begin(), input_text.end(), 0, 0), DB::Exception);
+        ASSERT_THROW(parseQuery(*parser, input_text.begin(), input_text.end(), 0, 0, 0), DB::Exception);
     }
 }
 
@@ -649,12 +645,13 @@ INSTANTIATE_TEST_SUITE_P(ParserKQLQuery, ParserKQLTest,
 
 static constexpr size_t kDummyMaxQuerySize = 256 * 1024;
 static constexpr size_t kDummyMaxParserDepth = 256;
+static constexpr size_t kDummyMaxParserBacktracks = 1000000;
 
 INSTANTIATE_TEST_SUITE_P(
     ParserPRQL,
     ParserTest,
     ::testing::Combine(
-        ::testing::Values(std::make_shared<ParserPRQLQuery>(kDummyMaxQuerySize, kDummyMaxParserDepth)),
+        ::testing::Values(std::make_shared<ParserPRQLQuery>(kDummyMaxQuerySize, kDummyMaxParserDepth, kDummyMaxParserBacktracks)),
         ::testing::ValuesIn(std::initializer_list<ParserTestCase>{
             {
                 "from albums\ngroup {author_id} (\n  aggregate {first_published = min published}\n)\njoin a=author side:left (==author_id)\njoin p=purchases side:right (==author_id)\ngroup {a.id, p.purchase_id} (\n  aggregate {avg_sell = min first_published}\n)",
diff --git a/src/Parsers/tests/gtest_common.cpp b/src/Parsers/tests/gtest_common.cpp
index 52d3ceb47e2..8ff9400d8a2 100644
--- a/src/Parsers/tests/gtest_common.cpp
+++ b/src/Parsers/tests/gtest_common.cpp
@@ -28,7 +28,7 @@ TEST_P(ParserRegexTest, parseQuery)
     ASSERT_TRUE(expected_ast);
 
     DB::ASTPtr ast;
-    ASSERT_NO_THROW(ast = parseQuery(*parser, input_text.begin(), input_text.end(), 0, 0));
+    ASSERT_NO_THROW(ast = parseQuery(*parser, input_text.begin(), input_text.end(), 0, 0, 0));
     DB::WriteBufferFromOwnString buf;
     formatAST(*ast->clone(), buf, false, false);
     EXPECT_THAT(buf.str(), ::testing::MatchesRegex(expected_ast));
@@ -45,12 +45,12 @@ TEST_P(ParserKQLTest, parseKQLQuery)
     {
         if (std::string(expected_ast).starts_with("throws"))
         {
-            EXPECT_THROW(parseKQLQuery(*parser, input_text.begin(), input_text.end(), 0, 0), DB::Exception);
+            EXPECT_THROW(parseKQLQuery(*parser, input_text.begin(), input_text.end(), 0, 0, 0), DB::Exception);
         }
         else
         {
             DB::ASTPtr ast;
-            ASSERT_NO_THROW(ast = parseKQLQuery(*parser, input_text.begin(), input_text.end(), 0, 0));
+            ASSERT_NO_THROW(ast = parseKQLQuery(*parser, input_text.begin(), input_text.end(), 0, 0, 0));
             if (std::string("CREATE USER or ALTER USER query") != parser->getName()
                     && std::string("ATTACH access entity query") != parser->getName())
             {
@@ -78,6 +78,6 @@ TEST_P(ParserKQLTest, parseKQLQuery)
     }
     else
     {
-        ASSERT_THROW(parseKQLQuery(*parser, input_text.begin(), input_text.end(), 0, 0), DB::Exception);
+        ASSERT_THROW(parseKQLQuery(*parser, input_text.begin(), input_text.end(), 0, 0, 0), DB::Exception);
     }
 }
diff --git a/src/Parsers/tests/gtest_dictionary_parser.cpp b/src/Parsers/tests/gtest_dictionary_parser.cpp
index c0a975f7a38..a1ba46125a7 100644
--- a/src/Parsers/tests/gtest_dictionary_parser.cpp
+++ b/src/Parsers/tests/gtest_dictionary_parser.cpp
@@ -40,7 +40,7 @@ TEST(ParserDictionaryDDL, SimpleDictionary)
                    " RANGE(MIN second_column MAX third_column)";
 
     ParserCreateDictionaryQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
     ASTCreateQuery * create = ast->as<ASTCreateQuery>();
     EXPECT_EQ(create->getTable(), "dict1");
     EXPECT_EQ(create->getDatabase(), "test");
@@ -136,7 +136,7 @@ TEST(ParserDictionaryDDL, AttributesWithMultipleProperties)
                    " SOURCE(CLICKHOUSE(HOST 'localhost'))";
 
     ParserCreateDictionaryQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
     ASTCreateQuery * create = ast->as<ASTCreateQuery>();
     EXPECT_EQ(create->getTable(), "dict2");
     EXPECT_EQ(create->getDatabase(), "");
@@ -183,7 +183,7 @@ TEST(ParserDictionaryDDL, CustomAttributePropertiesOrder)
                    " LIFETIME(300)";
 
     ParserCreateDictionaryQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
     ASTCreateQuery * create = ast->as<ASTCreateQuery>();
 
     /// test attributes
@@ -238,7 +238,7 @@ TEST(ParserDictionaryDDL, NestedSource)
                    " RANGE(MIN second_column MAX third_column)";
 
     ParserCreateDictionaryQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
     ASTCreateQuery * create = ast->as<ASTCreateQuery>();
     EXPECT_EQ(create->getTable(), "dict4");
     EXPECT_EQ(create->getDatabase(), "");
@@ -286,7 +286,7 @@ TEST(ParserDictionaryDDL, Formatting)
                    " RANGE(MIN second_column MAX third_column)";
 
     ParserCreateDictionaryQuery parser;
-    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0);
+    ASTPtr ast = parseQuery(parser, input.data(), input.data() + input.size(), "", 0, 0, 0);
     ASTCreateQuery * create = ast->as<ASTCreateQuery>();
     auto str = serializeAST(*create);
     EXPECT_EQ(str, "CREATE DICTIONARY test.dict5 (`key_column1` UInt64 DEFAULT 1 HIERARCHICAL INJECTIVE, `key_column2` String DEFAULT '', `second_column` UInt8 EXPRESSION intDiv(50, rand() % 1000), `third_column` UInt8) PRIMARY KEY key_column1, key_column2 SOURCE(MYSQL(HOST 'localhost' PORT 9000 USER 'default' REPLICA (HOST '127.0.0.1' PRIORITY 1) PASSWORD '')) LIFETIME(MIN 1 MAX 10) LAYOUT(CACHE(SIZE_IN_CELLS 50)) RANGE(MIN second_column MAX third_column)");
@@ -297,7 +297,7 @@ TEST(ParserDictionaryDDL, ParseDropQuery)
     String input1 = "DROP DICTIONARY test.dict1";
 
     ParserDropQuery parser;
-    ASTPtr ast1 = parseQuery(parser, input1.data(), input1.data() + input1.size(), "", 0, 0);
+    ASTPtr ast1 = parseQuery(parser, input1.data(), input1.data() + input1.size(), "", 0, 0, 0);
     ASTDropQuery * drop1 = ast1->as<ASTDropQuery>();
 
     EXPECT_TRUE(drop1->is_dictionary);
@@ -308,7 +308,7 @@ TEST(ParserDictionaryDDL, ParseDropQuery)
 
     String input2 = "DROP DICTIONARY IF EXISTS dict2";
 
-    ASTPtr ast2 = parseQuery(parser, input2.data(), input2.data() + input2.size(), "", 0, 0);
+    ASTPtr ast2 = parseQuery(parser, input2.data(), input2.data() + input2.size(), "", 0, 0, 0);
     ASTDropQuery * drop2 = ast2->as<ASTDropQuery>();
 
     EXPECT_TRUE(drop2->is_dictionary);
@@ -323,7 +323,7 @@ TEST(ParserDictionaryDDL, ParsePropertiesQueries)
     String input1 = "SHOW CREATE DICTIONARY test.dict1";
 
     ParserTablePropertiesQuery parser;
-    ASTPtr ast1 = parseQuery(parser, input1.data(), input1.data() + input1.size(), "", 0, 0);
+    ASTPtr ast1 = parseQuery(parser, input1.data(), input1.data() + input1.size(), "", 0, 0, 0);
     ASTShowCreateDictionaryQuery * show1 = ast1->as<ASTShowCreateDictionaryQuery>();
 
     EXPECT_EQ(show1->getTable(), "dict1");
@@ -332,7 +332,7 @@ TEST(ParserDictionaryDDL, ParsePropertiesQueries)
 
     String input2 = "EXISTS DICTIONARY dict2";
 
-    ASTPtr ast2 = parseQuery(parser, input2.data(), input2.data() + input2.size(), "", 0, 0);
+    ASTPtr ast2 = parseQuery(parser, input2.data(), input2.data() + input2.size(), "", 0, 0, 0);
     ASTExistsDictionaryQuery * show2 = ast2->as<ASTExistsDictionaryQuery>();
 
     EXPECT_EQ(show2->getTable(), "dict2");
diff --git a/src/Parsers/tests/gtest_format_hiliting.cpp b/src/Parsers/tests/gtest_format_hiliting.cpp
index e87b093db9d..00e8197af1f 100644
--- a/src/Parsers/tests/gtest_format_hiliting.cpp
+++ b/src/Parsers/tests/gtest_format_hiliting.cpp
@@ -50,7 +50,7 @@ void compare(const String & expected, const String & query)
 {
     using namespace DB;
     ParserQuery parser(query.data() + query.size());
-    ASTPtr ast = parseQuery(parser, query, 0, 0);
+    ASTPtr ast = parseQuery(parser, query, 0, 0, 0);
 
     WriteBufferFromOwnString write_buffer;
     IAST::FormatSettings settings(write_buffer, true, true);
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 7b3fb0c5c91..8ca8f0f258b 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -538,7 +538,7 @@ FilterDAGInfo buildAdditionalFiltersIfNeeded(const StoragePtr & storage,
             ParserExpression parser;
             additional_filter_ast = parseQuery(
                 parser, filter.data(), filter.data() + filter.size(),
-                "additional filter", settings.max_query_size, settings.max_parser_depth);
+                "additional filter", settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
             break;
         }
     }
diff --git a/src/Planner/Utils.cpp b/src/Planner/Utils.cpp
index bd0b831ee58..a04f9f502e2 100644
--- a/src/Planner/Utils.cpp
+++ b/src/Planner/Utils.cpp
@@ -523,7 +523,7 @@ ASTPtr parseAdditionalResultFilter(const Settings & settings)
     ParserExpression parser;
     auto additional_result_filter_ast = parseQuery(
                 parser, additional_result_filter.data(), additional_result_filter.data() + additional_result_filter.size(),
-                "additional result filter", settings.max_query_size, settings.max_parser_depth);
+                "additional result filter", settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
     return additional_result_filter_ast;
 }
 
diff --git a/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp b/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
index f91f7cf536b..9d056b42101 100644
--- a/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
+++ b/src/Processors/Formats/Impl/ConstantExpressionTemplate.cpp
@@ -537,7 +537,7 @@ bool ConstantExpressionTemplate::parseLiteralAndAssertType(
         ParserArrayOfLiterals parser_array;
         ParserTupleOfLiterals parser_tuple;
 
-        IParser::Pos iterator(token_iterator, static_cast<unsigned>(settings.max_parser_depth));
+        IParser::Pos iterator(token_iterator, static_cast<unsigned>(settings.max_parser_depth), static_cast<unsigned>(settings.max_parser_backtracks));
         while (iterator->begin < istr.position())
             ++iterator;
         Expected expected;
diff --git a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
index 9c7f095e661..67bdd1cf877 100644
--- a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
@@ -274,7 +274,8 @@ static bool tryToExtractStructureFromCreateQuery(ReadBuffer & in, NamesAndTypesL
     String error;
     const char * start = create_query_str.data();
     const char * end = create_query_str.data() + create_query_str.size();
-    ASTPtr query = tryParseQuery(parser, start, end, error, false, "MySQL create query", false, DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    ASTPtr query = tryParseQuery(parser, start, end, error, false, "MySQL create query", false,
+        DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS, true);
     if (!query)
         return false;
 
diff --git a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
index 8659dcd2318..353de76eea8 100644
--- a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
@@ -194,7 +194,7 @@ void ValuesBlockInputFormat::readUntilTheEndOfRowAndReTokenize(size_t current_co
     auto * row_end = buf->position();
     buf->rollbackToCheckpoint();
     tokens.emplace(buf->position(), row_end);
-    token_iterator.emplace(*tokens, static_cast<unsigned>(context->getSettingsRef().max_parser_depth));
+    token_iterator.emplace(*tokens, static_cast<unsigned>(context->getSettingsRef().max_parser_depth), static_cast<unsigned>(context->getSettingsRef().max_parser_backtracks));
     auto const & first = (*token_iterator).get();
     if (first.isError() || first.isEnd())
     {
@@ -418,7 +418,7 @@ bool ValuesBlockInputFormat::parseExpression(IColumn & column, size_t column_idx
     {
         Expected expected;
         /// Keep a copy to the start of the column tokens to use if later if necessary
-        ti_start = IParser::Pos(*token_iterator, static_cast<unsigned>(settings.max_parser_depth));
+        ti_start = IParser::Pos(*token_iterator, static_cast<unsigned>(settings.max_parser_depth), static_cast<unsigned>(settings.max_parser_backtracks));
 
         parsed = parser.parse(*token_iterator, ast, expected);
 
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index 21e3cfcceab..fb92be6eed9 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -1343,7 +1343,7 @@ static void buildIndexes(
     {
         const auto & indices = settings.ignore_data_skipping_indices.toString();
         Tokens tokens(indices.data(), indices.data() + indices.size(), settings.max_query_size);
-        IParser::Pos pos(tokens, static_cast<unsigned>(settings.max_parser_depth));
+        IParser::Pos pos(tokens, static_cast<unsigned>(settings.max_parser_depth), static_cast<unsigned>(settings.max_parser_backtracks));
         Expected expected;
 
         /// Use an unordered list rather than string vector
diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index 15765f99b4b..f21991e8d58 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -885,7 +885,7 @@ namespace
         const char * begin = query_text.data();
         const char * end = begin + query_text.size();
         ParserQuery parser(end, settings.allow_settings_after_format_in_insert);
-        ast = parseQuery(parser, begin, end, "", settings.max_query_size, settings.max_parser_depth);
+        ast = parseQuery(parser, begin, end, "", settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
 
         /// Choose input format.
         insert_query = ast->as<ASTInsertQuery>();
diff --git a/src/Server/PostgreSQLHandler.cpp b/src/Server/PostgreSQLHandler.cpp
index c62dc8109ea..83e06628185 100644
--- a/src/Server/PostgreSQLHandler.cpp
+++ b/src/Server/PostgreSQLHandler.cpp
@@ -284,6 +284,7 @@ void PostgreSQLHandler::processQuery()
         auto parse_res = splitMultipartQuery(query->query, queries,
             settings.max_query_size,
             settings.max_parser_depth,
+            settings.max_parser_backtracks,
             settings.allow_settings_after_format_in_insert);
         if (!parse_res.second)
             throw Exception(ErrorCodes::SYNTAX_ERROR, "Cannot parse and execute the following part of query: {}", String(parse_res.first));
diff --git a/src/Storages/ColumnsDescription.cpp b/src/Storages/ColumnsDescription.cpp
index e08dac3a332..16b89f24243 100644
--- a/src/Storages/ColumnsDescription.cpp
+++ b/src/Storages/ColumnsDescription.cpp
@@ -145,7 +145,7 @@ void ColumnDescription::readText(ReadBuffer & buf)
         readEscapedStringUntilEOL(modifiers, buf);
 
         ParserColumnDeclaration column_parser(/* require type */ true);
-        ASTPtr ast = parseQuery(column_parser, "x T " + modifiers, "column parser", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        ASTPtr ast = parseQuery(column_parser, "x T " + modifiers, "column parser", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
         if (auto * col_ast = ast->as<ASTColumnDeclaration>())
         {
@@ -211,7 +211,7 @@ void ColumnsDescription::setAliases(NamesAndAliases aliases)
         const char * alias_expression_pos = alias.expression.data();
         const char * alias_expression_end = alias_expression_pos + alias.expression.size();
         ParserExpression expression_parser;
-        description.default_desc.expression = parseQuery(expression_parser, alias_expression_pos, alias_expression_end, "expression", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        description.default_desc.expression = parseQuery(expression_parser, alias_expression_pos, alias_expression_end, "expression", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
         add(std::move(description));
     }
diff --git a/src/Storages/ConstraintsDescription.cpp b/src/Storages/ConstraintsDescription.cpp
index 219c3fd0c97..d492de2c2b2 100644
--- a/src/Storages/ConstraintsDescription.cpp
+++ b/src/Storages/ConstraintsDescription.cpp
@@ -45,7 +45,7 @@ ConstraintsDescription ConstraintsDescription::parse(const String & str)
 
     ConstraintsDescription res;
     ParserConstraintDeclarationList parser;
-    ASTPtr list = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    ASTPtr list = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
     for (const auto & constraint : list->children)
         res.constraints.push_back(constraint);
diff --git a/src/Storages/IndicesDescription.cpp b/src/Storages/IndicesDescription.cpp
index c723fa4225c..14555dca63b 100644
--- a/src/Storages/IndicesDescription.cpp
+++ b/src/Storages/IndicesDescription.cpp
@@ -173,7 +173,7 @@ IndicesDescription IndicesDescription::parse(const String & str, const ColumnsDe
         return result;
 
     ParserIndexDeclarationList parser;
-    ASTPtr list = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    ASTPtr list = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
     for (const auto & index : list->children)
         result.emplace_back(IndexDescription::getIndexFromAST(index, columns, context));
diff --git a/src/Storages/KeyDescription.cpp b/src/Storages/KeyDescription.cpp
index c407cef627d..d63b40e2b11 100644
--- a/src/Storages/KeyDescription.cpp
+++ b/src/Storages/KeyDescription.cpp
@@ -171,7 +171,7 @@ KeyDescription KeyDescription::parse(const String & str, const ColumnsDescriptio
         return result;
 
     ParserExpression parser;
-    ASTPtr ast = parseQuery(parser, "(" + str + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    ASTPtr ast = parseQuery(parser, "(" + str + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     FunctionNameNormalizer().visit(ast.get());
 
     return getKeyFromAST(ast, columns, context);
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 984d06e6a61..023202019e4 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -957,7 +957,7 @@ void IMergeTreeDataPart::loadDefaultCompressionCodec()
         try
         {
             ParserCodec codec_parser;
-            auto codec_ast = parseQuery(codec_parser, codec_line.data() + buf.getPosition(), codec_line.data() + codec_line.length(), "codec parser", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+            auto codec_ast = parseQuery(codec_parser, codec_line.data() + buf.getPosition(), codec_line.data() + codec_line.length(), "codec parser", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
             default_codec = CompressionCodecFactory::instance().get(codec_ast, {});
         }
         catch (const DB::Exception & ex)
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
index 1721fd15b8d..fe45d0bee54 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
@@ -12,7 +12,7 @@ namespace ErrorCodes
 static CompressionCodecPtr getMarksCompressionCodec(const String & marks_compression_codec)
 {
     ParserCodec codec_parser;
-    auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(marks_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(marks_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     return CompressionCodecFactory::instance().get(ast, nullptr);
 }
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
index fd83d2ebfe9..a31da5bc4fe 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
@@ -243,7 +243,7 @@ void MergeTreeDataPartWriterOnDisk::initPrimaryIndex()
         if (compress_primary_key)
         {
             ParserCodec codec_parser;
-            auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(settings.primary_key_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+            auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(settings.primary_key_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
             CompressionCodecPtr primary_key_compression_codec = CompressionCodecFactory::instance().get(ast, nullptr);
             index_compressor_stream = std::make_unique<CompressedWriteBuffer>(*index_file_hashing_stream, primary_key_compression_codec, settings.primary_key_compress_block_size);
             index_source_hashing_stream = std::make_unique<HashingWriteBuffer>(*index_compressor_stream);
@@ -268,7 +268,7 @@ void MergeTreeDataPartWriterOnDisk::initStatistics()
 void MergeTreeDataPartWriterOnDisk::initSkipIndices()
 {
     ParserCodec codec_parser;
-    auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(settings.marks_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(settings.marks_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     CompressionCodecPtr marks_compression_codec = CompressionCodecFactory::instance().get(ast, nullptr);
 
     for (const auto & skip_index : skip_indices)
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
index d79590ded21..6a3b08d4d65 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterWide.cpp
@@ -135,7 +135,7 @@ void MergeTreeDataPartWriterWide::addStreams(
             compression_codec = CompressionCodecFactory::instance().get(effective_codec_desc, nullptr, default_codec, true);
 
         ParserCodec codec_parser;
-        auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(settings.marks_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(settings.marks_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
         CompressionCodecPtr marks_compression_codec = CompressionCodecFactory::instance().get(ast, nullptr);
 
         const auto column_desc = metadata_snapshot->columns.tryGetColumnDescription(GetColumnsOptions(GetColumnsOptions::AllPhysical), column.getNameInStorage());
diff --git a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
index ef679b61a79..6471f510291 100644
--- a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
@@ -606,7 +606,7 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
         Strings forced_indices;
         {
             Tokens tokens(indices.data(), indices.data() + indices.size(), settings.max_query_size);
-            IParser::Pos pos(tokens, static_cast<unsigned>(settings.max_parser_depth));
+            IParser::Pos pos(tokens, static_cast<unsigned>(settings.max_parser_depth), static_cast<unsigned>(settings.max_parser_backtracks));
             Expected expected;
             if (!parseIdentifiersOrStringLiterals(pos, expected, forced_indices))
                 throw Exception(ErrorCodes::CANNOT_PARSE_TEXT, "Cannot parse force_data_skipping_indices ('{}')", indices);
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.cpp
index 41188891118..0ca7a4d74d9 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.cpp
@@ -432,7 +432,7 @@ StorageInMemoryMetadata ReplicatedMergeTreeTableMetadata::Diff::getNewMetadata(c
         auto parse_key_expr = [] (const String & key_expr)
         {
             ParserNotEmptyExpressionList parser(false);
-            auto new_sorting_key_expr_list = parseQuery(parser, key_expr, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+            auto new_sorting_key_expr_list = parseQuery(parser, key_expr, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
             ASTPtr order_by_ast;
             if (new_sorting_key_expr_list->children.size() == 1)
@@ -489,7 +489,7 @@ StorageInMemoryMetadata ReplicatedMergeTreeTableMetadata::Diff::getNewMetadata(c
             if (!new_ttl_table.empty())
             {
                 ParserTTLExpressionList parser;
-                auto ttl_for_table_ast = parseQuery(parser, new_ttl_table, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+                auto ttl_for_table_ast = parseQuery(parser, new_ttl_table, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
                 new_metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(
                     ttl_for_table_ast, new_metadata.columns, context, new_metadata.primary_key, true /* allow_suspicious; because it is replication */);
             }
diff --git a/src/Storages/MutationCommands.cpp b/src/Storages/MutationCommands.cpp
index f6ec277c270..aaf5c1b5d87 100644
--- a/src/Storages/MutationCommands.cpp
+++ b/src/Storages/MutationCommands.cpp
@@ -228,7 +228,7 @@ void MutationCommands::readText(ReadBuffer & in)
 
     ParserAlterCommandList p_alter_commands;
     auto commands_ast = parseQuery(
-        p_alter_commands, commands_str.data(), commands_str.data() + commands_str.length(), "mutation commands list", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+        p_alter_commands, commands_str.data(), commands_str.data() + commands_str.length(), "mutation commands list", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
     for (const auto & child : commands_ast->children)
     {
diff --git a/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.cpp b/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.cpp
index 64d329f74b2..f686fbda664 100644
--- a/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.cpp
+++ b/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.cpp
@@ -479,7 +479,7 @@ ASTPtr StorageMaterializedPostgreSQL::getCreateNestedTableQuery(
                     ASTPtr result;
 
                     Tokens tokens(attr.attr_def.data(), attr.attr_def.data() + attr.attr_def.size());
-                    IParser::Pos pos(tokens, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+                    IParser::Pos pos(tokens, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
                     if (!expr_parser.parse(pos, result, expected))
                     {
                         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Failed to parse default expression: {}", attr.attr_def);
diff --git a/src/Storages/ProjectionsDescription.cpp b/src/Storages/ProjectionsDescription.cpp
index 08ebe3a10d0..0bcbedee41a 100644
--- a/src/Storages/ProjectionsDescription.cpp
+++ b/src/Storages/ProjectionsDescription.cpp
@@ -341,7 +341,7 @@ ProjectionsDescription ProjectionsDescription::parse(const String & str, const C
         return result;
 
     ParserProjectionDeclarationList parser;
-    ASTPtr list = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    ASTPtr list = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
     for (const auto & projection_ast : list->children)
     {
diff --git a/src/Storages/System/StorageSystemDDLWorkerQueue.cpp b/src/Storages/System/StorageSystemDDLWorkerQueue.cpp
index ac5dd6c05d0..635686780a0 100644
--- a/src/Storages/System/StorageSystemDDLWorkerQueue.cpp
+++ b/src/Storages/System/StorageSystemDDLWorkerQueue.cpp
@@ -78,7 +78,8 @@ static String clusterNameFromDDLQuery(ContextPtr context, const DDLTask & task)
     ParserQuery parser_query(end, settings.allow_settings_after_format_in_insert);
     ASTPtr query = parseQuery(parser_query, begin, end, description,
                               settings.max_query_size,
-                              settings.max_parser_depth);
+                              settings.max_parser_depth,
+                              settings.max_parser_backtracks);
 
     String cluster_name;
     if (const auto * query_on_cluster = dynamic_cast<const ASTQueryWithOnCluster *>(query.get()))
diff --git a/src/Storages/System/attachInformationSchemaTables.cpp b/src/Storages/System/attachInformationSchemaTables.cpp
index 3482867bbf7..5afdd7a02ac 100644
--- a/src/Storages/System/attachInformationSchemaTables.cpp
+++ b/src/Storages/System/attachInformationSchemaTables.cpp
@@ -478,7 +478,7 @@ static void createInformationSchemaView(ContextMutablePtr context, IDatabase & d
         ParserCreateQuery parser;
         ASTPtr ast = parseQuery(parser, query.data(), query.data() + query.size(),
                                 "Attach query from embedded resource " + metadata_resource_name,
-                                DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+                                DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
 
         auto & ast_create = ast->as<ASTCreateQuery &>();
         assert(view_name == ast_create.getTable());
diff --git a/src/Storages/TTLDescription.cpp b/src/Storages/TTLDescription.cpp
index a675afbdc26..3d1ce76dff1 100644
--- a/src/Storages/TTLDescription.cpp
+++ b/src/Storages/TTLDescription.cpp
@@ -425,7 +425,7 @@ TTLTableDescription TTLTableDescription::parse(const String & str, const Columns
         return result;
 
     ParserTTLExpressionList parser;
-    ASTPtr ast = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+    ASTPtr ast = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     FunctionNameNormalizer().visit(ast.get());
 
     return getTTLForTableFromAST(ast, columns, context, primary_key, context->getSettingsRef().allow_suspicious_ttl_expressions);
diff --git a/src/Storages/getStructureOfRemoteTable.cpp b/src/Storages/getStructureOfRemoteTable.cpp
index 32266f20923..c545367b63d 100644
--- a/src/Storages/getStructureOfRemoteTable.cpp
+++ b/src/Storages/getStructureOfRemoteTable.cpp
@@ -32,6 +32,7 @@ ColumnsDescription getStructureOfRemoteTableInShard(
     const ASTPtr & table_func_ptr)
 {
     String query;
+    const Settings & settings = context->getSettingsRef();
 
     if (table_func_ptr)
     {
@@ -110,7 +111,8 @@ ColumnsDescription getStructureOfRemoteTableInShard(
                 column.default_desc.kind = columnDefaultKindFromString(kind_name);
                 String expr_str = (*default_expr)[i].get<const String &>();
                 column.default_desc.expression = parseQuery(
-                    expr_parser, expr_str.data(), expr_str.data() + expr_str.size(), "default expression", 0, context->getSettingsRef().max_parser_depth);
+                    expr_parser, expr_str.data(), expr_str.data() + expr_str.size(), "default expression",
+                    0, settings.max_parser_depth, settings.max_parser_backtracks);
             }
 
             res.add(column);
diff --git a/src/Storages/tests/gtest_transform_query_for_external_database.cpp b/src/Storages/tests/gtest_transform_query_for_external_database.cpp
index 475cf5a4eae..7e2d393c3d1 100644
--- a/src/Storages/tests/gtest_transform_query_for_external_database.cpp
+++ b/src/Storages/tests/gtest_transform_query_for_external_database.cpp
@@ -118,7 +118,7 @@ static void checkOld(
     const std::string & expected)
 {
     ParserSelectQuery parser;
-    ASTPtr ast = parseQuery(parser, query, 1000, 1000);
+    ASTPtr ast = parseQuery(parser, query, 1000, 1000, 1000000);
     SelectQueryInfo query_info;
     SelectQueryOptions select_options;
     query_info.syntax_analyzer_result
@@ -161,7 +161,7 @@ static void checkNewAnalyzer(
     const std::string & expected)
 {
     ParserSelectQuery parser;
-    ASTPtr ast = parseQuery(parser, query, 1000, 1000);
+    ASTPtr ast = parseQuery(parser, query, 1000, 1000, 1000000);
 
     SelectQueryOptions select_query_options;
     auto query_tree = buildQueryTree(ast, state.context);
diff --git a/src/TableFunctions/Hive/TableFunctionHive.cpp b/src/TableFunctions/Hive/TableFunctionHive.cpp
index e840d5fc8be..80494dbe5a8 100644
--- a/src/TableFunctions/Hive/TableFunctionHive.cpp
+++ b/src/TableFunctions/Hive/TableFunctionHive.cpp
@@ -17,6 +17,7 @@
 #include <TableFunctions/TableFunctionFactory.h>
 #include <Interpreters/parseColumnsListForTableFunction.h>
 
+
 namespace DB
 {
 
@@ -99,7 +100,8 @@ StoragePtr TableFunctionHive::executeImpl(
         "(" + partition_by_def + ")",
         "partition by declaration list",
         settings.max_query_size,
-        settings.max_parser_depth);
+        settings.max_parser_depth,
+        settings.max_parser_backtracks);
     StoragePtr storage;
     storage = std::make_shared<StorageHive>(
         hive_metastore_url,
diff --git a/src/TableFunctions/TableFunctionExplain.cpp b/src/TableFunctions/TableFunctionExplain.cpp
index 400fc81e6d4..8607597fa67 100644
--- a/src/TableFunctions/TableFunctionExplain.cpp
+++ b/src/TableFunctions/TableFunctionExplain.cpp
@@ -63,7 +63,7 @@ std::vector<size_t> TableFunctionExplain::skipAnalysisForArguments(const QueryTr
     return {};
 }
 
-void TableFunctionExplain::parseArguments(const ASTPtr & ast_function, ContextPtr /*context*/)
+void TableFunctionExplain::parseArguments(const ASTPtr & ast_function, ContextPtr context)
 {
     const auto * function = ast_function->as<ASTFunction>();
     if (!function || !function->arguments)
@@ -94,12 +94,12 @@ void TableFunctionExplain::parseArguments(const ASTPtr & ast_function, ContextPt
     const auto & settings_str = settings_arg->value.get<String>();
     if (!settings_str.empty())
     {
-        constexpr UInt64 max_size = 4096;
-        constexpr UInt64 max_depth = 16;
+        const Settings & settings = context->getSettingsRef();
 
         /// parse_only_internals_ = true - we don't want to parse `SET` keyword
         ParserSetQuery settings_parser(/* parse_only_internals_ = */ true);
-        ASTPtr settings_ast = parseQuery(settings_parser, settings_str, max_size, max_depth);
+        ASTPtr settings_ast = parseQuery(settings_parser, settings_str,
+            settings.max_query_size, settings.max_parser_depth, settings.max_parser_backtracks);
         explain_query->setSettings(std::move(settings_ast));
     }
 

From f0c9fe6bc90798d3d4e402817e14c83b831663f1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 19:54:20 +0100
Subject: [PATCH 624/985] Limit backtracking in parser

---
 src/Parsers/IParser.cpp | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/src/Parsers/IParser.cpp b/src/Parsers/IParser.cpp
index d1e9ace89b6..5679fba1a0c 100644
--- a/src/Parsers/IParser.cpp
+++ b/src/Parsers/IParser.cpp
@@ -24,9 +24,6 @@ IParser::Pos & IParser::Pos::operator=(const IParser::Pos & rhs)
 
     TokenIterator::operator=(rhs);
 
-    if (backtracks % 1000 == 0)
-        std::cerr << backtracks << "\n";
-
     return *this;
 }
 

From 65d091cc65362f9f86e1efa5a51001a67c11b03c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 20:16:23 +0100
Subject: [PATCH 625/985] Limit backtracking in parser

---
 src/Functions/getFuzzerData.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/getFuzzerData.cpp b/src/Functions/getFuzzerData.cpp
index 5c536477401..a6f8dd1de2c 100644
--- a/src/Functions/getFuzzerData.cpp
+++ b/src/Functions/getFuzzerData.cpp
@@ -41,7 +41,7 @@ public:
         return DataTypeString().createColumnConst(input_rows_count, fuzz_data);
     }
 
-    static void update(const String & fuzz_data_)
+    [[maybe_unused]] static void update(const String & fuzz_data_)
     {
         fuzz_data = fuzz_data_;
     }

From 13797b9712994edfe37d5bcfbca9d19d174ea95b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 20:21:07 +0100
Subject: [PATCH 626/985] Fix style

---
 src/Common/ErrorCodes.cpp | 1 +
 src/Parsers/IParser.cpp   | 7 ++++++-
 2 files changed, 7 insertions(+), 1 deletion(-)

diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index 9f2572cbfc6..0f01036aa06 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -584,6 +584,7 @@
     M(703, INVALID_IDENTIFIER) \
     M(704, QUERY_CACHE_USED_WITH_NONDETERMINISTIC_FUNCTIONS) \
     M(705, TABLE_NOT_EMPTY) \
+    M(706, TOO_SLOW_PARSING) \
     \
     M(900, DISTRIBUTED_CACHE_ERROR) \
     M(901, CANNOT_USE_DISTRIBUTED_CACHE) \
diff --git a/src/Parsers/IParser.cpp b/src/Parsers/IParser.cpp
index 5679fba1a0c..41981a4bb8a 100644
--- a/src/Parsers/IParser.cpp
+++ b/src/Parsers/IParser.cpp
@@ -4,6 +4,11 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int TOO_SLOW_PARSING;
+}
+
 IParser::Pos & IParser::Pos::operator=(const IParser::Pos & rhs)
 {
     depth = rhs.depth;
@@ -18,7 +23,7 @@ IParser::Pos & IParser::Pos::operator=(const IParser::Pos & rhs)
     {
         ++backtracks;
         if (max_backtracks && backtracks > max_backtracks)
-            throw Exception(ErrorCodes::TOO_DEEP_RECURSION, "Maximum amount of backtracking ({}) exceeded in the parser. "
+            throw Exception(ErrorCodes::TOO_SLOW_PARSING, "Maximum amount of backtracking ({}) exceeded in the parser. "
                 "Consider rising max_parser_backtracks parameter.", max_backtracks);
     }
 

From 95cfba9439b1c298fec390521510af32b6a5d66e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 17 Mar 2024 20:26:43 +0100
Subject: [PATCH 627/985] Add a test

---
 src/Common/ErrorCodes.cpp                                | 9 ++++-----
 .../0_stateless/03012_parser_backtracking.reference      | 1 +
 tests/queries/0_stateless/03012_parser_backtracking.sh   | 7 +++++++
 3 files changed, 12 insertions(+), 5 deletions(-)
 create mode 100644 tests/queries/0_stateless/03012_parser_backtracking.reference
 create mode 100755 tests/queries/0_stateless/03012_parser_backtracking.sh

diff --git a/src/Common/ErrorCodes.cpp b/src/Common/ErrorCodes.cpp
index 0f01036aa06..75ba9cff81e 100644
--- a/src/Common/ErrorCodes.cpp
+++ b/src/Common/ErrorCodes.cpp
@@ -584,11 +584,6 @@
     M(703, INVALID_IDENTIFIER) \
     M(704, QUERY_CACHE_USED_WITH_NONDETERMINISTIC_FUNCTIONS) \
     M(705, TABLE_NOT_EMPTY) \
-    M(706, TOO_SLOW_PARSING) \
-    \
-    M(900, DISTRIBUTED_CACHE_ERROR) \
-    M(901, CANNOT_USE_DISTRIBUTED_CACHE) \
-    \
     M(706, LIBSSH_ERROR) \
     M(707, GCP_ERROR) \
     M(708, ILLEGAL_STATISTIC) \
@@ -600,6 +595,10 @@
     M(715, CANNOT_DETECT_FORMAT) \
     M(716, CANNOT_FORGET_PARTITION) \
     M(717, EXPERIMENTAL_FEATURE_ERROR) \
+    M(718, TOO_SLOW_PARSING) \
+    \
+    M(900, DISTRIBUTED_CACHE_ERROR) \
+    M(901, CANNOT_USE_DISTRIBUTED_CACHE) \
     \
     M(999, KEEPER_EXCEPTION) \
     M(1000, POCO_EXCEPTION) \
diff --git a/tests/queries/0_stateless/03012_parser_backtracking.reference b/tests/queries/0_stateless/03012_parser_backtracking.reference
new file mode 100644
index 00000000000..84727754516
--- /dev/null
+++ b/tests/queries/0_stateless/03012_parser_backtracking.reference
@@ -0,0 +1 @@
+TOO_SLOW_PARSING
diff --git a/tests/queries/0_stateless/03012_parser_backtracking.sh b/tests/queries/0_stateless/03012_parser_backtracking.sh
new file mode 100755
index 00000000000..889753fb048
--- /dev/null
+++ b/tests/queries/0_stateless/03012_parser_backtracking.sh
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+$CLICKHOUSE_LOCAL --query "SELECT((((((((((SELECT(((((((((SELECT((((((((((SELECT(((((((((SELECT((((((((((SELECT(((((((((SELECT 1+)))))))))))))))))))))))))))))))))))))))))))))))))))))))))" 2>&1 | grep -o -F 'TOO_SLOW_PARSING'

From 12289a9ebe07ce15937ceb4cffe8fe4cf033dcdd Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Sun, 17 Mar 2024 22:34:41 +0100
Subject: [PATCH 628/985] Add support of ParallelReadBuffer to
 ReadBufferFromAzureBlobStorage

---
 .../IO/ReadBufferFromAzureBlobStorage.cpp     | 51 +++++++++++++++++++
 src/Disks/IO/ReadBufferFromAzureBlobStorage.h |  4 ++
 2 files changed, 55 insertions(+)

diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
index 8de977ef876..7cda8898a65 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
@@ -8,7 +8,9 @@
 #include <Common/Throttler.h>
 #include <base/sleep.h>
 #include <Common/ProfileEvents.h>
+#include <IO/SeekableReadBuffer.h>
 
+#include <sstream>
 
 namespace ProfileEvents
 {
@@ -262,6 +264,55 @@ size_t ReadBufferFromAzureBlobStorage::getFileSize()
     return *file_size;
 }
 
+size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t range_begin, const std::function<bool(size_t)> & progress_callback) const
+{
+    size_t initial_n = n;
+
+    size_t sleep_time_with_backoff_milliseconds = 100;
+    auto handle_exception = [&, this](const auto & e, size_t i)
+    {
+        LOG_INFO(log, "Exception caught during Azure Download for file {} at offset {} at attempt {}/{}: {}", path, offset, i + 1, max_single_download_retries, e.Message);
+        if (i + 1 == max_single_download_retries)
+            throw;
+
+        sleepForMilliseconds(sleep_time_with_backoff_milliseconds);
+        sleep_time_with_backoff_milliseconds *= 2;
+    };
+
+    Azure::Storage::Blobs::DownloadBlobOptions download_options;
+    download_options.Range = {static_cast<int64_t>(range_begin), range_begin+n};
+
+    for (size_t i = 0; i < max_single_download_retries; ++i)
+    {
+        size_t bytes_copied = 0;
+        try
+        {
+            auto download_response = blob_client->Download(download_options);
+            std::unique_ptr<Azure::Core::IO::BodyStream> body_stream = std::move(download_response.Value.BodyStream);
+            auto length = body_stream->Length();
+            char buffer[length];
+            body_stream->Read(reinterpret_cast<uint8_t *>(buffer), length);
+            std::istringstream string_stream(String(static_cast<char *>(buffer),length));
+            copyFromIStreamWithProgressCallback(string_stream, to, n, progress_callback, &bytes_copied);
+
+            if (read_settings.remote_throttler)
+                read_settings.remote_throttler->add(bytes_copied, ProfileEvents::RemoteReadThrottlerBytes, ProfileEvents::RemoteReadThrottlerSleepMicroseconds);
+
+            break;
+        }
+        catch (const Azure::Core::RequestFailedException & e)
+        {
+            handle_exception(e,i);
+        }
+
+        range_begin += bytes_copied;
+        to += bytes_copied;
+        n -= bytes_copied;
+    }
+
+    return initial_n;
+}
+
 }
 
 #endif
diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.h b/src/Disks/IO/ReadBufferFromAzureBlobStorage.h
index 68058b84a2f..d328195cc26 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.h
@@ -44,6 +44,10 @@ public:
 
     size_t getFileSize() override;
 
+    size_t readBigAt(char * to, size_t n, size_t range_begin, const std::function<bool(size_t)> & progress_callback) const override;
+
+    bool supportsReadAt() override { return true; }
+
 private:
 
     void initialize();

From fd9231a886ffb37db3657695b590b43d0fbd31ef Mon Sep 17 00:00:00 2001
From: Dan Wu <wudanzy@google.com>
Date: Mon, 18 Mar 2024 07:41:50 +0800
Subject: [PATCH 629/985] Add database = currentDatabase() condition to query
 test 03010_read_system_parts_table_test.sql

The failed test suggest to add database = currentDatabase() condition to tests that queries on system.parts.
---
 .../0_stateless/03010_read_system_parts_table_test.sql        | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/03010_read_system_parts_table_test.sql b/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
index 6ec7e6212d5..8871822af4e 100644
--- a/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
+++ b/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
@@ -4,7 +4,7 @@ CREATE TABLE users (uid Int16, name String, age Int16) ENGINE=MergeTree ORDER BY
 INSERT INTO users VALUES (1231, 'John', 33);
 INSERT INTO users VALUES (6666, 'Ksenia', 48);
 
-SELECT uuid, name from system.parts WHERE table = 'users';
+SELECT uuid, name from system.parts WHERE database = currentDatabase() AND table = 'users';
 
-SELECT table from system.parts WHERE uuid = '00000000-0000-0000-0000-000000000000';
+SELECT table from system.parts WHERE database = currentDatabase() AND uuid = '00000000-0000-0000-0000-000000000000';
 DROP TABLE IF EXISTS users;

From 58a2f780d9f224dcc5463860e986dbd9deb094b8 Mon Sep 17 00:00:00 2001
From: San <santrancisco@users.noreply.github.com>
Date: Mon, 18 Mar 2024 11:30:36 +1100
Subject: [PATCH 630/985] Update jdbc.md

We will no longer support jdbc bridge
---
 docs/en/sql-reference/table-functions/jdbc.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/en/sql-reference/table-functions/jdbc.md b/docs/en/sql-reference/table-functions/jdbc.md
index fbc917c1e1a..a566c168794 100644
--- a/docs/en/sql-reference/table-functions/jdbc.md
+++ b/docs/en/sql-reference/table-functions/jdbc.md
@@ -6,6 +6,10 @@ sidebar_label: jdbc
 
 # jdbc
 
+:::note
+clickhouse-jdbc-bridge contains experimental codes and is no longer supported. It may contain reliability issues and security vulnerabilities. Use it at your own risk. ClickHouse recommend using built-in table functions in ClickHouse which provide a better alternative for ad-hoc querying scenarios (Postgres, MySQL, MongoDB, etc).
+:::
+
 `jdbc(datasource, schema, table)` - returns table that is connected via JDBC driver.
 
 This table function requires separate [clickhouse-jdbc-bridge](https://github.com/ClickHouse/clickhouse-jdbc-bridge) program to be running.

From 0a8b7dd9cdaf2a5df6d18811a33698c6edc4db1c Mon Sep 17 00:00:00 2001
From: San <santrancisco@users.noreply.github.com>
Date: Mon, 18 Mar 2024 11:36:39 +1100
Subject: [PATCH 631/985] Update jdbc.md

---
 docs/en/engines/table-engines/integrations/jdbc.md | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/docs/en/engines/table-engines/integrations/jdbc.md b/docs/en/engines/table-engines/integrations/jdbc.md
index a4a1e2a31ae..16ed01fecb5 100644
--- a/docs/en/engines/table-engines/integrations/jdbc.md
+++ b/docs/en/engines/table-engines/integrations/jdbc.md
@@ -6,6 +6,11 @@ sidebar_label: JDBC
 
 # JDBC
 
+:::note
+clickhouse-jdbc-bridge contains experimental codes and is no longer supported. It may contain reliability issues and security vulnerabilities. Use it at your own risk. 
+ClickHouse recommend using built-in table functions in ClickHouse which provide a better alternative for ad-hoc querying scenarios (Postgres, MySQL, MongoDB, etc).
+:::
+
 Allows ClickHouse to connect to external databases via [JDBC](https://en.wikipedia.org/wiki/Java_Database_Connectivity).
 
 To implement the JDBC connection, ClickHouse uses the separate program [clickhouse-jdbc-bridge](https://github.com/ClickHouse/clickhouse-jdbc-bridge) that should run as a daemon.

From 973b2781282e8e6fb7900cf404abe94142e649ff Mon Sep 17 00:00:00 2001
From: San <santrancisco@users.noreply.github.com>
Date: Mon, 18 Mar 2024 11:37:21 +1100
Subject: [PATCH 632/985] Update jdbc.md

---
 docs/en/sql-reference/table-functions/jdbc.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/table-functions/jdbc.md b/docs/en/sql-reference/table-functions/jdbc.md
index a566c168794..6b801344a83 100644
--- a/docs/en/sql-reference/table-functions/jdbc.md
+++ b/docs/en/sql-reference/table-functions/jdbc.md
@@ -7,7 +7,8 @@ sidebar_label: jdbc
 # jdbc
 
 :::note
-clickhouse-jdbc-bridge contains experimental codes and is no longer supported. It may contain reliability issues and security vulnerabilities. Use it at your own risk. ClickHouse recommend using built-in table functions in ClickHouse which provide a better alternative for ad-hoc querying scenarios (Postgres, MySQL, MongoDB, etc).
+clickhouse-jdbc-bridge contains experimental codes and is no longer supported. It may contain reliability issues and security vulnerabilities. Use it at your own risk. 
+ClickHouse recommend using built-in table functions in ClickHouse which provide a better alternative for ad-hoc querying scenarios (Postgres, MySQL, MongoDB, etc).
 :::
 
 `jdbc(datasource, schema, table)` - returns table that is connected via JDBC driver.

From 1a61da1baefa5ae3f0f4d168a7357b4ce2221c82 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 02:16:52 +0100
Subject: [PATCH 633/985] Replace getFuzzerData with query text fuzzer in
 clickhouse-local

---
 CMakeLists.txt                 |  10 ++-
 programs/CMakeLists.txt        |   4 -
 programs/local/CMakeLists.txt  |   6 --
 programs/local/LocalServer.cpp | 133 ++++++---------------------------
 programs/main.cpp              |  10 +--
 src/Client/ClientBase.cpp      |  25 +++++++
 src/Client/ClientBase.h        |   7 ++
 src/Functions/CMakeLists.txt   |   4 -
 8 files changed, 66 insertions(+), 133 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 8c4e16eace2..da29a9c93e8 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -102,6 +102,8 @@ if (ENABLE_FUZZING)
 
     # For codegen_select_fuzzer
     set (ENABLE_PROTOBUF 1)
+
+    add_compile_definitions(FUZZING_MODE=1)
 endif()
 
 # Global libraries
@@ -574,7 +576,7 @@ if (FUZZER)
             if (NOT(target_type STREQUAL "INTERFACE_LIBRARY" OR target_type STREQUAL "UTILITY"))
                 target_compile_options(${target} PRIVATE "-fsanitize=fuzzer-no-link")
             endif()
-            if (target_type STREQUAL "EXECUTABLE" AND (target MATCHES ".+_fuzzer" OR target STREQUAL "clickhouse"))
+            if (target_type STREQUAL "EXECUTABLE" AND target MATCHES ".+_fuzzer")
                 message(STATUS "${target} instrumented with fuzzer")
                 target_link_libraries(${target} PUBLIC ch_contrib::fuzzer)
                 # Add to fuzzers bundle
@@ -583,6 +585,12 @@ if (FUZZER)
                 get_target_property(target_bin_dir ${target} BINARY_DIR)
                 add_custom_command(TARGET fuzzers POST_BUILD COMMAND mv "${target_bin_dir}/${target_bin_name}" "${CMAKE_CURRENT_BINARY_DIR}/programs/" VERBATIM)
             endif()
+            if (target STREQUAL "clickhouse")
+                message(STATUS "${target} instrumented with fuzzer")
+                target_link_libraries(${target} PUBLIC ch_contrib::fuzzer_no_main)
+                # Add to fuzzers bundle
+                add_dependencies(fuzzers ${target})
+            endif()
         endif()
     endforeach()
     add_custom_command(TARGET fuzzers POST_BUILD COMMAND SRC=${CMAKE_SOURCE_DIR} BIN=${CMAKE_BINARY_DIR} OUT=${CMAKE_BINARY_DIR}/programs ${CMAKE_SOURCE_DIR}/tests/fuzz/build.sh VERBATIM)
diff --git a/programs/CMakeLists.txt b/programs/CMakeLists.txt
index d945fdf4a6f..0d91de2dad8 100644
--- a/programs/CMakeLists.txt
+++ b/programs/CMakeLists.txt
@@ -268,10 +268,6 @@ if (ENABLE_TESTS)
     add_dependencies(clickhouse-bundle clickhouse-tests)
 endif()
 
-if (ENABLE_FUZZING)
-    add_compile_definitions(FUZZING_MODE=1)
-endif ()
-
 if (TARGET ch_contrib::protobuf)
     get_property(google_proto_files TARGET ch_contrib::protobuf PROPERTY google_proto_files)
     foreach (proto_file IN LISTS google_proto_files)
diff --git a/programs/local/CMakeLists.txt b/programs/local/CMakeLists.txt
index 565b67d0020..1aaa2859898 100644
--- a/programs/local/CMakeLists.txt
+++ b/programs/local/CMakeLists.txt
@@ -25,9 +25,3 @@ endif()
 
 # Always use internal readpassphrase
 target_link_libraries(clickhouse-local-lib PRIVATE readpassphrase)
-
-if (ENABLE_FUZZING)
-    add_compile_definitions(FUZZING_MODE=1)
-    set (WITH_COVERAGE ON)
-    target_link_libraries(clickhouse-local-lib PRIVATE ${LIB_FUZZING_ENGINE})
-endif ()
diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 167d361f5e3..4bb5d3a94b7 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -4,7 +4,6 @@
 #include <Common/logger_useful.h>
 #include <Common/formatReadable.h>
 #include <base/getMemoryAmount.h>
-#include <base/errnoToString.h>
 #include <Poco/Util/XMLConfiguration.h>
 #include <Poco/String.h>
 #include <Poco/Logger.h>
@@ -22,8 +21,6 @@
 #include <Interpreters/loadMetadata.h>
 #include <Interpreters/registerInterpreters.h>
 #include <base/getFQDNOrHostName.h>
-#include <Common/scope_guard_safe.h>
-#include <Interpreters/Session.h>
 #include <Access/AccessControl.h>
 #include <Common/PoolId.h>
 #include <Common/Exception.h>
@@ -34,7 +31,6 @@
 #include <Common/quoteString.h>
 #include <Common/randomSeed.h>
 #include <Common/ThreadPool.h>
-#include <Loggers/Loggers.h>
 #include <Loggers/OwnFormattingChannel.h>
 #include <Loggers/OwnPatternFormatter.h>
 #include <IO/ReadBufferFromFile.h>
@@ -42,7 +38,6 @@
 #include <IO/WriteBufferFromFileDescriptor.h>
 #include <IO/UseSSL.h>
 #include <IO/SharedThreadPools.h>
-#include <Parsers/IAST.h>
 #include <Parsers/ASTInsertQuery.h>
 #include <Common/ErrorHandlers.h>
 #include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
@@ -61,10 +56,6 @@
 
 #include "config.h"
 
-#if defined(FUZZING_MODE)
-    #include <Functions/getFuzzerData.h>
-#endif
-
 #if USE_AZURE_BLOB_STORAGE
 #   include <azure/storage/common/internal/xml_wrapper.hpp>
 #endif
@@ -474,25 +465,10 @@ try
         }
     }
 
-#if defined(FUZZING_MODE)
-    static bool first_time = true;
-    if (first_time)
-    {
-
-    if (queries_files.empty() && queries.empty())
-    {
-        std::cerr << "\033[31m" << "ClickHouse compiled in fuzzing mode." << "\033[0m" << std::endl;
-        std::cerr << "\033[31m" << "You have to provide a query with --query or --queries-file option." << "\033[0m" << std::endl;
-        std::cerr << "\033[31m" << "The query have to use function getFuzzerData() inside." << "\033[0m" << std::endl;
-        exit(1);
-    }
-
-    is_interactive = false;
-#else
     is_interactive = stdin_is_a_tty
         && (config().hasOption("interactive")
             || (queries.empty() && !config().has("table-structure") && queries_files.empty() && !config().has("table-file")));
-#endif
+
     if (!is_interactive)
     {
         /// We will terminate process on error
@@ -538,15 +514,13 @@ try
 
     connect();
 
-#ifdef FUZZING_MODE
-    first_time = false;
-    }
-#endif
-
     String initial_query = getInitialCreateTableQuery();
     if (!initial_query.empty())
         processQueryText(initial_query);
 
+#if defined(FUZZING_MODE)
+    runLibFuzzer();
+#else
     if (is_interactive && !delayed_interactive)
     {
         runInteractive();
@@ -558,10 +532,8 @@ try
         if (delayed_interactive)
             runInteractive();
     }
-
-#ifndef FUZZING_MODE
-    cleanup();
 #endif
+
     return Application::EXIT_OK;
 }
 catch (const DB::Exception & e)
@@ -829,23 +801,11 @@ void LocalServer::processConfig()
 
 void LocalServer::printHelpMessage([[maybe_unused]] const OptionsDescription & options_description)
 {
-#if defined(FUZZING_MODE)
-    std::cout <<
-        "usage: clickhouse <clickhouse-local arguments> -- <libfuzzer arguments>\n"
-        "Note: It is important not to use only one letter keys with single dash for \n"
-        "for clickhouse-local arguments. It may work incorrectly.\n"
-
-        "ClickHouse is build with coverage guided fuzzer (libfuzzer) inside it.\n"
-        "You have to provide a query which contains getFuzzerData function.\n"
-        "This will take the data from fuzzing engine, pass it to getFuzzerData function and execute a query.\n"
-        "Each time the data will be different, and it will last until some segfault or sanitizer assertion is found. \n";
-#else
     std::cout << getHelpHeader() << "\n";
     std::cout << options_description.main_description.value() << "\n";
     std::cout << getHelpFooter() << "\n";
     std::cout << "In addition, --param_name=value can be specified for substitution of parameters for parametrized queries.\n";
     std::cout << "\nSee also: https://clickhouse.com/docs/en/operations/utilities/clickhouse-local/\n";
-#endif
 }
 
 
@@ -921,6 +881,7 @@ void LocalServer::readArguments(int argc, char ** argv, Arguments & common_argum
     for (int arg_num = 1; arg_num < argc; ++arg_num)
     {
         std::string_view arg = argv[arg_num];
+
         /// Parameter arg after underline.
         if (arg.starts_with("--param_"))
         {
@@ -952,9 +913,27 @@ void LocalServer::readArguments(int argc, char ** argv, Arguments & common_argum
             arg = argv[arg_num];
             addMultiquery(arg, common_arguments);
         }
+        else if (arg == "--")
+        {
+#if defined(FUZZING_MODE)
+            fuzzer_argc = 1 + argc - arg_num;
+            fuzzer_argv = argv + arg_num;
+            break;
+#endif
+        }
         else
+        {
             common_arguments.emplace_back(arg);
+        }
     }
+
+#if defined(FUZZING_MODE)
+    if (!fuzzer_argc)
+    {
+        fuzzer_argc = 1;
+        fuzzer_argv = argv;
+    }
+#endif
 }
 
 }
@@ -988,67 +967,3 @@ int mainEntryClickHouseLocal(int argc, char ** argv)
         return code ? code : 1;
     }
 }
-
-#if defined(FUZZING_MODE)
-
-// linked from programs/main.cpp
-bool isClickhouseApp(const std::string & app_suffix, std::vector<char *> & argv);
-
-std::optional<DB::LocalServer> fuzz_app;
-
-extern "C" int LLVMFuzzerInitialize(int * pargc, char *** pargv)
-{
-    std::vector<char *> argv(*pargv, *pargv + (*pargc + 1));
-
-    /// As a user you can add flags to clickhouse binary in fuzzing mode as follows
-    /// clickhouse local <set of clickhouse-local specific flag> -- <set of libfuzzer flags>
-
-    char **p = &(*pargv)[1];
-
-    auto it = argv.begin() + 1;
-    for (; *it; ++it)
-    {
-        if (strcmp(*it, "--") == 0)
-        {
-            ++it;
-            break;
-        }
-    }
-
-    while (*it)
-    {
-        if (strncmp(*it, "--", 2) != 0)
-        {
-            *(p++) = *it;
-            it = argv.erase(it);
-        }
-        else
-            ++it;
-    }
-
-    *pargc = static_cast<int>(p - &(*pargv)[0]);
-    *p = nullptr;
-
-    /// Initialize clickhouse-local app
-    fuzz_app.emplace();
-    fuzz_app->init(static_cast<int>(argv.size() - 1), argv.data());
-
-    return 0;
-}
-
-
-extern "C" int LLVMFuzzerTestOneInput(const uint8_t * data, size_t size)
-{
-    try
-    {
-        auto input = String(reinterpret_cast<const char *>(data), size);
-        DB::FunctionGetFuzzerData::update(input);
-        fuzz_app->run();
-    }
-    catch (...)
-    {
-    }
-
-    return 0;
-}
-#endif
diff --git a/programs/main.cpp b/programs/main.cpp
index 0a35594bd30..7162a18d764 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -67,7 +67,6 @@ namespace
 
 using MainFunc = int (*)(int, char**);
 
-#if !defined(FUZZING_MODE)
 /// Add an item here to register new application
 std::pair<std::string_view, MainFunc> clickhouse_applications[] =
 {
@@ -111,7 +110,6 @@ int printHelp(int, char **)
         std::cerr << "clickhouse " << application.first << " [args] " << std::endl;
     return -1;
 }
-#endif
 
 /// Add an item here to register a new short name
 std::pair<std::string_view, std::string_view> clickhouse_short_names[] =
@@ -284,7 +282,7 @@ struct Checker
 ;
 
 
-#if !defined(FUZZING_MODE) && !defined(USE_MUSL)
+#if !defined(USE_MUSL)
 /// NOTE: We will migrate to full static linking or our own dynamic loader to make this code obsolete.
 void checkHarmfulEnvironmentVariables(char ** argv)
 {
@@ -446,13 +444,8 @@ extern "C"
 ///
 /// extern bool inside_main;
 /// class C { C() { assert(inside_main); } };
-#ifndef FUZZING_MODE
 bool inside_main = false;
-#else
-bool inside_main = true;
-#endif
 
-#if !defined(FUZZING_MODE)
 int main(int argc_, char ** argv_)
 {
     inside_main = true;
@@ -510,4 +503,3 @@ int main(int argc_, char ** argv_)
 
     return exit_code;
 }
-#endif
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index d561a64895b..da0807d0c26 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -2631,6 +2631,31 @@ void ClientBase::runNonInteractive()
 }
 
 
+#if defined(FUZZING_MODE)
+extern "C" int LLVMFuzzerRunDriver(int * argc, char *** argv, int (*callback)(const uint8_t * data, size_t size));
+ClientBase * app;
+
+void ClientBase::runLibFuzzer()
+{
+    app = this;
+    LLVMFuzzerRunDriver(&fuzzer_argc, &fuzzer_argv, [](const uint8_t * data, size_t size)
+    {
+        try
+        {
+            String query(reinterpret_cast<const char *>(data), size);
+            app->processQueryText(query);
+        }
+        catch (...)
+        {
+            return -1;
+        }
+
+        return 0;
+    });
+}
+#endif
+
+
 void ClientBase::clearTerminal()
 {
     /// Clear from cursor until end of screen.
diff --git a/src/Client/ClientBase.h b/src/Client/ClientBase.h
index 7a9e9666e67..48a779d1757 100644
--- a/src/Client/ClientBase.h
+++ b/src/Client/ClientBase.h
@@ -78,6 +78,13 @@ protected:
     void runInteractive();
     void runNonInteractive();
 
+#if defined(FUZZING_MODE)
+    int fuzzer_argc = 0;
+    char ** fuzzer_argv = nullptr;
+
+    void runLibFuzzer();
+#endif
+
     virtual bool processWithFuzzing(const String &)
     {
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Query processing with fuzzing is not implemented");
diff --git a/src/Functions/CMakeLists.txt b/src/Functions/CMakeLists.txt
index ac3e3671ae0..bfb1fc92df8 100644
--- a/src/Functions/CMakeLists.txt
+++ b/src/Functions/CMakeLists.txt
@@ -142,10 +142,6 @@ list (APPEND OBJECT_LIBS $<TARGET_OBJECTS:clickhouse_functions_extractkeyvaluepa
 # Signed integer overflow on user-provided data inside boost::geometry - ignore.
 set_source_files_properties("pointInPolygon.cpp" PROPERTIES COMPILE_FLAGS -fno-sanitize=signed-integer-overflow)
 
-if (ENABLE_FUZZING)
-    add_compile_definitions(FUZZING_MODE=1)
-endif ()
-
 if (USE_GPERF)
     # Only for regenerating
     add_custom_target(generate-html-char-ref-gperf ./HTMLCharacterReference.sh

From 5000e3e10b5caf188b8b3fc6cdf7d41d711ade1f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 02:16:24 +0100
Subject: [PATCH 634/985] Fix error in clickhouse-client

---
 src/Parsers/parseQuery.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Parsers/parseQuery.cpp b/src/Parsers/parseQuery.cpp
index 7aad0b010a5..51878efa706 100644
--- a/src/Parsers/parseQuery.cpp
+++ b/src/Parsers/parseQuery.cpp
@@ -92,7 +92,9 @@ void writeQueryWithHighlightedErrorPositions(
         }
         else
         {
-            size_t bytes_to_hilite = UTF8::seqLength(*current_position_to_hilite);
+            ssize_t bytes_to_hilite = UTF8::seqLength(*current_position_to_hilite);
+            if (bytes_to_hilite > end - current_position_to_hilite)
+                bytes_to_hilite = end - current_position_to_hilite;
 
             /// Bright on red background.
             out << "\033[41;1m";

From 2eb7de859d08a889db4d2e4f543a8c1699fcb5f4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 02:35:32 +0100
Subject: [PATCH 635/985] Correct arguments parsing

---
 programs/local/LocalServer.cpp | 16 ++++++----------
 src/Client/ClientBase.cpp      |  3 +++
 src/Client/ClientBase.h        |  4 +---
 3 files changed, 10 insertions(+), 13 deletions(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 4bb5d3a94b7..f485e3880c1 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -878,6 +878,11 @@ void LocalServer::processOptions(const OptionsDescription &, const CommandLineOp
 
 void LocalServer::readArguments(int argc, char ** argv, Arguments & common_arguments, std::vector<Arguments> &, std::vector<Arguments> &)
 {
+#if defined(FUZZING_MODE)
+    if (argc)
+        fuzzer_args.push_back(argv[0]);
+#endif
+
     for (int arg_num = 1; arg_num < argc; ++arg_num)
     {
         std::string_view arg = argv[arg_num];
@@ -916,8 +921,7 @@ void LocalServer::readArguments(int argc, char ** argv, Arguments & common_argum
         else if (arg == "--")
         {
 #if defined(FUZZING_MODE)
-            fuzzer_argc = 1 + argc - arg_num;
-            fuzzer_argv = argv + arg_num;
+            fuzzer_args.insert(fuzzer_args.end(), &argv[arg_num + 1], &argv[argc]);
             break;
 #endif
         }
@@ -926,14 +930,6 @@ void LocalServer::readArguments(int argc, char ** argv, Arguments & common_argum
             common_arguments.emplace_back(arg);
         }
     }
-
-#if defined(FUZZING_MODE)
-    if (!fuzzer_argc)
-    {
-        fuzzer_argc = 1;
-        fuzzer_argv = argv;
-    }
-#endif
 }
 
 }
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index da0807d0c26..c4cb6e1a5ad 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -2638,6 +2638,9 @@ ClientBase * app;
 void ClientBase::runLibFuzzer()
 {
     app = this;
+    int fuzzer_argc = fuzzer_args.size();
+    char ** fuzzer_argv = fuzzer_args.data();
+
     LLVMFuzzerRunDriver(&fuzzer_argc, &fuzzer_argv, [](const uint8_t * data, size_t size)
     {
         try
diff --git a/src/Client/ClientBase.h b/src/Client/ClientBase.h
index 48a779d1757..c0052ade7aa 100644
--- a/src/Client/ClientBase.h
+++ b/src/Client/ClientBase.h
@@ -79,9 +79,7 @@ protected:
     void runNonInteractive();
 
 #if defined(FUZZING_MODE)
-    int fuzzer_argc = 0;
-    char ** fuzzer_argv = nullptr;
-
+    std::vector<char *> fuzzer_args;
     void runLibFuzzer();
 #endif
 

From c17536c3b31ca48cdd1771266d8385628de622e5 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Thu, 14 Mar 2024 12:16:33 +0000
Subject: [PATCH 636/985] Enable clang-tidy in headers

---
 .clang-tidy                                   |  6 +-
 .../Poco/Net/HTTPRequestHandlerFactory.h      |  1 -
 contrib/libmetrohash/src/metrohash64.cpp      | 64 +++++++++----------
 contrib/libmetrohash/src/metrohash64.h        | 10 +--
 src/Access/AccessBackup.cpp                   |  4 +-
 src/Access/AccessBackup.h                     |  2 +-
 src/Access/ContextAccessParams.cpp            |  2 +-
 src/Access/ContextAccessParams.h              |  2 +-
 src/Access/GSSAcceptor.h                      |  2 +-
 src/Access/LDAPAccessStorage.cpp              |  2 +-
 src/Access/LDAPAccessStorage.h                | 22 +++----
 .../AggregateFunctionFlameGraph.cpp           |  2 -
 .../AggregateFunctionMLMethod.h               |  6 +-
 .../AggregateFunctionStatisticsSimple.h       |  5 --
 .../AggregateFunctionUniqCombined.h           |  5 --
 .../Combinators/AggregateFunctionNull.h       |  2 +-
 src/AggregateFunctions/DDSketch/Store.h       |  2 +-
 src/AggregateFunctions/QuantileExact.h        |  8 +--
 .../ReservoirSamplerDeterministic.h           |  2 +-
 src/AggregateFunctions/SingleValueData.h      |  2 +-
 src/AggregateFunctions/UniqExactSet.h         |  4 +-
 src/Analyzer/Passes/QueryAnalysisPass.h       |  2 +-
 src/Backups/BackupSettings.h                  |  2 +-
 src/Backups/IBackup.h                         |  8 +--
 src/Backups/RestorerFromBackup.cpp            |  8 +--
 src/Client/HedgedConnectionsFactory.h         |  2 +-
 src/Client/TestHint.h                         |  6 +-
 src/Columns/ColumnUnique.h                    |  2 +-
 src/Columns/ReverseIndex.h                    |  2 +-
 src/Common/AllocatorWithMemoryTracking.h      |  6 +-
 src/Common/Arena.h                            |  6 +-
 src/Common/FrequencyHolder.h                  |  1 -
 src/Common/HTTPConnectionPool.h               | 10 +--
 src/Common/HashTable/HashTable.h              |  5 +-
 src/Common/HostResolvePool.h                  | 15 +++--
 src/Common/MortonUtils.h                      |  4 +-
 src/Common/NetException.h                     |  2 +-
 src/Common/PODArray.h                         |  4 ++
 src/Common/ProxyConfiguration.h               |  2 +-
 .../Scheduler/Nodes/DynamicResourceManager.h  |  1 -
 src/Common/Scheduler/Nodes/FairPolicy.h       |  1 -
 src/Common/Scheduler/SchedulerRoot.h          |  2 -
 src/Common/ZooKeeper/ZooKeeperImpl.h          |  2 +-
 src/Common/ZooKeeper/ZooKeeperRetries.h       |  2 +-
 src/Common/memory.h                           |  2 +-
 src/Common/mysqlxx/mysqlxx/Transaction.h      |  2 +-
 src/Common/mysqlxx/mysqlxx/Types.h            |  2 +-
 src/Common/threadPoolCallbackRunner.h         |  2 +-
 src/Compression/CompressionCodecDeflateQpl.h  |  2 +-
 .../WriteBufferFromNuraftBuffer.h             |  2 +-
 src/Core/Field.h                              |  2 +
 src/Core/MySQL/MySQLReplication.h             |  2 +-
 src/Core/Settings.h                           |  2 -
 src/Core/tests/gtest_charset_conv.cpp         |  2 -
 src/Daemon/BaseDaemon.h                       |  4 +-
 src/DataTypes/NumberTraits.h                  |  2 +
 .../SerializationCustomSimpleText.h           |  2 +-
 .../Serializations/SerializationSparse.h      |  2 +-
 .../SerializationVariantElement.cpp           |  4 +-
 .../SerializationVariantElement.h             |  4 +-
 src/Databases/DatabasesOverlay.h              |  1 -
 src/Dictionaries/CacheDictionary.cpp          |  2 +-
 src/Dictionaries/CacheDictionary.h            |  2 +-
 src/Dictionaries/CacheDictionaryStorage.h     |  4 +-
 src/Dictionaries/ICacheDictionaryStorage.h    |  4 +-
 src/Dictionaries/SSDCacheDictionaryStorage.h  |  4 +-
 src/Disks/IDiskTransaction.h                  |  4 +-
 src/Disks/IO/IOUringReader.h                  |  2 +-
 src/Disks/IVolume.h                           |  2 +-
 .../ObjectStorages/DiskObjectStorage.cpp      |  2 +-
 .../ObjectStorages/ObjectStorageIterator.h    |  2 +-
 src/Disks/ObjectStorages/S3/diskSettings.h    |  8 ---
 src/Functions/CountSubstringsImpl.h           |  2 +-
 src/Functions/CustomWeekTransforms.h          |  2 +-
 src/Functions/FunctionConstantBase.h          |  5 +-
 src/Functions/FunctionsAES.h                  |  4 +-
 src/Functions/FunctionsBitmap.h               |  4 +-
 src/Functions/FunctionsComparison.h           |  2 +-
 src/Functions/FunctionsExternalDictionaries.h |  4 +-
 src/Functions/FunctionsTimeWindow.h           |  4 ++
 src/Functions/GatherUtils/Selectors.h         | 14 ++--
 src/Functions/GatherUtils/Sources.h           |  4 ++
 src/Functions/GregorianDate.h                 |  4 +-
 src/Functions/HasSubsequenceImpl.h            |  4 --
 .../JSONPath/Generator/GeneratorJSONPath.h    |  2 +-
 src/Functions/LowerUpperUTF8Impl.h            |  2 +-
 src/Functions/URL/domain.h                    |  4 +-
 src/Functions/UniqTheta/FunctionsUniqTheta.h  |  4 +-
 .../UserDefinedSQLObjectsBackup.cpp           |  2 +-
 src/Functions/geometryConverters.h            |  5 --
 src/Functions/stl.hpp                         | 58 ++++++++---------
 src/IO/Archives/IArchiveWriter.h              |  4 +-
 src/IO/BrotliWriteBuffer.h                    |  4 +-
 src/IO/Bzip2WriteBuffer.h                     |  4 +-
 src/IO/ConnectionTimeouts.h                   |  2 +
 src/IO/HTTPCommon.h                           |  2 +-
 src/IO/LZMADeflatingWriteBuffer.h             |  4 +-
 src/IO/Lz4DeflatingWriteBuffer.h              |  4 +-
 src/IO/ReadBufferFromFileBase.h               |  2 +-
 src/IO/ReadSettings.h                         |  1 -
 src/IO/ReadWriteBufferFromHTTP.h              |  4 +-
 src/IO/S3/PocoHTTPClient.h                    |  2 +-
 src/IO/S3/tests/TestPocoHTTPServer.h          | 10 ++-
 src/IO/SeekableReadBuffer.h                   |  2 +-
 src/IO/WriteBufferFromArena.h                 |  2 +-
 src/IO/ZlibDeflatingWriteBuffer.h             |  8 +--
 src/IO/ZstdDeflatingWriteBuffer.h             |  4 +-
 src/IO/readDecimalText.h                      |  2 +-
 src/Interpreters/AddDefaultDatabaseVisitor.h  |  2 +-
 .../AggregateFunctionOfGroupByKeysVisitor.h   |  4 +-
 src/Interpreters/AggregationCommon.h          |  2 +-
 src/Interpreters/ArrayJoinedColumnsVisitor.h  | 10 +--
 src/Interpreters/AsynchronousInsertQueue.h    |  2 +-
 src/Interpreters/BackupLog.h                  |  2 +-
 src/Interpreters/Context.h                    |  2 -
 src/Interpreters/DirectJoin.h                 | 22 +++----
 src/Interpreters/GetAggregatesVisitor.h       |  4 +-
 src/Interpreters/GroupByFunctionKeysVisitor.h |  4 +-
 src/Interpreters/HashJoin.h                   |  2 +
 src/Interpreters/MonotonicityCheckVisitor.h   |  2 +-
 .../RedundantFunctionsInOrderByVisitor.h      |  2 +-
 src/Interpreters/SessionLog.h                 |  2 +-
 src/Interpreters/SetVariants.h                |  4 +-
 .../TranslateQualifiedNamesVisitor.h          |  2 +-
 src/Interpreters/TreeCNFConverter.h           |  2 +-
 src/Interpreters/joinDispatch.h               |  3 +-
 src/Loggers/OwnFormattingChannel.h            |  4 +-
 .../Executors/PullingAsyncPipelineExecutor.h  |  1 -
 src/Processors/Formats/IRowOutputFormat.h     |  6 +-
 .../Formats/Impl/ArrowBufferedStreams.cpp     |  2 +-
 .../Formats/Impl/AvroRowInputFormat.h         |  2 +-
 .../Formats/Impl/AvroRowOutputFormat.h        |  8 +--
 .../Formats/Impl/ConstantExpressionTemplate.h |  1 -
 .../Impl/ParallelFormattingOutputFormat.h     |  2 +-
 .../Formats/Impl/ParquetBlockOutputFormat.h   |  4 +-
 .../Impl/TabSeparatedRowOutputFormat.h        |  6 +-
 .../Formats/RowInputFormatWithNamesAndTypes.h |  2 +-
 .../Algorithms/AggregatingSortedAlgorithm.h   |  2 +-
 .../Merges/Algorithms/IMergingAlgorithm.h     |  2 +-
 src/Processors/Merges/Algorithms/RowRef.h     |  2 +-
 .../Transforms/MergeJoinTransform.h           |  6 +-
 .../Transforms/PasteJoinTransform.h           |  6 +-
 src/QueryPipeline/QueryPipelineBuilder.h      |  2 +-
 src/Server/GRPCServer.cpp                     |  2 -
 src/Server/HTTP/HTTPServerResponse.h          |  6 +-
 src/Server/HTTPHandler.h                      |  2 +-
 src/Storages/DataLakes/S3MetadataReader.h     |  4 +-
 src/Storages/FileLog/FileLogSource.h          |  2 +-
 src/Storages/Hive/HiveFile.h                  |  2 +-
 src/Storages/IStorage.cpp                     |  2 +-
 src/Storages/Kafka/KafkaConsumer.h            |  2 +-
 src/Storages/Kafka/parseSyslogLevel.cpp       |  2 +-
 src/Storages/Kafka/parseSyslogLevel.h         |  2 +-
 src/Storages/MergeTree/ColumnSizeEstimator.h  |  4 +-
 src/Storages/MergeTree/IMergeTreeDataPart.h   |  1 -
 src/Storages/MergeTree/LeaderElection.h       |  2 +-
 src/Storages/MergeTree/MarkRange.h            |  2 +-
 src/Storages/MergeTree/MergeTreeData.cpp      |  4 +-
 src/Storages/MergeTree/MergeTreeData.h        |  2 +-
 .../MergeTree/MergeTreeMutationStatus.h       |  2 +
 src/Storages/MergeTree/RPNBuilder.h           |  2 +-
 src/Storages/MergeTree/RangesInDataPart.h     |  2 +-
 .../ReplicatedMergeTreeQuorumAddedParts.h     |  2 +-
 src/Storages/MergeTree/checkDataPart.cpp      |  2 +-
 src/Storages/MergeTree/checkDataPart.h        |  2 +-
 src/Storages/RabbitMQ/RabbitMQProducer.cpp    |  6 +-
 src/Storages/RabbitMQ/RabbitMQProducer.h      |  6 +-
 src/Storages/S3Queue/StorageS3Queue.h         |  5 --
 src/Storages/StorageInMemoryMetadata.h        |  4 +-
 src/Storages/StorageMongoDBSocketFactory.h    |  2 +-
 src/Storages/StorageS3.h                      |  5 --
 src/Storages/StorageView.cpp                  |  2 +-
 src/Storages/StorageView.h                    |  4 +-
 src/Storages/System/StorageSystemPartsBase.h  |  2 +-
 src/Storages/System/StorageSystemTimeZones.h  |  1 -
 175 files changed, 349 insertions(+), 388 deletions(-)

diff --git a/.clang-tidy b/.clang-tidy
index 4aeb38ca409..e7900cbe2aa 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -5,9 +5,7 @@
 # a) the new check is not controversial (this includes many checks in readability-* and google-*) or
 # b) too noisy (checks with > 100 new warnings are considered noisy, this includes e.g. cppcoreguidelines-*).
 
-# TODO Let clang-tidy check headers in further directories
-#      --> HeaderFilterRegex: '^.*/(src|base|programs|utils)/.*(h|hpp)$'
-HeaderFilterRegex: '^.*/(base|programs|utils)/.*(h|hpp)$'
+HeaderFilterRegex: '^.*/(base|src|programs|utils)/.*(h|hpp)$'
 
 Checks: [
   '*',
@@ -37,6 +35,8 @@ Checks: [
   '-cert-oop54-cpp',
   '-cert-oop57-cpp',
 
+  '-clang-analyzer-optin.performance.Padding',
+
   '-clang-analyzer-unix.Malloc',
 
   '-cppcoreguidelines-*', # impractical in a codebase as large as ClickHouse, also slow
diff --git a/base/poco/Net/include/Poco/Net/HTTPRequestHandlerFactory.h b/base/poco/Net/include/Poco/Net/HTTPRequestHandlerFactory.h
index 029d936769b..9bc35b7ff70 100644
--- a/base/poco/Net/include/Poco/Net/HTTPRequestHandlerFactory.h
+++ b/base/poco/Net/include/Poco/Net/HTTPRequestHandlerFactory.h
@@ -30,7 +30,6 @@ namespace Net
 
 
     class HTTPServerRequest;
-    class HTTPServerResponse;
     class HTTPRequestHandler;
 
 
diff --git a/contrib/libmetrohash/src/metrohash64.cpp b/contrib/libmetrohash/src/metrohash64.cpp
index 7b5ec7f1a42..6ff64027292 100644
--- a/contrib/libmetrohash/src/metrohash64.cpp
+++ b/contrib/libmetrohash/src/metrohash64.cpp
@@ -26,13 +26,13 @@ const uint8_t MetroHash64::test_seed_1[8] =   { 0x3B, 0x0D, 0x48, 0x1C, 0xF4, 0x
 
 
-MetroHash64::MetroHash64(const uint64_t seed)
+MetroHash64::MetroHash64(uint64_t seed)
 {
     Initialize(seed);
 }
 
 
-void MetroHash64::Initialize(const uint64_t seed)
+void MetroHash64::Initialize(uint64_t seed)
 {
     vseed = (static_cast<uint64_t>(seed) + k2) * k0;
 
@@ -47,7 +47,7 @@ void MetroHash64::Initialize(const uint64_t seed)
 }
 
 
-void MetroHash64::Update(const uint8_t * const buffer, const uint64_t length)
+void MetroHash64::Update(const uint8_t * const buffer, uint64_t length)
 {
     const uint8_t * ptr = reinterpret_cast<const uint8_t*>(buffer);
     const uint8_t * const end = ptr + length;
@@ -62,7 +62,7 @@ void MetroHash64::Update(const uint8_t * const buffer, const uint64_t length)
         memcpy(input.b + (bytes % 32), ptr, static_cast<size_t>(fill));
         ptr   += fill;
         bytes += fill;
-        
+
         // input buffer is still partially filled
         if ((bytes % 32) != 0) return;
 
@@ -72,7 +72,7 @@ void MetroHash64::Update(const uint8_t * const buffer, const uint64_t length)
         state.v[2] += read_u64(&input.b[16]) * k2; state.v[2] = rotate_right(state.v[2],29) + state.v[0];
         state.v[3] += read_u64(&input.b[24]) * k3; state.v[3] = rotate_right(state.v[3],29) + state.v[1];
     }
-    
+
     // bulk update
     bytes += static_cast<uint64_t>(end - ptr);
     while (ptr <= (end - 32))
@@ -83,14 +83,14 @@ void MetroHash64::Update(const uint8_t * const buffer, const uint64_t length)
         state.v[2] += read_u64(ptr) * k2; ptr += 8; state.v[2] = rotate_right(state.v[2],29) + state.v[0];
         state.v[3] += read_u64(ptr) * k3; ptr += 8; state.v[3] = rotate_right(state.v[3],29) + state.v[1];
     }
-    
+
     // store remaining bytes in input buffer
     if (ptr < end)
         memcpy(input.b, ptr, static_cast<size_t>(end - ptr));
 }
 
 
-void MetroHash64::Finalize(uint8_t * const hash)
+void MetroHash64::Finalize(uint8_t * hash)
 {
     // finalize bulk loop, if used
     if (bytes >= 32)
@@ -102,11 +102,11 @@ void MetroHash64::Finalize(uint8_t * const hash)
 
         state.v[0] = vseed + (state.v[0] ^ state.v[1]);
     }
-    
+
     // process any bytes remaining in the input buffer
     const uint8_t * ptr = reinterpret_cast<const uint8_t*>(input.b);
     const uint8_t * const end = ptr + (bytes % 32);
-    
+
     if ((end - ptr) >= 16)
     {
         state.v[1]  = state.v[0] + (read_u64(ptr) * k2); ptr += 8; state.v[1] = rotate_right(state.v[1],29) * k3;
@@ -139,7 +139,7 @@ void MetroHash64::Finalize(uint8_t * const hash)
         state.v[0] += read_u8 (ptr) * k3;
         state.v[0] ^= rotate_right(state.v[0], 37) * k1;
     }
-    
+
     state.v[0] ^= rotate_right(state.v[0], 28);
     state.v[0] *= k0;
     state.v[0] ^= rotate_right(state.v[0], 29);
@@ -152,7 +152,7 @@ void MetroHash64::Finalize(uint8_t * const hash)
 }
 
 
-void MetroHash64::Hash(const uint8_t * buffer, const uint64_t length, uint8_t * const hash, const uint64_t seed)
+void MetroHash64::Hash(const uint8_t * buffer, uint64_t length, uint8_t * const hash, uint64_t seed)
 {
     const uint8_t * ptr = reinterpret_cast<const uint8_t*>(buffer);
     const uint8_t * const end = ptr + length;
@@ -238,7 +238,7 @@ bool MetroHash64::ImplementationVerified()
 
     // verify incremental implementation
     MetroHash64 metro;
-    
+
     metro.Initialize(0);
     metro.Update(reinterpret_cast<const uint8_t *>(MetroHash64::test_string), strlen(MetroHash64::test_string));
     metro.Finalize(hash);
@@ -262,9 +262,9 @@ void metrohash64_1(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * o
 
     const uint8_t * ptr = reinterpret_cast<const uint8_t*>(key);
     const uint8_t * const end = ptr + len;
-    
+
     uint64_t hash = ((static_cast<uint64_t>(seed) + k2) * k0) + len;
-    
+
     if (len >= 32)
     {
         uint64_t v[4];
@@ -272,7 +272,7 @@ void metrohash64_1(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * o
         v[1] = hash;
         v[2] = hash;
         v[3] = hash;
-        
+
         do
         {
             v[0] += read_u64(ptr) * k0; ptr += 8; v[0] = rotate_right(v[0],29) + v[2];
@@ -288,7 +288,7 @@ void metrohash64_1(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * o
         v[1] ^= rotate_right(((v[1] + v[3]) * k1) + v[2], 33) * k0;
         hash += v[0] ^ v[1];
     }
-    
+
     if ((end - ptr) >= 16)
     {
         uint64_t v0 = hash + (read_u64(ptr) * k0); ptr += 8; v0 = rotate_right(v0,33) * k1;
@@ -297,32 +297,32 @@ void metrohash64_1(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * o
         v1 ^= rotate_right(v1 * k3, 35) + v0;
         hash += v1;
     }
-    
+
     if ((end - ptr) >= 8)
     {
         hash += read_u64(ptr) * k3; ptr += 8;
         hash ^= rotate_right(hash, 33) * k1;
-        
+
     }
-    
+
     if ((end - ptr) >= 4)
     {
         hash += read_u32(ptr) * k3; ptr += 4;
         hash ^= rotate_right(hash, 15) * k1;
     }
-    
+
     if ((end - ptr) >= 2)
     {
         hash += read_u16(ptr) * k3; ptr += 2;
         hash ^= rotate_right(hash, 13) * k1;
     }
-    
+
     if ((end - ptr) >= 1)
     {
         hash += read_u8 (ptr) * k3;
         hash ^= rotate_right(hash, 25) * k1;
     }
-    
+
     hash ^= rotate_right(hash, 33);
     hash *= k0;
     hash ^= rotate_right(hash, 33);
@@ -336,13 +336,13 @@ void metrohash64_2(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * o
     static const uint64_t k0 = 0xD6D018F5;
     static const uint64_t k1 = 0xA2AA033B;
     static const uint64_t k2 = 0x62992FC1;
-    static const uint64_t k3 = 0x30BC5B29; 
+    static const uint64_t k3 = 0x30BC5B29;
 
     const uint8_t * ptr = reinterpret_cast<const uint8_t*>(key);
     const uint8_t * const end = ptr + len;
-    
+
     uint64_t hash = ((static_cast<uint64_t>(seed) + k2) * k0) + len;
-    
+
     if (len >= 32)
     {
         uint64_t v[4];
@@ -350,7 +350,7 @@ void metrohash64_2(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * o
         v[1] = hash;
         v[2] = hash;
         v[3] = hash;
-        
+
         do
         {
             v[0] += read_u64(ptr) * k0; ptr += 8; v[0] = rotate_right(v[0],29) + v[2];
@@ -366,7 +366,7 @@ void metrohash64_2(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * o
         v[1] ^= rotate_right(((v[1] + v[3]) * k1) + v[2], 30) * k0;
         hash += v[0] ^ v[1];
     }
-    
+
     if ((end - ptr) >= 16)
     {
         uint64_t v0 = hash + (read_u64(ptr) * k2); ptr += 8; v0 = rotate_right(v0,29) * k3;
@@ -375,31 +375,31 @@ void metrohash64_2(const uint8_t * key, uint64_t len, uint32_t seed, uint8_t * o
         v1 ^= rotate_right(v1 * k3, 34) + v0;
         hash += v1;
     }
-    
+
     if ((end - ptr) >= 8)
     {
         hash += read_u64(ptr) * k3; ptr += 8;
         hash ^= rotate_right(hash, 36) * k1;
     }
-    
+
     if ((end - ptr) >= 4)
     {
         hash += read_u32(ptr) * k3; ptr += 4;
         hash ^= rotate_right(hash, 15) * k1;
     }
-    
+
     if ((end - ptr) >= 2)
     {
         hash += read_u16(ptr) * k3; ptr += 2;
         hash ^= rotate_right(hash, 15) * k1;
     }
-    
+
     if ((end - ptr) >= 1)
     {
         hash += read_u8 (ptr) * k3;
         hash ^= rotate_right(hash, 23) * k1;
     }
-    
+
     hash ^= rotate_right(hash, 28);
     hash *= k0;
     hash ^= rotate_right(hash, 29);
diff --git a/contrib/libmetrohash/src/metrohash64.h b/contrib/libmetrohash/src/metrohash64.h
index 911e54e6863..7003a1848be 100644
--- a/contrib/libmetrohash/src/metrohash64.h
+++ b/contrib/libmetrohash/src/metrohash64.h
@@ -25,24 +25,24 @@ public:
     static const uint32_t bits = 64;
 
     // Constructor initializes the same as Initialize()
-    explicit MetroHash64(const uint64_t seed=0);
+    explicit MetroHash64(uint64_t seed=0);
 
     // Initializes internal state for new hash with optional seed
-    void Initialize(const uint64_t seed=0);
+    void Initialize(uint64_t seed=0);
 
     // Update the hash state with a string of bytes. If the length
     // is sufficiently long, the implementation switches to a bulk
     // hashing algorithm directly on the argument buffer for speed.
-    void Update(const uint8_t * buffer, const uint64_t length);
+    void Update(const uint8_t * buffer, uint64_t length);
 
     // Constructs the final hash and writes it to the argument buffer.
     // After a hash is finalized, this instance must be Initialized()-ed
     // again or the behavior of Update() and Finalize() is undefined.
-    void Finalize(uint8_t * const hash);
+    void Finalize(uint8_t * hash);
 
     // A non-incremental function implementation. This can be significantly
     // faster than the incremental implementation for some usage patterns.
-    static void Hash(const uint8_t * buffer, const uint64_t length, uint8_t * const hash, const uint64_t seed=0);
+    static void Hash(const uint8_t * buffer, uint64_t length, uint8_t * hash, uint64_t seed=0);
 
     // Does implementation correctly execute test vectors?
     static bool ImplementationVerified();
diff --git a/src/Access/AccessBackup.cpp b/src/Access/AccessBackup.cpp
index 800a54e69b3..ba89899dd8f 100644
--- a/src/Access/AccessBackup.cpp
+++ b/src/Access/AccessBackup.cpp
@@ -297,7 +297,7 @@ namespace
 
 
 std::pair<String, BackupEntryPtr> makeBackupEntryForAccess(
-    const std::vector<std::pair<UUID, AccessEntityPtr>> access_entities,
+    const std::vector<std::pair<UUID, AccessEntityPtr>> & access_entities,
     const String & data_path_in_backup,
     size_t counter,
     const AccessControl & access_control)
@@ -326,7 +326,7 @@ void AccessRestorerFromBackup::addDataPath(const String & data_path)
         return;
 
     fs::path data_path_in_backup_fs = data_path;
-    Strings filenames = backup->listFiles(data_path);
+    Strings filenames = backup->listFiles(data_path, /*recursive*/ false);
     if (filenames.empty())
         return;
 
diff --git a/src/Access/AccessBackup.h b/src/Access/AccessBackup.h
index 99f22b6c6a8..1aaac589ccb 100644
--- a/src/Access/AccessBackup.h
+++ b/src/Access/AccessBackup.h
@@ -21,7 +21,7 @@ struct RestoreSettings;
 
 /// Makes a backup of access entities of a specified type.
 std::pair<String, BackupEntryPtr> makeBackupEntryForAccess(
-    const std::vector<std::pair<UUID, AccessEntityPtr>> access_entities,
+    const std::vector<std::pair<UUID, AccessEntityPtr>> & access_entities,
     const String & data_path_in_backup,
     size_t counter,
     const AccessControl & access_control);
diff --git a/src/Access/ContextAccessParams.cpp b/src/Access/ContextAccessParams.cpp
index ec839a37b1a..07374e9bbf5 100644
--- a/src/Access/ContextAccessParams.cpp
+++ b/src/Access/ContextAccessParams.cpp
@@ -7,7 +7,7 @@ namespace DB
 {
 
 ContextAccessParams::ContextAccessParams(
-    const std::optional<UUID> user_id_,
+    std::optional<UUID> user_id_,
     bool full_access_,
     bool use_default_roles_,
     const std::shared_ptr<const std::vector<UUID>> & current_roles_,
diff --git a/src/Access/ContextAccessParams.h b/src/Access/ContextAccessParams.h
index 8b68fa44ed4..07503a3af6d 100644
--- a/src/Access/ContextAccessParams.h
+++ b/src/Access/ContextAccessParams.h
@@ -15,7 +15,7 @@ class ContextAccessParams
 {
 public:
     ContextAccessParams(
-        const std::optional<UUID> user_id_,
+        std::optional<UUID> user_id_,
         bool full_access_,
         bool use_default_roles_,
         const std::shared_ptr<const std::vector<UUID>> & current_roles_,
diff --git a/src/Access/GSSAcceptor.h b/src/Access/GSSAcceptor.h
index 8d490fb47ae..225e03056ac 100644
--- a/src/Access/GSSAcceptor.h
+++ b/src/Access/GSSAcceptor.h
@@ -34,7 +34,7 @@ public:
     };
 
     explicit GSSAcceptorContext(const Params & params_);
-    virtual ~GSSAcceptorContext() override;
+    ~GSSAcceptorContext() override;
 
     GSSAcceptorContext(const GSSAcceptorContext &) = delete;
     GSSAcceptorContext(GSSAcceptorContext &&) = delete;
diff --git a/src/Access/LDAPAccessStorage.cpp b/src/Access/LDAPAccessStorage.cpp
index c271cd39845..b1f10cd2d49 100644
--- a/src/Access/LDAPAccessStorage.cpp
+++ b/src/Access/LDAPAccessStorage.cpp
@@ -204,7 +204,7 @@ void LDAPAccessStorage::assignRolesNoLock(User & user, const LDAPClient::SearchR
 }
 
 
-void LDAPAccessStorage::assignRolesNoLock(User & user, const LDAPClient::SearchResultsList & external_roles, const std::size_t external_roles_hash) const
+void LDAPAccessStorage::assignRolesNoLock(User & user, const LDAPClient::SearchResultsList & external_roles, std::size_t external_roles_hash) const
 {
     const auto & user_name = user.getName();
     auto & granted_roles = user.granted_roles;
diff --git a/src/Access/LDAPAccessStorage.h b/src/Access/LDAPAccessStorage.h
index b01f58c724a..d5da64e4111 100644
--- a/src/Access/LDAPAccessStorage.h
+++ b/src/Access/LDAPAccessStorage.h
@@ -33,29 +33,29 @@ public:
     static constexpr char STORAGE_TYPE[] = "ldap";
 
     explicit LDAPAccessStorage(const String & storage_name_, AccessControl & access_control_, const Poco::Util::AbstractConfiguration & config, const String & prefix);
-    virtual ~LDAPAccessStorage() override = default;
+    ~LDAPAccessStorage() override = default;
 
     String getLDAPServerName() const;
 
     // IAccessStorage implementations.
-    virtual const char * getStorageType() const override;
-    virtual String getStorageParamsJSON() const override;
-    virtual bool isReadOnly() const override { return true; }
-    virtual bool exists(const UUID & id) const override;
+    const char * getStorageType() const override;
+    String getStorageParamsJSON() const override;
+    bool isReadOnly() const override { return true; }
+    bool exists(const UUID & id) const override;
 
 private: // IAccessStorage implementations.
-    virtual std::optional<UUID> findImpl(AccessEntityType type, const String & name) const override;
-    virtual std::vector<UUID> findAllImpl(AccessEntityType type) const override;
-    virtual AccessEntityPtr readImpl(const UUID & id, bool throw_if_not_exists) const override;
-    virtual std::optional<std::pair<String, AccessEntityType>> readNameWithTypeImpl(const UUID & id, bool throw_if_not_exists) const override;
-    virtual std::optional<AuthResult> authenticateImpl(const Credentials & credentials, const Poco::Net::IPAddress & address, const ExternalAuthenticators & external_authenticators, bool throw_if_user_not_exists, bool allow_no_password, bool allow_plaintext_password) const override;
+    std::optional<UUID> findImpl(AccessEntityType type, const String & name) const override;
+    std::vector<UUID> findAllImpl(AccessEntityType type) const override;
+    AccessEntityPtr readImpl(const UUID & id, bool throw_if_not_exists) const override;
+    std::optional<std::pair<String, AccessEntityType>> readNameWithTypeImpl(const UUID & id, bool throw_if_not_exists) const override;
+    std::optional<AuthResult> authenticateImpl(const Credentials & credentials, const Poco::Net::IPAddress & address, const ExternalAuthenticators & external_authenticators, bool throw_if_user_not_exists, bool allow_no_password, bool allow_plaintext_password) const override;
 
     void setConfiguration(const Poco::Util::AbstractConfiguration & config, const String & prefix);
     void processRoleChange(const UUID & id, const AccessEntityPtr & entity);
 
     void applyRoleChangeNoLock(bool grant, const UUID & role_id, const String & role_name);
     void assignRolesNoLock(User & user, const LDAPClient::SearchResultsList & external_roles) const;
-    void assignRolesNoLock(User & user, const LDAPClient::SearchResultsList & external_roles, const std::size_t external_roles_hash) const;
+    void assignRolesNoLock(User & user, const LDAPClient::SearchResultsList & external_roles, std::size_t external_roles_hash) const;
     void updateAssignedRolesNoLock(const UUID & id, const String & user_name, const LDAPClient::SearchResultsList & external_roles) const;
     std::set<String> mapExternalRolesNoLock(const LDAPClient::SearchResultsList & external_roles) const;
     bool areLDAPCredentialsValidNoLock(const User & user, const Credentials & credentials,
diff --git a/src/AggregateFunctions/AggregateFunctionFlameGraph.cpp b/src/AggregateFunctions/AggregateFunctionFlameGraph.cpp
index f6aafd9a9b1..f3d99046036 100644
--- a/src/AggregateFunctions/AggregateFunctionFlameGraph.cpp
+++ b/src/AggregateFunctions/AggregateFunctionFlameGraph.cpp
@@ -252,7 +252,6 @@ void dumpFlameGraph(
     fillColumn(chars, offsets, out.str());
 }
 
-// NOLINTBEGIN(clang-analyzer-optin.performance.Padding)
 struct AggregateFunctionFlameGraphData
 {
     struct Entry
@@ -469,7 +468,6 @@ struct AggregateFunctionFlameGraphData
         DB::dumpFlameGraph(tree.dump(max_depth, min_bytes), chars, offsets);
     }
 };
-// NOLINTEND(clang-analyzer-optin.performance.Padding)
 
 /// Aggregate function which builds a flamegraph using the list of stacktraces.
 /// The output is an array of strings which can be used by flamegraph.pl util.
diff --git a/src/AggregateFunctions/AggregateFunctionMLMethod.h b/src/AggregateFunctions/AggregateFunctionMLMethod.h
index fd50fe4b28c..cfb8550d829 100644
--- a/src/AggregateFunctions/AggregateFunctionMLMethod.h
+++ b/src/AggregateFunctions/AggregateFunctionMLMethod.h
@@ -157,7 +157,7 @@ public:
 
     void update(UInt64 batch_size, std::vector<Float64> & weights, Float64 & bias, Float64 learning_rate, const std::vector<Float64> & batch_gradient) override;
 
-    virtual void merge(const IWeightsUpdater & rhs, Float64 frac, Float64 rhs_frac) override;
+    void merge(const IWeightsUpdater & rhs, Float64 frac, Float64 rhs_frac) override;
 
     void write(WriteBuffer & buf) const override;
 
@@ -189,7 +189,7 @@ public:
 
     void update(UInt64 batch_size, std::vector<Float64> & weights, Float64 & bias, Float64 learning_rate, const std::vector<Float64> & batch_gradient) override;
 
-    virtual void merge(const IWeightsUpdater & rhs, Float64 frac, Float64 rhs_frac) override;
+    void merge(const IWeightsUpdater & rhs, Float64 frac, Float64 rhs_frac) override;
 
     void write(WriteBuffer & buf) const override;
 
@@ -226,7 +226,7 @@ public:
 
     void update(UInt64 batch_size, std::vector<Float64> & weights, Float64 & bias, Float64 learning_rate, const std::vector<Float64> & batch_gradient) override;
 
-    virtual void merge(const IWeightsUpdater & rhs, Float64 frac, Float64 rhs_frac) override;
+    void merge(const IWeightsUpdater & rhs, Float64 frac, Float64 rhs_frac) override;
 
     void write(WriteBuffer & buf) const override;
 
diff --git a/src/AggregateFunctions/AggregateFunctionStatisticsSimple.h b/src/AggregateFunctions/AggregateFunctionStatisticsSimple.h
index f9a60c0c0b4..cb20d54b2a8 100644
--- a/src/AggregateFunctions/AggregateFunctionStatisticsSimple.h
+++ b/src/AggregateFunctions/AggregateFunctionStatisticsSimple.h
@@ -234,9 +234,6 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
-namespace
-{
-
 template <template <typename> typename FunctionTemplate, StatisticsFunctionKind kind>
 AggregateFunctionPtr createAggregateFunctionStatisticsUnary(
     const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings *)
@@ -273,5 +270,3 @@ AggregateFunctionPtr createAggregateFunctionStatisticsBinary(
 }
 
 }
-
-}
diff --git a/src/AggregateFunctions/AggregateFunctionUniqCombined.h b/src/AggregateFunctions/AggregateFunctionUniqCombined.h
index 10774442610..6d5486a3b09 100644
--- a/src/AggregateFunctions/AggregateFunctionUniqCombined.h
+++ b/src/AggregateFunctions/AggregateFunctionUniqCombined.h
@@ -42,9 +42,6 @@ struct UniqCombinedHashTableGrower : public HashTableGrowerWithPrecalculation<>
     void increaseSize() { increaseSizeDegree(1); }
 };
 
-namespace
-{
-
 template <typename T, UInt8 K, typename HashValueType>
 struct AggregateFunctionUniqCombinedData
 {
@@ -268,8 +265,6 @@ AggregateFunctionPtr createAggregateFunctionWithK(const DataTypes & argument_typ
         return std::make_shared<typename WithK<K, HashValueType>::template AggregateFunctionVariadic<false, false>>(argument_types, params);
 }
 
-}
-
 template <UInt8 K>
 AggregateFunctionPtr createAggregateFunctionWithHashType(bool use_64_bit_hash, const DataTypes & argument_types, const Array & params)
 {
diff --git a/src/AggregateFunctions/Combinators/AggregateFunctionNull.h b/src/AggregateFunctions/Combinators/AggregateFunctionNull.h
index ba72f960852..72ab3cf5acb 100644
--- a/src/AggregateFunctions/Combinators/AggregateFunctionNull.h
+++ b/src/AggregateFunctions/Combinators/AggregateFunctionNull.h
@@ -521,7 +521,7 @@ public:
             }
         }
 
-        chassert(nullable_filters.size() > 0);
+        chassert(!nullable_filters.empty());
         bool found_one = false;
         if (nullable_filters.size() == 1)
         {
diff --git a/src/AggregateFunctions/DDSketch/Store.h b/src/AggregateFunctions/DDSketch/Store.h
index 91eaeacedfe..428b2a6c9b8 100644
--- a/src/AggregateFunctions/DDSketch/Store.h
+++ b/src/AggregateFunctions/DDSketch/Store.h
@@ -38,7 +38,7 @@ public:
         offset = other->offset;
     }
 
-    int length()
+    int length() const
     {
         return static_cast<int>(bins.size());
     }
diff --git a/src/AggregateFunctions/QuantileExact.h b/src/AggregateFunctions/QuantileExact.h
index a92d1979bab..94e321083a7 100644
--- a/src/AggregateFunctions/QuantileExact.h
+++ b/src/AggregateFunctions/QuantileExact.h
@@ -150,7 +150,7 @@ struct QuantileExactExclusive : public QuantileExact<Value>
                 return static_cast<Float64>(*std::min_element(array.begin(), array.end()));
 
             ::nth_element(array.begin(), array.begin() + n - 1, array.end());
-            auto nth_elem = std::min_element(array.begin() + n, array.end());
+            auto * nth_elem = std::min_element(array.begin() + n, array.end());
 
             return static_cast<Float64>(array[n - 1]) + (h - n) * static_cast<Float64>(*nth_elem - array[n - 1]);
         }
@@ -179,7 +179,7 @@ struct QuantileExactExclusive : public QuantileExact<Value>
                 else
                 {
                     ::nth_element(array.begin() + prev_n, array.begin() + n - 1, array.end());
-                    auto nth_elem = std::min_element(array.begin() + n, array.end());
+                    auto * nth_elem = std::min_element(array.begin() + n, array.end());
 
                     result[indices[i]] = static_cast<Float64>(array[n - 1]) + (h - n) * static_cast<Float64>(*nth_elem - array[n - 1]);
                     prev_n = n - 1;
@@ -214,7 +214,7 @@ struct QuantileExactInclusive : public QuantileExact<Value>
             else if (n < 1)
                 return static_cast<Float64>(*std::min_element(array.begin(), array.end()));
             ::nth_element(array.begin(), array.begin() + n - 1, array.end());
-            auto nth_elem = std::min_element(array.begin() + n, array.end());
+            auto * nth_elem = std::min_element(array.begin() + n, array.end());
 
             return static_cast<Float64>(array[n - 1]) + (h - n) * static_cast<Float64>(*nth_elem - array[n - 1]);
         }
@@ -241,7 +241,7 @@ struct QuantileExactInclusive : public QuantileExact<Value>
                 else
                 {
                     ::nth_element(array.begin() + prev_n, array.begin() + n - 1, array.end());
-                    auto nth_elem = std::min_element(array.begin() + n, array.end());
+                    auto * nth_elem = std::min_element(array.begin() + n, array.end());
 
                     result[indices[i]] = static_cast<Float64>(array[n - 1]) + (h - n) * (static_cast<Float64>(*nth_elem) - array[n - 1]);
                     prev_n = n - 1;
diff --git a/src/AggregateFunctions/ReservoirSamplerDeterministic.h b/src/AggregateFunctions/ReservoirSamplerDeterministic.h
index daed0b98ca3..b7032a01884 100644
--- a/src/AggregateFunctions/ReservoirSamplerDeterministic.h
+++ b/src/AggregateFunctions/ReservoirSamplerDeterministic.h
@@ -191,7 +191,7 @@ public:
             /// TODO: After implementation of "versioning aggregate function state",
             /// change the serialization format.
             Element elem;
-            memset(&elem, 0, sizeof(elem));
+            memset(&elem, 0, sizeof(elem)); /// NOLINT(bugprone-undefined-memory-manipulation)
             elem = samples[i];
 
             DB::transformEndianness<std::endian::little>(elem);
diff --git a/src/AggregateFunctions/SingleValueData.h b/src/AggregateFunctions/SingleValueData.h
index 2ba98f8a9c3..cde13b128e5 100644
--- a/src/AggregateFunctions/SingleValueData.h
+++ b/src/AggregateFunctions/SingleValueData.h
@@ -23,7 +23,7 @@ struct SingleValueDataBase
     /// For example argMin holds 1 of these (for the result), while keeping a template for the value
     static constexpr UInt32 MAX_STORAGE_SIZE = 64;
 
-    virtual ~SingleValueDataBase() { }
+    virtual ~SingleValueDataBase() = default;
     virtual bool has() const = 0;
     virtual void insertResultInto(IColumn &) const = 0;
     virtual void write(WriteBuffer &, const ISerialization &) const = 0;
diff --git a/src/AggregateFunctions/UniqExactSet.h b/src/AggregateFunctions/UniqExactSet.h
index 2a790690f51..131c59b9ed6 100644
--- a/src/AggregateFunctions/UniqExactSet.h
+++ b/src/AggregateFunctions/UniqExactSet.h
@@ -39,8 +39,8 @@ public:
     /// This method will convert all the SingleLevelSet to TwoLevelSet in parallel if the hashsets are not all singlelevel or not all twolevel.
     static void parallelizeMergePrepare(const std::vector<UniqExactSet *> & data_vec, ThreadPool & thread_pool)
     {
-        unsigned long single_level_set_num = 0;
-        unsigned long all_single_hash_size = 0;
+        UInt64 single_level_set_num = 0;
+        UInt64 all_single_hash_size = 0;
 
         for (auto ele : data_vec)
         {
diff --git a/src/Analyzer/Passes/QueryAnalysisPass.h b/src/Analyzer/Passes/QueryAnalysisPass.h
index 8c746833eee..e0a42a530b0 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.h
+++ b/src/Analyzer/Passes/QueryAnalysisPass.h
@@ -77,7 +77,7 @@ public:
       * Available expression columns are extracted from table expression.
       * Table expression node must have query, union, table, table function type.
       */
-    QueryAnalysisPass(QueryTreeNodePtr table_expression_, bool only_analyze_ = false);
+    explicit QueryAnalysisPass(QueryTreeNodePtr table_expression_, bool only_analyze_ = false);
 
     String getName() override
     {
diff --git a/src/Backups/BackupSettings.h b/src/Backups/BackupSettings.h
index f26b992b348..10181ea464a 100644
--- a/src/Backups/BackupSettings.h
+++ b/src/Backups/BackupSettings.h
@@ -26,7 +26,7 @@ struct BackupSettings
     String password;
 
     /// S3 storage class.
-    String s3_storage_class = "";
+    String s3_storage_class;
 
     /// If this is set to true then only create queries will be written to backup,
     /// without the data of tables.
diff --git a/src/Backups/IBackup.h b/src/Backups/IBackup.h
index 5663f1ed3e8..6f366a58103 100644
--- a/src/Backups/IBackup.h
+++ b/src/Backups/IBackup.h
@@ -80,7 +80,7 @@ public:
 
     /// Returns names of entries stored in a specified directory in the backup.
     /// If `directory` is empty or '/' the functions returns entries in the backup's root.
-    virtual Strings listFiles(const String & directory, bool recursive = false) const = 0;
+    virtual Strings listFiles(const String & directory, bool recursive) const = 0;
 
     /// Checks if a specified directory contains any files.
     /// The function returns the same as `!listFiles(directory).empty()`.
@@ -108,11 +108,9 @@ public:
     virtual std::unique_ptr<SeekableReadBuffer> readFile(const SizeAndChecksum & size_and_checksum) const = 0;
 
     /// Copies a file from the backup to a specified destination disk. Returns the number of bytes written.
-    virtual size_t copyFileToDisk(const String & file_name, DiskPtr destination_disk, const String & destination_path,
-                                  WriteMode write_mode = WriteMode::Rewrite) const = 0;
+    virtual size_t copyFileToDisk(const String & file_name, DiskPtr destination_disk, const String & destination_path, WriteMode write_mode) const = 0;
 
-    virtual size_t copyFileToDisk(const SizeAndChecksum & size_and_checksum, DiskPtr destination_disk, const String & destination_path,
-                                  WriteMode write_mode = WriteMode::Rewrite) const = 0;
+    virtual size_t copyFileToDisk(const SizeAndChecksum & size_and_checksum, DiskPtr destination_disk, const String & destination_path, WriteMode write_mode) const = 0;
 
     /// Puts a new entry to the backup.
     virtual void writeFile(const BackupFileInfo & file_info, BackupEntryPtr entry) = 0;
diff --git a/src/Backups/RestorerFromBackup.cpp b/src/Backups/RestorerFromBackup.cpp
index e20e8eb66c6..ed1d5b8a103 100644
--- a/src/Backups/RestorerFromBackup.cpp
+++ b/src/Backups/RestorerFromBackup.cpp
@@ -273,7 +273,7 @@ void RestorerFromBackup::findRootPathsInBackup()
     root_paths_in_backup.push_back(root_path);
 
     /// Add shard-related part to the root path.
-    Strings shards_in_backup = backup->listFiles(root_path / "shards");
+    Strings shards_in_backup = backup->listFiles(root_path / "shards", /*recursive*/ false);
     if (shards_in_backup.empty())
     {
         if (restore_settings.shard_num_in_backup > 1)
@@ -295,7 +295,7 @@ void RestorerFromBackup::findRootPathsInBackup()
     }
 
     /// Add replica-related part to the root path.
-    Strings replicas_in_backup = backup->listFiles(root_path / "replicas");
+    Strings replicas_in_backup = backup->listFiles(root_path / "replicas", /*recursive*/ false);
     if (replicas_in_backup.empty())
     {
         if (restore_settings.replica_num_in_backup > 1)
@@ -514,7 +514,7 @@ void RestorerFromBackup::findDatabaseInBackupImpl(const String & database_name_i
         if (!metadata_path && !try_metadata_path.empty() && backup->fileExists(try_metadata_path))
             metadata_path = try_metadata_path;
 
-        Strings file_names = backup->listFiles(try_tables_metadata_path);
+        Strings file_names = backup->listFiles(try_tables_metadata_path, /*recursive*/ false);
         for (const String & file_name : file_names)
         {
             if (!file_name.ends_with(".sql"))
@@ -575,7 +575,7 @@ void RestorerFromBackup::findEverythingInBackup(const std::set<String> & except_
 
     for (const auto & root_path_in_backup : root_paths_in_backup)
     {
-        Strings file_names = backup->listFiles(root_path_in_backup / "metadata");
+        Strings file_names = backup->listFiles(root_path_in_backup / "metadata", /*recursive*/ false);
         for (String & file_name : file_names)
         {
             if (file_name.ends_with(".sql"))
diff --git a/src/Client/HedgedConnectionsFactory.h b/src/Client/HedgedConnectionsFactory.h
index ce7b553acdd..2b7ec3f3fe5 100644
--- a/src/Client/HedgedConnectionsFactory.h
+++ b/src/Client/HedgedConnectionsFactory.h
@@ -159,7 +159,7 @@ private:
     size_t requested_connections_count = 0;
 
     const size_t max_parallel_replicas = 0;
-    const bool skip_unavailable_shards = 0;
+    const bool skip_unavailable_shards = false;
 };
 
 }
diff --git a/src/Client/TestHint.h b/src/Client/TestHint.h
index 7858b7f04a4..eaf854be5df 100644
--- a/src/Client/TestHint.h
+++ b/src/Client/TestHint.h
@@ -77,12 +77,12 @@ private:
     {
         if (actual_server_error && std::find(server_errors.begin(), server_errors.end(), actual_server_error) == server_errors.end())
             return false;
-        if (!actual_server_error && server_errors.size())
+        if (!actual_server_error && !server_errors.empty())
             return false;
 
         if (actual_client_error && std::find(client_errors.begin(), client_errors.end(), actual_client_error) == client_errors.end())
             return false;
-        if (!actual_client_error && client_errors.size())
+        if (!actual_client_error && !client_errors.empty())
             return false;
 
         return true;
@@ -90,7 +90,7 @@ private:
 
     bool lostExpectedError(int actual_server_error, int actual_client_error) const
     {
-        return (server_errors.size() && !actual_server_error) || (client_errors.size() && !actual_client_error);
+        return (!server_errors.empty() && !actual_server_error) || (!client_errors.empty() && !actual_client_error);
     }
 };
 
diff --git a/src/Columns/ColumnUnique.h b/src/Columns/ColumnUnique.h
index 76bbbbacdbf..a8873140817 100644
--- a/src/Columns/ColumnUnique.h
+++ b/src/Columns/ColumnUnique.h
@@ -671,7 +671,7 @@ IColumnUnique::IndexesWithOverflow ColumnUnique<ColumnType>::uniqueInsertRangeWi
     size_t max_dictionary_size)
 {
     auto overflowed_keys = column_holder->cloneEmpty();
-    auto overflowed_keys_ptr = typeid_cast<ColumnType *>(overflowed_keys.get());
+    auto * overflowed_keys_ptr = typeid_cast<ColumnType *>(overflowed_keys.get());
     if (!overflowed_keys_ptr)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid keys type for ColumnUnique.");
 
diff --git a/src/Columns/ReverseIndex.h b/src/Columns/ReverseIndex.h
index 2e59cea2c22..e2c422a0b3b 100644
--- a/src/Columns/ReverseIndex.h
+++ b/src/Columns/ReverseIndex.h
@@ -86,7 +86,7 @@ struct ReverseIndexHashTableCell
     {
         /// Careful: apparently this uses SFINAE to redefine isZero for all types
         /// except the IndexType, for which the default ZeroTraits::isZero is used.
-        static_assert(!std::is_same_v<typename std::decay<T>::type, typename std::decay<IndexType>::type>);
+        static_assert(!std::is_same_v<typename std::decay_t<T>, typename std::decay_t<IndexType>>);
         return false;
     }
 
diff --git a/src/Common/AllocatorWithMemoryTracking.h b/src/Common/AllocatorWithMemoryTracking.h
index b43870e05b2..52bfe1cc3fa 100644
--- a/src/Common/AllocatorWithMemoryTracking.h
+++ b/src/Common/AllocatorWithMemoryTracking.h
@@ -26,10 +26,10 @@ struct AllocatorWithMemoryTracking
 
     [[nodiscard]] T * allocate(size_t n)
     {
-        if (n > std::numeric_limits<size_t>::max() / sizeof(T))
+        if (n > std::numeric_limits<size_t>::max() / sizeof(T)) /// NOLINT(bugprone-sizeof-expression)
             throw std::bad_alloc();
 
-        size_t bytes = n * sizeof(T);
+        size_t bytes = n * sizeof(T); /// NOLINT(bugprone-sizeof-expression)
         auto trace = CurrentMemoryTracker::alloc(bytes);
 
         T * p = static_cast<T *>(malloc(bytes));
@@ -43,7 +43,7 @@ struct AllocatorWithMemoryTracking
 
     void deallocate(T * p, size_t n) noexcept
     {
-        size_t bytes = n * sizeof(T);
+        size_t bytes = n * sizeof(T); /// NOLINT(bugprone-sizeof-expression)
 
         free(p);
         auto trace = CurrentMemoryTracker::free(bytes);
diff --git a/src/Common/Arena.h b/src/Common/Arena.h
index ba5b9ea9205..db0e4883553 100644
--- a/src/Common/Arena.h
+++ b/src/Common/Arena.h
@@ -49,7 +49,7 @@ private:
 
         MemoryChunk() = default;
 
-        void swap(MemoryChunk & other)
+        void swap(MemoryChunk & other) noexcept
         {
             std::swap(begin, other.begin);
             std::swap(pos, other.pos);
@@ -57,12 +57,12 @@ private:
             prev.swap(other.prev);
         }
 
-        MemoryChunk(MemoryChunk && other)
+        MemoryChunk(MemoryChunk && other) noexcept
         {
             *this = std::move(other);
         }
 
-        MemoryChunk & operator=(MemoryChunk && other)
+        MemoryChunk & operator=(MemoryChunk && other) noexcept
         {
             swap(other);
             return *this;
diff --git a/src/Common/FrequencyHolder.h b/src/Common/FrequencyHolder.h
index 73675ed9814..64207dc5423 100644
--- a/src/Common/FrequencyHolder.h
+++ b/src/Common/FrequencyHolder.h
@@ -47,7 +47,6 @@ public:
         HashMap<UInt16, Float64> map;
     };
 
-public:
     using Map = HashMap<StringRef, Float64>;
     using Container = std::vector<Language>;
 
diff --git a/src/Common/HTTPConnectionPool.h b/src/Common/HTTPConnectionPool.h
index 7fd0847f5a7..a883a18ab8e 100644
--- a/src/Common/HTTPConnectionPool.h
+++ b/src/Common/HTTPConnectionPool.h
@@ -44,11 +44,12 @@ public:
     virtual const Metrics & getMetrics() const = 0;
     virtual ~IHTTPConnectionPoolForEndpoint() = default;
 
+    IHTTPConnectionPoolForEndpoint(const IHTTPConnectionPoolForEndpoint &) = delete;
+    IHTTPConnectionPoolForEndpoint & operator=(const IHTTPConnectionPoolForEndpoint &) = delete;
+
 protected:
     IHTTPConnectionPoolForEndpoint() = default;
 
-    IHTTPConnectionPoolForEndpoint(const IHTTPConnectionPoolForEndpoint &) = delete;
-    IHTTPConnectionPoolForEndpoint & operator=(const IHTTPConnectionPoolForEndpoint &) = delete;
 };
 
 enum class HTTPConnectionGroupType
@@ -70,11 +71,12 @@ public:
         static constexpr size_t warning_step = 100;
     };
 
-private:
-    HTTPConnectionPools();
     HTTPConnectionPools(const HTTPConnectionPools &) = delete;
     HTTPConnectionPools & operator=(const HTTPConnectionPools &) = delete;
 
+private:
+    HTTPConnectionPools();
+
 public:
     static HTTPConnectionPools & instance();
 
diff --git a/src/Common/HashTable/HashTable.h b/src/Common/HashTable/HashTable.h
index f23c4ca15dd..9050b7ef6d7 100644
--- a/src/Common/HashTable/HashTable.h
+++ b/src/Common/HashTable/HashTable.h
@@ -92,7 +92,8 @@ inline bool bitEquals(T && a, T && b)
     using RealT = std::decay_t<T>;
 
     if constexpr (std::is_floating_point_v<RealT>)
-        return 0 == memcmp(&a, &b, sizeof(RealT));  /// Note that memcmp with constant size is compiler builtin.
+        /// Note that memcmp with constant size is compiler builtin.
+        return 0 == memcmp(&a, &b, sizeof(RealT)); /// NOLINT
     else
         return a == b;
 }
@@ -644,7 +645,7 @@ protected:
 
         /// Copy to a new location and zero the old one.
         x.setHash(hash_value);
-        memcpy(static_cast<void*>(&buf[place_value]), &x, sizeof(x));
+        memcpy(static_cast<void*>(&buf[place_value]), &x, sizeof(x)); /// NOLINT(bugprone-undefined-memory-manipulation)
         x.setZero();
 
         /// Then the elements that previously were in collision with this can move to the old place.
diff --git a/src/Common/HostResolvePool.h b/src/Common/HostResolvePool.h
index 4f127f05253..ec4594bc8dd 100644
--- a/src/Common/HostResolvePool.h
+++ b/src/Common/HostResolvePool.h
@@ -67,8 +67,8 @@ public:
     class Entry
     {
     public:
-        explicit Entry(Entry && entry) = default;
-        explicit Entry(Entry & entry) = delete;
+        Entry(Entry && entry) = default;
+        Entry(Entry & entry) = delete;
 
         // no access as r-value
         const String * operator->() && = delete;
@@ -89,7 +89,7 @@ public:
 
         Entry(HostResolver & pool_, Poco::Net::IPAddress address_)
             : pool(pool_.getWeakFromThis())
-            , address(std::move(address_))
+            , address(address_)
             , resolved_host(address.toString())
         { }
 
@@ -126,14 +126,14 @@ protected:
     struct Record
     {
         Record(Poco::Net::IPAddress address_, Poco::Timestamp resolve_time_)
-            : address(std::move(address_))
+            : address(address_)
             , resolve_time(resolve_time_)
         {}
 
-        explicit Record(Record && rec) = default;
+        Record(Record && rec) = default;
         Record& operator=(Record && s) = default;
 
-        explicit Record(const Record & rec) = default;
+        Record(const Record & rec) = default;
         Record& operator=(const Record & s) = default;
 
         Poco::Net::IPAddress address;
@@ -198,10 +198,11 @@ class HostResolversPool
 {
 private:
     HostResolversPool() = default;
+
+public:
     HostResolversPool(const HostResolversPool &) = delete;
     HostResolversPool & operator=(const HostResolversPool &) = delete;
 
-public:
     static HostResolversPool & instance();
 
     void dropCache();
diff --git a/src/Common/MortonUtils.h b/src/Common/MortonUtils.h
index 591621f7a47..c55b36c6354 100644
--- a/src/Common/MortonUtils.h
+++ b/src/Common/MortonUtils.h
@@ -27,7 +27,7 @@
   */
 
 
-namespace
+namespace impl
 {
     /// After the most significant bit 1, set all subsequent less significant bits to 1 as well.
     inline UInt64 toMask(UInt64 n)
@@ -85,7 +85,7 @@ void intervalBinaryPartition(UInt64 first, UInt64 last, F && callback)
     /// split = 15:   00001111
 
     UInt64 diff = first ^ last;
-    UInt64 mask = toMask(diff) >> 1;
+    UInt64 mask = impl::toMask(diff) >> 1;
 
     /// The current interval represents a whole range with fixed prefix.
     if ((first & mask) == 0 && (last & mask) == mask)
diff --git a/src/Common/NetException.h b/src/Common/NetException.h
index 0ec3a7c423f..09c51949501 100644
--- a/src/Common/NetException.h
+++ b/src/Common/NetException.h
@@ -29,7 +29,7 @@ public:
     }
 
     NetException * clone() const override { return new NetException(*this); }
-    void rethrow() const override { throw *this; }
+    void rethrow() const override { throw *this; } /// NOLINT(cert-err60-cpp)
 
 private:
     const char * name() const noexcept override { return "DB::NetException"; }
diff --git a/src/Common/PODArray.h b/src/Common/PODArray.h
index af863e01fb2..02281eb776a 100644
--- a/src/Common/PODArray.h
+++ b/src/Common/PODArray.h
@@ -301,6 +301,8 @@ public:
     }
 };
 
+/// NOLINTBEGIN(bugprone-sizeof-expression)
+
 template <typename T, size_t initial_bytes, typename TAllocator, size_t pad_right_, size_t pad_left_>
 class PODArray : public PODArrayBase<sizeof(T), initial_bytes, TAllocator, pad_right_, pad_left_>
 {
@@ -755,6 +757,8 @@ public:
     }
 };
 
+/// NOLINTEND(bugprone-sizeof-expression)
+
 template <typename T, size_t initial_bytes, typename TAllocator, size_t pad_right_, size_t pad_left_>
 void swap(PODArray<T, initial_bytes, TAllocator, pad_right_, pad_left_> & lhs, PODArray<T, initial_bytes, TAllocator, pad_right_, pad_left_> & rhs) /// NOLINT
 {
diff --git a/src/Common/ProxyConfiguration.h b/src/Common/ProxyConfiguration.h
index 11a09cb5924..289ae2b6813 100644
--- a/src/Common/ProxyConfiguration.h
+++ b/src/Common/ProxyConfiguration.h
@@ -50,7 +50,7 @@ struct ProxyConfiguration
     bool tunneling = false;
     Protocol original_request_protocol = Protocol::HTTP;
 
-    bool isEmpty() const { return host.size() == 0; }
+    bool isEmpty() const { return host.empty(); }
 };
 
 }
diff --git a/src/Common/Scheduler/Nodes/DynamicResourceManager.h b/src/Common/Scheduler/Nodes/DynamicResourceManager.h
index ff736693664..4b0a3a48b61 100644
--- a/src/Common/Scheduler/Nodes/DynamicResourceManager.h
+++ b/src/Common/Scheduler/Nodes/DynamicResourceManager.h
@@ -85,7 +85,6 @@ private:
         StatePtr state; // hold state to avoid ResourceLink invalidation due to resource deregistration from SchedulerRoot
     };
 
-private:
     SchedulerRoot scheduler;
     std::mutex mutex;
     StatePtr state;
diff --git a/src/Common/Scheduler/Nodes/FairPolicy.h b/src/Common/Scheduler/Nodes/FairPolicy.h
index ce2bf729a04..0a4e55c253b 100644
--- a/src/Common/Scheduler/Nodes/FairPolicy.h
+++ b/src/Common/Scheduler/Nodes/FairPolicy.h
@@ -248,7 +248,6 @@ private:
             parent->activateChild(this);
     }
 
-private:
     /// Beginning of `items` vector is heap of active children: [0; `heap_size`).
     /// Next go inactive children in unsorted order.
     /// NOTE: we have to track vruntime of inactive children for max-min fairness.
diff --git a/src/Common/Scheduler/SchedulerRoot.h b/src/Common/Scheduler/SchedulerRoot.h
index ab3f702a422..7af42fdbbea 100644
--- a/src/Common/Scheduler/SchedulerRoot.h
+++ b/src/Common/Scheduler/SchedulerRoot.h
@@ -231,7 +231,6 @@ private:
         value->next = nullptr;
     }
 
-private:
     void schedulerThread()
     {
         while (!stop_flag.load())
@@ -253,7 +252,6 @@ private:
         request->execute();
     }
 
-private:
     TResource * current = nullptr; // round-robin pointer
     std::unordered_map<ISchedulerNode *, TResource> children; // resources by pointer
     std::atomic<bool> stop_flag = false;
diff --git a/src/Common/ZooKeeper/ZooKeeperImpl.h b/src/Common/ZooKeeper/ZooKeeperImpl.h
index d089ab7cc04..b5ab4f04b8e 100644
--- a/src/Common/ZooKeeper/ZooKeeperImpl.h
+++ b/src/Common/ZooKeeper/ZooKeeperImpl.h
@@ -291,7 +291,7 @@ private:
     class ThreadReference
     {
     public:
-        const ThreadReference & operator = (ThreadFromGlobalPool && thread_)
+        ThreadReference & operator = (ThreadFromGlobalPool && thread_)
         {
             std::lock_guard<std::mutex> l(lock);
             thread = std::move(thread_);
diff --git a/src/Common/ZooKeeper/ZooKeeperRetries.h b/src/Common/ZooKeeper/ZooKeeperRetries.h
index d8d234ba913..39782d08b33 100644
--- a/src/Common/ZooKeeper/ZooKeeperRetries.h
+++ b/src/Common/ZooKeeper/ZooKeeperRetries.h
@@ -120,7 +120,7 @@ public:
 
         iteration_succeeded = false;
         user_error.code = code;
-        user_error.message = std::move(message);
+        user_error.message = message;
         user_error.exception = exception;
         keeper_error = KeeperError{};
     }
diff --git a/src/Common/memory.h b/src/Common/memory.h
index a4c9d46e21b..a828ba7a38e 100644
--- a/src/Common/memory.h
+++ b/src/Common/memory.h
@@ -215,7 +215,7 @@ inline ALWAYS_INLINE size_t untrackMemory(void * ptr [[maybe_unused]], Allocatio
 #endif
         trace = CurrentMemoryTracker::free(actual_size);
     }
-    catch (...)
+    catch (...) /// NOLINT(bugprone-empty-catch)
     {
     }
 
diff --git a/src/Common/mysqlxx/mysqlxx/Transaction.h b/src/Common/mysqlxx/mysqlxx/Transaction.h
index 38c175d69d5..4f06042eb06 100644
--- a/src/Common/mysqlxx/mysqlxx/Transaction.h
+++ b/src/Common/mysqlxx/mysqlxx/Transaction.h
@@ -27,7 +27,7 @@ public:
             if (!finished)
                 rollback();
         }
-        catch (...)
+        catch (...) /// NOLINT(bugprone-empty-catch)
         {
         }
     }
diff --git a/src/Common/mysqlxx/mysqlxx/Types.h b/src/Common/mysqlxx/mysqlxx/Types.h
index 883eb41989e..b58ed20d740 100644
--- a/src/Common/mysqlxx/mysqlxx/Types.h
+++ b/src/Common/mysqlxx/mysqlxx/Types.h
@@ -36,7 +36,7 @@ using Int64 = int64_t;
 using UInt32 = uint32_t;
 using Int32 = int32_t;
 
-using MYSQL_LENGTH = unsigned long;
+using MYSQL_LENGTH = unsigned long; /// NOLINT
 using MYSQL_LENGTHS = MYSQL_LENGTH *;
 using MYSQL_FIELDS = MYSQL_FIELD *;
 
diff --git a/src/Common/threadPoolCallbackRunner.h b/src/Common/threadPoolCallbackRunner.h
index 2b943110273..6f7892ae4bb 100644
--- a/src/Common/threadPoolCallbackRunner.h
+++ b/src/Common/threadPoolCallbackRunner.h
@@ -57,7 +57,7 @@ template <typename Result, typename T>
 std::future<Result> scheduleFromThreadPool(T && task, ThreadPool & pool, const std::string & thread_name, Priority priority = {})
 {
     auto schedule = threadPoolCallbackRunner<Result, T>(pool, thread_name);
-    return schedule(std::move(task), priority);
+    return schedule(std::move(task), priority); /// NOLINT
 }
 
 }
diff --git a/src/Compression/CompressionCodecDeflateQpl.h b/src/Compression/CompressionCodecDeflateQpl.h
index 42d9bb69c31..86fd9051bd8 100644
--- a/src/Compression/CompressionCodecDeflateQpl.h
+++ b/src/Compression/CompressionCodecDeflateQpl.h
@@ -26,7 +26,7 @@ public:
 
     qpl_job * acquireJob(UInt32 & job_id);
     void releaseJob(UInt32 job_id);
-    const bool & isJobPoolReady() { return job_pool_ready; }
+    const bool & isJobPoolReady() const { return job_pool_ready; }
 
 private:
     bool tryLockJob(UInt32 index);
diff --git a/src/Coordination/WriteBufferFromNuraftBuffer.h b/src/Coordination/WriteBufferFromNuraftBuffer.h
index c9ca1e2a227..61b8632631a 100644
--- a/src/Coordination/WriteBufferFromNuraftBuffer.h
+++ b/src/Coordination/WriteBufferFromNuraftBuffer.h
@@ -16,7 +16,7 @@ public:
     ~WriteBufferFromNuraftBuffer() override;
 
 private:
-    void finalizeImpl() override final;
+    void finalizeImpl() final;
 
     void nextImpl() override;
 
diff --git a/src/Core/Field.h b/src/Core/Field.h
index 43f175cb476..aed5fab2106 100644
--- a/src/Core/Field.h
+++ b/src/Core/Field.h
@@ -40,6 +40,7 @@ using FieldVector = std::vector<Field, AllocatorWithMemoryTracking<Field>>;
 /// construct a Field of Array or a Tuple type. An alternative approach would be
 /// to construct both of these types from FieldVector, and have the caller
 /// specify the desired Field type explicitly.
+/// NOLINTBEGIN(modernize-type-traits)
 #define DEFINE_FIELD_VECTOR(X) \
 struct X : public FieldVector \
 { \
@@ -48,6 +49,7 @@ struct X : public FieldVector \
 
 DEFINE_FIELD_VECTOR(Array);
 DEFINE_FIELD_VECTOR(Tuple);
+/// NOLINTEND(modernize-type-traits)
 
 /// An array with the following structure: [(key1, value1), (key2, value2), ...]
 DEFINE_FIELD_VECTOR(Map); /// TODO: use map instead of vector.
diff --git a/src/Core/MySQL/MySQLReplication.h b/src/Core/MySQL/MySQLReplication.h
index 2e2023ff47f..3387d952711 100644
--- a/src/Core/MySQL/MySQLReplication.h
+++ b/src/Core/MySQL/MySQLReplication.h
@@ -546,7 +546,7 @@ namespace MySQLReplication
         virtual void setGTIDSets(GTIDSets sets) = 0;
         virtual void setChecksumSignatureLength(size_t checksum_signature_length_) = 0;
 
-        virtual ~IFlavor() override = default;
+        ~IFlavor() override = default;
     };
 
     class MySQLFlavor : public IFlavor
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index e6adb00137f..b5e519fb8b4 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1194,7 +1194,6 @@ class IColumn;
     FORMAT_FACTORY_SETTINGS(M, ALIAS)  \
     OBSOLETE_FORMAT_SETTINGS(M, ALIAS) \
 
-/// NOLINTNEXTLINE(clang-analyzer-optin.performance.Padding)
 DECLARE_SETTINGS_TRAITS_ALLOW_CUSTOM_SETTINGS(SettingsTraits, LIST_OF_SETTINGS)
 
 
@@ -1239,7 +1238,6 @@ private:
 /*
  * User-specified file format settings for File and URL engines.
  */
-/// NOLINTNEXTLINE(clang-analyzer-optin.performance.Padding)
 DECLARE_SETTINGS_TRAITS(FormatFactorySettingsTraits, LIST_OF_ALL_FORMAT_SETTINGS)
 
 struct FormatFactorySettings : public BaseSettings<FormatFactorySettingsTraits>
diff --git a/src/Core/tests/gtest_charset_conv.cpp b/src/Core/tests/gtest_charset_conv.cpp
index 9b501b5f8fc..073b0dd74b4 100644
--- a/src/Core/tests/gtest_charset_conv.cpp
+++ b/src/Core/tests/gtest_charset_conv.cpp
@@ -5,14 +5,12 @@
 namespace DB
 {
 
-// NOLINTBEGIN(clang-analyzer-optin.performance.Padding)
 struct CheckResult
 {
     Int32 id;
     String name;
     bool need_convert;
 };
-// NOLINTEND(clang-analyzer-optin.performance.Padding)
 
 TEST(CharsetTest, CharsetTest)
 {
diff --git a/src/Daemon/BaseDaemon.h b/src/Daemon/BaseDaemon.h
index 952cf61d8e0..a0f47c44460 100644
--- a/src/Daemon/BaseDaemon.h
+++ b/src/Daemon/BaseDaemon.h
@@ -103,7 +103,7 @@ public:
 
     GraphiteWriter * getGraphiteWriter(const std::string & config_name = DEFAULT_GRAPHITE_CONFIG_NAME)
     {
-        if (graphite_writers.count(config_name))
+        if (graphite_writers.contains(config_name))
             return graphite_writers[config_name].get();
         return nullptr;
     }
@@ -183,7 +183,7 @@ std::optional<std::reference_wrapper<Daemon>> BaseDaemon::tryGetInstance()
     {
         ptr = dynamic_cast<Daemon *>(&Poco::Util::Application::instance());
     }
-    catch (const Poco::NullPointerException &)
+    catch (const Poco::NullPointerException &) /// NOLINT(bugprone-empty-catch)
     {
         /// if daemon doesn't exist than instance() throw NullPointerException
     }
diff --git a/src/DataTypes/NumberTraits.h b/src/DataTypes/NumberTraits.h
index cf283d3358c..59a64017af3 100644
--- a/src/DataTypes/NumberTraits.h
+++ b/src/DataTypes/NumberTraits.h
@@ -217,11 +217,13 @@ template <typename A> struct ToInteger
 
 // CLICKHOUSE-29. The same depth, different signs
 // NOTE: This case is applied for 64-bit integers only (for backward compatibility), but could be used for any-bit integers
+/// NOLINTBEGIN(misc-redundant-expression)
 template <typename A, typename B>
 constexpr bool LeastGreatestSpecialCase =
     std::is_integral_v<A> && std::is_integral_v<B>
     && (8 == sizeof(A) && sizeof(A) == sizeof(B))
     && (is_signed_v<A> ^ is_signed_v<B>);
+/// NOLINTEND(misc-redundant-expression)
 
 template <typename A, typename B>
 using ResultOfLeast = std::conditional_t<LeastGreatestSpecialCase<A, B>,
diff --git a/src/DataTypes/Serializations/SerializationCustomSimpleText.h b/src/DataTypes/Serializations/SerializationCustomSimpleText.h
index c80a57e234c..f7aea8697ff 100644
--- a/src/DataTypes/Serializations/SerializationCustomSimpleText.h
+++ b/src/DataTypes/Serializations/SerializationCustomSimpleText.h
@@ -18,7 +18,7 @@ public:
     explicit SerializationCustomSimpleText(const SerializationPtr & nested_);
 
     // Methods that subclasses must override in order to get full serialization/deserialization support.
-    virtual void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override = 0;
+    void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override = 0;
     /// whole = true means that buffer contains only one value, so we should read until EOF.
     /// It's needed to check if there is garbage after parsed field.
     virtual void deserializeText(IColumn & column, ReadBuffer & istr, const FormatSettings &, bool whole) const = 0;
diff --git a/src/DataTypes/Serializations/SerializationSparse.h b/src/DataTypes/Serializations/SerializationSparse.h
index 2d31fba2509..b1ed7b613f0 100644
--- a/src/DataTypes/Serializations/SerializationSparse.h
+++ b/src/DataTypes/Serializations/SerializationSparse.h
@@ -27,7 +27,7 @@ public:
 
     Kind getKind() const override { return Kind::SPARSE; }
 
-    virtual void enumerateStreams(
+    void enumerateStreams(
         EnumerateStreamsSettings & settings,
         const StreamCallback & callback,
         const SubstreamData & data) const override;
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.cpp b/src/DataTypes/Serializations/SerializationVariantElement.cpp
index 053f8d22d5a..7d4487fe6da 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.cpp
+++ b/src/DataTypes/Serializations/SerializationVariantElement.cpp
@@ -205,8 +205,8 @@ void SerializationVariantElement::removeVariantFromPath(DB::ISerialization::Subs
 SerializationVariantElement::VariantSubcolumnCreator::VariantSubcolumnCreator(
     const ColumnPtr & local_discriminators_,
     const String & variant_element_name_,
-    const ColumnVariant::Discriminator global_variant_discriminator_,
-    const ColumnVariant::Discriminator local_variant_discriminator_)
+    ColumnVariant::Discriminator global_variant_discriminator_,
+    ColumnVariant::Discriminator local_variant_discriminator_)
     : local_discriminators(local_discriminators_)
     , variant_element_name(variant_element_name_)
     , global_variant_discriminator(global_variant_discriminator_)
diff --git a/src/DataTypes/Serializations/SerializationVariantElement.h b/src/DataTypes/Serializations/SerializationVariantElement.h
index c343c219cf3..aafecf43d39 100644
--- a/src/DataTypes/Serializations/SerializationVariantElement.h
+++ b/src/DataTypes/Serializations/SerializationVariantElement.h
@@ -75,8 +75,8 @@ private:
         VariantSubcolumnCreator(
             const ColumnPtr & local_discriminators_,
             const String & variant_element_name_,
-            const ColumnVariant::Discriminator global_variant_discriminator_,
-            const ColumnVariant::Discriminator local_variant_discriminator_);
+            ColumnVariant::Discriminator global_variant_discriminator_,
+            ColumnVariant::Discriminator local_variant_discriminator_);
 
         DataTypePtr create(const DataTypePtr & prev) const override;
         ColumnPtr create(const ColumnPtr & prev) const override;
diff --git a/src/Databases/DatabasesOverlay.h b/src/Databases/DatabasesOverlay.h
index b58df506f70..859063a4ac4 100644
--- a/src/Databases/DatabasesOverlay.h
+++ b/src/Databases/DatabasesOverlay.h
@@ -23,7 +23,6 @@ public:
 
     String getEngineName() const override { return "Overlay"; }
 
-public:
     bool isTableExist(const String & table_name, ContextPtr context) const override;
 
     StoragePtr tryGetTable(const String & table_name, ContextPtr context) const override;
diff --git a/src/Dictionaries/CacheDictionary.cpp b/src/Dictionaries/CacheDictionary.cpp
index 935658719db..fbb04eab3e4 100644
--- a/src/Dictionaries/CacheDictionary.cpp
+++ b/src/Dictionaries/CacheDictionary.cpp
@@ -308,7 +308,7 @@ ColumnUInt8::Ptr CacheDictionary<dictionary_key_type>::hasKeys(const Columns & k
         /// Write lock on storage
         const ProfilingScopedWriteRWLock write_lock{rw_lock, ProfileEvents::DictCacheLockWriteNs};
 
-        result_of_fetch_from_storage = cache_storage_ptr->fetchColumnsForKeys(keys, request);
+        result_of_fetch_from_storage = cache_storage_ptr->fetchColumnsForKeys(keys, request, /*default_mask*/ nullptr);
     }
 
     size_t found_keys_size = result_of_fetch_from_storage.found_keys_size;
diff --git a/src/Dictionaries/CacheDictionary.h b/src/Dictionaries/CacheDictionary.h
index c02fb91c60e..a23f64e3e3f 100644
--- a/src/Dictionaries/CacheDictionary.h
+++ b/src/Dictionaries/CacheDictionary.h
@@ -171,7 +171,7 @@ private:
         const PaddedPODArray<KeyState> & key_index_to_fetched_columns_from_storage_result,
         const MutableColumns & fetched_columns_during_update,
         const HashMap<KeyType, size_t> & found_keys_to_fetched_columns_during_update_index,
-        IColumn::Filter * const default_mask = nullptr) const;
+        IColumn::Filter * default_mask = nullptr) const;
 
     void update(CacheDictionaryUpdateUnitPtr<dictionary_key_type> update_unit_ptr);
 
diff --git a/src/Dictionaries/CacheDictionaryStorage.h b/src/Dictionaries/CacheDictionaryStorage.h
index 4cbbaa070d0..01217c58e31 100644
--- a/src/Dictionaries/CacheDictionaryStorage.h
+++ b/src/Dictionaries/CacheDictionaryStorage.h
@@ -73,7 +73,7 @@ public:
     SimpleKeysStorageFetchResult fetchColumnsForKeys(
         const PaddedPODArray<UInt64> & keys,
         const DictionaryStorageFetchRequest & fetch_request,
-        IColumn::Filter * const default_mask = nullptr) override
+        IColumn::Filter * const default_mask) override
     {
         if constexpr (dictionary_key_type == DictionaryKeyType::Simple)
             return fetchColumnsForKeysImpl<SimpleKeysStorageFetchResult>(keys, fetch_request, default_mask);
@@ -110,7 +110,7 @@ public:
     ComplexKeysStorageFetchResult fetchColumnsForKeys(
         const PaddedPODArray<StringRef> & keys,
         const DictionaryStorageFetchRequest & column_fetch_requests,
-        IColumn::Filter * const default_mask = nullptr) override
+        IColumn::Filter * const default_mask) override
     {
         if constexpr (dictionary_key_type == DictionaryKeyType::Complex)
             return fetchColumnsForKeysImpl<ComplexKeysStorageFetchResult>(keys, column_fetch_requests, default_mask);
diff --git a/src/Dictionaries/ICacheDictionaryStorage.h b/src/Dictionaries/ICacheDictionaryStorage.h
index 047d67135a6..dcd7434946f 100644
--- a/src/Dictionaries/ICacheDictionaryStorage.h
+++ b/src/Dictionaries/ICacheDictionaryStorage.h
@@ -82,7 +82,7 @@ public:
     virtual SimpleKeysStorageFetchResult fetchColumnsForKeys(
         const PaddedPODArray<UInt64> & keys,
         const DictionaryStorageFetchRequest & fetch_request,
-        IColumn::Filter * default_mask = nullptr) = 0;
+        IColumn::Filter * default_mask) = 0;
 
     /// Fetch columns for keys, this method is not write thread safe
     virtual void insertColumnsForKeys(const PaddedPODArray<UInt64> & keys, Columns columns) = 0;
@@ -100,7 +100,7 @@ public:
     virtual ComplexKeysStorageFetchResult fetchColumnsForKeys(
         const PaddedPODArray<StringRef> & keys,
         const DictionaryStorageFetchRequest & column_fetch_requests,
-        IColumn::Filter * default_mask = nullptr) = 0;
+        IColumn::Filter * default_mask) = 0;
 
     /// Fetch columns for keys, this method is not write thread safe
     virtual void insertColumnsForKeys(const PaddedPODArray<StringRef> & keys, Columns columns) = 0;
diff --git a/src/Dictionaries/SSDCacheDictionaryStorage.h b/src/Dictionaries/SSDCacheDictionaryStorage.h
index acebea676a5..73c96e0aedc 100644
--- a/src/Dictionaries/SSDCacheDictionaryStorage.h
+++ b/src/Dictionaries/SSDCacheDictionaryStorage.h
@@ -870,7 +870,7 @@ public:
     SimpleKeysStorageFetchResult fetchColumnsForKeys(
         const PaddedPODArray<UInt64> & keys,
         const DictionaryStorageFetchRequest & fetch_request,
-        IColumn::Filter * const default_mask = nullptr) override
+        IColumn::Filter * const default_mask) override
     {
         if constexpr (dictionary_key_type == DictionaryKeyType::Simple)
             return fetchColumnsForKeysImpl<SimpleKeysStorageFetchResult>(keys, fetch_request, default_mask);
@@ -907,7 +907,7 @@ public:
     ComplexKeysStorageFetchResult fetchColumnsForKeys(
         const PaddedPODArray<StringRef> & keys,
         const DictionaryStorageFetchRequest & fetch_request,
-        IColumn::Filter * const default_mask = nullptr) override
+        IColumn::Filter * const default_mask) override
     {
         if constexpr (dictionary_key_type == DictionaryKeyType::Complex)
             return fetchColumnsForKeysImpl<ComplexKeysStorageFetchResult>(keys, fetch_request, default_mask);
diff --git a/src/Disks/IDiskTransaction.h b/src/Disks/IDiskTransaction.h
index 975c41cb70b..7df1b71eb2b 100644
--- a/src/Disks/IDiskTransaction.h
+++ b/src/Disks/IDiskTransaction.h
@@ -62,8 +62,8 @@ public:
     virtual void copyFile(
         const std::string & from_file_path,
         const std::string & to_file_path,
-        const ReadSettings & read_settings = {},
-        const WriteSettings & write_settings = {}) = 0;
+        const ReadSettings & read_settings,
+        const WriteSettings & write_settings) = 0;
 
     /// Open the file for write and return WriteBufferFromFileBase object.
     virtual std::unique_ptr<WriteBufferFromFileBase> writeFile( /// NOLINT
diff --git a/src/Disks/IO/IOUringReader.h b/src/Disks/IO/IOUringReader.h
index a29781171e5..89e71e4b215 100644
--- a/src/Disks/IO/IOUringReader.h
+++ b/src/Disks/IO/IOUringReader.h
@@ -78,7 +78,7 @@ private:
 public:
     explicit IOUringReader(uint32_t entries_);
 
-    inline bool isSupported() { return is_supported; }
+    bool isSupported() const { return is_supported; }
     std::future<Result> submit(Request request) override;
     Result execute(Request /* request */) override { throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method `execute` not implemented for IOUringReader"); }
 
diff --git a/src/Disks/IVolume.h b/src/Disks/IVolume.h
index bc6706a1829..2da896a3514 100644
--- a/src/Disks/IVolume.h
+++ b/src/Disks/IVolume.h
@@ -64,7 +64,7 @@ public:
         DiskSelectorPtr disk_selector
     );
 
-    virtual ReservationPtr reserve(UInt64 bytes) override = 0;
+    ReservationPtr reserve(UInt64 bytes) override = 0;
 
     /// This is a volume.
     bool isVolume() const override { return true; }
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.cpp b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
index 16183ec20c1..696a0ef7416 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
@@ -204,7 +204,7 @@ void DiskObjectStorage::copyFile( /// NOLINT
             /// It may use s3-server-side copy
             auto & to_disk_object_storage = dynamic_cast<DiskObjectStorage &>(to_disk);
             auto transaction = createObjectStorageTransactionToAnotherDisk(to_disk_object_storage);
-            transaction->copyFile(from_file_path, to_file_path);
+            transaction->copyFile(from_file_path, to_file_path, /*read_settings*/ {}, /*write_settings*/ {});
             transaction->commit();
     }
     else
diff --git a/src/Disks/ObjectStorages/ObjectStorageIterator.h b/src/Disks/ObjectStorages/ObjectStorageIterator.h
index 841b0ea6664..9af2593579a 100644
--- a/src/Disks/ObjectStorages/ObjectStorageIterator.h
+++ b/src/Disks/ObjectStorages/ObjectStorageIterator.h
@@ -54,7 +54,7 @@ public:
         return batch;
     }
 
-    virtual std::optional<RelativePathsWithMetadata> getCurrrentBatchAndScheduleNext() override
+    std::optional<RelativePathsWithMetadata> getCurrrentBatchAndScheduleNext() override
     {
         return std::nullopt;
     }
diff --git a/src/Disks/ObjectStorages/S3/diskSettings.h b/src/Disks/ObjectStorages/S3/diskSettings.h
index 83bf7b179ef..e461daa99e2 100644
--- a/src/Disks/ObjectStorages/S3/diskSettings.h
+++ b/src/Disks/ObjectStorages/S3/diskSettings.h
@@ -9,14 +9,6 @@
 
 #include <IO/S3/Client.h>
 
-namespace Aws
-{
-namespace S3
-{
-class Client;
-}
-}
-
 namespace DB
 {
 
diff --git a/src/Functions/CountSubstringsImpl.h b/src/Functions/CountSubstringsImpl.h
index 8ba9ee99de8..9ff3e4e1f2a 100644
--- a/src/Functions/CountSubstringsImpl.h
+++ b/src/Functions/CountSubstringsImpl.h
@@ -47,7 +47,7 @@ struct CountSubstringsImpl
         const UInt8 * pos = begin;
 
         /// FIXME: suboptimal
-        memset(&res[0], 0, res.size() * sizeof(res[0]));
+        memset(&res[0], 0, res.size() * sizeof(res[0])); /// NOLINT(readability-container-data-pointer)
 
         if (needle.empty())
             return; // Return all zeros
diff --git a/src/Functions/CustomWeekTransforms.h b/src/Functions/CustomWeekTransforms.h
index b8d25cc30b6..75fb3c32f16 100644
--- a/src/Functions/CustomWeekTransforms.h
+++ b/src/Functions/CustomWeekTransforms.h
@@ -58,7 +58,7 @@ struct CustomWeekTransformImpl
     template <typename Transform>
     static ColumnPtr execute(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/, Transform transform = {})
     {
-        const auto op = WeekTransformer<typename FromDataType::FieldType, typename ToDataType::FieldType, Transform, is_extended_result>{std::move(transform)};
+        const auto op = WeekTransformer<typename FromDataType::FieldType, typename ToDataType::FieldType, Transform, is_extended_result>{transform};
 
         static constexpr UInt8 default_week_mode = 0;
         UInt8 week_mode = default_week_mode;
diff --git a/src/Functions/FunctionConstantBase.h b/src/Functions/FunctionConstantBase.h
index ad969268713..9b999af38b6 100644
--- a/src/Functions/FunctionConstantBase.h
+++ b/src/Functions/FunctionConstantBase.h
@@ -13,8 +13,9 @@ class FunctionConstantBase : public IFunction
 {
 public:
     template <typename U>
-    explicit FunctionConstantBase(U && constant_value_, bool is_distributed_ = false)
-        : constant_value(static_cast<T>(std::forward<U>(constant_value_))), is_distributed(is_distributed_)
+    explicit FunctionConstantBase(const U & constant_value_, bool is_distributed_ = false)
+        : constant_value(static_cast<T>(constant_value_))
+        , is_distributed(is_distributed_)
     {
     }
 
diff --git a/src/Functions/FunctionsAES.h b/src/Functions/FunctionsAES.h
index a03f0b602b9..3bb264dfaec 100644
--- a/src/Functions/FunctionsAES.h
+++ b/src/Functions/FunctionsAES.h
@@ -96,7 +96,7 @@ inline void validateCipherMode(const EVP_CIPHER * evp_cipher)
 {
     if constexpr (compatibility_mode == CompatibilityMode::MySQL)
     {
-        switch (EVP_CIPHER_mode(evp_cipher))
+        switch (EVP_CIPHER_mode(evp_cipher)) /// NOLINT(bugprone-switch-missing-default-case)
         {
             case EVP_CIPH_ECB_MODE: [[fallthrough]];
             case EVP_CIPH_CBC_MODE: [[fallthrough]];
@@ -107,7 +107,7 @@ inline void validateCipherMode(const EVP_CIPHER * evp_cipher)
     }
     else if constexpr (compatibility_mode == CompatibilityMode::OpenSSL)
     {
-        switch (EVP_CIPHER_mode(evp_cipher))
+        switch (EVP_CIPHER_mode(evp_cipher)) /// NOLINT(bugprone-switch-missing-default-case)
         {
             case EVP_CIPH_ECB_MODE: [[fallthrough]];
             case EVP_CIPH_CBC_MODE: [[fallthrough]];
diff --git a/src/Functions/FunctionsBitmap.h b/src/Functions/FunctionsBitmap.h
index 801f2ccd012..22d46fa7728 100644
--- a/src/Functions/FunctionsBitmap.h
+++ b/src/Functions/FunctionsBitmap.h
@@ -519,12 +519,12 @@ public:
                                        "but one of them has type {}.", getName(), arguments[i + 1]->getName());
 
             if (!array_type)
-                throw exception;
+                throw exception; /// NOLINT
 
             auto nested_type = array_type->getNestedType();
             WhichDataType which(nested_type);
             if (!(which.isUInt8() || which.isUInt16() || which.isUInt32() || which.isUInt64()))
-                throw exception;
+                throw exception; /// NOLINT
         }
         return arguments[0];
     }
diff --git a/src/Functions/FunctionsComparison.h b/src/Functions/FunctionsComparison.h
index 3be675f39b3..57aebc11da0 100644
--- a/src/Functions/FunctionsComparison.h
+++ b/src/Functions/FunctionsComparison.h
@@ -283,7 +283,7 @@ struct StringComparisonImpl
         size_t size = a_data.size();
 
         for (size_t i = 0, j = 0; i < size; i += 16, ++j)
-            c[j] = Op::apply(memcmp16(&a_data[i], &b_data[0]), 0);
+            c[j] = Op::apply(memcmp16(&a_data[i], &b_data[0]), 0); /// NOLINT(readability-container-data-pointer)
     }
 
     static void NO_INLINE fixed_string_vector_fixed_string_vector( /// NOLINT
diff --git a/src/Functions/FunctionsExternalDictionaries.h b/src/Functions/FunctionsExternalDictionaries.h
index 011772baab9..d3317e2dfcf 100644
--- a/src/Functions/FunctionsExternalDictionaries.h
+++ b/src/Functions/FunctionsExternalDictionaries.h
@@ -393,8 +393,8 @@ public:
                 throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Function {} does not support nullable keys", getName());
 
             // Wrap all the attribute types in Array()
-            for (auto it = attribute_types.begin(); it != attribute_types.end(); ++it)
-                *it = std::make_shared<DataTypeArray>(*it);
+            for (auto & attr_type : attribute_types)
+                attr_type = std::make_shared<DataTypeArray>(attr_type);
         }
         if (attribute_types.size() > 1)
         {
diff --git a/src/Functions/FunctionsTimeWindow.h b/src/Functions/FunctionsTimeWindow.h
index 658963cb69c..5145ae79377 100644
--- a/src/Functions/FunctionsTimeWindow.h
+++ b/src/Functions/FunctionsTimeWindow.h
@@ -73,6 +73,8 @@ struct ToStartOfTransform;
     TRANSFORM_TIME(Second)
 #undef TRANSFORM_TIME
 
+/// NOLINTBEGIN(bugprone-macro-parentheses)
+
 #define TRANSFORM_SUBSECONDS(INTERVAL_KIND, DEF_SCALE) \
 template<> \
     struct ToStartOfTransform<IntervalKind::Kind::INTERVAL_KIND> \
@@ -156,6 +158,8 @@ template <> \
     ADD_SUBSECONDS(Nanosecond, 9)
 #undef ADD_SUBSECONDS
 
+/// NOLINTEND(bugprone-macro-parentheses)
+
 template <TimeWindowFunctionName type>
 struct TimeWindowImpl
 {
diff --git a/src/Functions/GatherUtils/Selectors.h b/src/Functions/GatherUtils/Selectors.h
index 00367727a39..1f933c13ba0 100644
--- a/src/Functions/GatherUtils/Selectors.h
+++ b/src/Functions/GatherUtils/Selectors.h
@@ -126,19 +126,19 @@ struct ArrayAndValueSourceSelectorBySink : public ArraySinkSelector<ArrayAndValu
     template <typename Sink, typename ... Args>
     static void selectImpl(Sink && sink, IArraySource & array_source, IValueSource & value_source, Args && ... args)
     {
-        using SynkType = typename std::decay<Sink>::type;
-        using ArraySource = typename SynkType::CompatibleArraySource;
-        using ValueSource = typename SynkType::CompatibleValueSource;
+        using SinkType = typename std::decay_t<Sink>;
+        using ArraySource = typename SinkType::CompatibleArraySource;
+        using ValueSource = typename SinkType::CompatibleValueSource;
 
         auto check_type = [] (auto source_ptr)
         {
             if (source_ptr == nullptr)
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "{} expected {} or {} or {} or {} but got {}",
                                 demangle(typeid(Base).name()),
-                                demangle(typeid(typename SynkType::CompatibleArraySource).name()),
-                                demangle(typeid(ConstSource<typename SynkType::CompatibleArraySource>).name()),
-                                demangle(typeid(typename SynkType::CompatibleValueSource).name()),
-                                demangle(typeid(ConstSource<typename SynkType::CompatibleValueSource>).name()),
+                                demangle(typeid(typename SinkType::CompatibleArraySource).name()),
+                                demangle(typeid(ConstSource<typename SinkType::CompatibleArraySource>).name()),
+                                demangle(typeid(typename SinkType::CompatibleValueSource).name()),
+                                demangle(typeid(ConstSource<typename SinkType::CompatibleValueSource>).name()),
                                 demangle(typeid(*source_ptr).name()));
         };
         auto check_type_and_call_concat = [& sink, & check_type, & args ...] (auto array_source_ptr, auto value_source_ptr)
diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index 80fb9ce3900..01b63338559 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -144,6 +144,8 @@ struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
 #pragma clang diagnostic ignored "-Wsuggest-override"
 #pragma clang diagnostic ignored "-Wsuggest-destructor-override"
 
+/// NOLINTBEGIN(hicpp-use-override)
+
 template <typename Base>
 struct ConstSource : public Base
 {
@@ -231,6 +233,8 @@ struct ConstSource : public Base
     }
 };
 
+/// NOLINTEND(hicpp-use-override)
+
 #pragma clang diagnostic pop
 
 struct StringSource
diff --git a/src/Functions/GregorianDate.h b/src/Functions/GregorianDate.h
index 2528223443e..fb00e4276b6 100644
--- a/src/Functions/GregorianDate.h
+++ b/src/Functions/GregorianDate.h
@@ -13,7 +13,7 @@ class WriteBuffer;
 class GregorianDate
 {
 public:
-    GregorianDate() {}
+    GregorianDate() = default;
 
     void init(ReadBuffer & in);
     bool tryInit(ReadBuffer & in);
@@ -84,7 +84,7 @@ private:
 class OrdinalDate
 {
 public:
-    OrdinalDate() {}
+    OrdinalDate() = default;
 
     void init(int32_t year, uint16_t day_of_year);
     bool tryInit(int32_t year, uint16_t day_of_year);
diff --git a/src/Functions/HasSubsequenceImpl.h b/src/Functions/HasSubsequenceImpl.h
index 17955746aa2..630a2afb720 100644
--- a/src/Functions/HasSubsequenceImpl.h
+++ b/src/Functions/HasSubsequenceImpl.h
@@ -14,8 +14,6 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int ILLEGAL_COLUMN;
 }
-namespace
-{
 
 using namespace GatherUtils;
 
@@ -154,5 +152,3 @@ private:
 };
 
 }
-
-}
diff --git a/src/Functions/JSONPath/Generator/GeneratorJSONPath.h b/src/Functions/JSONPath/Generator/GeneratorJSONPath.h
index de62be98d31..1016d776be0 100644
--- a/src/Functions/JSONPath/Generator/GeneratorJSONPath.h
+++ b/src/Functions/JSONPath/Generator/GeneratorJSONPath.h
@@ -35,7 +35,7 @@ public:
         }
         const auto * query = path->jsonpath_query;
 
-        for (auto child_ast : query->children)
+        for (const auto & child_ast : query->children)
         {
             if (typeid_cast<ASTJSONPathRoot *>(child_ast.get()))
             {
diff --git a/src/Functions/LowerUpperUTF8Impl.h b/src/Functions/LowerUpperUTF8Impl.h
index 460f75f9bde..7ca98166576 100644
--- a/src/Functions/LowerUpperUTF8Impl.h
+++ b/src/Functions/LowerUpperUTF8Impl.h
@@ -174,7 +174,7 @@ private:
 
     static void array(const UInt8 * src, const UInt8 * src_end, const ColumnString::Offsets & offsets, UInt8 * dst)
     {
-        auto offset_it = offsets.begin();
+        const auto * offset_it = offsets.begin();
         const UInt8 * begin = src;
 
 #ifdef __SSE2__
diff --git a/src/Functions/URL/domain.h b/src/Functions/URL/domain.h
index f38f106e9a2..87f5aeffda7 100644
--- a/src/Functions/URL/domain.h
+++ b/src/Functions/URL/domain.h
@@ -88,7 +88,7 @@ exloop: if ((scheme_end - pos) > 2 && *pos == ':' && *(pos + 1) == '/' && *(pos
     const auto * start_of_host = pos;
     for (; pos < end; ++pos)
     {
-        switch (*pos)
+        switch (*pos) /// NOLINT(bugprone-switch-missing-default-case)
         {
         case '.':
             if (has_open_bracket)
@@ -220,7 +220,7 @@ exloop: if ((scheme_end - pos) > 2 && *pos == ':' && *(pos + 1) == '/' && *(pos
     const auto * start_of_host = pos;
     for (; pos < end; ++pos)
     {
-        switch (*pos)
+        switch (*pos) /// NOLINT(bugprone-switch-missing-default-case)
         {
         case '.':
             dot_pos = pos;
diff --git a/src/Functions/UniqTheta/FunctionsUniqTheta.h b/src/Functions/UniqTheta/FunctionsUniqTheta.h
index 2d616841c7f..c312dcc09f5 100644
--- a/src/Functions/UniqTheta/FunctionsUniqTheta.h
+++ b/src/Functions/UniqTheta/FunctionsUniqTheta.h
@@ -137,8 +137,8 @@ namespace DB
 
             for (size_t i = 0; i < input_rows_count; ++i)
             {
-                const AggregateDataPtr data_ptr_0 = is_column_const[0] ? container0[0] : container0[i];
-                const AggregateDataPtr data_ptr_1 = is_column_const[1] ? container1[0] : container1[i];
+                AggregateDataPtr data_ptr_0 = is_column_const[0] ? container0[0] : container0[i];
+                AggregateDataPtr data_ptr_1 = is_column_const[1] ? container1[0] : container1[i];
 
                 col_to->insertFrom(data_ptr_0);
                 AggregateFunctionUniqThetaData & sketch_data_1 = *reinterpret_cast<AggregateFunctionUniqThetaData *>(col_to->getData()[i]);
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp b/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp
index b7c7e5847bd..c15958f81c9 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp
@@ -88,7 +88,7 @@ restoreUserDefinedSQLObjects(RestorerFromBackup & restorer, const String & data_
     auto backup = restorer.getBackup();
     fs::path data_path_in_backup_fs{data_path_in_backup};
 
-    Strings filenames = backup->listFiles(data_path_in_backup);
+    Strings filenames = backup->listFiles(data_path_in_backup, /*recursive*/ false);
     if (filenames.empty())
         return {}; /// Nothing to restore.
 
diff --git a/src/Functions/geometryConverters.h b/src/Functions/geometryConverters.h
index dba984b4184..97162fa9dd0 100644
--- a/src/Functions/geometryConverters.h
+++ b/src/Functions/geometryConverters.h
@@ -28,9 +28,6 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
-namespace
-{
-
 template <typename Point>
 using Ring = boost::geometry::model::ring<Point>;
 
@@ -374,5 +371,3 @@ static void callOnTwoGeometryDataTypes(DataTypePtr left_type, DataTypePtr right_
 }
 
 }
-
-}
diff --git a/src/Functions/stl.hpp b/src/Functions/stl.hpp
index fbfc52f959c..9d4fa30e2e3 100644
--- a/src/Functions/stl.hpp
+++ b/src/Functions/stl.hpp
@@ -1,4 +1,4 @@
-// Dump of https://github.com/ankane/stl-cpp/blob/3b1b3a3e9335cda26c8b0797d8b8d24ac8e350ad/include/stl.hpp. 
+// Dump of https://github.com/ankane/stl-cpp/blob/3b1b3a3e9335cda26c8b0797d8b8d24ac8e350ad/include/stl.hpp.
 // Added to ClickHouse source code and not referenced as a submodule because its easier maintain and modify/customize.
 
 /*!
@@ -24,12 +24,12 @@
 
 namespace stl {
 
-bool est(const float* y, size_t n, size_t len, int ideg, float xs, float* ys, size_t nleft, size_t nright, float* w, bool userw, const float* rw) {
+inline bool est(const float* y, size_t n, size_t len, int ideg, float xs, float* ys, size_t nleft, size_t nright, float* w, bool userw, const float* rw) {
     auto range = ((float) n) - 1.0;
     auto h = std::max(xs - ((float) nleft), ((float) nright) - xs);
 
     if (len > n) {
-        h += (float) ((len - n) / 2);
+        h += (float) ((len - n) / 2); /// NOLINT(bugprone-integer-division)
     }
 
     auto h9 = 0.999 * h;
@@ -89,7 +89,7 @@ bool est(const float* y, size_t n, size_t len, int ideg, float xs, float* ys, si
     }
 }
 
-void ess(const float* y, size_t n, size_t len, int ideg, size_t njump, bool userw, const float* rw, float* ys, float* res) {
+inline void ess(const float* y, size_t n, size_t len, int ideg, size_t njump, bool userw, const float* rw, float* ys, float* res) {
     if (n < 2) {
         ys[0] = y[0];
         return;
@@ -165,7 +165,7 @@ void ess(const float* y, size_t n, size_t len, int ideg, size_t njump, bool user
     }
 }
 
-void ma(const float* x, size_t n, size_t len, float* ave) {
+inline void ma(const float* x, size_t n, size_t len, float* ave) {
     auto newn = n - len + 1;
     auto flen = (float) len;
     auto v = 0.0;
@@ -189,13 +189,13 @@ void ma(const float* x, size_t n, size_t len, float* ave) {
     }
 }
 
-void fts(const float* x, size_t n, size_t np, float* trend, float* work) {
+inline void fts(const float* x, size_t n, size_t np, float* trend, float* work) {
     ma(x, n, np, trend);
     ma(trend, n - np + 1, np, work);
     ma(work, n - 2 * np + 2, 3, trend);
 }
 
-void rwts(const float* y, size_t n, const float* fit, float* rw) {
+inline void rwts(const float* y, size_t n, const float* fit, float* rw) {
     for (size_t i = 0; i < n; i++) {
         rw[i] = fabs(y[i] - fit[i]);
     }
@@ -222,7 +222,7 @@ void rwts(const float* y, size_t n, const float* fit, float* rw) {
     }
 }
 
-void ss(const float* y, size_t n, size_t np, size_t ns, int isdeg, size_t nsjump, bool userw, float* rw, float* season, float* work1, float* work2, float* work3, float* work4) {
+inline void ss(const float* y, size_t n, size_t np, size_t ns, int isdeg, size_t nsjump, bool userw, float* rw, float* season, float* work1, float* work2, float* work3, float* work4) { /// NOLINT(readability-non-const-parameter)
     for (size_t j = 1; j <= np; j++) {
         size_t k = (n - j) / np + 1;
 
@@ -253,7 +253,7 @@ void ss(const float* y, size_t n, size_t np, size_t ns, int isdeg, size_t nsjump
     }
 }
 
-void onestp(const float* y, size_t n, size_t np, size_t ns, size_t nt, size_t nl, int isdeg, int itdeg, int ildeg, size_t nsjump, size_t ntjump, size_t nljump, size_t ni, bool userw, float* rw, float* season, float* trend, float* work1, float* work2, float* work3, float* work4, float* work5) {
+inline void onestp(const float* y, size_t n, size_t np, size_t ns, size_t nt, size_t nl, int isdeg, int itdeg, int ildeg, size_t nsjump, size_t ntjump, size_t nljump, size_t ni, bool userw, float* rw, float* season, float* trend, float* work1, float* work2, float* work3, float* work4, float* work5) {
     for (size_t j = 0; j < ni; j++) {
         for (size_t i = 0; i < n; i++) {
             work1[i] = y[i] - trend[i];
@@ -272,7 +272,7 @@ void onestp(const float* y, size_t n, size_t np, size_t ns, size_t nt, size_t nl
     }
 }
 
-void stl(const float* y, size_t n, size_t np, size_t ns, size_t nt, size_t nl, int isdeg, int itdeg, int ildeg, size_t nsjump, size_t ntjump, size_t nljump, size_t ni, size_t no, float* rw, float* season, float* trend) {
+inline void stl(const float* y, size_t n, size_t np, size_t ns, size_t nt, size_t nl, int isdeg, int itdeg, int ildeg, size_t nsjump, size_t ntjump, size_t nljump, size_t ni, size_t no, float* rw, float* season, float* trend) {
     if (ns < 3) {
         throw std::invalid_argument("seasonal_length must be at least 3");
     }
@@ -335,7 +335,7 @@ void stl(const float* y, size_t n, size_t np, size_t ns, size_t nt, size_t nl, i
     }
 }
 
-float var(const std::vector<float>& series) {
+inline float var(const std::vector<float>& series) {
     auto mean = std::accumulate(series.begin(), series.end(), 0.0) / series.size();
     std::vector<float> tmp;
     tmp.reserve(series.size());
@@ -345,7 +345,7 @@ float var(const std::vector<float>& series) {
     return std::accumulate(tmp.begin(), tmp.end(), 0.0) / (series.size() - 1);
 }
 
-float strength(const std::vector<float>& component, const std::vector<float>& remainder) {
+inline float strength(const std::vector<float>& component, const std::vector<float>& remainder) {
     std::vector<float> sr;
     sr.reserve(remainder.size());
     for (size_t i = 0; i < remainder.size(); i++) {
@@ -361,11 +361,11 @@ public:
     std::vector<float> remainder;
     std::vector<float> weights;
 
-    inline float seasonal_strength() {
+    float seasonal_strength() const {
         return strength(seasonal, remainder);
     }
 
-    inline float trend_strength() {
+    float trend_strength() const {
         return strength(trend, remainder);
     }
 };
@@ -385,62 +385,62 @@ class StlParams {
     bool robust_ = false;
 
 public:
-    inline StlParams seasonal_length(size_t ns) {
+    StlParams seasonal_length(size_t ns) {
         this->ns_ = ns;
         return *this;
     }
 
-    inline StlParams trend_length(size_t nt) {
+    StlParams trend_length(size_t nt) {
         this->nt_ = nt;
         return *this;
     }
 
-    inline StlParams low_pass_length(size_t nl) {
+    StlParams low_pass_length(size_t nl) {
         this->nl_ = nl;
         return *this;
     }
 
-    inline StlParams seasonal_degree(int isdeg) {
+    StlParams seasonal_degree(int isdeg) {
         this->isdeg_ = isdeg;
         return *this;
     }
 
-    inline StlParams trend_degree(int itdeg) {
+    StlParams trend_degree(int itdeg) {
         this->itdeg_ = itdeg;
         return *this;
     }
 
-    inline StlParams low_pass_degree(int ildeg) {
+    StlParams low_pass_degree(int ildeg) {
         this->ildeg_ = ildeg;
         return *this;
     }
 
-    inline StlParams seasonal_jump(size_t nsjump) {
+    StlParams seasonal_jump(size_t nsjump) {
         this->nsjump_ = nsjump;
         return *this;
     }
 
-    inline StlParams trend_jump(size_t ntjump) {
+    StlParams trend_jump(size_t ntjump) {
         this->ntjump_ = ntjump;
         return *this;
     }
 
-    inline StlParams low_pass_jump(size_t nljump) {
+    StlParams low_pass_jump(size_t nljump) {
         this->nljump_ = nljump;
         return *this;
     }
 
-    inline StlParams inner_loops(bool ni) {
+    StlParams inner_loops(bool ni) {
         this->ni_ = ni;
         return *this;
     }
 
-    inline StlParams outer_loops(bool no) {
+    StlParams outer_loops(bool no) {
         this->no_ = no;
         return *this;
     }
 
-    inline StlParams robust(bool robust) {
+    StlParams robust(bool robust) {
         this->robust_ = robust;
         return *this;
     }
@@ -449,11 +449,11 @@ public:
     StlResult fit(const std::vector<float>& y, size_t np);
 };
 
-StlParams params() {
+inline StlParams params() {
     return StlParams();
 }
 
-StlResult StlParams::fit(const float* y, size_t n, size_t np) {
+inline StlResult StlParams::fit(const float* y, size_t n, size_t np) {
     if (n < 2 * np) {
         throw std::invalid_argument("series has less than two periods");
     }
@@ -506,7 +506,7 @@ StlResult StlParams::fit(const float* y, size_t n, size_t np) {
     return res;
 }
 
-StlResult StlParams::fit(const std::vector<float>& y, size_t np) {
+inline StlResult StlParams::fit(const std::vector<float>& y, size_t np) {
     return StlParams::fit(y.data(), y.size(), np);
 }
 
diff --git a/src/IO/Archives/IArchiveWriter.h b/src/IO/Archives/IArchiveWriter.h
index c8f0c609da1..a3b06e6c4be 100644
--- a/src/IO/Archives/IArchiveWriter.h
+++ b/src/IO/Archives/IArchiveWriter.h
@@ -36,10 +36,10 @@ public:
 
     /// Sets compression method and level.
     /// Changing them will affect next file in the archive.
-    virtual void setCompression(const String & /* compression_method */, int /* compression_level */ = kDefaultCompressionLevel) {}
+    virtual void setCompression(const String & /*compression_method*/, int /*compression_level*/) {}
 
     /// Sets password. If the password is not empty it will enable encryption in the archive.
-    virtual void setPassword(const String & /* password */) {}
+    virtual void setPassword(const String & /*password*/) {}
 };
 
 }
diff --git a/src/IO/BrotliWriteBuffer.h b/src/IO/BrotliWriteBuffer.h
index d4cda7b270c..c68743ca13f 100644
--- a/src/IO/BrotliWriteBuffer.h
+++ b/src/IO/BrotliWriteBuffer.h
@@ -21,10 +21,10 @@ public:
         WriteBufferT && out_,
         int compression_level,
         size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
-        char * existing_memory = nullptr,
+        char * existing_memory = nullptr, /// NOLINT(readability-non-const-parameter)
         size_t alignment = 0,
         bool compress_empty_ = true)
-    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment)
+    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment) /// NOLINT(bugprone-move-forwarding-reference)
     , brotli(std::make_unique<BrotliStateWrapper>())
     , in_available(0)
     , in_data(nullptr)
diff --git a/src/IO/Bzip2WriteBuffer.h b/src/IO/Bzip2WriteBuffer.h
index a685d4efa75..7808f8987cc 100644
--- a/src/IO/Bzip2WriteBuffer.h
+++ b/src/IO/Bzip2WriteBuffer.h
@@ -25,10 +25,10 @@ public:
         WriteBufferT && out_,
         int compression_level,
         size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
-        char * existing_memory = nullptr,
+        char * existing_memory = nullptr, /// NOLINT(readability-non-const-parameter)
         size_t alignment = 0,
         bool compress_empty_ = true)
-    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment)
+    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment) /// NOLINT(bugprone-move-forwarding-reference)
     , compress_empty(compress_empty_)
     {
         memset(&stream, 0, sizeof(stream));
diff --git a/src/IO/ConnectionTimeouts.h b/src/IO/ConnectionTimeouts.h
index 2b2ab0e7ab8..49305f42d85 100644
--- a/src/IO/ConnectionTimeouts.h
+++ b/src/IO/ConnectionTimeouts.h
@@ -71,6 +71,7 @@ APPLY_FOR_ALL_CONNECTION_TIMEOUT_MEMBERS(DECLARE_BUILDER_FOR_MEMBER)
     ConnectionTimeouts & withConnectionTimeout(Poco::Timespan span);
 };
 
+/// NOLINTBEGIN(bugprone-macro-parentheses)
 #define DEFINE_BUILDER_FOR_MEMBER(member, setter_func) \
     inline ConnectionTimeouts & ConnectionTimeouts::setter_func(size_t seconds) \
     { \
@@ -83,6 +84,7 @@ APPLY_FOR_ALL_CONNECTION_TIMEOUT_MEMBERS(DECLARE_BUILDER_FOR_MEMBER)
     } \
 
     APPLY_FOR_ALL_CONNECTION_TIMEOUT_MEMBERS(DEFINE_BUILDER_FOR_MEMBER)
+/// NOLINTEND(bugprone-macro-parentheses)
 
 #undef DEFINE_BUILDER_FOR_MEMBER
 
diff --git a/src/IO/HTTPCommon.h b/src/IO/HTTPCommon.h
index e27269e2559..63dffcf6878 100644
--- a/src/IO/HTTPCommon.h
+++ b/src/IO/HTTPCommon.h
@@ -34,7 +34,7 @@ public:
     {}
 
     HTTPException * clone() const override { return new HTTPException(*this); }
-    void rethrow() const override { throw *this; }
+    void rethrow() const override { throw *this; } /// NOLINT(cert-err60-cpp)
 
     Poco::Net::HTTPResponse::HTTPStatus getHTTPStatus() const { return http_status; }
 
diff --git a/src/IO/LZMADeflatingWriteBuffer.h b/src/IO/LZMADeflatingWriteBuffer.h
index 797b85cd400..a3bcad7603c 100644
--- a/src/IO/LZMADeflatingWriteBuffer.h
+++ b/src/IO/LZMADeflatingWriteBuffer.h
@@ -19,10 +19,10 @@ public:
         WriteBufferT && out_,
         int compression_level,
         size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
-        char * existing_memory = nullptr,
+        char * existing_memory = nullptr, /// NOLINT(readability-non-const-parameter)
         size_t alignment = 0,
         bool compress_empty_ = true)
-    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment), compress_empty(compress_empty_)
+    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment), compress_empty(compress_empty_) /// NOLINT(bugprone-move-forwarding-reference)
     {
         initialize(compression_level);
     }
diff --git a/src/IO/Lz4DeflatingWriteBuffer.h b/src/IO/Lz4DeflatingWriteBuffer.h
index b37d61fa732..6efd092afd0 100644
--- a/src/IO/Lz4DeflatingWriteBuffer.h
+++ b/src/IO/Lz4DeflatingWriteBuffer.h
@@ -19,10 +19,10 @@ public:
         WriteBufferT && out_,
         int compression_level,
         size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
-        char * existing_memory = nullptr,
+        char * existing_memory = nullptr, /// NOLINT(readability-non-const-parameter)
         size_t alignment = 0,
         bool compress_empty_ = true)
-    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment)
+    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment) /// NOLINT(bugprone-move-forwarding-reference)
     , tmp_memory(buf_size)
     , compress_empty(compress_empty_)
     {
diff --git a/src/IO/ReadBufferFromFileBase.h b/src/IO/ReadBufferFromFileBase.h
index 296edf9c689..9870d8bbe43 100644
--- a/src/IO/ReadBufferFromFileBase.h
+++ b/src/IO/ReadBufferFromFileBase.h
@@ -58,7 +58,7 @@ public:
     /// I.e. it can be read using open() or mmap(). If this buffer is a "view" into a subrange of the
     /// file, *out_view_offset is set to the start of that subrange, i.e. the difference between actual
     /// file offset and what getPosition() returns.
-    virtual bool isRegularLocalFile(size_t * /* out_view_offset */ = nullptr) { return false; }
+    virtual bool isRegularLocalFile(size_t * /*out_view_offsee*/) { return false; }
 
 protected:
     std::optional<size_t> file_size;
diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index c937f77708c..6a0cac35878 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -63,7 +63,6 @@ enum class RemoteFSReadMethod
 class MMappedFileCache;
 class PageCache;
 
-/// NOLINTNEXTLINE(clang-analyzer-optin.performance.Padding)
 struct ReadSettings
 {
     /// Method to use reading from local filesystem.
diff --git a/src/IO/ReadWriteBufferFromHTTP.h b/src/IO/ReadWriteBufferFromHTTP.h
index 1b7437ea0c6..224aac809a4 100644
--- a/src/IO/ReadWriteBufferFromHTTP.h
+++ b/src/IO/ReadWriteBufferFromHTTP.h
@@ -210,10 +210,11 @@ class BuilderRWBufferFromHTTP
     bool delay_initialization = true;
 
 public:
-    BuilderRWBufferFromHTTP(Poco::URI uri_)
+    explicit BuilderRWBufferFromHTTP(Poco::URI uri_)
         : uri(uri_)
     {}
 
+/// NOLINTBEGIN(bugprone-macro-parentheses)
 #define setterMember(name, member) \
     BuilderRWBufferFromHTTP & name(decltype(BuilderRWBufferFromHTTP::member) arg_##member) \
     { \
@@ -235,6 +236,7 @@ public:
     setterMember(withDelayInit, delay_initialization)
     setterMember(withSkipNotFound, http_skip_not_found_url)
 #undef setterMember
+/// NOLINTEND(bugprone-macro-parentheses)
 
     ReadWriteBufferFromHTTPPtr create(const Poco::Net::HTTPBasicCredentials & credentials_)
     {
diff --git a/src/IO/S3/PocoHTTPClient.h b/src/IO/S3/PocoHTTPClient.h
index a93a4dfbaf7..ebbddbb2c7e 100644
--- a/src/IO/S3/PocoHTTPClient.h
+++ b/src/IO/S3/PocoHTTPClient.h
@@ -95,7 +95,7 @@ public:
 
     void SetResponseBody(std::string & response_body) /// NOLINT
     {
-        auto stream = Aws::New<std::stringstream>("http result buf", response_body); // STYLE_CHECK_ALLOW_STD_STRING_STREAM
+        auto * stream = Aws::New<std::stringstream>("http result buf", response_body); // STYLE_CHECK_ALLOW_STD_STRING_STREAM
         stream->exceptions(std::ios::failbit);
         body_stream = Aws::Utils::Stream::ResponseStream(std::move(stream));
     }
diff --git a/src/IO/S3/tests/TestPocoHTTPServer.h b/src/IO/S3/tests/TestPocoHTTPServer.h
index a26e811d646..35ceb5e1632 100644
--- a/src/IO/S3/tests/TestPocoHTTPServer.h
+++ b/src/IO/S3/tests/TestPocoHTTPServer.h
@@ -22,7 +22,7 @@ class MockRequestHandler : public Poco::Net::HTTPRequestHandler
 
 public:
     explicit MockRequestHandler(Poco::Net::MessageHeader & last_request_header_)
-    : Poco::Net::HTTPRequestHandler(), last_request_header(last_request_header_)
+    : last_request_header(last_request_header_)
     {
     }
 
@@ -38,20 +38,18 @@ class HTTPRequestHandlerFactory : public Poco::Net::HTTPRequestHandlerFactory
 {
     Poco::Net::MessageHeader & last_request_header;
 
-    virtual Poco::Net::HTTPRequestHandler * createRequestHandler(const Poco::Net::HTTPServerRequest &) override
+    Poco::Net::HTTPRequestHandler * createRequestHandler(const Poco::Net::HTTPServerRequest &) override
     {
         return new MockRequestHandler(last_request_header);
     }
 
 public:
     explicit HTTPRequestHandlerFactory(Poco::Net::MessageHeader & last_request_header_)
-    : Poco::Net::HTTPRequestHandlerFactory(), last_request_header(last_request_header_)
+    : last_request_header(last_request_header_)
     {
     }
 
-    virtual ~HTTPRequestHandlerFactory() override
-    {
-    }
+    ~HTTPRequestHandlerFactory() override = default;
 };
 
 class TestPocoHTTPServer
diff --git a/src/IO/SeekableReadBuffer.h b/src/IO/SeekableReadBuffer.h
index 798833e1a9b..808efe9e6d0 100644
--- a/src/IO/SeekableReadBuffer.h
+++ b/src/IO/SeekableReadBuffer.h
@@ -82,7 +82,7 @@ public:
     ///    (e.g. next() or supportsReadAt()).
     ///  * Performance: there's no buffering. Each readBigAt() call typically translates into actual
     ///    IO operation (e.g. HTTP request). Don't use it for small adjacent reads.
-    virtual size_t readBigAt(char * /*to*/, size_t /*n*/, size_t /*offset*/, const std::function<bool(size_t m)> & /*progress_callback*/ = nullptr) const
+    virtual size_t readBigAt(char * /*to*/, size_t /*n*/, size_t /*offset*/, const std::function<bool(size_t m)> & /*progress_callback*/) const
         { throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Method readBigAt() not implemented"); }
 
     /// Checks if readBigAt() is allowed. May be slow, may throw (e.g. it may do an HTTP request or an fstat).
diff --git a/src/IO/WriteBufferFromArena.h b/src/IO/WriteBufferFromArena.h
index 8e9276496b5..f901f5bff77 100644
--- a/src/IO/WriteBufferFromArena.h
+++ b/src/IO/WriteBufferFromArena.h
@@ -66,7 +66,7 @@ private:
 
     /// it is super strange,
     /// but addition next call changes the data in serializeValueIntoArena result
-    virtual void finalizeImpl() override { /* no op */ }
+    void finalizeImpl() override { /* no op */ }
 };
 
 }
diff --git a/src/IO/ZlibDeflatingWriteBuffer.h b/src/IO/ZlibDeflatingWriteBuffer.h
index f01c41c7d13..35760b3e246 100644
--- a/src/IO/ZlibDeflatingWriteBuffer.h
+++ b/src/IO/ZlibDeflatingWriteBuffer.h
@@ -27,10 +27,10 @@ public:
             CompressionMethod compression_method,
             int compression_level,
             size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
-            char * existing_memory = nullptr,
+            char * existing_memory = nullptr, /// NOLINT(readability-non-const-parameter)
             size_t alignment = 0,
             bool compress_empty_ = true)
-    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment), compress_empty(compress_empty_)
+    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment), compress_empty(compress_empty_) /// NOLINT(bugprone-move-forwarding-reference)
     {
         zstr.zalloc = nullptr;
         zstr.zfree = nullptr;
@@ -60,8 +60,8 @@ private:
     /// Flush all pending data and write zlib footer to the underlying buffer.
     /// After the first call to this function, subsequent calls will have no effect and
     /// an attempt to write to this buffer will result in exception.
-    virtual void finalizeBefore() override;
-    virtual void finalizeAfter() override;
+    void finalizeBefore() override;
+    void finalizeAfter() override;
 
     z_stream zstr;
     bool compress_empty = true;
diff --git a/src/IO/ZstdDeflatingWriteBuffer.h b/src/IO/ZstdDeflatingWriteBuffer.h
index 15c3869062f..9d1c677e725 100644
--- a/src/IO/ZstdDeflatingWriteBuffer.h
+++ b/src/IO/ZstdDeflatingWriteBuffer.h
@@ -20,10 +20,10 @@ public:
         int compression_level,
         int window_log = 0,
         size_t buf_size = DBMS_DEFAULT_BUFFER_SIZE,
-        char * existing_memory = nullptr,
+        char * existing_memory = nullptr, /// NOLINT(readability-non-const-parameter)
         size_t alignment = 0,
         bool compress_empty_ = true)
-    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment), compress_empty(compress_empty_)
+    : WriteBufferWithOwnMemoryDecorator(std::move(out_), buf_size, existing_memory, alignment), compress_empty(compress_empty_) /// NOLINT(bugprone-move-forwarding-reference)
     {
         initialize(compression_level, window_log);
     }
diff --git a/src/IO/readDecimalText.h b/src/IO/readDecimalText.h
index 8b4405ee2e9..f3b08065696 100644
--- a/src/IO/readDecimalText.h
+++ b/src/IO/readDecimalText.h
@@ -38,7 +38,7 @@ inline bool readDigits(ReadBuffer & buf, T & x, uint32_t & digits, int32_t & exp
         return false;
     }
 
-    switch (*buf.position())
+    switch (*buf.position()) /// NOLINT(bugprone-switch-missing-default-case)
     {
         case '-':
             sign = -1;
diff --git a/src/Interpreters/AddDefaultDatabaseVisitor.h b/src/Interpreters/AddDefaultDatabaseVisitor.h
index e36f22e8ba1..356bffa75e9 100644
--- a/src/Interpreters/AddDefaultDatabaseVisitor.h
+++ b/src/Interpreters/AddDefaultDatabaseVisitor.h
@@ -163,7 +163,7 @@ private:
         if (identifier.compound())
             return;
         /// There is temporary table with such name, should not be rewritten.
-        if (external_tables.count(identifier.shortName()))
+        if (external_tables.contains(identifier.shortName()))
             return;
 
         auto qualified_identifier = std::make_shared<ASTTableIdentifier>(database_name, identifier.name());
diff --git a/src/Interpreters/AggregateFunctionOfGroupByKeysVisitor.h b/src/Interpreters/AggregateFunctionOfGroupByKeysVisitor.h
index ab01cc6a0b6..d8fae7e80ad 100644
--- a/src/Interpreters/AggregateFunctionOfGroupByKeysVisitor.h
+++ b/src/Interpreters/AggregateFunctionOfGroupByKeysVisitor.h
@@ -37,7 +37,7 @@ struct KeepAggregateFunctionMatcher
             return;
         }
 
-        if (!data.group_by_keys.count(function_node.getColumnName()))
+        if (!data.group_by_keys.contains(function_node.getColumnName()))
         {
             Visitor(data).visit(function_node.arguments);
         }
@@ -46,7 +46,7 @@ struct KeepAggregateFunctionMatcher
     static void visit(ASTIdentifier & ident, Data & data)
     {
         /// if variable of a function is not in GROUP BY keys, this function should not be deleted
-        if (!data.group_by_keys.count(ident.getColumnName()))
+        if (!data.group_by_keys.contains(ident.getColumnName()))
             data.keep_aggregator = true;
     }
 
diff --git a/src/Interpreters/AggregationCommon.h b/src/Interpreters/AggregationCommon.h
index ced29c2f862..ab078d1c5e5 100644
--- a/src/Interpreters/AggregationCommon.h
+++ b/src/Interpreters/AggregationCommon.h
@@ -94,7 +94,7 @@ void fillFixedBatch(size_t keys_size, const ColumnRawPtrs & key_columns, const S
             if constexpr (std::endian::native == std::endian::big)
                 offset_to = sizeof(Key) - sizeof(T) - offset;
             T * dest = reinterpret_cast<T *>(reinterpret_cast<char *>(out.data()) + offset_to);
-            fillFixedBatch<T, sizeof(Key) / sizeof(T)>(num_rows, reinterpret_cast<const T *>(source), dest);
+            fillFixedBatch<T, sizeof(Key) / sizeof(T)>(num_rows, reinterpret_cast<const T *>(source), dest); /// NOLINT(bugprone-sizeof-expression)
             offset += sizeof(T);
         }
     }
diff --git a/src/Interpreters/ArrayJoinedColumnsVisitor.h b/src/Interpreters/ArrayJoinedColumnsVisitor.h
index f16751c4561..86db342073a 100644
--- a/src/Interpreters/ArrayJoinedColumnsVisitor.h
+++ b/src/Interpreters/ArrayJoinedColumnsVisitor.h
@@ -75,7 +75,7 @@ private:
             if (nested_table_alias == nested_table_name && !ast->as<ASTIdentifier>())
                 throw Exception(ErrorCodes::ALIAS_REQUIRED, "No alias for non-trivial value in ARRAY JOIN: {}", nested_table_name);
 
-            if (data.array_join_alias_to_name.count(nested_table_alias) || data.aliases.count(nested_table_alias))
+            if (data.array_join_alias_to_name.contains(nested_table_alias) || data.aliases.contains(nested_table_alias))
                 throw Exception(ErrorCodes::MULTIPLE_EXPRESSIONS_FOR_ALIAS, "Duplicate alias in ARRAY JOIN: {}", nested_table_alias);
 
             data.array_join_alias_to_name[nested_table_alias] = nested_table_name;
@@ -100,18 +100,18 @@ private:
 
         auto split = Nested::splitName(node.name());  /// ParsedParams, Key1
 
-        if (array_join_alias_to_name.count(node.name()))
+        if (array_join_alias_to_name.contains(node.name()))
         {
             /// ARRAY JOIN was written with an array column. Example: SELECT K1 FROM ... ARRAY JOIN ParsedParams.Key1 AS K1
             array_join_result_to_source[node.name()] = array_join_alias_to_name[node.name()];    /// K1 -> ParsedParams.Key1
         }
-        else if (array_join_alias_to_name.count(split.first) && !split.second.empty())
+        else if (array_join_alias_to_name.contains(split.first) && !split.second.empty())
         {
             /// ARRAY JOIN was written with a nested table. Example: SELECT PP.KEY1 FROM ... ARRAY JOIN ParsedParams AS PP
             array_join_result_to_source[node.name()]    /// PP.Key1 -> ParsedParams.Key1
                 = Nested::concatenateName(array_join_alias_to_name[split.first], split.second);
         }
-        else if (array_join_name_to_alias.count(node.name()))
+        else if (array_join_name_to_alias.contains(node.name()))
         {
             /** Example: SELECT ParsedParams.Key1 FROM ... ARRAY JOIN ParsedParams.Key1 AS PP.Key1.
             * That is, the query uses the original array, replicated by itself.
@@ -119,7 +119,7 @@ private:
             array_join_result_to_source[    /// PP.Key1 -> ParsedParams.Key1
                 array_join_name_to_alias[node.name()]] = node.name();
         }
-        else if (array_join_name_to_alias.count(split.first) && !split.second.empty())
+        else if (array_join_name_to_alias.contains(split.first) && !split.second.empty())
         {
             /** Example: SELECT ParsedParams.Key1 FROM ... ARRAY JOIN ParsedParams AS PP.
             */
diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index 5076701d0b0..9d3c38d0a4c 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -282,7 +282,7 @@ private:
 public:
     auto getQueueLocked(size_t shard_num) const
     {
-        auto & shard = queue_shards[shard_num];
+        const auto & shard = queue_shards[shard_num];
         std::unique_lock lock(shard.mutex);
         return std::make_pair(std::ref(shard.queue), std::move(lock));
     }
diff --git a/src/Interpreters/BackupLog.h b/src/Interpreters/BackupLog.h
index ee6a4c214ee..e17b9b69cfd 100644
--- a/src/Interpreters/BackupLog.h
+++ b/src/Interpreters/BackupLog.h
@@ -23,7 +23,7 @@ struct BackupLogElement
 
     std::chrono::system_clock::time_point event_time{};
     Decimal64 event_time_usec{};
-    BackupOperationInfo info{};
+    BackupOperationInfo info{}; /// NOLINT(bugprone-throw-keyword-missing)
 
     static std::string name() { return "BackupLog"; }
     static ColumnsDescription getColumnsDescription();
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index 43df8d6adf2..dbd9bbd1ff8 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -129,7 +129,6 @@ using ActionLocksManagerPtr = std::shared_ptr<ActionLocksManager>;
 class ShellCommand;
 class ICompressionCodec;
 class AccessControl;
-class Credentials;
 class GSSAcceptorContext;
 struct SettingsConstraintsAndProfileIDs;
 class SettingsProfileElements;
@@ -164,7 +163,6 @@ using OrdinaryBackgroundExecutorPtr = std::shared_ptr<OrdinaryBackgroundExecutor
 struct PartUUIDs;
 using PartUUIDsPtr = std::shared_ptr<PartUUIDs>;
 class KeeperDispatcher;
-class Session;
 struct WriteSettings;
 
 class IInputFormat;
diff --git a/src/Interpreters/DirectJoin.h b/src/Interpreters/DirectJoin.h
index ef8d12a1b8f..019e32c3130 100644
--- a/src/Interpreters/DirectJoin.h
+++ b/src/Interpreters/DirectJoin.h
@@ -31,28 +31,24 @@ public:
         const Block & right_sample_block_with_storage_column_names_);
 
     std::string getName() const override { return "DirectKeyValueJoin"; }
-    virtual const TableJoin & getTableJoin() const override { return *table_join; }
+    const TableJoin & getTableJoin() const override { return *table_join; }
 
-    virtual bool addBlockToJoin(const Block &, bool) override;
-    virtual void checkTypesOfKeys(const Block &) const override;
+    bool addBlockToJoin(const Block &, bool) override;
+    void checkTypesOfKeys(const Block &) const override;
 
     /// Join the block with data from left hand of JOIN to the right hand data (that was previously built by calls to addBlockToJoin).
     /// Could be called from different threads in parallel.
-    virtual void joinBlock(Block & block, std::shared_ptr<ExtraBlock> &) override;
+    void joinBlock(Block & block, std::shared_ptr<ExtraBlock> &) override;
 
-    virtual size_t getTotalRowCount() const override { return 0; }
+    size_t getTotalRowCount() const override { return 0; }
 
-    virtual size_t getTotalByteCount() const override { return 0; }
+    size_t getTotalByteCount() const override { return 0; }
 
-    virtual bool alwaysReturnsEmptySet() const override { return false; }
+    bool alwaysReturnsEmptySet() const override { return false; }
 
-    virtual bool isFilled() const override { return true; }
+    bool isFilled() const override { return true; }
 
-    virtual IBlocksStreamPtr
-    getNonJoinedBlocks(const Block &, const Block &, UInt64) const override
-    {
-        return nullptr;
-    }
+    IBlocksStreamPtr getNonJoinedBlocks(const Block &, const Block &, UInt64) const override { return nullptr; }
 
 private:
     std::shared_ptr<TableJoin> table_join;
diff --git a/src/Interpreters/GetAggregatesVisitor.h b/src/Interpreters/GetAggregatesVisitor.h
index 863c4f81a1b..e1d22e4de82 100644
--- a/src/Interpreters/GetAggregatesVisitor.h
+++ b/src/Interpreters/GetAggregatesVisitor.h
@@ -68,7 +68,7 @@ private:
                                 node.getColumnName(), String(data.assert_no_aggregates));
 
             String column_name = node.getColumnName();
-            if (data.uniq_names.count(column_name))
+            if (data.uniq_names.contains(column_name))
                 return;
 
             data.uniq_names.insert(column_name);
@@ -81,7 +81,7 @@ private:
                                 node.getColumnName(), String(data.assert_no_windows));
 
             String column_name = node.getColumnName();
-            if (data.uniq_names.count(column_name))
+            if (data.uniq_names.contains(column_name))
                 return;
 
             data.uniq_names.insert(column_name);
diff --git a/src/Interpreters/GroupByFunctionKeysVisitor.h b/src/Interpreters/GroupByFunctionKeysVisitor.h
index b1d40320a45..9b082291bfb 100644
--- a/src/Interpreters/GroupByFunctionKeysVisitor.h
+++ b/src/Interpreters/GroupByFunctionKeysVisitor.h
@@ -38,7 +38,7 @@ struct KeepFunctionMatcher
             return;
         }
 
-        if (!data.key_names_to_keep.count(function_node->getColumnName()))
+        if (!data.key_names_to_keep.contains(function_node->getColumnName()))
         {
             Visitor(data).visit(function_node->arguments);
         }
@@ -46,7 +46,7 @@ struct KeepFunctionMatcher
 
     static void visit(ASTIdentifier * ident, Data & data)
     {
-        if (!data.key_names_to_keep.count(ident->shortName()))
+        if (!data.key_names_to_keep.contains(ident->shortName()))
         {
             /// if variable of a function is not in GROUP BY keys, this function should not be deleted
             data.keep_key = true;
diff --git a/src/Interpreters/HashJoin.h b/src/Interpreters/HashJoin.h
index 29bb9070009..3e11517edad 100644
--- a/src/Interpreters/HashJoin.h
+++ b/src/Interpreters/HashJoin.h
@@ -253,6 +253,7 @@ public:
     template <typename Mapped>
     struct MapsTemplate
     {
+/// NOLINTBEGIN(bugprone-macro-parentheses)
         using MappedType = Mapped;
         std::unique_ptr<FixedHashMap<UInt8, Mapped>>                  key8;
         std::unique_ptr<FixedHashMap<UInt16, Mapped>>                 key16;
@@ -341,6 +342,7 @@ public:
 
             UNREACHABLE();
         }
+/// NOLINTEND(bugprone-macro-parentheses)
     };
 
     using MapsOne = MapsTemplate<RowRef>;
diff --git a/src/Interpreters/MonotonicityCheckVisitor.h b/src/Interpreters/MonotonicityCheckVisitor.h
index cc386825024..e1df45ed36b 100644
--- a/src/Interpreters/MonotonicityCheckVisitor.h
+++ b/src/Interpreters/MonotonicityCheckVisitor.h
@@ -41,7 +41,7 @@ public:
             /// if GROUP BY contains the same function ORDER BY shouldn't be optimized
             const auto hash = ast_function.getTreeHash(/*ignore_aliases=*/ true);
             const auto key = toString(hash);
-            if (group_by_function_hashes.count(key))
+            if (group_by_function_hashes.contains(key))
                 return false;
 
             /// if ORDER BY contains aggregate function or window functions, it
diff --git a/src/Interpreters/RedundantFunctionsInOrderByVisitor.h b/src/Interpreters/RedundantFunctionsInOrderByVisitor.h
index 60c9fcf2a24..516e6f0a9d4 100644
--- a/src/Interpreters/RedundantFunctionsInOrderByVisitor.h
+++ b/src/Interpreters/RedundantFunctionsInOrderByVisitor.h
@@ -61,7 +61,7 @@ public:
 
             /// Allow known identifiers: they are present in ORDER BY before current item
             if (auto * identifier = arg->as<ASTIdentifier>())
-                if (data.keys.count(getIdentifierName(identifier)))
+                if (data.keys.contains(getIdentifierName(identifier)))
                     continue;
 
             /// Reject erase others
diff --git a/src/Interpreters/SessionLog.h b/src/Interpreters/SessionLog.h
index 74e72c54bcc..5bacb9677c0 100644
--- a/src/Interpreters/SessionLog.h
+++ b/src/Interpreters/SessionLog.h
@@ -37,7 +37,7 @@ struct SessionLogElement
     SessionLogElement(const UUID & auth_id_, Type type_);
     SessionLogElement(const SessionLogElement &) = default;
     SessionLogElement & operator=(const SessionLogElement &) = default;
-    SessionLogElement(SessionLogElement &&) = default;
+    SessionLogElement(SessionLogElement &&) = default; /// NOLINT(performance-noexcept-move-constructor,hicpp-noexcept-move)
     SessionLogElement & operator=(SessionLogElement &&) = default;
 
     UUID auth_id;
diff --git a/src/Interpreters/SetVariants.h b/src/Interpreters/SetVariants.h
index 71187c9f109..ff527102080 100644
--- a/src/Interpreters/SetVariants.h
+++ b/src/Interpreters/SetVariants.h
@@ -80,7 +80,7 @@ protected:
 
         for (const auto & col : key_columns)
         {
-            if (auto * nullable = checkAndGetColumn<ColumnNullable>(*col))
+            if (const auto * nullable = checkAndGetColumn<ColumnNullable>(*col))
             {
                 actual_columns.push_back(&nullable->getNestedColumn());
                 null_maps.push_back(&nullable->getNullMapColumn());
@@ -96,7 +96,7 @@ protected:
     /// Return the columns which actually contain the values of the keys.
     /// For a given key column, if it is nullable, we return its nested
     /// column. Otherwise we return the key column itself.
-    inline const ColumnRawPtrs & getActualColumns() const
+    const ColumnRawPtrs & getActualColumns() const
     {
         return actual_columns;
     }
diff --git a/src/Interpreters/TranslateQualifiedNamesVisitor.h b/src/Interpreters/TranslateQualifiedNamesVisitor.h
index 73e45fc7ea0..00c85d08873 100644
--- a/src/Interpreters/TranslateQualifiedNamesVisitor.h
+++ b/src/Interpreters/TranslateQualifiedNamesVisitor.h
@@ -35,7 +35,7 @@ public:
             , has_columns(has_columns_)
         {}
 
-        bool hasColumn(const String & name) const { return source_columns.count(name); }
+        bool hasColumn(const String & name) const { return source_columns.contains(name); }
         bool hasTable() const { return !tables.empty(); }
         bool processAsterisks() const { return hasTable() && has_columns; }
         bool unknownColumn(size_t table_pos, const ASTIdentifier & identifier) const;
diff --git a/src/Interpreters/TreeCNFConverter.h b/src/Interpreters/TreeCNFConverter.h
index 3cc8b05d6c6..8258412f1a6 100644
--- a/src/Interpreters/TreeCNFConverter.h
+++ b/src/Interpreters/TreeCNFConverter.h
@@ -58,7 +58,7 @@ public:
         for (const auto & or_group : statements)
         {
             OrGroup filtered_group;
-            for (auto ast : or_group)
+            for (const auto & ast : or_group)
             {
                 if (predicate_is_unknown(ast))
                     filtered_group.insert(ast);
diff --git a/src/Interpreters/joinDispatch.h b/src/Interpreters/joinDispatch.h
index ca2fcd27cda..324d6a4d434 100644
--- a/src/Interpreters/joinDispatch.h
+++ b/src/Interpreters/joinDispatch.h
@@ -113,10 +113,9 @@ inline bool joinDispatch(JoinKind kind, JoinStrictness strictness, std::vector<c
         {
             using MapType = typename MapGetter<KINDS[i], STRICTNESSES[j]>::Map;
             std::vector<const MapType *> v;
+            v.resize(mapsv.size());
             for (const auto & el : mapsv)
-            {
                 v.push_back(&std::get<MapType>(*el));
-            }
 
             func(
                 std::integral_constant<JoinKind, KINDS[i]>(),
diff --git a/src/Loggers/OwnFormattingChannel.h b/src/Loggers/OwnFormattingChannel.h
index da7cde315f9..00300fe99ff 100644
--- a/src/Loggers/OwnFormattingChannel.h
+++ b/src/Loggers/OwnFormattingChannel.h
@@ -16,11 +16,11 @@ class OwnFormattingChannel : public Poco::Channel, public ExtendedLogChannel
 public:
     explicit OwnFormattingChannel(
         Poco::AutoPtr<OwnPatternFormatter> pFormatter_ = nullptr, Poco::AutoPtr<Poco::Channel> pChannel_ = nullptr)
-        : pFormatter(std::move(pFormatter_)), pChannel(std::move(pChannel_)), priority(Poco::Message::PRIO_TRACE)
+        : pFormatter(pFormatter_), pChannel(pChannel_), priority(Poco::Message::PRIO_TRACE)
     {
     }
 
-    void setChannel(Poco::AutoPtr<Poco::Channel> pChannel_) { pChannel = std::move(pChannel_); }
+    void setChannel(Poco::AutoPtr<Poco::Channel> pChannel_) { pChannel = pChannel_; }
 
     void setLevel(Poco::Message::Priority priority_) { priority = priority_; }
 
diff --git a/src/Processors/Executors/PullingAsyncPipelineExecutor.h b/src/Processors/Executors/PullingAsyncPipelineExecutor.h
index 361bcc0155c..618a7e790ab 100644
--- a/src/Processors/Executors/PullingAsyncPipelineExecutor.h
+++ b/src/Processors/Executors/PullingAsyncPipelineExecutor.h
@@ -58,7 +58,6 @@ private:
 
     void cancelWithExceptionHandling(CancelFunc && cancel_func);
 
-private:
     QueryPipeline & pipeline;
     std::shared_ptr<LazyOutputFormat> lazy_format;
     std::unique_ptr<Data> data;
diff --git a/src/Processors/Formats/IRowOutputFormat.h b/src/Processors/Formats/IRowOutputFormat.h
index 3a648f00eba..6083e1a6bc8 100644
--- a/src/Processors/Formats/IRowOutputFormat.h
+++ b/src/Processors/Formats/IRowOutputFormat.h
@@ -50,13 +50,13 @@ protected:
     virtual void writeFieldDelimiter() {}       /// delimiter between values
     virtual void writeRowStartDelimiter() {}    /// delimiter before each row
     virtual void writeRowEndDelimiter() {}      /// delimiter after each row
-    virtual void writePrefix() override {}      /// delimiter before resultset
-    virtual void writeSuffix() override {}      /// delimiter after resultset
+    void writePrefix() override {}      /// delimiter before resultset
+    void writeSuffix() override {}      /// delimiter after resultset
     virtual void writeBeforeTotals() {}
     virtual void writeAfterTotals() {}
     virtual void writeBeforeExtremes() {}
     virtual void writeAfterExtremes() {}
-    virtual void finalizeImpl() override {}  /// Write something after resultset, totals end extremes.
+    void finalizeImpl() override {}  /// Write something after resultset, totals end extremes.
 
     bool haveWrittenData() { return !first_row || getRowsReadBefore() != 0; }
 
diff --git a/src/Processors/Formats/Impl/ArrowBufferedStreams.cpp b/src/Processors/Formats/Impl/ArrowBufferedStreams.cpp
index 83d7a8b7bbd..c6e951ada6a 100644
--- a/src/Processors/Formats/Impl/ArrowBufferedStreams.cpp
+++ b/src/Processors/Formats/Impl/ArrowBufferedStreams.cpp
@@ -154,7 +154,7 @@ arrow::Result<int64_t> RandomAccessFileFromRandomAccessReadBuffer::GetSize()
 
 arrow::Result<int64_t> RandomAccessFileFromRandomAccessReadBuffer::ReadAt(int64_t position, int64_t nbytes, void* out)
 {
-    return in.readBigAt(reinterpret_cast<char*>(out), nbytes, position);
+    return in.readBigAt(reinterpret_cast<char*>(out), nbytes, position, nullptr);
 }
 
 arrow::Result<std::shared_ptr<arrow::Buffer>> RandomAccessFileFromRandomAccessReadBuffer::ReadAt(int64_t position, int64_t nbytes)
diff --git a/src/Processors/Formats/Impl/AvroRowInputFormat.h b/src/Processors/Formats/Impl/AvroRowInputFormat.h
index a8364df6e80..78dfe65fa5e 100644
--- a/src/Processors/Formats/Impl/AvroRowInputFormat.h
+++ b/src/Processors/Formats/Impl/AvroRowInputFormat.h
@@ -183,7 +183,7 @@ public:
     class SchemaRegistry;
 
 private:
-    virtual bool readRow(MutableColumns & columns, RowReadExtension & ext) override;
+    bool readRow(MutableColumns & columns, RowReadExtension & ext) override;
     void readPrefix() override;
 
     bool allowSyncAfterError() const override { return true; }
diff --git a/src/Processors/Formats/Impl/AvroRowOutputFormat.h b/src/Processors/Formats/Impl/AvroRowOutputFormat.h
index c526936b383..5d308d78966 100644
--- a/src/Processors/Formats/Impl/AvroRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/AvroRowOutputFormat.h
@@ -48,16 +48,16 @@ class AvroRowOutputFormat final : public IRowOutputFormat
 {
 public:
     AvroRowOutputFormat(WriteBuffer & out_, const Block & header_, const FormatSettings & settings_);
-    virtual ~AvroRowOutputFormat() override;
+    ~AvroRowOutputFormat() override;
 
     String getName() const override { return "AvroRowOutputFormat"; }
 
 private:
     void write(const Columns & columns, size_t row_num) override;
     void writeField(const IColumn &, const ISerialization &, size_t) override {}
-    virtual void writePrefix() override;
-    virtual void finalizeImpl() override;
-    virtual void resetFormatterImpl() override;
+    void writePrefix() override;
+    void finalizeImpl() override;
+    void resetFormatterImpl() override;
 
     void createFileWriter();
 
diff --git a/src/Processors/Formats/Impl/ConstantExpressionTemplate.h b/src/Processors/Formats/Impl/ConstantExpressionTemplate.h
index 71d0d0f7134..11165d5c449 100644
--- a/src/Processors/Formats/Impl/ConstantExpressionTemplate.h
+++ b/src/Processors/Formats/Impl/ConstantExpressionTemplate.h
@@ -92,7 +92,6 @@ private:
     bool parseLiteralAndAssertType(
         ReadBuffer & istr, const TokenIterator & token_iterator, const IDataType * type, size_t column_idx, const Settings & settings);
 
-private:
     TemplateStructurePtr structure;
     MutableColumns columns;
 
diff --git a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
index 50a73646359..b04c1b0c16e 100644
--- a/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
+++ b/src/Processors/Formats/Impl/ParallelFormattingOutputFormat.h
@@ -154,7 +154,7 @@ public:
     void setException(const String & exception_message_) override { exception_message = exception_message_; }
 
 private:
-    void consume(Chunk chunk) override final
+    void consume(Chunk chunk) final
     {
         addChunk(std::move(chunk), ProcessingUnitType::PLAIN, /*can_throw_exception*/ true);
     }
diff --git a/src/Processors/Formats/Impl/ParquetBlockOutputFormat.h b/src/Processors/Formats/Impl/ParquetBlockOutputFormat.h
index 3db90f4299b..422bae5c315 100644
--- a/src/Processors/Formats/Impl/ParquetBlockOutputFormat.h
+++ b/src/Processors/Formats/Impl/ParquetBlockOutputFormat.h
@@ -48,10 +48,10 @@ private:
             set(b);
         }
 
-        MemoryToken(MemoryToken && t)
+        MemoryToken(MemoryToken && t) /// NOLINT
           : parent(std::exchange(t.parent, nullptr)), bytes(std::exchange(t.bytes, 0)) {}
 
-        MemoryToken & operator=(MemoryToken && t)
+        MemoryToken & operator=(MemoryToken && t) /// NOLINT
         {
             parent = std::exchange(t.parent, nullptr);
             bytes = std::exchange(t.bytes, 0);
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowOutputFormat.h b/src/Processors/Formats/Impl/TabSeparatedRowOutputFormat.h
index 9facba2052a..a514323873e 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowOutputFormat.h
+++ b/src/Processors/Formats/Impl/TabSeparatedRowOutputFormat.h
@@ -34,14 +34,14 @@ public:
 
 protected:
     void writeField(const IColumn & column, const ISerialization & serialization, size_t row_num) override;
-    void writeFieldDelimiter() override final;
+    void writeFieldDelimiter() final;
     void writeRowEndDelimiter() override;
 
     bool supportTotals() const override { return true; }
     bool supportExtremes() const override { return true; }
 
-    void writeBeforeTotals() override final;
-    void writeBeforeExtremes() override final;
+    void writeBeforeTotals() final;
+    void writeBeforeExtremes() final;
 
     void writePrefix() override;
     void writeLine(const std::vector<String> & values);
diff --git a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.h b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.h
index d0457990714..b7d9507151e 100644
--- a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.h
+++ b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.h
@@ -175,7 +175,7 @@ public:
     void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
 
 protected:
-    virtual std::optional<DataTypes> readRowAndGetDataTypes() override;
+    std::optional<DataTypes> readRowAndGetDataTypes() override;
 
     virtual std::optional<DataTypes> readRowAndGetDataTypesImpl()
     {
diff --git a/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.h b/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.h
index 72a1f4871d8..aa221573151 100644
--- a/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.h
@@ -47,7 +47,7 @@ public:
         bool created = false;
 
         SimpleAggregateDescription(
-            AggregateFunctionPtr function_, const size_t column_number_,
+            AggregateFunctionPtr function_, size_t column_number_,
             DataTypePtr nested_type_, DataTypePtr real_type_);
 
         void createState();
diff --git a/src/Processors/Merges/Algorithms/IMergingAlgorithm.h b/src/Processors/Merges/Algorithms/IMergingAlgorithm.h
index d55ceb78af4..6e352c3f104 100644
--- a/src/Processors/Merges/Algorithms/IMergingAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/IMergingAlgorithm.h
@@ -31,7 +31,7 @@ public:
 
         IColumn::Permutation * permutation = nullptr;
 
-        void swap(Input & other)
+        void swap(Input & other) noexcept
         {
             chunk.swap(other.chunk);
             std::swap(skip_last_row, other.skip_last_row);
diff --git a/src/Processors/Merges/Algorithms/RowRef.h b/src/Processors/Merges/Algorithms/RowRef.h
index ee64224d44d..af379ec59f6 100644
--- a/src/Processors/Merges/Algorithms/RowRef.h
+++ b/src/Processors/Merges/Algorithms/RowRef.h
@@ -181,7 +181,7 @@ struct RowRefWithOwnedChunk
 
     UInt64 source_stream_index = 0;
 
-    void swap(RowRefWithOwnedChunk & other)
+    void swap(RowRefWithOwnedChunk & other) /// NOLINT(performance-noexcept-swap)
     {
         owned_chunk.swap(other.owned_chunk);
         std::swap(all_columns, other.all_columns);
diff --git a/src/Processors/Transforms/MergeJoinTransform.h b/src/Processors/Transforms/MergeJoinTransform.h
index 793de00db40..959550067f7 100644
--- a/src/Processors/Transforms/MergeJoinTransform.h
+++ b/src/Processors/Transforms/MergeJoinTransform.h
@@ -230,9 +230,9 @@ public:
     explicit MergeJoinAlgorithm(JoinPtr table_join, const Blocks & input_headers, size_t max_block_size_);
 
     const char * getName() const override { return "MergeJoinAlgorithm"; }
-    virtual void initialize(Inputs inputs) override;
-    virtual void consume(Input & input, size_t source_num) override;
-    virtual Status merge() override;
+    void initialize(Inputs inputs) override;
+    void consume(Input & input, size_t source_num) override;
+    Status merge() override;
 
     void logElapsed(double seconds);
 
diff --git a/src/Processors/Transforms/PasteJoinTransform.h b/src/Processors/Transforms/PasteJoinTransform.h
index 04cb5486cd5..6a7e65ee27c 100644
--- a/src/Processors/Transforms/PasteJoinTransform.h
+++ b/src/Processors/Transforms/PasteJoinTransform.h
@@ -32,9 +32,9 @@ public:
     explicit PasteJoinAlgorithm(JoinPtr table_join, const Blocks & input_headers, size_t max_block_size_);
 
     const char * getName() const override { return "PasteJoinAlgorithm"; }
-    virtual void initialize(Inputs inputs) override;
-    virtual void consume(Input & input, size_t source_num) override;
-    virtual Status merge() override;
+    void initialize(Inputs inputs) override;
+    void consume(Input & input, size_t source_num) override;
+    Status merge() override;
 
     void logElapsed(double seconds);
 
diff --git a/src/QueryPipeline/QueryPipelineBuilder.h b/src/QueryPipeline/QueryPipelineBuilder.h
index 5d273df7068..f0b2ead687e 100644
--- a/src/QueryPipeline/QueryPipelineBuilder.h
+++ b/src/QueryPipeline/QueryPipelineBuilder.h
@@ -188,7 +188,7 @@ public:
         concurrency_control = concurrency_control_;
     }
 
-    bool getConcurrencyControl()
+    bool getConcurrencyControl() const
     {
         return concurrency_control;
     }
diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index f21991e8d58..dfae812c620 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -618,7 +618,6 @@ namespace
 
 
     /// Handles a connection after a responder is started (i.e. after getting a new call).
-// NOLINTBEGIN(clang-analyzer-optin.performance.Padding)
     class Call
     {
     public:
@@ -724,7 +723,6 @@ namespace
 
         ThreadFromGlobalPool call_thread;
     };
-// NOLINTEND(clang-analyzer-optin.performance.Padding)
 
     Call::Call(CallType call_type_, std::unique_ptr<BaseResponder> responder_, IServer & iserver_, LoggerRawPtr log_)
         : call_type(call_type_), responder(std::move(responder_)), iserver(iserver_), log(log_)
diff --git a/src/Server/HTTP/HTTPServerResponse.h b/src/Server/HTTP/HTTPServerResponse.h
index 6c5be008bf8..8edb785e7c5 100644
--- a/src/Server/HTTP/HTTPServerResponse.h
+++ b/src/Server/HTTP/HTTPServerResponse.h
@@ -90,7 +90,7 @@ public:
         resizeIfNeeded(buf_size);
     }
 
-    bool isChunked()
+    bool isChunked() const
     {
         return chunked;
     }
@@ -103,7 +103,7 @@ public:
         resizeIfNeeded(length);
     }
 
-    size_t isFixedLength()
+    size_t isFixedLength() const
     {
         return chunked ? 0 : fixed_length;
     }
@@ -116,7 +116,7 @@ public:
         resizeIfNeeded(buf_size);
     }
 
-    bool isPlain()
+    bool isPlain() const
     {
         return !(isChunked() || isFixedLength());
     }
diff --git a/src/Server/HTTPHandler.h b/src/Server/HTTPHandler.h
index 0e30b466694..39cef0e7112 100644
--- a/src/Server/HTTPHandler.h
+++ b/src/Server/HTTPHandler.h
@@ -32,7 +32,7 @@ class HTTPHandler : public HTTPRequestHandler
 {
 public:
     HTTPHandler(IServer & server_, const std::string & name, const std::optional<String> & content_type_override_);
-    virtual ~HTTPHandler() override;
+    ~HTTPHandler() override;
 
     void handleRequest(HTTPServerRequest & request, HTTPServerResponse & response, const ProfileEvents::Event & write_event) override;
 
diff --git a/src/Storages/DataLakes/S3MetadataReader.h b/src/Storages/DataLakes/S3MetadataReader.h
index cae7dd1fa3d..c29a66b3813 100644
--- a/src/Storages/DataLakes/S3MetadataReader.h
+++ b/src/Storages/DataLakes/S3MetadataReader.h
@@ -6,11 +6,11 @@
 
 #include <Storages/StorageS3.h>
 
-class ReadBuffer;
-
 namespace DB
 {
 
+class ReadBuffer;
+
 struct S3DataLakeMetadataReadHelper
 {
     static std::shared_ptr<ReadBuffer> createReadBuffer(
diff --git a/src/Storages/FileLog/FileLogSource.h b/src/Storages/FileLog/FileLogSource.h
index 281b109ff4b..3ac2b407e10 100644
--- a/src/Storages/FileLog/FileLogSource.h
+++ b/src/Storages/FileLog/FileLogSource.h
@@ -30,7 +30,7 @@ public:
 
     void onFinish();
 
-    virtual ~FileLogSource() override;
+    ~FileLogSource() override;
 
 protected:
     Chunk generate() override;
diff --git a/src/Storages/Hive/HiveFile.h b/src/Storages/Hive/HiveFile.h
index 1f5e31f1d54..601c7f2a310 100644
--- a/src/Storages/Hive/HiveFile.h
+++ b/src/Storages/Hive/HiveFile.h
@@ -65,7 +65,7 @@ public:
         {ORC_INPUT_FORMAT, FileFormat::ORC},
     };
 
-    static inline bool isFormatClass(const String & format_class) { return VALID_HDFS_FORMATS.count(format_class) > 0; }
+    static inline bool isFormatClass(const String & format_class) { return VALID_HDFS_FORMATS.contains(format_class); }
     static inline FileFormat toFileFormat(const String & format_class)
     {
         if (isFormatClass(format_class))
diff --git a/src/Storages/IStorage.cpp b/src/Storages/IStorage.cpp
index 9852220241f..b532abc9074 100644
--- a/src/Storages/IStorage.cpp
+++ b/src/Storages/IStorage.cpp
@@ -305,7 +305,7 @@ void IStorage::backupData(BackupEntriesCollector &, const String &, const std::o
 void IStorage::restoreDataFromBackup(RestorerFromBackup & restorer, const String & data_path_in_backup, const std::optional<ASTs> &)
 {
     /// If an inherited class doesn't override restoreDataFromBackup() that means it doesn't backup any data.
-    auto filenames = restorer.getBackup()->listFiles(data_path_in_backup);
+    auto filenames = restorer.getBackup()->listFiles(data_path_in_backup, /*recursive*/ false);
     if (!filenames.empty())
         throw Exception(ErrorCodes::CANNOT_RESTORE_TABLE, "Cannot restore table {}: Folder {} in backup must be empty",
                         getStorageID().getFullTableName(), data_path_in_backup);
diff --git a/src/Storages/Kafka/KafkaConsumer.h b/src/Storages/Kafka/KafkaConsumer.h
index 9cc78d42856..f160d1c0855 100644
--- a/src/Storages/Kafka/KafkaConsumer.h
+++ b/src/Storages/Kafka/KafkaConsumer.h
@@ -184,7 +184,7 @@ private:
     std::atomic<UInt64> last_rebalance_timestamp_usec = 0;
     std::atomic<UInt64> num_rebalance_assignments = 0;
     std::atomic<UInt64> num_rebalance_revocations = 0;
-    std::atomic<bool> in_use = 0;
+    std::atomic<bool> in_use = false;
     /// Last used time (for TTL)
     std::atomic<UInt64> last_used_usec = 0;
 
diff --git a/src/Storages/Kafka/parseSyslogLevel.cpp b/src/Storages/Kafka/parseSyslogLevel.cpp
index f4358a13efe..43630a5001f 100644
--- a/src/Storages/Kafka/parseSyslogLevel.cpp
+++ b/src/Storages/Kafka/parseSyslogLevel.cpp
@@ -4,7 +4,7 @@
 /// Must be in a separate compilation unit due to macros overlaps:
 /// - syslog (LOG_DEBUG/...)
 /// - logger_useful.h (LOG_DEBUG(...)/...)
-std::pair<Poco::Message::Priority, DB::LogsLevel> parseSyslogLevel(const int level)
+std::pair<Poco::Message::Priority, DB::LogsLevel> parseSyslogLevel(int level)
 {
     using DB::LogsLevel;
     using Poco::Message;
diff --git a/src/Storages/Kafka/parseSyslogLevel.h b/src/Storages/Kafka/parseSyslogLevel.h
index f0fb4968631..a004fc3d29f 100644
--- a/src/Storages/Kafka/parseSyslogLevel.h
+++ b/src/Storages/Kafka/parseSyslogLevel.h
@@ -4,4 +4,4 @@
 #include <Poco/Message.h>
 #include <Common/CurrentThread.h>
 
-std::pair<Poco::Message::Priority, DB::LogsLevel> parseSyslogLevel(const int level);
+std::pair<Poco::Message::Priority, DB::LogsLevel> parseSyslogLevel(int level);
diff --git a/src/Storages/MergeTree/ColumnSizeEstimator.h b/src/Storages/MergeTree/ColumnSizeEstimator.h
index e512415ff05..1307a5f493e 100644
--- a/src/Storages/MergeTree/ColumnSizeEstimator.h
+++ b/src/Storages/MergeTree/ColumnSizeEstimator.h
@@ -23,9 +23,9 @@ public:
         : map(std::move(map_))
     {
         for (const auto & name : key_columns)
-            if (!map.count(name)) map[name] = 0;
+            if (!map.contains(name)) map[name] = 0;
         for (const auto & name : ordinary_columns)
-            if (!map.count(name)) map[name] = 0;
+            if (!map.contains(name)) map[name] = 0;
 
         for (const auto & name : key_columns)
             sum_index_columns += map.at(name);
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 8bd32e777bc..57243335238 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -218,7 +218,6 @@ public:
 
     const MergeTreeData & storage;
 
-public:
     const String & name;    // const ref to private mutable_name
     MergeTreePartInfo info;
 
diff --git a/src/Storages/MergeTree/LeaderElection.h b/src/Storages/MergeTree/LeaderElection.h
index 3bd486fd54a..b7dc9c31655 100644
--- a/src/Storages/MergeTree/LeaderElection.h
+++ b/src/Storages/MergeTree/LeaderElection.h
@@ -19,7 +19,7 @@ namespace zkutil
   * For now, every replica can become leader if there is no leader among replicas with old version.
   */
 
-void checkNoOldLeaders(LoggerPtr log, ZooKeeper & zookeeper, const String path)
+inline void checkNoOldLeaders(LoggerPtr log, ZooKeeper & zookeeper, const String path)
 {
     /// Previous versions (before 21.12) used to create ephemeral sequential node path/leader_election-
     /// Replica with the lexicographically smallest node name becomes leader (before 20.6) or enables multi-leader mode (since 20.6)
diff --git a/src/Storages/MergeTree/MarkRange.h b/src/Storages/MergeTree/MarkRange.h
index f31d6a2a73b..1d9d0a1e27e 100644
--- a/src/Storages/MergeTree/MarkRange.h
+++ b/src/Storages/MergeTree/MarkRange.h
@@ -33,7 +33,7 @@ struct MarkRange
 
 struct MarkRanges : public std::deque<MarkRange>
 {
-    using std::deque<MarkRange>::deque;
+    using std::deque<MarkRange>::deque; /// NOLINT(modernize-type-traits)
 
     size_t getNumberOfMarks() const;
 
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index aacac5366a9..ba30c13049b 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -5435,7 +5435,7 @@ void MergeTreeData::restorePartsFromBackup(RestorerFromBackup & restorer, const
         partition_ids = getPartitionIDsFromQuery(*partitions, restorer.getContext());
 
     auto backup = restorer.getBackup();
-    Strings part_names = backup->listFiles(data_path_in_backup);
+    Strings part_names = backup->listFiles(data_path_in_backup, /*recursive*/ false);
     boost::remove_erase(part_names, "mutations");
 
     bool restore_broken_parts_as_detached = restorer.getRestoreSettings().restore_broken_parts_as_detached;
@@ -5516,7 +5516,7 @@ void MergeTreeData::restorePartFromBackup(std::shared_ptr<RestoredPartsHolder> r
         if (filename.ends_with(IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME))
             continue;
 
-        size_t file_size = backup->copyFileToDisk(part_path_in_backup_fs / filename, disk, temp_part_dir / filename);
+        size_t file_size = backup->copyFileToDisk(part_path_in_backup_fs / filename, disk, temp_part_dir / filename, WriteMode::Rewrite);
         reservation->update(reservation->getSize() - file_size);
     }
 
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index c864fce4659..8305c7c6ce9 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -1372,7 +1372,7 @@ protected:
                 latest_fail_time_us = static_cast<size_t>(Poco::Timestamp().epochMicroseconds());
             }
 
-            bool partCanBeMutated()
+            bool partCanBeMutated() const
             {
                 if (max_postpone_time_ms == 0)
                     return true;
diff --git a/src/Storages/MergeTree/MergeTreeMutationStatus.h b/src/Storages/MergeTree/MergeTreeMutationStatus.h
index b6f62e1218f..4bc9549872c 100644
--- a/src/Storages/MergeTree/MergeTreeMutationStatus.h
+++ b/src/Storages/MergeTree/MergeTreeMutationStatus.h
@@ -13,6 +13,7 @@ namespace DB
 
 struct MergeTreeMutationStatus
 {
+/// NOLINTBEGIN(readability-redundant-string-init)
     String id = "";
     String command = "";
     time_t create_time = 0;
@@ -30,6 +31,7 @@ struct MergeTreeMutationStatus
 
     /// FIXME: currently unused, but would be much better to report killed mutations with this flag.
     bool is_killed = false;
+/// NOLINTEND(readability-redundant-string-init)
 };
 
 /// Check mutation status and throw exception in case of error during mutation
diff --git a/src/Storages/MergeTree/RPNBuilder.h b/src/Storages/MergeTree/RPNBuilder.h
index d750c02d3e1..f8924ff6186 100644
--- a/src/Storages/MergeTree/RPNBuilder.h
+++ b/src/Storages/MergeTree/RPNBuilder.h
@@ -226,7 +226,7 @@ private:
                       * - in this case `n - 1` elements are added (where `n` is the number of arguments).
                       */
                     if (argument_index != 0 || element.function == RPNElement::FUNCTION_NOT)
-                        rpn_elements.emplace_back(std::move(element));
+                        rpn_elements.emplace_back(std::move(element)); /// NOLINT(bugprone-use-after-move,hicpp-invalid-access-moved)
                 }
 
                 if (arguments_size == 0 && function_node.getFunctionName() == "indexHint")
diff --git a/src/Storages/MergeTree/RangesInDataPart.h b/src/Storages/MergeTree/RangesInDataPart.h
index 0bc5829c82e..e275f2c27e7 100644
--- a/src/Storages/MergeTree/RangesInDataPart.h
+++ b/src/Storages/MergeTree/RangesInDataPart.h
@@ -67,7 +67,7 @@ struct RangesInDataPart
 
 struct RangesInDataParts: public std::vector<RangesInDataPart>
 {
-    using std::vector<RangesInDataPart>::vector;
+    using std::vector<RangesInDataPart>::vector; /// NOLINT(modernize-type-traits)
 
     RangesInDataPartsDescription getDescriptions() const;
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeQuorumAddedParts.h b/src/Storages/MergeTree/ReplicatedMergeTreeQuorumAddedParts.h
index f0f737cb1e6..81045460ab7 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeQuorumAddedParts.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeQuorumAddedParts.h
@@ -66,7 +66,7 @@ struct ReplicatedMergeTreeQuorumAddedParts
     }
 
     /// Read added blocks when node in ZooKeeper supports only one partition.
-    PartitionIdToPartName readV1(ReadBuffer & in)
+    PartitionIdToPartName readV1(ReadBuffer & in) const
     {
         PartitionIdToPartName parts_in_quorum;
 
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index aea0020f89d..2d7727b57cb 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -56,7 +56,7 @@ bool isNotEnoughMemoryErrorCode(int code)
         || code == ErrorCodes::CANNOT_MREMAP;
 }
 
-bool isRetryableException(const std::exception_ptr exception_ptr)
+bool isRetryableException(std::exception_ptr exception_ptr)
 {
     try
     {
diff --git a/src/Storages/MergeTree/checkDataPart.h b/src/Storages/MergeTree/checkDataPart.h
index d0e48b6f80a..ada89a54dcc 100644
--- a/src/Storages/MergeTree/checkDataPart.h
+++ b/src/Storages/MergeTree/checkDataPart.h
@@ -13,6 +13,6 @@ IMergeTreeDataPart::Checksums checkDataPart(
     std::function<bool()> is_cancelled = []{ return false; });
 
 bool isNotEnoughMemoryErrorCode(int code);
-bool isRetryableException(const std::exception_ptr exception_ptr);
+bool isRetryableException(std::exception_ptr exception_ptr);
 
 }
diff --git a/src/Storages/RabbitMQ/RabbitMQProducer.cpp b/src/Storages/RabbitMQ/RabbitMQProducer.cpp
index 7ad83213b9b..f0fbc8c5c06 100644
--- a/src/Storages/RabbitMQ/RabbitMQProducer.cpp
+++ b/src/Storages/RabbitMQ/RabbitMQProducer.cpp
@@ -27,9 +27,9 @@ RabbitMQProducer::RabbitMQProducer(
     const RabbitMQConfiguration & configuration_,
     const Names & routing_keys_,
     const String & exchange_name_,
-    const AMQP::ExchangeType exchange_type_,
-    const size_t channel_id_base_,
-    const bool persistent_,
+    AMQP::ExchangeType exchange_type_,
+    size_t channel_id_base_,
+    bool persistent_,
     std::atomic<bool> & shutdown_called_,
     LoggerPtr log_)
     : AsynchronousMessageProducer(log_)
diff --git a/src/Storages/RabbitMQ/RabbitMQProducer.h b/src/Storages/RabbitMQ/RabbitMQProducer.h
index a790eda0d08..e43518aec06 100644
--- a/src/Storages/RabbitMQ/RabbitMQProducer.h
+++ b/src/Storages/RabbitMQ/RabbitMQProducer.h
@@ -20,9 +20,9 @@ public:
         const RabbitMQConfiguration & configuration_,
         const Names & routing_keys_,
         const String & exchange_name_,
-        const AMQP::ExchangeType exchange_type_,
-        const size_t channel_id_base_,
-        const bool persistent_,
+        AMQP::ExchangeType exchange_type_,
+        size_t channel_id_base_,
+        bool persistent_,
         std::atomic<bool> & shutdown_called_,
         LoggerPtr log_);
 
diff --git a/src/Storages/S3Queue/StorageS3Queue.h b/src/Storages/S3Queue/StorageS3Queue.h
index bdd3ab7b687..fe86759ca62 100644
--- a/src/Storages/S3Queue/StorageS3Queue.h
+++ b/src/Storages/S3Queue/StorageS3Queue.h
@@ -14,11 +14,6 @@
 #include <Storages/StorageFactory.h>
 
 
-namespace Aws::S3
-{
-class Client;
-}
-
 namespace DB
 {
 class S3QueueFilesMetadata;
diff --git a/src/Storages/StorageInMemoryMetadata.h b/src/Storages/StorageInMemoryMetadata.h
index 69cd3422a7d..afc3bc81ef6 100644
--- a/src/Storages/StorageInMemoryMetadata.h
+++ b/src/Storages/StorageInMemoryMetadata.h
@@ -72,8 +72,8 @@ struct StorageInMemoryMetadata
     StorageInMemoryMetadata(const StorageInMemoryMetadata & other);
     StorageInMemoryMetadata & operator=(const StorageInMemoryMetadata & other);
 
-    StorageInMemoryMetadata(StorageInMemoryMetadata && other) = default; /// NOLINT
-    StorageInMemoryMetadata & operator=(StorageInMemoryMetadata && other) = default; /// NOLINT
+    StorageInMemoryMetadata(StorageInMemoryMetadata && other) = default; /// NOLINT(hicpp-noexcept-move,performance-noexcept-move-constructor)
+    StorageInMemoryMetadata & operator=(StorageInMemoryMetadata && other) = default; /// NOLINT(hicpp-noexcept-move,performance-noexcept-move-constructor)
 
     /// NOTE: Thread unsafe part. You should not modify same StorageInMemoryMetadata
     /// structure from different threads. It should be used as MultiVersion
diff --git a/src/Storages/StorageMongoDBSocketFactory.h b/src/Storages/StorageMongoDBSocketFactory.h
index 5fc423c63cb..2dc9cbddf8a 100644
--- a/src/Storages/StorageMongoDBSocketFactory.h
+++ b/src/Storages/StorageMongoDBSocketFactory.h
@@ -9,7 +9,7 @@ namespace DB
 class StorageMongoDBSocketFactory : public Poco::MongoDB::Connection::SocketFactory
 {
 public:
-    virtual Poco::Net::StreamSocket createSocket(const std::string & host, int port, Poco::Timespan connectTimeout, bool secure) override;
+    Poco::Net::StreamSocket createSocket(const std::string & host, int port, Poco::Timespan connectTimeout, bool secure) override;
 
 private:
     static Poco::Net::StreamSocket createPlainSocket(const std::string & host, int port, Poco::Timespan connectTimeout);
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index 7c5db76aadf..f570a7e3a58 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -26,11 +26,6 @@
 #include <Storages/prepareReadingFromFormat.h>
 #include <IO/S3/BlobStorageLogWriter.h>
 
-namespace Aws::S3
-{
-    class Client;
-}
-
 namespace DB
 {
 
diff --git a/src/Storages/StorageView.cpp b/src/Storages/StorageView.cpp
index 673ca61cd50..db568a1d5ab 100644
--- a/src/Storages/StorageView.cpp
+++ b/src/Storages/StorageView.cpp
@@ -110,7 +110,7 @@ StorageView::StorageView(
     const ASTCreateQuery & query,
     const ColumnsDescription & columns_,
     const String & comment,
-    const bool is_parameterized_view_)
+    bool is_parameterized_view_)
     : IStorage(table_id_)
 {
     StorageInMemoryMetadata storage_metadata;
diff --git a/src/Storages/StorageView.h b/src/Storages/StorageView.h
index 4d265eed86b..053fca807d5 100644
--- a/src/Storages/StorageView.h
+++ b/src/Storages/StorageView.h
@@ -16,7 +16,7 @@ public:
         const ASTCreateQuery & query,
         const ColumnsDescription & columns_,
         const String & comment,
-        const bool is_parameterized_view_=false);
+        bool is_parameterized_view_ = false);
 
     std::string getName() const override { return "View"; }
     bool isView() const override { return true; }
@@ -45,7 +45,7 @@ public:
         replaceWithSubquery(select_query, metadata_snapshot->getSelectQuery().inner_query->clone(), view_name, parameterized_view);
     }
 
-    static void replaceWithSubquery(ASTSelectQuery & outer_query, ASTPtr view_query, ASTPtr & view_name, const bool parameterized_view);
+    static void replaceWithSubquery(ASTSelectQuery & outer_query, ASTPtr view_query, ASTPtr & view_name, bool parameterized_view);
     static ASTPtr restoreViewName(ASTSelectQuery & select_query, const ASTPtr & view_name);
 
 protected:
diff --git a/src/Storages/System/StorageSystemPartsBase.h b/src/Storages/System/StorageSystemPartsBase.h
index 0527a99b841..10d1a3a2e0e 100644
--- a/src/Storages/System/StorageSystemPartsBase.h
+++ b/src/Storages/System/StorageSystemPartsBase.h
@@ -94,7 +94,7 @@ protected:
         // nullptr means table was dropped while acquiring the lock
         return info.table_lock != nullptr;
     }
-protected:
+
     String query_id;
     Settings settings;
 
diff --git a/src/Storages/System/StorageSystemTimeZones.h b/src/Storages/System/StorageSystemTimeZones.h
index 160e8854e3e..3f9db2f53e2 100644
--- a/src/Storages/System/StorageSystemTimeZones.h
+++ b/src/Storages/System/StorageSystemTimeZones.h
@@ -17,7 +17,6 @@ public:
 
     using IStorageSystemOneBlock::IStorageSystemOneBlock;
 
-public:
     std::string getName() const override { return "SystemTimeZones"; }
 
     static ColumnsDescription getColumnsDescription();

From e5baeaba9c81d9ad1d49215f573b82c5ec4254d3 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Fri, 15 Mar 2024 13:28:42 +0000
Subject: [PATCH 637/985] Fix FastTest

---
 src/Interpreters/joinDispatch.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/joinDispatch.h b/src/Interpreters/joinDispatch.h
index 324d6a4d434..dccbe68fdb6 100644
--- a/src/Interpreters/joinDispatch.h
+++ b/src/Interpreters/joinDispatch.h
@@ -113,7 +113,7 @@ inline bool joinDispatch(JoinKind kind, JoinStrictness strictness, std::vector<c
         {
             using MapType = typename MapGetter<KINDS[i], STRICTNESSES[j]>::Map;
             std::vector<const MapType *> v;
-            v.resize(mapsv.size());
+            v.reserve(mapsv.size());
             for (const auto & el : mapsv)
                 v.push_back(&std::get<MapType>(*el));
 

From 3cff8206b32419bfcceeee8c9fe0fa02e3631a85 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 15 Mar 2024 16:31:20 +0000
Subject: [PATCH 638/985] Split 02125_lz4_compression_bug

---
 .../0_stateless/02125_lz4_compression_bug.lib | 19 ++++++++
 .../02125_lz4_compression_bug.reference       | 45 -------------------
 .../0_stateless/02125_lz4_compression_bug.sh  | 21 ---------
 .../02125_lz4_compression_bug_CSV.reference   |  4 ++
 .../02125_lz4_compression_bug_CSV.sh          |  6 +++
 ...mpression_bug_JSONCompactEachRow.reference |  4 ++
 ..._lz4_compression_bug_JSONCompactEachRow.sh |  6 +++
 ..._lz4_compression_bug_JSONEachRow.reference |  4 ++
 .../02125_lz4_compression_bug_JSONEachRow.sh  |  6 +++
 ...mpression_bug_JSONStringsEachRow.reference |  4 ++
 ..._lz4_compression_bug_JSONStringsEachRow.sh |  6 +++
 ...02125_lz4_compression_bug_Native.reference |  4 ++
 .../02125_lz4_compression_bug_Native.sh       |  6 +++
 .../02125_lz4_compression_bug_TSKV.reference  |  4 ++
 .../02125_lz4_compression_bug_TSKV.sh         |  6 +++
 .../02125_lz4_compression_bug_TSV.reference   |  4 ++
 .../02125_lz4_compression_bug_TSV.sh          |  6 +++
 ...02125_lz4_compression_bug_Values.reference |  4 ++
 .../02125_lz4_compression_bug_Values.sh       |  6 +++
 19 files changed, 99 insertions(+), 66 deletions(-)
 create mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug.lib
 delete mode 100644 tests/queries/0_stateless/02125_lz4_compression_bug.reference
 delete mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug.sh
 create mode 100644 tests/queries/0_stateless/02125_lz4_compression_bug_CSV.reference
 create mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug_CSV.sh
 create mode 100644 tests/queries/0_stateless/02125_lz4_compression_bug_JSONCompactEachRow.reference
 create mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug_JSONCompactEachRow.sh
 create mode 100644 tests/queries/0_stateless/02125_lz4_compression_bug_JSONEachRow.reference
 create mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug_JSONEachRow.sh
 create mode 100644 tests/queries/0_stateless/02125_lz4_compression_bug_JSONStringsEachRow.reference
 create mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug_JSONStringsEachRow.sh
 create mode 100644 tests/queries/0_stateless/02125_lz4_compression_bug_Native.reference
 create mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug_Native.sh
 create mode 100644 tests/queries/0_stateless/02125_lz4_compression_bug_TSKV.reference
 create mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug_TSKV.sh
 create mode 100644 tests/queries/0_stateless/02125_lz4_compression_bug_TSV.reference
 create mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug_TSV.sh
 create mode 100644 tests/queries/0_stateless/02125_lz4_compression_bug_Values.reference
 create mode 100755 tests/queries/0_stateless/02125_lz4_compression_bug_Values.sh

diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug.lib b/tests/queries/0_stateless/02125_lz4_compression_bug.lib
new file mode 100755
index 00000000000..d13932aa166
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug.lib
@@ -0,0 +1,19 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+format=$1
+
+${CLICKHOUSE_CLIENT} --query "DROP TABLE IF EXISTS file"
+${CLICKHOUSE_CLIENT} --query "CREATE TABLE file (x UInt64) ENGINE = File($format, '${CLICKHOUSE_DATABASE}/data.$format.lz4')"
+for size in 10000 100000 1000000 2500000
+do
+    ${CLICKHOUSE_CLIENT} --query "TRUNCATE TABLE file"
+    ${CLICKHOUSE_CLIENT} --query "INSERT INTO file SELECT * FROM numbers($size)"
+    ${CLICKHOUSE_CLIENT} --query "SELECT max(x) FROM file"
+done
+
+${CLICKHOUSE_CLIENT} --query "DROP TABLE file"
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug.reference b/tests/queries/0_stateless/02125_lz4_compression_bug.reference
deleted file mode 100644
index 713767e1d44..00000000000
--- a/tests/queries/0_stateless/02125_lz4_compression_bug.reference
+++ /dev/null
@@ -1,45 +0,0 @@
-Native
-9999
-99999
-999999
-2499999
-Values
-9999
-99999
-999999
-2499999
-JSONCompactEachRow
-9999
-99999
-999999
-2499999
-TSKV
-9999
-99999
-999999
-2499999
-TSV
-9999
-99999
-999999
-2499999
-CSV
-9999
-99999
-999999
-2499999
-JSONEachRow
-9999
-99999
-999999
-2499999
-JSONCompactEachRow
-9999
-99999
-999999
-2499999
-JSONStringsEachRow
-9999
-99999
-999999
-2499999
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug.sh b/tests/queries/0_stateless/02125_lz4_compression_bug.sh
deleted file mode 100755
index 77646b01298..00000000000
--- a/tests/queries/0_stateless/02125_lz4_compression_bug.sh
+++ /dev/null
@@ -1,21 +0,0 @@
-#!/usr/bin/env bash
-# Tags: no-parallel, no-fasttest
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-for format in Native Values JSONCompactEachRow TSKV TSV CSV JSONEachRow JSONCompactEachRow JSONStringsEachRow
-do
-    echo $format
-    ${CLICKHOUSE_CLIENT} --query "DROP TABLE IF EXISTS file"
-    ${CLICKHOUSE_CLIENT} --query "CREATE TABLE file (x UInt64) ENGINE = File($format, '${CLICKHOUSE_DATABASE}/data.$format.lz4')"
-    for size in 10000 100000 1000000 2500000
-    do
-        ${CLICKHOUSE_CLIENT} --query "TRUNCATE TABLE file"
-        ${CLICKHOUSE_CLIENT} --query "INSERT INTO file SELECT * FROM numbers($size)"
-        ${CLICKHOUSE_CLIENT} --query "SELECT max(x) FROM file"
-    done
-done
-
-${CLICKHOUSE_CLIENT} --query "DROP TABLE file"
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_CSV.reference b/tests/queries/0_stateless/02125_lz4_compression_bug_CSV.reference
new file mode 100644
index 00000000000..b4ace07c0ac
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_CSV.reference
@@ -0,0 +1,4 @@
+9999
+99999
+999999
+2499999
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_CSV.sh b/tests/queries/0_stateless/02125_lz4_compression_bug_CSV.sh
new file mode 100755
index 00000000000..ef38226a3fe
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_CSV.sh
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+${CUR_DIR}/02125_lz4_compression_bug.lib CSV
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_JSONCompactEachRow.reference b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONCompactEachRow.reference
new file mode 100644
index 00000000000..b4ace07c0ac
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONCompactEachRow.reference
@@ -0,0 +1,4 @@
+9999
+99999
+999999
+2499999
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_JSONCompactEachRow.sh b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONCompactEachRow.sh
new file mode 100755
index 00000000000..41510edd7df
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONCompactEachRow.sh
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+${CUR_DIR}/02125_lz4_compression_bug.lib JSONCompactEachRow
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_JSONEachRow.reference b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONEachRow.reference
new file mode 100644
index 00000000000..b4ace07c0ac
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONEachRow.reference
@@ -0,0 +1,4 @@
+9999
+99999
+999999
+2499999
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_JSONEachRow.sh b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONEachRow.sh
new file mode 100755
index 00000000000..c4bfc4274de
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONEachRow.sh
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+${CUR_DIR}/02125_lz4_compression_bug.lib JSONEachRow
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_JSONStringsEachRow.reference b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONStringsEachRow.reference
new file mode 100644
index 00000000000..b4ace07c0ac
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONStringsEachRow.reference
@@ -0,0 +1,4 @@
+9999
+99999
+999999
+2499999
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_JSONStringsEachRow.sh b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONStringsEachRow.sh
new file mode 100755
index 00000000000..87f30a56da5
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_JSONStringsEachRow.sh
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+${CUR_DIR}/02125_lz4_compression_bug.lib JSONStringsEachRow
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_Native.reference b/tests/queries/0_stateless/02125_lz4_compression_bug_Native.reference
new file mode 100644
index 00000000000..b4ace07c0ac
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_Native.reference
@@ -0,0 +1,4 @@
+9999
+99999
+999999
+2499999
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_Native.sh b/tests/queries/0_stateless/02125_lz4_compression_bug_Native.sh
new file mode 100755
index 00000000000..523d40e0522
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_Native.sh
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+${CUR_DIR}/02125_lz4_compression_bug.lib Native
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_TSKV.reference b/tests/queries/0_stateless/02125_lz4_compression_bug_TSKV.reference
new file mode 100644
index 00000000000..b4ace07c0ac
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_TSKV.reference
@@ -0,0 +1,4 @@
+9999
+99999
+999999
+2499999
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_TSKV.sh b/tests/queries/0_stateless/02125_lz4_compression_bug_TSKV.sh
new file mode 100755
index 00000000000..b4f4045d6f6
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_TSKV.sh
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+${CUR_DIR}/02125_lz4_compression_bug.lib TSKV
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_TSV.reference b/tests/queries/0_stateless/02125_lz4_compression_bug_TSV.reference
new file mode 100644
index 00000000000..b4ace07c0ac
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_TSV.reference
@@ -0,0 +1,4 @@
+9999
+99999
+999999
+2499999
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_TSV.sh b/tests/queries/0_stateless/02125_lz4_compression_bug_TSV.sh
new file mode 100755
index 00000000000..ca50929c958
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_TSV.sh
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+${CUR_DIR}/02125_lz4_compression_bug.lib TSV
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_Values.reference b/tests/queries/0_stateless/02125_lz4_compression_bug_Values.reference
new file mode 100644
index 00000000000..b4ace07c0ac
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_Values.reference
@@ -0,0 +1,4 @@
+9999
+99999
+999999
+2499999
diff --git a/tests/queries/0_stateless/02125_lz4_compression_bug_Values.sh b/tests/queries/0_stateless/02125_lz4_compression_bug_Values.sh
new file mode 100755
index 00000000000..68f3d90dbb4
--- /dev/null
+++ b/tests/queries/0_stateless/02125_lz4_compression_bug_Values.sh
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+${CUR_DIR}/02125_lz4_compression_bug.lib Values
\ No newline at end of file

From c98a165980cb57edf86e4b7152b66e6c97b6f991 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 18 Mar 2024 08:32:16 +0000
Subject: [PATCH 639/985] Fix build

---
 src/Dictionaries/RangeHashedDictionary.h           | 14 +++++++-------
 .../RangeHashedDictionaryGetItemsImpl.txx          |  2 +-
 ...ngeHashedDictionaryGetItemsShortCircuitImpl.txx |  2 +-
 3 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index 0469e82d7be..c208863905b 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -288,7 +288,7 @@ private:
 extern template class RangeHashedDictionary<DictionaryKeyType::Simple>;
 extern template class RangeHashedDictionary<DictionaryKeyType::Complex>;
 
-namespace
+namespace impl
 {
     template <typename F>
     void callOnRangeType(const DataTypePtr & range_type, F && func)
@@ -465,7 +465,7 @@ ColumnUInt8::Ptr RangeHashedDictionary<dictionary_key_type>::hasKeys(const Colum
     auto & out = result->getData();
     size_t keys_found = 0;
 
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
+    impl::callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
     {
         using Types = std::decay_t<decltype(types)>;
         using RangeColumnType = typename Types::LeftType;
@@ -523,7 +523,7 @@ void RangeHashedDictionary<dictionary_key_type>::createAttributes()
                             getDictionaryID().getNameForLogs());
     }
 
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
+    impl::callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
     {
         using Types = std::decay_t<decltype(types)>;
         using RangeColumnType = typename Types::LeftType;
@@ -553,7 +553,7 @@ void RangeHashedDictionary<dictionary_key_type>::loadData()
         updateData();
     }
 
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
+    impl::callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
     {
         using Types = std::decay_t<decltype(types)>;
         using RangeColumnType = typename Types::LeftType;
@@ -573,7 +573,7 @@ void RangeHashedDictionary<dictionary_key_type>::loadData()
 template <DictionaryKeyType dictionary_key_type>
 void RangeHashedDictionary<dictionary_key_type>::calculateBytesAllocated()
 {
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
+    impl::callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
     {
         using Types = std::decay_t<decltype(types)>;
         using RangeColumnType = typename Types::LeftType;
@@ -783,7 +783,7 @@ void RangeHashedDictionary<dictionary_key_type>::blockToAttributes(const Block &
         max_range_null_map = &max_range_column_nullable->getNullMapColumn().getData();
     }
 
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
+    impl::callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
     {
         using Types = std::decay_t<decltype(types)>;
         using RangeColumnType = typename Types::LeftType;
@@ -930,7 +930,7 @@ Pipe RangeHashedDictionary<dictionary_key_type>::read(const Names & column_names
 
     PaddedPODArray<KeyType> keys;
 
-    callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
+    impl::callOnRangeType(dict_struct.range_min->type, [&](const auto & types)
     {
         using Types = std::decay_t<decltype(types)>;
         using RangeColumnType = typename Types::LeftType;
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsImpl.txx b/src/Dictionaries/RangeHashedDictionaryGetItemsImpl.txx
index 9da2b0faf4a..8ed4445f236 100644
--- a/src/Dictionaries/RangeHashedDictionaryGetItemsImpl.txx
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsImpl.txx
@@ -37,7 +37,7 @@ void RangeHashedDictionary<dictionary_key_type>::getItemsImpl(
     DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns_copy, arena_holder.getComplexKeyArena());
     const size_t keys_size = keys_extractor.getKeysSize();
 
-    callOnRangeType(
+    impl::callOnRangeType(
         dict_struct.range_min->type,
         [&](const auto & types)
         {
diff --git a/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx
index 5807af519f9..63c29f8cc34 100644
--- a/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx
+++ b/src/Dictionaries/RangeHashedDictionaryGetItemsShortCircuitImpl.txx
@@ -37,7 +37,7 @@ size_t RangeHashedDictionary<dictionary_key_type>::getItemsShortCircuitImpl(
     const size_t keys_size = keys_extractor.getKeysSize();
     default_mask.resize(keys_size);
 
-    callOnRangeType(
+    impl::callOnRangeType(
         dict_struct.range_min->type,
         [&](const auto & types)
         {

From 248a8a60f1722414523a4ce19977cf7a68c636a6 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 18 Mar 2024 10:02:52 +0100
Subject: [PATCH 640/985] Fix style check

---
 src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
index 7cda8898a65..13f62c7ac25 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
@@ -292,7 +292,7 @@ size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t ran
             auto length = body_stream->Length();
             char buffer[length];
             body_stream->Read(reinterpret_cast<uint8_t *>(buffer), length);
-            std::istringstream string_stream(String(static_cast<char *>(buffer),length));
+            std::istringstream string_stream(String(static_cast<char *>(buffer),length)); // STYLE_CHECK_ALLOW_STD_STRING_STREAM
             copyFromIStreamWithProgressCallback(string_stream, to, n, progress_callback, &bytes_copied);
 
             if (read_settings.remote_throttler)

From 43eea86ec507e1da7c3b42d8e2bb177150873a89 Mon Sep 17 00:00:00 2001
From: lgbo-ustc <lgbo.ustc@gmail.com>
Date: Mon, 18 Mar 2024 17:13:20 +0800
Subject: [PATCH 641/985] fixed

---
 src/Interpreters/Aggregator.h | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Interpreters/Aggregator.h b/src/Interpreters/Aggregator.h
index ee3086e1d0e..e339047063c 100644
--- a/src/Interpreters/Aggregator.h
+++ b/src/Interpreters/Aggregator.h
@@ -428,6 +428,7 @@ private:
         size_t row_begin,
         size_t row_end,
         AggregateFunctionInstruction * aggregate_instructions,
+        bool no_more_keys,
         bool all_keys_are_const,
         bool use_compiled_functions,
         AggregateDataPtr overflow_row) const;

From 6549a96ced628dbbaa5b1c32304459ae6d40930a Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio2368@users.noreply.github.com>
Date: Mon, 18 Mar 2024 10:38:28 +0100
Subject: [PATCH 642/985] Revert "Analyzer: Fix virtual columns in
 StorageMerge"

---
 .../InterpreterSelectQueryAnalyzer.cpp        |  1 -
 src/Storages/StorageMerge.cpp                 | 93 ++++++-------------
 tests/analyzer_tech_debt.txt                  |  1 +
 3 files changed, 27 insertions(+), 68 deletions(-)

diff --git a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
index 539d7a59f6f..922f4a99b4a 100644
--- a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
+++ b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
@@ -86,7 +86,6 @@ void replaceStorageInQueryTree(QueryTreeNodePtr & query_tree, const ContextPtr &
             continue;
 
         auto replacement_table_expression = std::make_shared<TableNode>(storage, context);
-        replacement_table_expression->setAlias(node->getAlias());
 
         if (auto table_expression_modifiers = table_node.getTableExpressionModifiers())
             replacement_table_expression->setTableExpressionModifiers(*table_expression_modifiers);
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 3a4ec6f9b17..9161b2773da 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -885,7 +885,6 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextMutablePtr & mo
     if (modified_query_info.table_expression)
     {
         auto replacement_table_expression = std::make_shared<TableNode>(storage, storage_lock, storage_snapshot_);
-        replacement_table_expression->setAlias(modified_query_info.table_expression->getAlias());
         if (query_info.table_expression_modifiers)
             replacement_table_expression->setTableExpressionModifiers(*query_info.table_expression_modifiers);
 
@@ -1026,7 +1025,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
     const auto & [database_name, storage, _, table_name] = storage_with_lock;
     bool allow_experimental_analyzer = context->getSettingsRef().allow_experimental_analyzer;
     auto storage_stage
-        = storage->getQueryProcessingStage(context, processed_stage, storage_snapshot_, modified_query_info);
+        = storage->getQueryProcessingStage(context, QueryProcessingStage::Complete, storage_snapshot_, modified_query_info);
 
     builder = plan.buildQueryPipeline(
         QueryPlanOptimizationSettings::fromContext(context), BuildQueryPipelineSettings::fromContext(context));
@@ -1053,80 +1052,40 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
 
         Block pipe_header = builder->getHeader();
 
-        if (allow_experimental_analyzer)
+        if (has_database_virtual_column && common_header.has("_database") && !pipe_header.has("_database"))
         {
-            String table_alias = modified_query_info.query_tree->as<QueryNode>()->getJoinTree()->as<TableNode>()->getAlias();
+            ColumnWithTypeAndName column;
+            column.name = "_database";
+            column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+            column.column = column.type->createColumnConst(0, Field(database_name));
 
-            String database_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_database" : table_alias + "._database";
-            String table_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_table" : table_alias + "._table";
+            auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+            auto adding_column_actions = std::make_shared<ExpressionActions>(
+                std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
 
-            if (has_database_virtual_column && common_header.has(database_column)
-                && (storage_stage == QueryProcessingStage::FetchColumns || !pipe_header.has("'" + database_name + "'_String")))
-            {
-                ColumnWithTypeAndName column;
-                column.name = database_column;
-                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
-                column.column = column.type->createColumnConst(0, Field(database_name));
-
-                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
-                auto adding_column_actions = std::make_shared<ExpressionActions>(
-                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
-
-                builder->addSimpleTransform([&](const Block & stream_header)
-                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
-            }
-
-            if (has_table_virtual_column && common_header.has(table_column)
-                && (storage_stage == QueryProcessingStage::FetchColumns || !pipe_header.has("'" + table_name + "'_String")))
-            {
-                ColumnWithTypeAndName column;
-                column.name = table_column;
-                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
-                column.column = column.type->createColumnConst(0, Field(table_name));
-
-                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
-                auto adding_column_actions = std::make_shared<ExpressionActions>(
-                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
-
-                builder->addSimpleTransform([&](const Block & stream_header)
-                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
-            }
+            builder->addSimpleTransform([&](const Block & stream_header)
+                                        { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
         }
-        else
+
+        if (has_table_virtual_column && common_header.has("_table") && !pipe_header.has("_table"))
         {
-            if (has_database_virtual_column && common_header.has("_database") && !pipe_header.has("_database"))
-            {
-                ColumnWithTypeAndName column;
-                column.name = "_database";
-                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
-                column.column = column.type->createColumnConst(0, Field(database_name));
+            ColumnWithTypeAndName column;
+            column.name = "_table";
+            column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+            column.column = column.type->createColumnConst(0, Field(table_name));
 
-                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
-                auto adding_column_actions = std::make_shared<ExpressionActions>(
-                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
-                builder->addSimpleTransform([&](const Block & stream_header)
-                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
-            }
+            auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+            auto adding_column_actions = std::make_shared<ExpressionActions>(
+                std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
 
-            if (has_table_virtual_column && common_header.has("_table") && !pipe_header.has("_table"))
-            {
-                ColumnWithTypeAndName column;
-                column.name = "_table";
-                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
-                column.column = column.type->createColumnConst(0, Field(table_name));
-
-                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
-                auto adding_column_actions = std::make_shared<ExpressionActions>(
-                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
-                builder->addSimpleTransform([&](const Block & stream_header)
-                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
-            }
+            builder->addSimpleTransform([&](const Block & stream_header)
+                                        { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
         }
 
         /// Subordinary tables could have different but convertible types, like numeric types of different width.
         /// We must return streams with structure equals to structure of Merge table.
         convertAndFilterSourceStream(
-            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, storage_stage);
+            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, processed_stage);
     }
 
     return builder;
@@ -1157,13 +1116,13 @@ QueryPlan ReadFromMerge::createPlanForTable(
     bool allow_experimental_analyzer = modified_context->getSettingsRef().allow_experimental_analyzer;
 
     auto storage_stage = storage->getQueryProcessingStage(modified_context,
-        processed_stage,
+        QueryProcessingStage::Complete,
         storage_snapshot_,
         modified_query_info);
 
     QueryPlan plan;
 
-    if (processed_stage <= storage_stage)
+    if (processed_stage <= storage_stage || (allow_experimental_analyzer && processed_stage == QueryProcessingStage::FetchColumns))
     {
         /// If there are only virtual columns in query, you must request at least one other column.
         if (real_column_names.empty())
@@ -1208,7 +1167,7 @@ QueryPlan ReadFromMerge::createPlanForTable(
                 row_policy_data_opt->addStorageFilter(source_step_with_filter);
         }
     }
-    else if (processed_stage > storage_stage || allow_experimental_analyzer)
+    else if (processed_stage > storage_stage || (allow_experimental_analyzer && processed_stage != QueryProcessingStage::FetchColumns))
     {
         /// Maximum permissible parallelism is streams_num
         modified_context->setSetting("max_threads", streams_num);
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index 7cd73705e77..bcf0eee0d0e 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -1,4 +1,5 @@
 00223_shard_distributed_aggregation_memory_efficient
+00717_merge_and_distributed
 00725_memory_tracking
 01062_pm_all_join_with_block_continuation
 01083_expressions_in_engine_arguments

From dc4a2064e4c7720d0b027746f28e1237c7ca58f3 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 18 Mar 2024 10:51:46 +0100
Subject: [PATCH 643/985] Fix clang-tidy build

---
 utils/check-marks/CMakeLists.txt        | 2 +-
 utils/check-mysql-binlog/CMakeLists.txt | 2 +-
 utils/keeper-data-dumper/CMakeLists.txt | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/utils/check-marks/CMakeLists.txt b/utils/check-marks/CMakeLists.txt
index 05546a2989b..857dc51d40a 100644
--- a/utils/check-marks/CMakeLists.txt
+++ b/utils/check-marks/CMakeLists.txt
@@ -1,2 +1,2 @@
 clickhouse_add_executable (check-marks main.cpp)
-target_link_libraries(check-marks PRIVATE dbms boost::program_options)
+target_link_libraries(check-marks PRIVATE dbms clickhouse_functions boost::program_options)
diff --git a/utils/check-mysql-binlog/CMakeLists.txt b/utils/check-mysql-binlog/CMakeLists.txt
index cbbecd456a0..0ece1684e6b 100644
--- a/utils/check-mysql-binlog/CMakeLists.txt
+++ b/utils/check-mysql-binlog/CMakeLists.txt
@@ -1,2 +1,2 @@
 clickhouse_add_executable(check-mysql-binlog main.cpp)
-target_link_libraries(check-mysql-binlog PRIVATE dbms boost::program_options)
+target_link_libraries(check-mysql-binlog PRIVATE dbms clickhouse_functions boost::program_options)
diff --git a/utils/keeper-data-dumper/CMakeLists.txt b/utils/keeper-data-dumper/CMakeLists.txt
index 136d6f2268c..71f29781b73 100644
--- a/utils/keeper-data-dumper/CMakeLists.txt
+++ b/utils/keeper-data-dumper/CMakeLists.txt
@@ -4,4 +4,4 @@ if (NOT TARGET ch_contrib::nuraft)
 endif ()
 
 clickhouse_add_executable(keeper-data-dumper main.cpp)
-target_link_libraries(keeper-data-dumper PRIVATE dbms)
+target_link_libraries(keeper-data-dumper PRIVATE dbms clickhouse_functions)

From fe867410591b7d0a8b16d8023be7f1938d91bc89 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 18 Mar 2024 10:44:56 +0000
Subject: [PATCH 644/985] Some fixups

---
 programs/keeper/Keeper.cpp                | 16 ++++++--------
 programs/server/Server.cpp                |  5 +----
 src/Common/CgroupsMemoryUsageObserver.cpp | 13 ++++--------
 src/Common/CgroupsMemoryUsageObserver.h   | 26 ++++++++++++-----------
 4 files changed, 25 insertions(+), 35 deletions(-)

diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index 9263719da2a..a558ed64bf9 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -624,21 +624,17 @@ try
     buildLoggers(config(), logger());
     main_config_reloader->start();
 
-    std::optional<CgroupsMemoryUsageObserver> observer;
+    std::optional<CgroupsMemoryUsageObserver> cgroups_memory_usage_observer;
     try
     {
         auto wait_time = config().getUInt64("keeper_server.cgroups_memory_observer_wait_time", 15);
         if (wait_time != 0)
         {
-            observer.emplace(std::chrono::seconds(wait_time));
-            /// Keeper use setting max_memory_usage_soft_limit to control memory limit. When memory usage
-            /// hits the limit, Keeper will refuse all the request util memory usage is lower.
-            /// We don't call setLimits() here because of this.
-            observer->setOnMemoryAmountAvailableChanged([&]()
-            {
-                main_config_reloader->reload();
-            });
-            observer->startThread();
+            cgroups_memory_usage_observer.emplace(std::chrono::seconds(wait_time));
+            /// Not calling cgroups_memory_usage_observer->setLimits() here (as for the normal ClickHouse server) because Keeper controls
+            /// its memory usage by other means (via setting 'max_memory_usage_soft_limit').
+            cgroups_memory_usage_observer->setOnMemoryAmountAvailableChangedFn([&]() { main_config_reloader->reload(); });
+            cgroups_memory_usage_observer->startThread();
         }
     }
     catch (Exception &)
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 78d95d8340f..d1957fa53a8 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -1702,10 +1702,7 @@ try
 
     if (cgroups_memory_usage_observer)
     {
-        cgroups_memory_usage_observer->setOnMemoryAmountAvailableChanged([&]()
-        {
-            main_config_reloader->reload();
-        });
+        cgroups_memory_usage_observer->setOnMemoryAmountAvailableChangedFn([&]() { main_config_reloader->reload(); });
         cgroups_memory_usage_observer->startThread();
     }
 
diff --git a/src/Common/CgroupsMemoryUsageObserver.cpp b/src/Common/CgroupsMemoryUsageObserver.cpp
index 661b80a6059..dd68bd0da64 100644
--- a/src/Common/CgroupsMemoryUsageObserver.cpp
+++ b/src/Common/CgroupsMemoryUsageObserver.cpp
@@ -84,7 +84,7 @@ void CgroupsMemoryUsageObserver::setMemoryUsageLimits(uint64_t hard_limit_, uint
             mallctl("arena." STRINGIFY(MALLCTL_ARENAS_ALL) ".purge", nullptr, nullptr, nullptr, 0);
 #endif
             /// Reset current usage in memory tracker. Expect zero for free_memory_in_allocator_arenas as we just purged them.
-            uint64_t memory_usage = readMemoryUsage();
+            uint64_t memory_usage = memory_usage_file.readMemoryUsage();
             MemoryTracker::setRSS(memory_usage, 0);
 
             LOG_INFO(log, "Purged jemalloc arenas. Current memory usage is {}", ReadableSize(memory_usage));
@@ -98,17 +98,12 @@ void CgroupsMemoryUsageObserver::setMemoryUsageLimits(uint64_t hard_limit_, uint
     LOG_INFO(log, "Set new limits, soft limit: {}, hard limit: {}", ReadableSize(soft_limit_), ReadableSize(hard_limit_));
 }
 
-void CgroupsMemoryUsageObserver::setOnMemoryAmountAvailableChanged(OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed_)
+void CgroupsMemoryUsageObserver::setOnMemoryAmountAvailableChangedFn(OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed_)
 {
-    std::lock_guard<std::mutex> memory_amount_change_lock(memory_amount_change_mutex);
+    std::lock_guard<std::mutex> memory_amount_available_changed_lock(memory_amount_available_changed_mutex);
     on_memory_amount_available_changed = on_memory_amount_available_changed_;
 }
 
-uint64_t CgroupsMemoryUsageObserver::readMemoryUsage() const
-{
-    return memory_usage_file.readMemoryUsage();
-}
-
 namespace
 {
 
@@ -299,7 +294,7 @@ void CgroupsMemoryUsageObserver::runThread()
             {
                 LOG_INFO(log, "Memory amount available to the process changed from {} to {}", ReadableSize(last_available_memory_amount), ReadableSize(available_memory_amount));
                 last_available_memory_amount = available_memory_amount;
-                std::lock_guard<std::mutex> memory_amount_change_lock(memory_amount_change_mutex);
+                std::lock_guard<std::mutex> memory_amount_available_changed_lock(memory_amount_available_changed_mutex);
                 on_memory_amount_available_changed();
             }
 
diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index 1da49f8f777..ecb1fd8360f 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -2,7 +2,6 @@
 
 #include <Common/ThreadPool.h>
 
-#include <atomic>
 #include <chrono>
 #include <mutex>
 
@@ -14,11 +13,16 @@ namespace DB
 ///    You can specify soft or hard memory limits:
 ///    - When the soft memory limit is hit, drop jemalloc cache.
 ///    - When the hard memory limit is hit, update MemoryTracking metric to throw memory exceptions faster.
+///    The goal of this is to avoid that the process hits the maximum allowed memory limit at which there is a good
+///    chance that the Limux OOM killer terminates it. All of this is done is because internal memory tracking in
+///    ClickHouse can unfortunately under-estimate the actually used memory.
 /// 2. Periodically reads the the maximum memory available to the process (which can change due to cgroups settings).
-///    You can specify a callback to react on changes. The callback typically performs circular logic: It reloads the
-///    configuration (e.g. server configuration file), which will check the memory amount again and re-calculate
-///    soft/hard limits (see 1.) and update the value of setting `max_server_memory_usage` for clickhouse-server or
-///    `max_memory_usage_soft_limit` for clickhouse-keeper.
+///    You can specify a callback to react on changes. The callback typically reloads the configuration, i.e. Server
+///    or Keeper configuration file. This reloads settings 'max_server_memory_usage' (Server) and 'max_memory_usage_soft_limit'
+///    (Keeper) from which various other internal limits are calculated, including the soft and hard limits for (1.).
+///    The goal of this is to provide elasticity when the container is scaled-up/scaled-down. The mechanism (polling
+///    cgroups) is quite implicit, unfortuantely there is currently no better way to communicate memory threshold changes
+///    to the database.
 #if defined(OS_LINUX)
 class CgroupsMemoryUsageObserver
 {
@@ -36,12 +40,10 @@ public:
     ~CgroupsMemoryUsageObserver();
 
     void setMemoryUsageLimits(uint64_t hard_limit_, uint64_t soft_limit_);
-    void setOnMemoryAmountAvailableChanged(OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed);
+    void setOnMemoryAmountAvailableChangedFn(OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed_);
 
     void startThread();
 
-    uint64_t readMemoryUsage() const;
-
 private:
     LoggerPtr log;
 
@@ -52,8 +54,9 @@ private:
     size_t soft_limit TSA_GUARDED_BY(limit_mutex) = 0;
     OnMemoryLimitFn on_hard_limit TSA_GUARDED_BY(limit_mutex);
     OnMemoryLimitFn on_soft_limit TSA_GUARDED_BY(limit_mutex);
-    std::mutex memory_amount_change_mutex;
-    OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed TSA_GUARDED_BY(memory_amount_change_mutex);
+
+    std::mutex memory_amount_available_changed_mutex;
+    OnMemoryAmountAvailableChangedFn on_memory_amount_available_changed TSA_GUARDED_BY(memory_amount_available_changed_mutex);
 
     uint64_t last_memory_usage = 0;        /// how much memory does the process use
     uint64_t last_available_memory_amount; /// how much memory can the process use
@@ -93,9 +96,8 @@ public:
     explicit CgroupsMemoryUsageObserver(std::chrono::seconds) {}
 
     void setMemoryUsageLimits(uint64_t, uint64_t) {}
-    void setOnMemoryAmountAvailableChanged(OnMemoryAmountAvailableChangedFn) {}
+    void setOnMemoryAmountAvailableChangedFn(OnMemoryAmountAvailableChangedFn) {}
     void startThread() {}
-    size_t readMemoryUsage() { return 0; }
 };
 #endif
 

From 9b9f409805acb2f3d8c4427537bac91168d7f33c Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 18 Mar 2024 10:45:57 +0000
Subject: [PATCH 645/985] Fix spelling

---
 src/Common/CgroupsMemoryUsageObserver.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/CgroupsMemoryUsageObserver.h b/src/Common/CgroupsMemoryUsageObserver.h
index ecb1fd8360f..51c5cd08124 100644
--- a/src/Common/CgroupsMemoryUsageObserver.h
+++ b/src/Common/CgroupsMemoryUsageObserver.h
@@ -21,7 +21,7 @@ namespace DB
 ///    or Keeper configuration file. This reloads settings 'max_server_memory_usage' (Server) and 'max_memory_usage_soft_limit'
 ///    (Keeper) from which various other internal limits are calculated, including the soft and hard limits for (1.).
 ///    The goal of this is to provide elasticity when the container is scaled-up/scaled-down. The mechanism (polling
-///    cgroups) is quite implicit, unfortuantely there is currently no better way to communicate memory threshold changes
+///    cgroups) is quite implicit, unfortunately there is currently no better way to communicate memory threshold changes
 ///    to the database.
 #if defined(OS_LINUX)
 class CgroupsMemoryUsageObserver

From 30b757b40dac46e07842c2fbe6a155b1ee99c065 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Mon, 18 Mar 2024 12:06:45 +0100
Subject: [PATCH 646/985] Check boundaries for some settings in parallel
 replicas (#61455)

---
 src/Common/NaNUtils.h                         | 12 +++++++++++
 src/Interpreters/InterpreterSelectQuery.cpp   |  8 ++++++--
 .../QueryPlan/ReadFromMergeTree.cpp           | 20 ++++++++++++++++---
 3 files changed, 35 insertions(+), 5 deletions(-)

diff --git a/src/Common/NaNUtils.h b/src/Common/NaNUtils.h
index 1c5a619e919..2ff3e2f5661 100644
--- a/src/Common/NaNUtils.h
+++ b/src/Common/NaNUtils.h
@@ -25,6 +25,18 @@ inline bool isFinite(T x)
         return true;
 }
 
+template <typename T>
+bool canConvertTo(Float64 x)
+{
+    if constexpr (std::is_floating_point_v<T>)
+        return true;
+    if (!isFinite(x))
+        return false;
+    if (x > Float64(std::numeric_limits<T>::max()) || x < Float64(std::numeric_limits<T>::lowest()))
+        return false;
+
+    return true;
+}
 
 template <typename T>
 T NaNOrZero()
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 07f4e94680c..7c87dadfce6 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -96,6 +96,7 @@
 #include <Common/scope_guard_safe.h>
 #include <Common/typeid_cast.h>
 #include <Common/ProfileEvents.h>
+#include <Common/NaNUtils.h>
 
 
 namespace ProfileEvents
@@ -2553,10 +2554,13 @@ void InterpreterSelectQuery::executeFetchColumns(QueryProcessingStage::Enum proc
         /// If necessary, we request more sources than the number of threads - to distribute the work evenly over the threads.
         if (max_streams > 1 && !is_sync_remote)
         {
-            if (auto streams_with_ratio = max_streams * settings.max_streams_to_max_threads_ratio; streams_with_ratio < SIZE_MAX)
+            if (auto streams_with_ratio = max_streams * settings.max_streams_to_max_threads_ratio; canConvertTo<size_t>(streams_with_ratio))
                 max_streams = static_cast<size_t>(streams_with_ratio);
             else
-                throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND, "Exceeded limit for `max_streams` with `max_streams_to_max_threads_ratio`. Make sure that `max_streams * max_streams_to_max_threads_ratio` not exceeds {}, current value: {}", SIZE_MAX, streams_with_ratio);
+                throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND,
+                    "Exceeded limit for `max_streams` with `max_streams_to_max_threads_ratio`. "
+                    "Make sure that `max_streams * max_streams_to_max_threads_ratio` is in some reasonable boundaries, current value: {}",
+                    streams_with_ratio);
         }
 
         auto & prewhere_info = analysis_result.prewhere_info;
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index fb92be6eed9..f1ce5a7802f 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -131,6 +131,7 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
     extern const int TOO_MANY_ROWS;
     extern const int CANNOT_PARSE_TEXT;
+    extern const int PARAMETER_OUT_OF_BOUND;
 }
 
 static MergeTreeReaderSettings getMergeTreeReaderSettings(
@@ -348,7 +349,14 @@ Pipe ReadFromMergeTree::readFromPoolParallelReplicas(
 
     /// We have a special logic for local replica. It has to read less data, because in some cases it should
     /// merge states of aggregate functions or do some other important stuff other than reading from Disk.
-    pool_settings.min_marks_for_concurrent_read = static_cast<size_t>(pool_settings.min_marks_for_concurrent_read * context->getSettingsRef().parallel_replicas_single_task_marks_count_multiplier);
+    const auto multiplier = context->getSettingsRef().parallel_replicas_single_task_marks_count_multiplier;
+    if (auto result = pool_settings.min_marks_for_concurrent_read * multiplier; canConvertTo<size_t>(result))
+        pool_settings.min_marks_for_concurrent_read = static_cast<size_t>(result);
+    else
+        throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND,
+            "Exceeded limit for the number of marks per a single task for parallel replicas. "
+            "Make sure that `parallel_replicas_single_task_marks_count_multiplier` is in some reasonable boundaries, current value is: {}",
+            multiplier);
 
     auto pool = std::make_shared<MergeTreeReadPoolParallelReplicas>(
         std::move(extension),
@@ -512,8 +520,14 @@ Pipe ReadFromMergeTree::readInOrder(
             .columns_to_read = required_columns,
         };
 
-        pool_settings.min_marks_for_concurrent_read = static_cast<size_t>(
-            pool_settings.min_marks_for_concurrent_read * context->getSettingsRef().parallel_replicas_single_task_marks_count_multiplier);
+        const auto multiplier = context->getSettingsRef().parallel_replicas_single_task_marks_count_multiplier;
+        if (auto result = pool_settings.min_marks_for_concurrent_read * multiplier; canConvertTo<size_t>(result))
+            pool_settings.min_marks_for_concurrent_read = static_cast<size_t>(result);
+        else
+            throw Exception(ErrorCodes::PARAMETER_OUT_OF_BOUND,
+                "Exceeded limit for the number of marks per a single task for parallel replicas. "
+                "Make sure that `parallel_replicas_single_task_marks_count_multiplier` is in some reasonable boundaries, current value is: {}",
+                multiplier);
 
         CoordinationMode mode = read_type == ReadType::InOrder
             ? CoordinationMode::WithOrder

From e27e6fb2f5410119b116bb12e9ff9c25d958d901 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Tue, 20 Feb 2024 11:41:08 +0000
Subject: [PATCH 647/985] Analyzer: support join using column from select list

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 140 ++++++++++++++----
 src/Planner/PlannerJoinTree.cpp               |  46 ++++--
 src/Storages/StorageMerge.cpp                 |   8 +-
 tests/analyzer_tech_debt.txt                  |   1 -
 .../02989_join_using_parent_scope.reference   |  88 +++++++++++
 .../02989_join_using_parent_scope.sql         |  45 ++++++
 6 files changed, 276 insertions(+), 52 deletions(-)
 create mode 100644 tests/queries/0_stateless/02989_join_using_parent_scope.reference
 create mode 100644 tests/queries/0_stateless/02989_join_using_parent_scope.sql

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 1da5d86edf3..702a70ddc61 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -1276,7 +1276,7 @@ private:
         return {};
     }
 
-    static void convertJoinedColumnTypeToNullIfNeeded(QueryTreeNodePtr & resolved_identifier, const JoinKind & join_kind, std::optional<JoinTableSide> resolved_side)
+    static void convertJoinedColumnTypeToNullIfNeeded(QueryTreeNodePtr & resolved_identifier, const JoinKind & join_kind, std::optional<JoinTableSide> resolved_side, const ContextPtr & context)
     {
         if (resolved_identifier->getNodeType() == QueryTreeNodeType::COLUMN &&
             JoinCommon::canBecomeNullable(resolved_identifier->getResultType()) &&
@@ -1285,7 +1285,14 @@ private:
             (isRight(join_kind) && resolved_side && *resolved_side == JoinTableSide::Left)))
         {
             auto & resolved_column = resolved_identifier->as<ColumnNode &>();
-            resolved_column.setColumnType(makeNullableOrLowCardinalityNullable(resolved_column.getColumnType()));
+            auto new_result_type = makeNullableOrLowCardinalityNullable(resolved_column.getColumnType());
+            resolved_column.setColumnType(new_result_type);
+            if (resolved_column.hasExpression())
+            {
+                auto & resolved_expression = resolved_column.getExpression();
+                if (!resolved_expression->getResultType()->equals(*new_result_type))
+                    resolved_expression = buildCastFunction(resolved_expression, new_result_type, context, true);
+            }
         }
     }
 
@@ -3258,6 +3265,32 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromTableExpression(const Id
     return {};
 }
 
+QueryTreeNodePtr checkIsMissedObjectJSONSubcolumn(const QueryTreeNodePtr & left_resolved_identifier,
+                                                  const QueryTreeNodePtr & right_resolved_identifier)
+{
+    if (left_resolved_identifier && right_resolved_identifier && left_resolved_identifier->getNodeType() == QueryTreeNodeType::CONSTANT
+        && right_resolved_identifier->getNodeType() == QueryTreeNodeType::CONSTANT)
+    {
+        auto & left_resolved_column = left_resolved_identifier->as<ConstantNode &>();
+        auto & right_resolved_column = right_resolved_identifier->as<ConstantNode &>();
+        if (left_resolved_column.getValueStringRepresentation() == "NULL" && right_resolved_column.getValueStringRepresentation() == "NULL")
+            return left_resolved_identifier;
+    }
+    else if (left_resolved_identifier && left_resolved_identifier->getNodeType() == QueryTreeNodeType::CONSTANT)
+    {
+        auto & left_resolved_column = left_resolved_identifier->as<ConstantNode &>();
+        if (left_resolved_column.getValueStringRepresentation() == "NULL")
+            return left_resolved_identifier;
+    }
+    else if (right_resolved_identifier && right_resolved_identifier->getNodeType() == QueryTreeNodeType::CONSTANT)
+    {
+        auto & right_resolved_column = right_resolved_identifier->as<ConstantNode &>();
+        if (right_resolved_column.getValueStringRepresentation() == "NULL")
+            return right_resolved_identifier;
+    }
+    return {};
+}
+
 QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromJoin(const IdentifierLookup & identifier_lookup,
     const QueryTreeNodePtr & table_expression_node,
     IdentifierResolveScope & scope)
@@ -3358,28 +3391,8 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromJoin(const IdentifierLoo
 
     /// If columns from left or right table were missed Object(Nullable('json')) subcolumns, they will be replaced
     /// to ConstantNode(NULL), which can't be cast to ColumnNode, so we resolve it here.
-    if (left_resolved_identifier && right_resolved_identifier && left_resolved_identifier->getNodeType() == QueryTreeNodeType::CONSTANT
-        && right_resolved_identifier->getNodeType() == QueryTreeNodeType::CONSTANT)
-    {
-        auto & left_resolved_column = left_resolved_identifier->as<ConstantNode &>();
-        auto & right_resolved_column = right_resolved_identifier->as<ConstantNode &>();
-        if (left_resolved_column.getValueStringRepresentation() == "NULL" && right_resolved_column.getValueStringRepresentation() == "NULL")
-            return left_resolved_identifier;
-    }
-    else if (left_resolved_identifier && left_resolved_identifier->getNodeType() == QueryTreeNodeType::CONSTANT)
-    {
-        resolved_side = JoinTableSide::Left;
-        auto & left_resolved_column = left_resolved_identifier->as<ConstantNode &>();
-        if (left_resolved_column.getValueStringRepresentation() == "NULL")
-            return left_resolved_identifier;
-    }
-    else if (right_resolved_identifier && right_resolved_identifier->getNodeType() == QueryTreeNodeType::CONSTANT)
-    {
-        resolved_side = JoinTableSide::Right;
-        auto & right_resolved_column = right_resolved_identifier->as<ConstantNode &>();
-        if (right_resolved_column.getValueStringRepresentation() == "NULL")
-            return right_resolved_identifier;
-    }
+    if (auto missed_subcolumn_identifier = checkIsMissedObjectJSONSubcolumn(left_resolved_identifier, right_resolved_identifier))
+        return missed_subcolumn_identifier;
 
     if (left_resolved_identifier && right_resolved_identifier)
     {
@@ -3522,7 +3535,7 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromJoin(const IdentifierLoo
     if (scope.join_use_nulls)
     {
         resolved_identifier = resolved_identifier->clone();
-        convertJoinedColumnTypeToNullIfNeeded(resolved_identifier, join_kind, resolved_side);
+        convertJoinedColumnTypeToNullIfNeeded(resolved_identifier, join_kind, resolved_side, scope.context);
     }
 
     return resolved_identifier;
@@ -4402,6 +4415,31 @@ QueryAnalyzer::QueryTreeNodesWithNames QueryAnalyzer::resolveUnqualifiedMatcher(
                     const auto & join_using_column_nodes_list = join_using_column_node.getExpressionOrThrow()->as<ListNode &>();
                     const auto & join_using_column_nodes = join_using_column_nodes_list.getNodes();
 
+                    /** If column doesn't exists in the table, then do not match column from USING clause.
+                      * Example: SELECT a + 1 AS id, * FROM (SELECT 1 AS a) AS t1 JOIN (SELECT 2 AS id) AS t2 USING (id);
+                      * In this case `id` is not present in the left table expression,
+                      * so asterisk should return `id` from the right table expression.
+                      */
+                    auto is_column_from_parent_scope = [&scope](const QueryTreeNodePtr & using_node_from_table)
+                    {
+                        const auto & using_column_from_table = using_node_from_table->as<ColumnNode &>();
+                        auto table_expression_data_it = scope.table_expression_node_to_data.find(using_column_from_table.getColumnSource());
+                        if (table_expression_data_it != scope.table_expression_node_to_data.end())
+                        {
+                            const auto & table_expression_data = table_expression_data_it->second;
+                            const auto & column_name = using_column_from_table.getColumnName();
+                            if (!table_expression_data.column_name_to_column_node.contains(column_name))
+                            {
+                                return true;
+                            }
+                        }
+                        return false;
+                    };
+
+                    if (is_column_from_parent_scope(join_using_column_nodes.at(0)) ||
+                        is_column_from_parent_scope(join_using_column_nodes.at(1)))
+                        continue;
+
                     QueryTreeNodePtr matched_column_node;
 
                     if (isRight(join_node->getKind()))
@@ -4523,7 +4561,13 @@ ProjectionNames QueryAnalyzer::resolveMatcher(QueryTreeNodePtr & matcher_node, I
             for (auto & [node, node_name] : matched_expression_nodes_with_names)
             {
                 auto join_identifier_side = getColumnSideFromJoinTree(node, *nearest_scope_join_node);
-                convertJoinedColumnTypeToNullIfNeeded(node, nearest_scope_join_node->getKind(), join_identifier_side);
+                auto projection_name_it = node_to_projection_name.find(node);
+                node = node->clone();
+                /// Set the same projection name for new nullable node
+                if (projection_name_it != node_to_projection_name.end())
+                    node_to_projection_name.emplace(node, projection_name_it->second);
+
+                convertJoinedColumnTypeToNullIfNeeded(node, nearest_scope_join_node->getKind(), join_identifier_side, scope.context);
             }
         }
     }
@@ -7307,11 +7351,45 @@ void QueryAnalyzer::resolveJoin(QueryTreeNodePtr & join_node, IdentifierResolveS
             IdentifierLookup identifier_lookup{identifier_node->getIdentifier(), IdentifierLookupContext::EXPRESSION};
             auto result_left_table_expression = tryResolveIdentifierFromJoinTreeNode(identifier_lookup, join_node_typed.getLeftTableExpression(), scope);
             if (!result_left_table_expression)
-                throw Exception(ErrorCodes::UNKNOWN_IDENTIFIER,
-                    "JOIN {} using identifier '{}' cannot be resolved from left table expression. In scope {}",
-                    join_node_typed.formatASTForErrorMessage(),
-                    identifier_full_name,
-                    scope.scope_node->formatASTForErrorMessage());
+            {
+                /** Try to resolve identifier from parent subquery projection.
+                  * Example: SELECT a + 1 AS v FROM (SELECT 1 AS a) t1 JOIN (SELECT 2 AS b) USING b
+                  * In this case `b` is not in the left table expression, but it is in the parent subquery projection.
+                  */
+                QueryNode * query_node = scope.scope_node ? scope.scope_node->as<QueryNode>() : nullptr;
+                if (query_node)
+                {
+                    const auto & projection_list = query_node->getProjection();
+                    for (const auto & projection_node : projection_list.getNodes())
+                    {
+                        if (projection_node->hasAlias() && identifier_full_name == projection_node->getAlias())
+                        {
+                            auto left_subquery = std::make_shared<QueryNode>(query_node->getMutableContext());
+                            left_subquery->getProjection().getNodes().push_back(projection_node->clone());
+                            left_subquery->getJoinTree() = join_node_typed.getLeftTableExpression();
+
+                            IdentifierResolveScope left_subquery_scope(left_subquery, nullptr /*parent_scope*/);
+                            resolveQuery(left_subquery, left_subquery_scope);
+
+                            const auto & resolved_nodes = left_subquery->getProjection().getNodes();
+                            if (resolved_nodes.size() == 1)
+                            {
+                                /// Create ColumnNode with expression from parent projection
+                                result_left_table_expression = std::make_shared<ColumnNode>(
+                                    NameAndTypePair{identifier_full_name, resolved_nodes.at(0)->getResultType()}, resolved_nodes.at(0), join_node_typed.getLeftTableExpression());
+                                break;
+                            }
+                        }
+                    }
+                }
+
+                if (!result_left_table_expression)
+                    throw Exception(ErrorCodes::UNKNOWN_IDENTIFIER,
+                        "JOIN {} using identifier '{}' cannot be resolved from left table expression. In scope {}",
+                        join_node_typed.formatASTForErrorMessage(),
+                        identifier_full_name,
+                        scope.scope_node->formatASTForErrorMessage());
+            }
 
             if (result_left_table_expression->getNodeType() != QueryTreeNodeType::COLUMN)
                 throw Exception(ErrorCodes::UNSUPPORTED_METHOD,
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 8ca8f0f258b..61a7a19f5be 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -585,6 +585,28 @@ UInt64 mainQueryNodeBlockSizeByLimit(const SelectQueryInfo & select_query_info)
     return 0;
 }
 
+std::unique_ptr<ExpressionStep> createComputeAliasColumnsStep(
+    const std::unordered_map<std::string, ActionsDAGPtr> & alias_column_expressions, const DataStream & current_data_stream)
+{
+    ActionsDAGPtr merged_alias_columns_actions_dag = std::make_shared<ActionsDAG>(current_data_stream.header.getColumnsWithTypeAndName());
+    ActionsDAG::NodeRawConstPtrs action_dag_outputs = merged_alias_columns_actions_dag->getInputs();
+
+    for (const auto & [column_name, alias_column_actions_dag] : alias_column_expressions)
+    {
+        const auto & current_outputs = alias_column_actions_dag->getOutputs();
+        action_dag_outputs.insert(action_dag_outputs.end(), current_outputs.begin(), current_outputs.end());
+        merged_alias_columns_actions_dag->mergeNodes(std::move(*alias_column_actions_dag));
+    }
+
+    for (const auto * output_node : action_dag_outputs)
+        merged_alias_columns_actions_dag->addOrReplaceInOutputs(*output_node);
+    merged_alias_columns_actions_dag->removeUnusedActions(false);
+
+    auto alias_column_step = std::make_unique<ExpressionStep>(current_data_stream, std::move(merged_alias_columns_actions_dag));
+    alias_column_step->setStepDescription("Compute alias columns");
+    return alias_column_step;
+}
+
 JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expression,
     const SelectQueryInfo & select_query_info,
     const SelectQueryOptions & select_query_options,
@@ -865,22 +887,7 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
                 const auto & alias_column_expressions = table_expression_data.getAliasColumnExpressions();
                 if (!alias_column_expressions.empty() && query_plan.isInitialized() && from_stage == QueryProcessingStage::FetchColumns)
                 {
-                    ActionsDAGPtr merged_alias_columns_actions_dag = std::make_shared<ActionsDAG>(query_plan.getCurrentDataStream().header.getColumnsWithTypeAndName());
-                    ActionsDAG::NodeRawConstPtrs action_dag_outputs = merged_alias_columns_actions_dag->getInputs();
-
-                    for (const auto & [column_name, alias_column_actions_dag] : alias_column_expressions)
-                    {
-                        const auto & current_outputs = alias_column_actions_dag->getOutputs();
-                        action_dag_outputs.insert(action_dag_outputs.end(), current_outputs.begin(), current_outputs.end());
-                        merged_alias_columns_actions_dag->mergeNodes(std::move(*alias_column_actions_dag));
-                    }
-
-                    for (const auto * output_node : action_dag_outputs)
-                        merged_alias_columns_actions_dag->addOrReplaceInOutputs(*output_node);
-                    merged_alias_columns_actions_dag->removeUnusedActions(false);
-
-                    auto alias_column_step = std::make_unique<ExpressionStep>(query_plan.getCurrentDataStream(), std::move(merged_alias_columns_actions_dag));
-                    alias_column_step->setStepDescription("Compute alias columns");
+                    auto alias_column_step = createComputeAliasColumnsStep(alias_column_expressions, query_plan.getCurrentDataStream());
                     query_plan.addStep(std::move(alias_column_step));
                 }
 
@@ -961,6 +968,13 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
             query_node_to_plan_step_mapping.insert(mapping.begin(), mapping.end());
             query_plan = std::move(subquery_planner).extractQueryPlan();
         }
+
+        const auto & alias_column_expressions = table_expression_data.getAliasColumnExpressions();
+        if (!alias_column_expressions.empty() && query_plan.isInitialized() && from_stage == QueryProcessingStage::FetchColumns)
+        {
+            auto alias_column_step = createComputeAliasColumnsStep(alias_column_expressions, query_plan.getCurrentDataStream());
+            query_plan.addStep(std::move(alias_column_step));
+        }
     }
     else
     {
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 9161b2773da..df3c141db1b 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -678,13 +678,13 @@ public:
 
     void visitImpl(QueryTreeNodePtr & node)
     {
-        if (auto * column = node->as<ColumnNode>(); column != nullptr)
+        if (auto * column = node->as<ColumnNode>())
         {
             if (column->hasExpression())
             {
-                auto column_name = column->getColumnName();
-                node = column->getExpressionOrThrow();
-                node->setAlias(column_name);
+                QueryTreeNodePtr column_expression = column->getExpressionOrThrow();
+                column_expression->setAlias(column->getColumnName());
+                node = std::move(column_expression);
             }
             else
                 column->setColumnSource(replacement_table_expression);
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index bcf0eee0d0e..21ab4a28ce4 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -1,7 +1,6 @@
 00223_shard_distributed_aggregation_memory_efficient
 00717_merge_and_distributed
 00725_memory_tracking
-01062_pm_all_join_with_block_continuation
 01083_expressions_in_engine_arguments
 01155_rename_move_materialized_view
 01584_distributed_buffer_cannot_find_column
diff --git a/tests/queries/0_stateless/02989_join_using_parent_scope.reference b/tests/queries/0_stateless/02989_join_using_parent_scope.reference
new file mode 100644
index 00000000000..c396431049f
--- /dev/null
+++ b/tests/queries/0_stateless/02989_join_using_parent_scope.reference
@@ -0,0 +1,88 @@
+-- { echoOn }
+SELECT 1 AS a FROM tb JOIN tabc USING (a) ORDER BY ALL;
+1
+1
+1
+1
+SELECT a + 2 AS b FROM ta JOIN tabc USING (b) ORDER BY ALL;
+2
+3
+4
+SELECT b + 2 AS a FROM tb JOIN tabc USING (a) ORDER BY ALL;
+2
+3
+SELECT a + 2 AS c FROM ta JOIN tabc USING (c) ORDER BY ALL;
+2
+3
+4
+5
+SELECT b AS a, a FROM tb JOIN tabc USING (a) ORDER BY ALL;
+0	0
+1	1
+2	2
+3	3
+SELECT 1 AS b FROM tb JOIN ta USING (b); -- { serverError UNKNOWN_IDENTIFIER }
+-- SELECT * works returns all columns from both tables in new analyzer
+SET allow_experimental_analyzer = 1;
+SELECT 3 AS a, a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
+3	3	0	3
+3	3	1	3
+3	3	2	3
+3	3	3	3
+3	3	\N	0
+3	3	\N	1
+3	3	\N	2
+SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
+1	0	1
+2	1	2
+3	2	3
+SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
+1	0	1
+2	1	2
+3	2	3
+SELECT b + 1 AS a, * FROM tb LEFT JOIN tabc USING (a) ORDER BY ALL;
+1	0	1
+2	1	2
+3	2	3
+4	3	\N
+SELECT b + 1 AS a, * FROM tb RIGHT JOIN tabc USING (a) ORDER BY ALL;
+1	0	1
+2	1	2
+3	2	3
+\N	\N	0
+SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
+1	0	1
+2	1	2
+3	2	3
+4	3	\N
+\N	\N	0
+SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS asterisk_include_alias_columns = 1;
+1	0	1	2	3
+2	1	2	3	4
+3	2	3	4	5
+4	3	\N	\N	\N
+\N	\N	0	1	2
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+1	0	1	2
+2	1	2	3
+3	2	3	4
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 LEFT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+1	0	1	2
+2	1	2	3
+3	2	3	4
+4	3	\N	\N
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 RIGHT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+1	0	1	2
+2	1	2	3
+3	2	3	4
+\N	\N	0	1
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 FULL JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+1	0	1	2
+2	1	2	3
+3	2	3	4
+4	3	\N	\N
+\N	\N	0	1
+DROP TABLE IF EXISTS tabc;
+DROP TABLE IF EXISTS ta;
+DROP TABLE IF EXISTS tb;
+DROP TABLE IF EXISTS tc;
diff --git a/tests/queries/0_stateless/02989_join_using_parent_scope.sql b/tests/queries/0_stateless/02989_join_using_parent_scope.sql
new file mode 100644
index 00000000000..05f1137f60e
--- /dev/null
+++ b/tests/queries/0_stateless/02989_join_using_parent_scope.sql
@@ -0,0 +1,45 @@
+DROP TABLE IF EXISTS tabc;
+CREATE TABLE tabc (a UInt32, b UInt32 ALIAS a + 1, c UInt32 ALIAS b + 1) ENGINE = MergeTree ORDER BY a;
+INSERT INTO tabc SELECT number FROM numbers(4);
+
+DROP TABLE IF EXISTS ta;
+CREATE TABLE ta (a Int32) ENGINE = MergeTree ORDER BY tuple();
+INSERT INTO ta SELECT number FROM numbers(4);
+
+DROP TABLE IF EXISTS tb;
+CREATE TABLE tb (b Int32) ENGINE = MergeTree ORDER BY tuple();
+INSERT INTO tb SELECT number FROM numbers(4);
+
+SET join_use_nulls = 1;
+
+-- { echoOn }
+SELECT 1 AS a FROM tb JOIN tabc USING (a) ORDER BY ALL;
+SELECT a + 2 AS b FROM ta JOIN tabc USING (b) ORDER BY ALL;
+SELECT b + 2 AS a FROM tb JOIN tabc USING (a) ORDER BY ALL;
+SELECT a + 2 AS c FROM ta JOIN tabc USING (c) ORDER BY ALL;
+
+SELECT b AS a, a FROM tb JOIN tabc USING (a) ORDER BY ALL;
+SELECT 1 AS b FROM tb JOIN ta USING (b); -- { serverError UNKNOWN_IDENTIFIER }
+
+-- SELECT * works returns all columns from both tables in new analyzer
+SET allow_experimental_analyzer = 1;
+
+SELECT 3 AS a, a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
+
+SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb LEFT JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb RIGHT JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS asterisk_include_alias_columns = 1;
+
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 LEFT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 RIGHT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 FULL JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+
+
+DROP TABLE IF EXISTS tabc;
+DROP TABLE IF EXISTS ta;
+DROP TABLE IF EXISTS tb;
+DROP TABLE IF EXISTS tc;

From fbad9b799cd4d8549bf8479c94688cb7a1277c89 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Mon, 11 Mar 2024 17:45:05 +0000
Subject: [PATCH 648/985] fix PREWHERE with join_use_nulls

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 90 +++++++++++++------
 .../02989_join_using_parent_scope.reference   | 68 +++++++-------
 .../02989_join_using_parent_scope.sql         |  5 +-
 3 files changed, 102 insertions(+), 61 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 702a70ddc61..35b6f05191e 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -776,6 +776,7 @@ struct IdentifierResolveScope
     std::unordered_map<QueryTreeNodePtr, TableExpressionData> table_expression_node_to_data;
 
     QueryTreeNodePtrWithHashSet nullable_group_by_keys;
+    QueryTreeNodePtrWithHashMap<QueryTreeNodePtr> nullable_join_columns;
 
     /// Use identifier lookup to result cache
     bool use_identifier_lookup_to_result_cache = true;
@@ -1276,7 +1277,11 @@ private:
         return {};
     }
 
-    static void convertJoinedColumnTypeToNullIfNeeded(QueryTreeNodePtr & resolved_identifier, const JoinKind & join_kind, std::optional<JoinTableSide> resolved_side, const ContextPtr & context)
+    static QueryTreeNodePtr convertJoinedColumnTypeToNullIfNeeded(
+        const QueryTreeNodePtr & resolved_identifier,
+        const JoinKind & join_kind,
+        std::optional<JoinTableSide> resolved_side,
+        IdentifierResolveScope & scope)
     {
         if (resolved_identifier->getNodeType() == QueryTreeNodeType::COLUMN &&
             JoinCommon::canBecomeNullable(resolved_identifier->getResultType()) &&
@@ -1284,16 +1289,20 @@ private:
             (isLeft(join_kind) && resolved_side && *resolved_side == JoinTableSide::Right) ||
             (isRight(join_kind) && resolved_side && *resolved_side == JoinTableSide::Left)))
         {
-            auto & resolved_column = resolved_identifier->as<ColumnNode &>();
+            auto nullable_resolved_identifier = resolved_identifier->clone();
+            auto & resolved_column = nullable_resolved_identifier->as<ColumnNode &>();
             auto new_result_type = makeNullableOrLowCardinalityNullable(resolved_column.getColumnType());
             resolved_column.setColumnType(new_result_type);
             if (resolved_column.hasExpression())
             {
                 auto & resolved_expression = resolved_column.getExpression();
                 if (!resolved_expression->getResultType()->equals(*new_result_type))
-                    resolved_expression = buildCastFunction(resolved_expression, new_result_type, context, true);
+                    resolved_expression = buildCastFunction(resolved_expression, new_result_type, scope.context, true);
             }
+            scope.nullable_join_columns[nullable_resolved_identifier] = resolved_identifier;
+            return nullable_resolved_identifier;
         }
+        return nullptr;
     }
 
     /// Resolve identifier functions
@@ -3534,8 +3543,9 @@ QueryTreeNodePtr QueryAnalyzer::tryResolveIdentifierFromJoin(const IdentifierLoo
 
     if (scope.join_use_nulls)
     {
-        resolved_identifier = resolved_identifier->clone();
-        convertJoinedColumnTypeToNullIfNeeded(resolved_identifier, join_kind, resolved_side, scope.context);
+        auto nullable_resolved_identifier = convertJoinedColumnTypeToNullIfNeeded(resolved_identifier, join_kind, resolved_side, scope);
+        if (nullable_resolved_identifier)
+            resolved_identifier = nullable_resolved_identifier;
     }
 
     return resolved_identifier;
@@ -4428,10 +4438,7 @@ QueryAnalyzer::QueryTreeNodesWithNames QueryAnalyzer::resolveUnqualifiedMatcher(
                         {
                             const auto & table_expression_data = table_expression_data_it->second;
                             const auto & column_name = using_column_from_table.getColumnName();
-                            if (!table_expression_data.column_name_to_column_node.contains(column_name))
-                            {
-                                return true;
-                            }
+                            return !table_expression_data.column_name_to_column_node.contains(column_name);
                         }
                         return false;
                     };
@@ -4562,12 +4569,14 @@ ProjectionNames QueryAnalyzer::resolveMatcher(QueryTreeNodePtr & matcher_node, I
             {
                 auto join_identifier_side = getColumnSideFromJoinTree(node, *nearest_scope_join_node);
                 auto projection_name_it = node_to_projection_name.find(node);
-                node = node->clone();
-                /// Set the same projection name for new nullable node
-                if (projection_name_it != node_to_projection_name.end())
-                    node_to_projection_name.emplace(node, projection_name_it->second);
-
-                convertJoinedColumnTypeToNullIfNeeded(node, nearest_scope_join_node->getKind(), join_identifier_side, scope.context);
+                auto nullable_node = convertJoinedColumnTypeToNullIfNeeded(node, nearest_scope_join_node->getKind(), join_identifier_side, scope);
+                if (nullable_node)
+                {
+                    node = nullable_node;
+                    /// Set the same projection name for new nullable node
+                    if (projection_name_it != node_to_projection_name.end())
+                        node_to_projection_name.emplace(node, projection_name_it->second);
+                }
             }
         }
     }
@@ -7526,6 +7535,29 @@ void QueryAnalyzer::resolveQueryJoinTreeNode(QueryTreeNodePtr & join_tree_node,
     scope.table_expressions_in_resolve_process.erase(join_tree_node.get());
 }
 
+class ReplaceColumnsVisitor : public InDepthQueryTreeVisitor<ReplaceColumnsVisitor>
+{
+public:
+    explicit ReplaceColumnsVisitor(const QueryTreeNodePtrWithHashMap<QueryTreeNodePtr> & replacement_map_, const ContextPtr & context_)
+        : replacement_map(replacement_map_)
+        , context(context_)
+    {}
+
+    void visitImpl(QueryTreeNodePtr & node)
+    {
+        if (auto it = replacement_map.find(node); it != replacement_map.end())
+            node = it->second;
+        if (auto * function_node = node->as<FunctionNode>())
+            rerunFunctionResolve(function_node, context);
+    }
+
+    bool shouldTraverseTopToBottom() const { return false; }
+
+private:
+    const QueryTreeNodePtrWithHashMap<QueryTreeNodePtr> & replacement_map;
+    const ContextPtr & context;
+};
+
 /** Resolve query.
   * This function modifies query node during resolve. It is caller responsibility to clone query node before resolve
   * if it is needed for later use.
@@ -7713,21 +7745,23 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
                 scope.scope_node->formatASTForErrorMessage());
     }
 
-    if (query_node_typed.getPrewhere())
+    if (auto & prewhere_node = query_node_typed.getPrewhere())
     {
-        /** Expression in PREWHERE with JOIN should not be modified by join_use_nulls.
-          * Example: SELECT * FROM t1 JOIN t2 USING (id) PREWHERE a = 1
-          * Column `a` should be resolved from table and should not change its type to Nullable.
-          */
-        bool join_use_nulls = scope.join_use_nulls;
-        bool use_identifier_lookup_to_result_cache = scope.use_identifier_lookup_to_result_cache;
-        scope.join_use_nulls = false;
-        scope.use_identifier_lookup_to_result_cache = false;
+        resolveExpressionNode(prewhere_node, scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
 
-        resolveExpressionNode(query_node_typed.getPrewhere(), scope, false /*allow_lambda_expression*/, false /*allow_table_expression*/);
-
-        scope.join_use_nulls = join_use_nulls;
-        scope.use_identifier_lookup_to_result_cache = use_identifier_lookup_to_result_cache;
+        if (scope.join_use_nulls)
+        {
+            /** Expression in PREWHERE with JOIN should not be modified by join_use_nulls.
+              * Example: SELECT * FROM t1 JOIN t2 USING (id) PREWHERE b = 1
+              * Column `a` should be resolved from table and should not change its type to Nullable.
+              * More complicated example when column is somewhere inside an expression:
+              * SELECT a + 1 as b FROM t1 JOIN t2 USING (id) PREWHERE b = 1
+              * expression `a + 1 as b` in projection and in PREWHERE should have different `a`.
+              */
+            prewhere_node = prewhere_node->clone();
+            ReplaceColumnsVisitor replace_visitor(scope.nullable_join_columns, scope.context);
+            replace_visitor.visit(prewhere_node);
+        }
     }
 
     if (query_node_typed.getWhere())
diff --git a/tests/queries/0_stateless/02989_join_using_parent_scope.reference b/tests/queries/0_stateless/02989_join_using_parent_scope.reference
index c396431049f..cf1ae93936f 100644
--- a/tests/queries/0_stateless/02989_join_using_parent_scope.reference
+++ b/tests/queries/0_stateless/02989_join_using_parent_scope.reference
@@ -25,43 +25,43 @@ SELECT 1 AS b FROM tb JOIN ta USING (b); -- { serverError UNKNOWN_IDENTIFIER }
 -- SELECT * works returns all columns from both tables in new analyzer
 SET allow_experimental_analyzer = 1;
 SELECT 3 AS a, a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
-3	3	0	3
-3	3	1	3
-3	3	2	3
-3	3	3	3
-3	3	\N	0
-3	3	\N	1
-3	3	\N	2
+3	3	0	3	abc3
+3	3	1	3	abc3
+3	3	2	3	abc3
+3	3	3	3	abc3
+3	3	\N	0	abc0
+3	3	\N	1	abc1
+3	3	\N	2	abc2
 SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
-1	0	1
-2	1	2
-3	2	3
+1	0	1	abc1
+2	1	2	abc2
+3	2	3	abc3
 SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
-1	0	1
-2	1	2
-3	2	3
+1	0	1	abc1
+2	1	2	abc2
+3	2	3	abc3
 SELECT b + 1 AS a, * FROM tb LEFT JOIN tabc USING (a) ORDER BY ALL;
-1	0	1
-2	1	2
-3	2	3
-4	3	\N
+1	0	1	abc1
+2	1	2	abc2
+3	2	3	abc3
+4	3	\N	\N
 SELECT b + 1 AS a, * FROM tb RIGHT JOIN tabc USING (a) ORDER BY ALL;
-1	0	1
-2	1	2
-3	2	3
-\N	\N	0
+1	0	1	abc1
+2	1	2	abc2
+3	2	3	abc3
+\N	\N	0	abc0
 SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
-1	0	1
-2	1	2
-3	2	3
-4	3	\N
-\N	\N	0
+1	0	1	abc1
+2	1	2	abc2
+3	2	3	abc3
+4	3	\N	\N
+\N	\N	0	abc0
 SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS asterisk_include_alias_columns = 1;
-1	0	1	2	3
-2	1	2	3	4
-3	2	3	4	5
-4	3	\N	\N	\N
-\N	\N	0	1	2
+1	0	1	abc1	2	3
+2	1	2	abc2	3	4
+3	2	3	abc3	4	5
+4	3	\N	\N	\N	\N
+\N	\N	0	abc0	1	2
 SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
 1	0	1	2
 2	1	2	3
@@ -82,6 +82,12 @@ SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 FULL JOIN (SELECT a, b FROM tabc
 3	2	3	4
 4	3	\N	\N
 \N	\N	0	1
+SELECT b + 1 AS a, s FROM tb FULL OUTER JOIN tabc USING (a) PREWHERE a > 2 ORDER BY ALL;
+3	abc3
+4	\N
+\N	abc0
+\N	abc1
+\N	abc2
 DROP TABLE IF EXISTS tabc;
 DROP TABLE IF EXISTS ta;
 DROP TABLE IF EXISTS tb;
diff --git a/tests/queries/0_stateless/02989_join_using_parent_scope.sql b/tests/queries/0_stateless/02989_join_using_parent_scope.sql
index 05f1137f60e..9c8501f6b00 100644
--- a/tests/queries/0_stateless/02989_join_using_parent_scope.sql
+++ b/tests/queries/0_stateless/02989_join_using_parent_scope.sql
@@ -1,6 +1,6 @@
 DROP TABLE IF EXISTS tabc;
-CREATE TABLE tabc (a UInt32, b UInt32 ALIAS a + 1, c UInt32 ALIAS b + 1) ENGINE = MergeTree ORDER BY a;
-INSERT INTO tabc SELECT number FROM numbers(4);
+CREATE TABLE tabc (a UInt32, b UInt32 ALIAS a + 1, c UInt32 ALIAS b + 1, s String) ENGINE = MergeTree ORDER BY a;
+INSERT INTO tabc (a, s) SELECT number, 'abc' || toString(number) FROM numbers(4);
 
 DROP TABLE IF EXISTS ta;
 CREATE TABLE ta (a Int32) ENGINE = MergeTree ORDER BY tuple();
@@ -38,6 +38,7 @@ SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 LEFT JOIN (SELECT a, b FROM tabc
 SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 RIGHT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
 SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 FULL JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
 
+SELECT b + 1 AS a, s FROM tb FULL OUTER JOIN tabc USING (a) PREWHERE a > 2 ORDER BY ALL;
 
 DROP TABLE IF EXISTS tabc;
 DROP TABLE IF EXISTS ta;

From dbed5d1902eee94d2db9596c74ccf0b7335bb293 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Wed, 13 Mar 2024 12:14:14 +0000
Subject: [PATCH 649/985] Add
 analyzer_compatibility_join_using_top_level_identifier

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp     | 90 ++++++++++++-------
 src/Core/Settings.h                           |  1 +
 src/Core/SettingsChangesHistory.h             |  1 +
 .../02989_join_using_parent_scope.reference   | 70 ++++++++++++---
 .../02989_join_using_parent_scope.sql         | 68 +++++++++++---
 5 files changed, 168 insertions(+), 62 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 35b6f05191e..0414ea93f94 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -7357,48 +7357,70 @@ void QueryAnalyzer::resolveJoin(QueryTreeNodePtr & join_node, IdentifierResolveS
 
             join_using_identifiers.insert(identifier_full_name);
 
-            IdentifierLookup identifier_lookup{identifier_node->getIdentifier(), IdentifierLookupContext::EXPRESSION};
-            auto result_left_table_expression = tryResolveIdentifierFromJoinTreeNode(identifier_lookup, join_node_typed.getLeftTableExpression(), scope);
-            if (!result_left_table_expression)
+            const auto & settings = scope.context->getSettingsRef();
+
+            /** While resolving JOIN USING identifier, try to resolve identifier from parent subquery projection.
+              * Example: SELECT a + 1 AS b FROM (SELECT 1 AS a) t1 JOIN (SELECT 2 AS b) USING b
+              * In this case `b` is not in the left table expression, but it is in the parent subquery projection.
+              */
+            auto try_resolve_identifier_from_query_projection = [this](const String & identifier_full_name_,
+                                                                       const QueryTreeNodePtr & left_table_expression,
+                                                                       const IdentifierResolveScope & scope_) -> QueryTreeNodePtr
             {
-                /** Try to resolve identifier from parent subquery projection.
-                  * Example: SELECT a + 1 AS v FROM (SELECT 1 AS a) t1 JOIN (SELECT 2 AS b) USING b
-                  * In this case `b` is not in the left table expression, but it is in the parent subquery projection.
-                  */
-                QueryNode * query_node = scope.scope_node ? scope.scope_node->as<QueryNode>() : nullptr;
-                if (query_node)
+                const QueryNode * query_node = scope_.scope_node ? scope_.scope_node->as<QueryNode>() : nullptr;
+                if (!query_node)
+                    return nullptr;
+
+                const auto & projection_list = query_node->getProjection();
+                for (const auto & projection_node : projection_list.getNodes())
                 {
-                    const auto & projection_list = query_node->getProjection();
-                    for (const auto & projection_node : projection_list.getNodes())
+                    if (projection_node->hasAlias() && identifier_full_name_ == projection_node->getAlias())
                     {
-                        if (projection_node->hasAlias() && identifier_full_name == projection_node->getAlias())
+                        auto left_subquery = std::make_shared<QueryNode>(query_node->getMutableContext());
+                        left_subquery->getProjection().getNodes().push_back(projection_node->clone());
+                        left_subquery->getJoinTree() = left_table_expression;
+
+                        IdentifierResolveScope left_subquery_scope(left_subquery, nullptr /*parent_scope*/);
+                        resolveQuery(left_subquery, left_subquery_scope);
+
+                        const auto & resolved_nodes = left_subquery->getProjection().getNodes();
+                        if (resolved_nodes.size() == 1)
                         {
-                            auto left_subquery = std::make_shared<QueryNode>(query_node->getMutableContext());
-                            left_subquery->getProjection().getNodes().push_back(projection_node->clone());
-                            left_subquery->getJoinTree() = join_node_typed.getLeftTableExpression();
-
-                            IdentifierResolveScope left_subquery_scope(left_subquery, nullptr /*parent_scope*/);
-                            resolveQuery(left_subquery, left_subquery_scope);
-
-                            const auto & resolved_nodes = left_subquery->getProjection().getNodes();
-                            if (resolved_nodes.size() == 1)
-                            {
-                                /// Create ColumnNode with expression from parent projection
-                                result_left_table_expression = std::make_shared<ColumnNode>(
-                                    NameAndTypePair{identifier_full_name, resolved_nodes.at(0)->getResultType()}, resolved_nodes.at(0), join_node_typed.getLeftTableExpression());
-                                break;
-                            }
+                            /// Create ColumnNode with expression from parent projection
+                            return std::make_shared<ColumnNode>(
+                                NameAndTypePair{identifier_full_name_, resolved_nodes.front()->getResultType()},
+                                resolved_nodes.front(), left_table_expression);
                         }
                     }
                 }
+                return nullptr;
+            };
 
-                if (!result_left_table_expression)
-                    throw Exception(ErrorCodes::UNKNOWN_IDENTIFIER,
-                        "JOIN {} using identifier '{}' cannot be resolved from left table expression. In scope {}",
-                        join_node_typed.formatASTForErrorMessage(),
-                        identifier_full_name,
-                        scope.scope_node->formatASTForErrorMessage());
-            }
+            QueryTreeNodePtr result_left_table_expression = nullptr;
+            /** With `analyzer_compatibility_join_using_top_level_identifier` alias in projection has higher priority than column from left table.
+              * But if aliased expression cannot be resolved from left table, we get UNKNOW_IDENTIFIER error,
+              * despite the fact that column from USING could be resolved from left table.
+              * It's compatibility with a default behavior for old analyzer.
+              */
+            if (settings.analyzer_compatibility_join_using_top_level_identifier)
+                result_left_table_expression = try_resolve_identifier_from_query_projection(identifier_full_name, join_node_typed.getLeftTableExpression(), scope);
+
+            IdentifierLookup identifier_lookup{identifier_node->getIdentifier(), IdentifierLookupContext::EXPRESSION};
+            if (!result_left_table_expression)
+                result_left_table_expression = tryResolveIdentifierFromJoinTreeNode(identifier_lookup, join_node_typed.getLeftTableExpression(), scope);
+
+            /// Here we may try to resolve identifier from projection in case it's not resolved from left table expression
+            /// and analyzer_compatibility_join_using_top_level_identifier is disabled.
+            /// For now we do not do this, because not all corner cases are clear.
+            /// if (!settings.analyzer_compatibility_join_using_top_level_identifier && !result_left_table_expression)
+            ///     result_left_table_expression = try_resolve_identifier_from_query_projection(identifier_full_name, join_node_typed.getLeftTableExpression(), scope);
+
+            if (!result_left_table_expression)
+                throw Exception(ErrorCodes::UNKNOWN_IDENTIFIER,
+                    "JOIN {} using identifier '{}' cannot be resolved from left table expression. In scope {}",
+                    join_node_typed.formatASTForErrorMessage(),
+                    identifier_full_name,
+                    scope.scope_node->formatASTForErrorMessage());
 
             if (result_left_table_expression->getNodeType() != QueryTreeNodeType::COLUMN)
                 throw Exception(ErrorCodes::UNSUPPORTED_METHOD,
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index e6adb00137f..bad130d6ef4 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -371,6 +371,7 @@ class IColumn;
     M(Bool, opentelemetry_trace_processors, false, "Collect OpenTelemetry spans for processors.", 0) \
     M(Bool, prefer_column_name_to_alias, false, "Prefer using column names instead of aliases if possible.", 0) \
     M(Bool, allow_experimental_analyzer, false, "Allow experimental analyzer", 0) \
+    M(Bool, analyzer_compatibility_join_using_top_level_identifier, false, "Force to resolve identifier in JOIN USING from projection (for example, in `SELECT a + 1 AS b FROM t1 JOIN t2 USING (b)` join will be performed by `t1.a + 1 = t2.b`, rather then `t1.b = t2.b`).", 0) \
     M(Bool, prefer_global_in_and_join, false, "If enabled, all IN/JOIN operators will be rewritten as GLOBAL IN/JOIN. It's useful when the to-be-joined tables are only available on the initiator and we need to always scatter their data on-the-fly during distributed processing with the GLOBAL keyword. It's also useful to reduce the need to access the external sources joining external tables.", 0) \
     M(Bool, enable_vertical_final, true, "If enable, remove duplicated rows during FINAL by marking rows as deleted and filtering them later instead of merging rows", 0) \
     \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 8e2b2915c2a..07a1c88363a 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -96,6 +96,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
               {"filesystem_cache_reserve_space_wait_lock_timeout_milliseconds", 1000, 1000, "Wait time to lock cache for sapce reservation in filesystem cache"},
               {"max_parser_backtracks", 0, 1000000, "Limiting the complexity of parsing"},
+              {"analyzer_compatibility_join_using_top_level_identifier", false, false, "Force to resolve identifier in JOIN USING from projection"},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
diff --git a/tests/queries/0_stateless/02989_join_using_parent_scope.reference b/tests/queries/0_stateless/02989_join_using_parent_scope.reference
index cf1ae93936f..965bfaf7c43 100644
--- a/tests/queries/0_stateless/02989_join_using_parent_scope.reference
+++ b/tests/queries/0_stateless/02989_join_using_parent_scope.reference
@@ -22,9 +22,8 @@ SELECT b AS a, a FROM tb JOIN tabc USING (a) ORDER BY ALL;
 2	2
 3	3
 SELECT 1 AS b FROM tb JOIN ta USING (b); -- { serverError UNKNOWN_IDENTIFIER }
--- SELECT * works returns all columns from both tables in new analyzer
-SET allow_experimental_analyzer = 1;
-SELECT 3 AS a, a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
+-- SELECT * returns all columns from both tables in new analyzer
+SELECT 3 AS a, a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 3	3	0	3	abc3
 3	3	1	3	abc3
 3	3	2	3	abc3
@@ -32,62 +31,105 @@ SELECT 3 AS a, a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
 3	3	\N	0	abc0
 3	3	\N	1	abc1
 3	3	\N	2	abc2
-SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 1	0	1	abc1
 2	1	2	abc2
 3	2	3	abc3
-SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 1	0	1	abc1
 2	1	2	abc2
 3	2	3	abc3
-SELECT b + 1 AS a, * FROM tb LEFT JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb LEFT JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 1	0	1	abc1
 2	1	2	abc2
 3	2	3	abc3
 4	3	\N	\N
-SELECT b + 1 AS a, * FROM tb RIGHT JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb RIGHT JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 1	0	1	abc1
 2	1	2	abc2
 3	2	3	abc3
 \N	\N	0	abc0
-SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 1	0	1	abc1
 2	1	2	abc2
 3	2	3	abc3
 4	3	\N	\N
 \N	\N	0	abc0
-SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS asterisk_include_alias_columns = 1;
+SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS asterisk_include_alias_columns = 1, allow_experimental_analyzer = 1;
 1	0	1	abc1	2	3
 2	1	2	abc2	3	4
 3	2	3	abc3	4	5
 4	3	\N	\N	\N	\N
 \N	\N	0	abc0	1	2
-SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 1	0	1	2
 2	1	2	3
 3	2	3	4
-SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 LEFT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 LEFT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 1	0	1	2
 2	1	2	3
 3	2	3	4
 4	3	\N	\N
-SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 RIGHT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 RIGHT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 1	0	1	2
 2	1	2	3
 3	2	3	4
 \N	\N	0	1
-SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 FULL JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 FULL JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 1	0	1	2
 2	1	2	3
 3	2	3	4
 4	3	\N	\N
 \N	\N	0	1
-SELECT b + 1 AS a, s FROM tb FULL OUTER JOIN tabc USING (a) PREWHERE a > 2 ORDER BY ALL;
+SELECT b + 1 AS a, s FROM tb FULL OUTER JOIN tabc USING (a) PREWHERE a > 2 ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 3	abc3
 4	\N
 \N	abc0
 \N	abc1
 \N	abc2
+-- It's a default behavior for old analyzer and new with analyzer_compatibility_join_using_top_level_identifier
+-- Column `b` actually exists in left table, but `b` from USING is resoled to `a + 2` and `a` is not in left table
+-- so we get UNKNOWN_IDENTIFIER error.
+SELECT a + 2 AS b FROM tb JOIN tabc USING (b) ORDER BY ALL
+SETTINGS analyzer_compatibility_join_using_top_level_identifier = 1; -- { serverError UNKNOWN_IDENTIFIER }
+-- In new analyzer with `analyzer_compatibility_join_using_top_level_identifier = 0` we get `b` from left table
+SELECT a + 2 AS b FROM tb JOIN tabc USING (b) ORDER BY ALL
+SETTINGS analyzer_compatibility_join_using_top_level_identifier = 0, allow_experimental_analyzer = 1;
+2
+3
+4
+-- This is example where query may return different results with different `analyzer_compatibility_join_using_top_level_identifier`
+
+DROP TABLE IF EXISTS users;
+CREATE TABLE users (uid Int16, name String, spouse_name String) ENGINE=Memory;
+INSERT INTO users VALUES (1231, 'John', 'Ksenia');
+INSERT INTO users VALUES (6666, 'Ksenia', '');
+SELECT u1.uid, u1.spouse_name as name, u2.uid, u2.name
+FROM users u1 JOIN users u2 USING (name)
+ORDER BY u1.uid
+FORMAT TSVWithNamesAndTypes
+SETTINGS allow_experimental_analyzer = 1, analyzer_compatibility_join_using_top_level_identifier = 1;
+uid	name	u2.uid	u2.name
+Int16	String	Int16	String
+1231	Ksenia	6666	Ksenia
+SELECT u1.uid, u1.spouse_name as name, u2.uid, u2.name
+FROM users u1 JOIN users u2 USING (name)
+ORDER BY u1.uid
+FORMAT TSVWithNamesAndTypes
+SETTINGS allow_experimental_analyzer = 1, analyzer_compatibility_join_using_top_level_identifier = 0;
+uid	name	u2.uid	u2.name
+Int16	String	Int16	String
+1231	Ksenia	1231	John
+6666		6666	Ksenia
+SELECT u1.uid, u1.spouse_name as name, u2.uid, u2.name
+FROM users u1 JOIN users u2 USING (name)
+ORDER BY u1.uid
+FORMAT TSVWithNamesAndTypes
+SETTINGS allow_experimental_analyzer = 0;
+uid	name	u2.uid	u2.name
+Int16	String	Int16	String
+1231	Ksenia	6666	Ksenia
+DROP TABLE IF EXISTS users;
 DROP TABLE IF EXISTS tabc;
 DROP TABLE IF EXISTS ta;
 DROP TABLE IF EXISTS tb;
diff --git a/tests/queries/0_stateless/02989_join_using_parent_scope.sql b/tests/queries/0_stateless/02989_join_using_parent_scope.sql
index 9c8501f6b00..2e4d9f097f7 100644
--- a/tests/queries/0_stateless/02989_join_using_parent_scope.sql
+++ b/tests/queries/0_stateless/02989_join_using_parent_scope.sql
@@ -12,6 +12,8 @@ INSERT INTO tb SELECT number FROM numbers(4);
 
 SET join_use_nulls = 1;
 
+SET analyzer_compatibility_join_using_top_level_identifier = 1;
+
 -- { echoOn }
 SELECT 1 AS a FROM tb JOIN tabc USING (a) ORDER BY ALL;
 SELECT a + 2 AS b FROM ta JOIN tabc USING (b) ORDER BY ALL;
@@ -21,24 +23,62 @@ SELECT a + 2 AS c FROM ta JOIN tabc USING (c) ORDER BY ALL;
 SELECT b AS a, a FROM tb JOIN tabc USING (a) ORDER BY ALL;
 SELECT 1 AS b FROM tb JOIN ta USING (b); -- { serverError UNKNOWN_IDENTIFIER }
 
--- SELECT * works returns all columns from both tables in new analyzer
-SET allow_experimental_analyzer = 1;
+-- SELECT * returns all columns from both tables in new analyzer
+SELECT 3 AS a, a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
+SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 
-SELECT 3 AS a, a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
-SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
+SELECT b + 1 AS a, * FROM tb LEFT JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
+SELECT b + 1 AS a, * FROM tb RIGHT JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
+SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
+SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS asterisk_include_alias_columns = 1, allow_experimental_analyzer = 1;
 
-SELECT b + 1 AS a, * FROM tb JOIN tabc USING (a) ORDER BY ALL;
-SELECT b + 1 AS a, * FROM tb LEFT JOIN tabc USING (a) ORDER BY ALL;
-SELECT b + 1 AS a, * FROM tb RIGHT JOIN tabc USING (a) ORDER BY ALL;
-SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL;
-SELECT b + 1 AS a, * FROM tb FULL JOIN tabc USING (a) ORDER BY ALL SETTINGS asterisk_include_alias_columns = 1;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 LEFT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 RIGHT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
+SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 FULL JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
 
-SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
-SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 LEFT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
-SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 RIGHT JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
-SELECT b + 1 AS a, * FROM (SELECT b FROM tb) t1 FULL JOIN (SELECT a, b FROM tabc) t2 USING (a) ORDER BY ALL;
+SELECT b + 1 AS a, s FROM tb FULL OUTER JOIN tabc USING (a) PREWHERE a > 2 ORDER BY ALL SETTINGS allow_experimental_analyzer = 1;
+
+
+-- It's a default behavior for old analyzer and new with analyzer_compatibility_join_using_top_level_identifier
+-- Column `b` actually exists in left table, but `b` from USING is resoled to `a + 2` and `a` is not in left table
+-- so we get UNKNOWN_IDENTIFIER error.
+SELECT a + 2 AS b FROM tb JOIN tabc USING (b) ORDER BY ALL
+SETTINGS analyzer_compatibility_join_using_top_level_identifier = 1; -- { serverError UNKNOWN_IDENTIFIER }
+
+-- In new analyzer with `analyzer_compatibility_join_using_top_level_identifier = 0` we get `b` from left table
+SELECT a + 2 AS b FROM tb JOIN tabc USING (b) ORDER BY ALL
+SETTINGS analyzer_compatibility_join_using_top_level_identifier = 0, allow_experimental_analyzer = 1;
+
+-- This is example where query may return different results with different `analyzer_compatibility_join_using_top_level_identifier`
+
+DROP TABLE IF EXISTS users;
+CREATE TABLE users (uid Int16, name String, spouse_name String) ENGINE=Memory;
+
+INSERT INTO users VALUES (1231, 'John', 'Ksenia');
+INSERT INTO users VALUES (6666, 'Ksenia', '');
+
+SELECT u1.uid, u1.spouse_name as name, u2.uid, u2.name
+FROM users u1 JOIN users u2 USING (name)
+ORDER BY u1.uid
+FORMAT TSVWithNamesAndTypes
+SETTINGS allow_experimental_analyzer = 1, analyzer_compatibility_join_using_top_level_identifier = 1;
+
+SELECT u1.uid, u1.spouse_name as name, u2.uid, u2.name
+FROM users u1 JOIN users u2 USING (name)
+ORDER BY u1.uid
+FORMAT TSVWithNamesAndTypes
+SETTINGS allow_experimental_analyzer = 1, analyzer_compatibility_join_using_top_level_identifier = 0;
+
+SELECT u1.uid, u1.spouse_name as name, u2.uid, u2.name
+FROM users u1 JOIN users u2 USING (name)
+ORDER BY u1.uid
+FORMAT TSVWithNamesAndTypes
+SETTINGS allow_experimental_analyzer = 0;
+
+DROP TABLE IF EXISTS users;
 
-SELECT b + 1 AS a, s FROM tb FULL OUTER JOIN tabc USING (a) PREWHERE a > 2 ORDER BY ALL;
 
 DROP TABLE IF EXISTS tabc;
 DROP TABLE IF EXISTS ta;

From 589c784e7bddfba89248bde6a2957457f9fa2538 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Mon, 18 Mar 2024 11:12:14 +0000
Subject: [PATCH 650/985] upd 01062_pm_all_join_with_block_continuation

---
 .../01062_pm_all_join_with_block_continuation.sql           | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/01062_pm_all_join_with_block_continuation.sql b/tests/queries/0_stateless/01062_pm_all_join_with_block_continuation.sql
index 15a28e92386..6a42c725e4a 100644
--- a/tests/queries/0_stateless/01062_pm_all_join_with_block_continuation.sql
+++ b/tests/queries/0_stateless/01062_pm_all_join_with_block_continuation.sql
@@ -1,8 +1,8 @@
 SET max_memory_usage = 50000000;
 SET join_algorithm = 'partial_merge';
-
+SET analyzer_compatibility_join_using_top_level_identifier = 1;
 SELECT 'defaults';
-    
+
 SELECT count(1) FROM (
     SELECT materialize(1) as k, n FROM numbers(10) nums
     JOIN (SELECT materialize(1) AS k, number n FROM numbers(1000000)) j
@@ -20,7 +20,7 @@ SELECT count(1), uniqExact(n) FROM (
 
 -- errors
 SET max_joined_block_size_rows = 0;
-    
+
 SELECT count(1) FROM (
     SELECT materialize(1) as k, n FROM numbers(10) nums
     JOIN (SELECT materialize(1) AS k, number n FROM numbers(1000000)) j

From 718e092c9189285eaf33c13899fa5cdcbf50a6b5 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 18 Mar 2024 12:09:21 +0100
Subject: [PATCH 651/985] Make dynamic resize of cache non blocking

---
 src/Interpreters/Cache/FileCache.cpp          | 23 ++++++++++++++++---
 src/Interpreters/Cache/FileCache.h            |  1 +
 src/Interpreters/Cache/IFileCachePriority.h   |  4 ++++
 src/Interpreters/Cache/LRUFileCachePriority.h |  4 ++++
 .../Cache/SLRUFileCachePriority.cpp           | 10 ++++++++
 .../Cache/SLRUFileCachePriority.h             |  4 ++++
 6 files changed, 43 insertions(+), 3 deletions(-)

diff --git a/src/Interpreters/Cache/FileCache.cpp b/src/Interpreters/Cache/FileCache.cpp
index 65b6a3a172d..5c1d82b90cd 100644
--- a/src/Interpreters/Cache/FileCache.cpp
+++ b/src/Interpreters/Cache/FileCache.cpp
@@ -783,6 +783,17 @@ bool FileCache::tryReserve(
     ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheReserveMicroseconds);
 
     assertInitialized();
+
+    /// A logical race on cache_is_being_resized is still possible,
+    /// in this case we will try to lock cache with timeout, this is ok, timeout is small
+    /// and as resizing of cache can take a long time then this small chance of a race is
+    /// ok compared to the number of cases this check will help.
+    if (cache_is_being_resized.load())
+    {
+        ProfileEvents::increment(ProfileEvents::FilesystemCacheFailToReserveSpaceBecauseOfLockContention);
+        return false;
+    }
+
     auto cache_lock = tryLockCache(std::chrono::milliseconds(lock_wait_timeout_milliseconds));
     if (!cache_lock)
     {
@@ -1264,12 +1275,14 @@ std::vector<String> FileCache::tryGetCachePaths(const Key & key)
 
 size_t FileCache::getUsedCacheSize() const
 {
-    return main_priority->getSize(lockCache());
+    /// We use this method for metrics, so it is ok to get approximate result.
+    return main_priority->getSizeApprox();
 }
 
 size_t FileCache::getFileSegmentsNum() const
 {
-    return main_priority->getElementsCount(lockCache());
+    /// We use this method for metrics, so it is ok to get approximate result.
+    return main_priority->getElementsCountApprox();
 }
 
 void FileCache::assertCacheCorrectness()
@@ -1327,8 +1340,12 @@ void FileCache::applySettingsIfPossible(const FileCacheSettings & new_settings,
     if (new_settings.max_size != actual_settings.max_size
         || new_settings.max_elements != actual_settings.max_elements)
     {
-        auto cache_lock = lockCache();
+        cache_is_being_resized.store(true);
+        SCOPE_EXIT({
+            cache_is_being_resized.store(false);
+        });
 
+        auto cache_lock = lockCache();
         bool updated = false;
         try
         {
diff --git a/src/Interpreters/Cache/FileCache.h b/src/Interpreters/Cache/FileCache.h
index 8ea5f4dab40..1433a067e7e 100644
--- a/src/Interpreters/Cache/FileCache.h
+++ b/src/Interpreters/Cache/FileCache.h
@@ -202,6 +202,7 @@ private:
     mutable std::mutex init_mutex;
     std::unique_ptr<StatusFile> status_file;
     std::atomic<bool> shutdown = false;
+    std::atomic<bool> cache_is_being_resized = false;
 
     std::mutex apply_settings_mutex;
 
diff --git a/src/Interpreters/Cache/IFileCachePriority.h b/src/Interpreters/Cache/IFileCachePriority.h
index 58011780323..09d71cebb01 100644
--- a/src/Interpreters/Cache/IFileCachePriority.h
+++ b/src/Interpreters/Cache/IFileCachePriority.h
@@ -63,8 +63,12 @@ public:
 
     virtual size_t getSize(const CachePriorityGuard::Lock &) const = 0;
 
+    virtual size_t getSizeApprox() const = 0;
+
     virtual size_t getElementsCount(const CachePriorityGuard::Lock &) const = 0;
 
+    virtual size_t getElementsCountApprox() const = 0;
+
     /// Throws exception if there is not enough size to fit it.
     virtual IteratorPtr add( /// NOLINT
         KeyMetadataPtr key_metadata,
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.h b/src/Interpreters/Cache/LRUFileCachePriority.h
index dcd4ee0a24c..49977c79b81 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.h
+++ b/src/Interpreters/Cache/LRUFileCachePriority.h
@@ -28,6 +28,10 @@ public:
 
     size_t getElementsCount(const CachePriorityGuard::Lock &) const override { return state->current_elements_num; }
 
+    size_t getSizeApprox() const override { return state->current_size; }
+
+    size_t getElementsCountApprox() const override { return state->current_elements_num; }
+
     bool canFit( /// NOLINT
         size_t size,
         const CachePriorityGuard::Lock &,
diff --git a/src/Interpreters/Cache/SLRUFileCachePriority.cpp b/src/Interpreters/Cache/SLRUFileCachePriority.cpp
index 1767cb94be7..c97d05d4b84 100644
--- a/src/Interpreters/Cache/SLRUFileCachePriority.cpp
+++ b/src/Interpreters/Cache/SLRUFileCachePriority.cpp
@@ -44,6 +44,16 @@ size_t SLRUFileCachePriority::getElementsCount(const CachePriorityGuard::Lock &
     return protected_queue.getElementsCount(lock) + probationary_queue.getElementsCount(lock);
 }
 
+size_t SLRUFileCachePriority::getSizeApprox() const
+{
+    return protected_queue.getSizeApprox() + probationary_queue.getSizeApprox();
+}
+
+size_t SLRUFileCachePriority::getElementsCountApprox() const
+{
+    return protected_queue.getElementsCountApprox() + probationary_queue.getElementsCountApprox();
+}
+
 bool SLRUFileCachePriority::canFit( /// NOLINT
     size_t size,
     const CachePriorityGuard::Lock & lock,
diff --git a/src/Interpreters/Cache/SLRUFileCachePriority.h b/src/Interpreters/Cache/SLRUFileCachePriority.h
index d81ce1bc480..f90918f7878 100644
--- a/src/Interpreters/Cache/SLRUFileCachePriority.h
+++ b/src/Interpreters/Cache/SLRUFileCachePriority.h
@@ -25,6 +25,10 @@ public:
 
     size_t getElementsCount(const CachePriorityGuard::Lock &) const override;
 
+    size_t getSizeApprox() const override;
+
+    size_t getElementsCountApprox() const override;
+
     bool canFit( /// NOLINT
         size_t size,
         const CachePriorityGuard::Lock &,

From 9065f34534a78ebc09cd0091ad18e8e5cac7ba46 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 12:26:05 +0100
Subject: [PATCH 652/985] Fix infinite loop in function `hop`

---
 src/Functions/FunctionsTimeWindow.cpp         | 205 +++++++++++-------
 src/Functions/FunctionsTimeWindow.h           |  35 ---
 .../03013_hop_infinite_loop.reference         |   0
 .../0_stateless/03013_hop_infinite_loop.sql   |   2 +
 4 files changed, 126 insertions(+), 116 deletions(-)
 create mode 100644 tests/queries/0_stateless/03013_hop_infinite_loop.reference
 create mode 100644 tests/queries/0_stateless/03013_hop_infinite_loop.sql

diff --git a/src/Functions/FunctionsTimeWindow.cpp b/src/Functions/FunctionsTimeWindow.cpp
index 017661231f5..91eb70fdd66 100644
--- a/src/Functions/FunctionsTimeWindow.cpp
+++ b/src/Functions/FunctionsTimeWindow.cpp
@@ -27,87 +27,124 @@ namespace ErrorCodes
 
 namespace
 {
-    std::tuple<IntervalKind::Kind, Int64>
-    dispatchForIntervalColumns(const ColumnWithTypeAndName & interval_column, const String & function_name)
-    {
-        const auto * interval_type = checkAndGetDataType<DataTypeInterval>(interval_column.type.get());
-        if (!interval_type)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}",
-                interval_column.name, function_name);
-        const auto * interval_column_const_int64 = checkAndGetColumnConst<ColumnInt64>(interval_column.column.get());
-        if (!interval_column_const_int64)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}",
-                interval_column.name, function_name);
-        Int64 num_units = interval_column_const_int64->getValue<Int64>();
-        if (num_units <= 0)
-            throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND, "Value for column {} of function {} must be positive",
-                interval_column.name, function_name);
 
-        return {interval_type->getKind(), num_units};
-    }
+std::tuple<IntervalKind::Kind, Int64>
+dispatchForIntervalColumns(const ColumnWithTypeAndName & interval_column, const String & function_name)
+{
+    const auto * interval_type = checkAndGetDataType<DataTypeInterval>(interval_column.type.get());
+    if (!interval_type)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}",
+            interval_column.name, function_name);
+    const auto * interval_column_const_int64 = checkAndGetColumnConst<ColumnInt64>(interval_column.column.get());
+    if (!interval_column_const_int64)
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}",
+            interval_column.name, function_name);
+    Int64 num_units = interval_column_const_int64->getValue<Int64>();
+    if (num_units <= 0)
+        throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND, "Value for column {} of function {} must be positive",
+            interval_column.name, function_name);
 
-    ColumnPtr executeWindowBound(const ColumnPtr & column, int index, const String & function_name)
+    return {interval_type->getKind(), num_units};
+}
+
+ColumnPtr executeWindowBound(const ColumnPtr & column, int index, const String & function_name)
+{
+    if (const ColumnTuple * col_tuple = checkAndGetColumn<ColumnTuple>(column.get()); col_tuple)
     {
-        if (const ColumnTuple * col_tuple = checkAndGetColumn<ColumnTuple>(column.get()); col_tuple)
-        {
-            if (!checkColumn<ColumnVector<UInt32>>(*col_tuple->getColumnPtr(index)))
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column for first argument of function {}. "
-                    "Must be a Tuple(DataTime, DataTime)", function_name);
-            return col_tuple->getColumnPtr(index);
-        }
-        else
-        {
+        if (!checkColumn<ColumnVector<UInt32>>(*col_tuple->getColumnPtr(index)))
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column for first argument of function {}. "
-                "Must be Tuple", function_name);
-        }
+                "Must be a Tuple(DataTime, DataTime)", function_name);
+        return col_tuple->getColumnPtr(index);
     }
-
-    void checkFirstArgument(const ColumnWithTypeAndName & argument, const String & function_name)
+    else
     {
-        if (!isDateTime(argument.type))
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
-                "Should be a date with time", argument.type->getName(), function_name);
-    }
-
-    void checkIntervalArgument(const ColumnWithTypeAndName & argument, const String & function_name, IntervalKind & interval_kind, bool & result_type_is_date)
-    {
-        const auto * interval_type = checkAndGetDataType<DataTypeInterval>(argument.type.get());
-        if (!interval_type)
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
-                "Should be an interval of time", argument.type->getName(), function_name);
-        interval_kind = interval_type->getKind();
-        result_type_is_date = (interval_type->getKind() == IntervalKind::Kind::Year) || (interval_type->getKind() == IntervalKind::Kind::Quarter)
-            || (interval_type->getKind() == IntervalKind::Kind::Month) || (interval_type->getKind() == IntervalKind::Kind::Week);
-    }
-
-    void checkIntervalArgument(const ColumnWithTypeAndName & argument, const String & function_name, bool & result_type_is_date)
-    {
-        IntervalKind interval_kind;
-        checkIntervalArgument(argument, function_name, interval_kind, result_type_is_date);
-    }
-
-    void checkTimeZoneArgument(
-        const ColumnWithTypeAndName & argument,
-        const String & function_name)
-    {
-        if (!WhichDataType(argument.type).isString())
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
-                "This argument is optional and must be a constant string with timezone name",
-                argument.type->getName(), function_name);
-    }
-
-    bool checkIntervalOrTimeZoneArgument(const ColumnWithTypeAndName & argument, const String & function_name, IntervalKind & interval_kind, bool & result_type_is_date)
-    {
-        if (WhichDataType(argument.type).isString())
-        {
-            checkTimeZoneArgument(argument, function_name);
-            return false;
-        }
-        checkIntervalArgument(argument, function_name, interval_kind, result_type_is_date);
-        return true;
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column for first argument of function {}. "
+            "Must be Tuple", function_name);
     }
 }
 
+void checkFirstArgument(const ColumnWithTypeAndName & argument, const String & function_name)
+{
+    if (!isDateTime(argument.type))
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
+            "Should be a date with time", argument.type->getName(), function_name);
+}
+
+void checkIntervalArgument(const ColumnWithTypeAndName & argument, const String & function_name, IntervalKind & interval_kind, bool & result_type_is_date)
+{
+    const auto * interval_type = checkAndGetDataType<DataTypeInterval>(argument.type.get());
+    if (!interval_type)
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
+            "Should be an interval of time", argument.type->getName(), function_name);
+    interval_kind = interval_type->getKind();
+    result_type_is_date = (interval_type->getKind() == IntervalKind::Kind::Year) || (interval_type->getKind() == IntervalKind::Kind::Quarter)
+        || (interval_type->getKind() == IntervalKind::Kind::Month) || (interval_type->getKind() == IntervalKind::Kind::Week);
+}
+
+void checkIntervalArgument(const ColumnWithTypeAndName & argument, const String & function_name, bool & result_type_is_date)
+{
+    IntervalKind interval_kind;
+    checkIntervalArgument(argument, function_name, interval_kind, result_type_is_date);
+}
+
+void checkTimeZoneArgument(
+    const ColumnWithTypeAndName & argument,
+    const String & function_name)
+{
+    if (!WhichDataType(argument.type).isString())
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
+            "This argument is optional and must be a constant string with timezone name",
+            argument.type->getName(), function_name);
+}
+
+bool checkIntervalOrTimeZoneArgument(const ColumnWithTypeAndName & argument, const String & function_name, IntervalKind & interval_kind, bool & result_type_is_date)
+{
+    if (WhichDataType(argument.type).isString())
+    {
+        checkTimeZoneArgument(argument, function_name);
+        return false;
+    }
+    checkIntervalArgument(argument, function_name, interval_kind, result_type_is_date);
+    return true;
+}
+
+template <TimeWindowFunctionName type>
+struct TimeWindowImpl
+{
+    static constexpr auto name = "UNKNOWN";
+
+    static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name);
+
+    static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name);
+};
+
+template <TimeWindowFunctionName type>
+class FunctionTimeWindow : public IFunction
+{
+public:
+    static constexpr auto name = TimeWindowImpl<type>::name;
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionTimeWindow>(); }
+    String getName() const override { return name; }
+    bool isVariadic() const override { return true; }
+    size_t getNumberOfArguments() const override { return 0; }
+    bool useDefaultImplementationForConstants() const override { return true; }
+    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2, 3}; }
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo &) const override { return true; }
+
+    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override;
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & /*result_type*/, size_t /*input_rows_count*/) const override;
+};
+
+using FunctionTumble = FunctionTimeWindow<TUMBLE>;
+using FunctionTumbleStart = FunctionTimeWindow<TUMBLE_START>;
+using FunctionTumbleEnd = FunctionTimeWindow<TUMBLE_END>;
+using FunctionHop = FunctionTimeWindow<HOP>;
+using FunctionWindowId = FunctionTimeWindow<WINDOW_ID>;
+using FunctionHopStart = FunctionTimeWindow<HOP_START>;
+using FunctionHopEnd = FunctionTimeWindow<HOP_END>;
+
+
 template <>
 struct TimeWindowImpl<TUMBLE>
 {
@@ -393,6 +430,9 @@ struct TimeWindowImpl<HOP>
             wstart = AddTime<kind>::execute(wend, -window_num_units, time_zone);
             ToType wend_latest;
 
+            if (wstart > wend)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Time overflow in function {}", name);
+
             do
             {
                 wend_latest = wend;
@@ -414,7 +454,7 @@ struct TimeWindowImpl<WINDOW_ID>
 {
     static constexpr auto name = "windowID";
 
-    [[maybe_unused]] static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
+    static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
     {
         bool result_type_is_date;
         IntervalKind interval_kind_1;
@@ -456,8 +496,7 @@ struct TimeWindowImpl<WINDOW_ID>
             return std::make_shared<DataTypeUInt32>();
     }
 
-    [[maybe_unused]] static ColumnPtr
-    dispatchForHopColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
+    static ColumnPtr dispatchForHopColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
     {
         const auto & time_column = arguments[0];
         const auto & hop_interval_column = arguments[1];
@@ -527,6 +566,9 @@ struct TimeWindowImpl<WINDOW_ID>
             ToType wend = AddTime<kind>::execute(wstart, hop_num_units, time_zone);
             ToType wend_latest;
 
+            if (wstart > wend)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Time overflow in function {}", name);
+
             do
             {
                 wend_latest = wend;
@@ -538,14 +580,13 @@ struct TimeWindowImpl<WINDOW_ID>
         return end;
     }
 
-    [[maybe_unused]] static ColumnPtr
-    dispatchForTumbleColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
+    static ColumnPtr dispatchForTumbleColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
     {
         ColumnPtr column = TimeWindowImpl<TUMBLE>::dispatchForColumns(arguments, function_name);
         return executeWindowBound(column, 1, function_name);
     }
 
-    [[maybe_unused]] static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
+    static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
     {
         if (arguments.size() == 2)
             return dispatchForTumbleColumns(arguments, function_name);
@@ -585,7 +626,7 @@ struct TimeWindowImpl<HOP_START>
         }
     }
 
-    [[maybe_unused]] static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
+    static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
     {
         const auto & time_column = arguments[0];
         const auto which_type = WhichDataType(time_column.type);
@@ -608,12 +649,12 @@ struct TimeWindowImpl<HOP_END>
 {
     static constexpr auto name = "hopEnd";
 
-    [[maybe_unused]] static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
+    static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name)
     {
         return TimeWindowImpl<HOP_START>::getReturnType(arguments, function_name);
     }
 
-    [[maybe_unused]] static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
+    static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name)
     {
         const auto & time_column = arguments[0];
         const auto which_type = WhichDataType(time_column.type);
@@ -644,6 +685,8 @@ ColumnPtr FunctionTimeWindow<type>::executeImpl(const ColumnsWithTypeAndName & a
     return TimeWindowImpl<type>::dispatchForColumns(arguments, name);
 }
 
+}
+
 REGISTER_FUNCTION(TimeWindow)
 {
     factory.registerFunction<FunctionTumble>();
diff --git a/src/Functions/FunctionsTimeWindow.h b/src/Functions/FunctionsTimeWindow.h
index 658963cb69c..ab8deef08c0 100644
--- a/src/Functions/FunctionsTimeWindow.h
+++ b/src/Functions/FunctionsTimeWindow.h
@@ -156,39 +156,4 @@ template <> \
     ADD_SUBSECONDS(Nanosecond, 9)
 #undef ADD_SUBSECONDS
 
-template <TimeWindowFunctionName type>
-struct TimeWindowImpl
-{
-    static constexpr auto name = "UNKNOWN";
-
-    static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name);
-
-    static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name);
-};
-
-template <TimeWindowFunctionName type>
-class FunctionTimeWindow : public IFunction
-{
-public:
-    static constexpr auto name = TimeWindowImpl<type>::name;
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionTimeWindow>(); }
-    String getName() const override { return name; }
-    bool isVariadic() const override { return true; }
-    size_t getNumberOfArguments() const override { return 0; }
-    bool useDefaultImplementationForConstants() const override { return true; }
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2, 3}; }
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo &) const override { return true; }
-
-    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override;
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & /*result_type*/, size_t /*input_rows_count*/) const override;
-};
-
-using FunctionTumble = FunctionTimeWindow<TUMBLE>;
-using FunctionTumbleStart = FunctionTimeWindow<TUMBLE_START>;
-using FunctionTumbleEnd = FunctionTimeWindow<TUMBLE_END>;
-using FunctionHop = FunctionTimeWindow<HOP>;
-using FunctionWindowId = FunctionTimeWindow<WINDOW_ID>;
-using FunctionHopStart = FunctionTimeWindow<HOP_START>;
-using FunctionHopEnd = FunctionTimeWindow<HOP_END>;
 }
diff --git a/tests/queries/0_stateless/03013_hop_infinite_loop.reference b/tests/queries/0_stateless/03013_hop_infinite_loop.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03013_hop_infinite_loop.sql b/tests/queries/0_stateless/03013_hop_infinite_loop.sql
new file mode 100644
index 00000000000..bdac87f5af1
--- /dev/null
+++ b/tests/queries/0_stateless/03013_hop_infinite_loop.sql
@@ -0,0 +1,2 @@
+SET allow_experimental_window_view = 1;
+SELECT hop(toDateTime(0), INTERVAL 1 DAY, INTERVAL 3 DAY); -- { serverError BAD_ARGUMENTS }

From 8434f049755ff8ea438d6d8c3cef1ad8f70cb2d4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 12:40:49 +0100
Subject: [PATCH 653/985] Fix style

---
 src/Functions/FunctionsTimeWindow.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Functions/FunctionsTimeWindow.cpp b/src/Functions/FunctionsTimeWindow.cpp
index 91eb70fdd66..97608db51e8 100644
--- a/src/Functions/FunctionsTimeWindow.cpp
+++ b/src/Functions/FunctionsTimeWindow.cpp
@@ -23,6 +23,7 @@ namespace ErrorCodes
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int ARGUMENT_OUT_OF_BOUND;
     extern const int SYNTAX_ERROR;
+    extern const int BAD_ARGUMENTS;
 }
 
 namespace

From 97aca12830f98890a6e2d71b2c7e9ce149d72cdb Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 12:58:03 +0100
Subject: [PATCH 654/985] Fix crash in window view

---
 src/Functions/FunctionsTimeWindow.cpp | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/Functions/FunctionsTimeWindow.cpp b/src/Functions/FunctionsTimeWindow.cpp
index 97608db51e8..be51978499b 100644
--- a/src/Functions/FunctionsTimeWindow.cpp
+++ b/src/Functions/FunctionsTimeWindow.cpp
@@ -48,11 +48,12 @@ dispatchForIntervalColumns(const ColumnWithTypeAndName & interval_column, const
     return {interval_type->getKind(), num_units};
 }
 
-ColumnPtr executeWindowBound(const ColumnPtr & column, int index, const String & function_name)
+ColumnPtr executeWindowBound(const ColumnPtr & column, size_t index, const String & function_name)
 {
+    chassert(index == 0 || index == 1);
     if (const ColumnTuple * col_tuple = checkAndGetColumn<ColumnTuple>(column.get()); col_tuple)
     {
-        if (!checkColumn<ColumnVector<UInt32>>(*col_tuple->getColumnPtr(index)))
+        if (index >= col_tuple->tupleSize() || !checkColumn<ColumnVector<UInt32>>(*col_tuple->getColumnPtr(index)))
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column for first argument of function {}. "
                 "Must be a Tuple(DataTime, DataTime)", function_name);
         return col_tuple->getColumnPtr(index);

From 9fa449fc75d1a9b69aa59737b5dd4fe0bc25dace Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 12:59:09 +0100
Subject: [PATCH 655/985] Add a test

---
 tests/queries/0_stateless/03014_window_view_crash.reference | 0
 tests/queries/0_stateless/03014_window_view_crash.sql       | 2 ++
 2 files changed, 2 insertions(+)
 create mode 100644 tests/queries/0_stateless/03014_window_view_crash.reference
 create mode 100644 tests/queries/0_stateless/03014_window_view_crash.sql

diff --git a/tests/queries/0_stateless/03014_window_view_crash.reference b/tests/queries/0_stateless/03014_window_view_crash.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03014_window_view_crash.sql b/tests/queries/0_stateless/03014_window_view_crash.sql
new file mode 100644
index 00000000000..ff9835521f5
--- /dev/null
+++ b/tests/queries/0_stateless/03014_window_view_crash.sql
@@ -0,0 +1,2 @@
+SET allow_experimental_window_view = 1;
+SELECT hopEnd(tuple([[[(20,20),(50,20),(50,50),(20,50)],[(30,30),(50,50),(50,30)]], [[(20,20),(50,20),(50,50),(20,50)],[(30,30),(50,50),(50,30)]], [[(20,20),(50,20),(50,50),(20,50)],[(30,30),(50,50),(50,30)]]])::Tuple(MultiPolygon)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }

From c6e86e3bb33cbd7e2f86d41e4726ffdd5c4545b7 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 18 Mar 2024 13:06:39 +0100
Subject: [PATCH 656/985] Review suggestion

---
 src/Interpreters/Cache/FileCache.cpp | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Interpreters/Cache/FileCache.cpp b/src/Interpreters/Cache/FileCache.cpp
index 5c1d82b90cd..916bdb8f898 100644
--- a/src/Interpreters/Cache/FileCache.cpp
+++ b/src/Interpreters/Cache/FileCache.cpp
@@ -788,7 +788,7 @@ bool FileCache::tryReserve(
     /// in this case we will try to lock cache with timeout, this is ok, timeout is small
     /// and as resizing of cache can take a long time then this small chance of a race is
     /// ok compared to the number of cases this check will help.
-    if (cache_is_being_resized.load())
+    if (cache_is_being_resized.load(std::memory_order_relaxed))
     {
         ProfileEvents::increment(ProfileEvents::FilesystemCacheFailToReserveSpaceBecauseOfLockContention);
         return false;
@@ -1340,9 +1340,9 @@ void FileCache::applySettingsIfPossible(const FileCacheSettings & new_settings,
     if (new_settings.max_size != actual_settings.max_size
         || new_settings.max_elements != actual_settings.max_elements)
     {
-        cache_is_being_resized.store(true);
+        cache_is_being_resized.store(true, std::memory_order_relaxed);
         SCOPE_EXIT({
-            cache_is_being_resized.store(false);
+            cache_is_being_resized.store(false, std::memory_order_relaxed);
         });
 
         auto cache_lock = lockCache();

From 47e3eccc59ed62149aff6fe68068b6ca4cbc1dad Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 18 Mar 2024 13:41:25 +0100
Subject: [PATCH 657/985] Fix repeat with non native integers

---
 src/Functions/repeat.cpp                      | 32 ++++++++++++++-----
 ...3_repeat_with_nonnative_integers.reference |  4 +++
 .../03013_repeat_with_nonnative_integers.sql  |  4 +++
 3 files changed, 32 insertions(+), 8 deletions(-)
 create mode 100644 tests/queries/0_stateless/03013_repeat_with_nonnative_integers.reference
 create mode 100644 tests/queries/0_stateless/03013_repeat_with_nonnative_integers.sql

diff --git a/src/Functions/repeat.cpp b/src/Functions/repeat.cpp
index 11a2ca37a3b..6f2078b7e48 100644
--- a/src/Functions/repeat.cpp
+++ b/src/Functions/repeat.cpp
@@ -44,7 +44,7 @@ struct RepeatImpl
         ColumnString::Offsets & res_offsets,
         T repeat_time)
     {
-        repeat_time = repeat_time < 0 ? 0 : repeat_time;
+        repeat_time = repeat_time < 0 ? static_cast<T>(0) : repeat_time;
         checkRepeatTime(repeat_time);
 
         UInt64 data_size = 0;
@@ -76,7 +76,7 @@ struct RepeatImpl
         res_offsets.assign(offsets);
         for (UInt64 i = 0; i < col_num.size(); ++i)
         {
-            T repeat_time = col_num[i] < 0 ? 0 : col_num[i];
+            T repeat_time = col_num[i] < 0 ? static_cast<T>(0) : col_num[i];
             size_t repeated_size = (offsets[i] - offsets[i - 1] - 1) * repeat_time + 1;
             checkStringSize(repeated_size);
             data_size += repeated_size;
@@ -86,7 +86,7 @@ struct RepeatImpl
 
         for (UInt64 i = 0; i < col_num.size(); ++i)
         {
-            T repeat_time = col_num[i] < 0 ? 0 : col_num[i];
+            T repeat_time = col_num[i] < 0 ? static_cast<T>(0) : col_num[i];
             checkRepeatTime(repeat_time);
             process(data.data() + offsets[i - 1], res_data.data() + res_offsets[i - 1], offsets[i] - offsets[i - 1], repeat_time);
         }
@@ -105,7 +105,7 @@ struct RepeatImpl
         UInt64 col_size = col_num.size();
         for (UInt64 i = 0; i < col_size; ++i)
         {
-            T repeat_time = col_num[i] < 0 ? 0 : col_num[i];
+            T repeat_time = col_num[i] < 0 ? static_cast<T>(0) : col_num[i];
             size_t repeated_size = str_size * repeat_time + 1;
             checkStringSize(repeated_size);
             data_size += repeated_size;
@@ -114,7 +114,7 @@ struct RepeatImpl
         res_data.resize(data_size);
         for (UInt64 i = 0; i < col_size; ++i)
         {
-            T repeat_time = col_num[i] < 0 ? 0 : col_num[i];
+            T repeat_time = col_num[i] < 0 ? static_cast<T>(0) : col_num[i];
             checkRepeatTime(repeat_time);
             process(
                 reinterpret_cast<UInt8 *>(const_cast<char *>(copy_str.data())),
@@ -169,8 +169,19 @@ class FunctionRepeat : public IFunction
     template <typename F>
     static bool castType(const IDataType * type, F && f)
     {
-        return castTypeToEither<DataTypeInt8, DataTypeInt16, DataTypeInt32, DataTypeInt64,
-            DataTypeUInt8, DataTypeUInt16, DataTypeUInt32, DataTypeUInt64>(type, std::forward<F>(f));
+        return castTypeToEither<
+            DataTypeInt8,
+            DataTypeInt16,
+            DataTypeInt32,
+            DataTypeInt64,
+            DataTypeInt128,
+            DataTypeInt256,
+            DataTypeUInt8,
+            DataTypeUInt16,
+            DataTypeUInt32,
+            DataTypeUInt64,
+            DataTypeUInt128,
+            DataTypeUInt256>(type, std::forward<F>(f));
     }
 
 public:
@@ -208,7 +219,7 @@ public:
             if (const ColumnConst * col_num_const = checkAndGetColumn<ColumnConst>(col_num.get()))
             {
                 auto col_res = ColumnString::create();
-                castType(arguments[1].type.get(), [&](const auto & type)
+                auto success = castType(arguments[1].type.get(), [&](const auto & type)
                 {
                     using DataType = std::decay_t<decltype(type)>;
                     using T = typename DataType::FieldType;
@@ -216,6 +227,11 @@ public:
                     RepeatImpl::vectorStrConstRepeat(col->getChars(), col->getOffsets(), col_res->getChars(), col_res->getOffsets(), times);
                     return true;
                 });
+
+                if (!success)
+                    throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column type {} of 'n' of function {}",
+                        arguments[1].column->getName(), getName());
+
                 return col_res;
             }
             else if (castType(arguments[1].type.get(), [&](const auto & type)
diff --git a/tests/queries/0_stateless/03013_repeat_with_nonnative_integers.reference b/tests/queries/0_stateless/03013_repeat_with_nonnative_integers.reference
new file mode 100644
index 00000000000..50cb7002a32
--- /dev/null
+++ b/tests/queries/0_stateless/03013_repeat_with_nonnative_integers.reference
@@ -0,0 +1,4 @@
+000000000000
+000000000000
+000000000000
+000000000000
diff --git a/tests/queries/0_stateless/03013_repeat_with_nonnative_integers.sql b/tests/queries/0_stateless/03013_repeat_with_nonnative_integers.sql
new file mode 100644
index 00000000000..0dbe98994b9
--- /dev/null
+++ b/tests/queries/0_stateless/03013_repeat_with_nonnative_integers.sql
@@ -0,0 +1,4 @@
+SELECT repeat(toString(number), toUInt256(12)) FROM numbers(1);
+SELECT repeat(toString(number), toUInt128(12)) FROM numbers(1);
+SELECT repeat(toString(number), toInt256(12)) FROM numbers(1);
+SELECT repeat(toString(number), toInt128(12)) FROM numbers(1);

From a65f027cf72d42f2d9263afe8fe58801ec1b3313 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Mon, 18 Mar 2024 14:00:20 +0100
Subject: [PATCH 658/985] Revert "Revert "Analyzer: Fix virtual columns in
 StorageMerge""

---
 .../InterpreterSelectQueryAnalyzer.cpp        |  1 +
 src/Storages/StorageMerge.cpp                 | 93 +++++++++++++------
 tests/analyzer_tech_debt.txt                  |  1 -
 3 files changed, 68 insertions(+), 27 deletions(-)

diff --git a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
index 922f4a99b4a..539d7a59f6f 100644
--- a/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
+++ b/src/Interpreters/InterpreterSelectQueryAnalyzer.cpp
@@ -86,6 +86,7 @@ void replaceStorageInQueryTree(QueryTreeNodePtr & query_tree, const ContextPtr &
             continue;
 
         auto replacement_table_expression = std::make_shared<TableNode>(storage, context);
+        replacement_table_expression->setAlias(node->getAlias());
 
         if (auto table_expression_modifiers = table_node.getTableExpressionModifiers())
             replacement_table_expression->setTableExpressionModifiers(*table_expression_modifiers);
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 9161b2773da..3a4ec6f9b17 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -885,6 +885,7 @@ SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const ContextMutablePtr & mo
     if (modified_query_info.table_expression)
     {
         auto replacement_table_expression = std::make_shared<TableNode>(storage, storage_lock, storage_snapshot_);
+        replacement_table_expression->setAlias(modified_query_info.table_expression->getAlias());
         if (query_info.table_expression_modifiers)
             replacement_table_expression->setTableExpressionModifiers(*query_info.table_expression_modifiers);
 
@@ -1025,7 +1026,7 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
     const auto & [database_name, storage, _, table_name] = storage_with_lock;
     bool allow_experimental_analyzer = context->getSettingsRef().allow_experimental_analyzer;
     auto storage_stage
-        = storage->getQueryProcessingStage(context, QueryProcessingStage::Complete, storage_snapshot_, modified_query_info);
+        = storage->getQueryProcessingStage(context, processed_stage, storage_snapshot_, modified_query_info);
 
     builder = plan.buildQueryPipeline(
         QueryPlanOptimizationSettings::fromContext(context), BuildQueryPipelineSettings::fromContext(context));
@@ -1052,40 +1053,80 @@ QueryPipelineBuilderPtr ReadFromMerge::createSources(
 
         Block pipe_header = builder->getHeader();
 
-        if (has_database_virtual_column && common_header.has("_database") && !pipe_header.has("_database"))
+        if (allow_experimental_analyzer)
         {
-            ColumnWithTypeAndName column;
-            column.name = "_database";
-            column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
-            column.column = column.type->createColumnConst(0, Field(database_name));
+            String table_alias = modified_query_info.query_tree->as<QueryNode>()->getJoinTree()->as<TableNode>()->getAlias();
 
-            auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
-            auto adding_column_actions = std::make_shared<ExpressionActions>(
-                std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+            String database_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_database" : table_alias + "._database";
+            String table_column = table_alias.empty() || processed_stage == QueryProcessingStage::FetchColumns ? "_table" : table_alias + "._table";
 
-            builder->addSimpleTransform([&](const Block & stream_header)
-                                        { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            if (has_database_virtual_column && common_header.has(database_column)
+                && (storage_stage == QueryProcessingStage::FetchColumns || !pipe_header.has("'" + database_name + "'_String")))
+            {
+                ColumnWithTypeAndName column;
+                column.name = database_column;
+                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+                column.column = column.type->createColumnConst(0, Field(database_name));
+
+                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+                auto adding_column_actions = std::make_shared<ExpressionActions>(
+                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+
+                builder->addSimpleTransform([&](const Block & stream_header)
+                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            }
+
+            if (has_table_virtual_column && common_header.has(table_column)
+                && (storage_stage == QueryProcessingStage::FetchColumns || !pipe_header.has("'" + table_name + "'_String")))
+            {
+                ColumnWithTypeAndName column;
+                column.name = table_column;
+                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+                column.column = column.type->createColumnConst(0, Field(table_name));
+
+                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+                auto adding_column_actions = std::make_shared<ExpressionActions>(
+                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+
+                builder->addSimpleTransform([&](const Block & stream_header)
+                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            }
         }
-
-        if (has_table_virtual_column && common_header.has("_table") && !pipe_header.has("_table"))
+        else
         {
-            ColumnWithTypeAndName column;
-            column.name = "_table";
-            column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
-            column.column = column.type->createColumnConst(0, Field(table_name));
+            if (has_database_virtual_column && common_header.has("_database") && !pipe_header.has("_database"))
+            {
+                ColumnWithTypeAndName column;
+                column.name = "_database";
+                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+                column.column = column.type->createColumnConst(0, Field(database_name));
 
-            auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
-            auto adding_column_actions = std::make_shared<ExpressionActions>(
-                std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+                auto adding_column_actions = std::make_shared<ExpressionActions>(
+                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+                builder->addSimpleTransform([&](const Block & stream_header)
+                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            }
 
-            builder->addSimpleTransform([&](const Block & stream_header)
-                                        { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            if (has_table_virtual_column && common_header.has("_table") && !pipe_header.has("_table"))
+            {
+                ColumnWithTypeAndName column;
+                column.name = "_table";
+                column.type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+                column.column = column.type->createColumnConst(0, Field(table_name));
+
+                auto adding_column_dag = ActionsDAG::makeAddingColumnActions(std::move(column));
+                auto adding_column_actions = std::make_shared<ExpressionActions>(
+                    std::move(adding_column_dag), ExpressionActionsSettings::fromContext(context, CompileExpressions::yes));
+                builder->addSimpleTransform([&](const Block & stream_header)
+                                            { return std::make_shared<ExpressionTransform>(stream_header, adding_column_actions); });
+            }
         }
 
         /// Subordinary tables could have different but convertible types, like numeric types of different width.
         /// We must return streams with structure equals to structure of Merge table.
         convertAndFilterSourceStream(
-            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, processed_stage);
+            header, modified_query_info, storage_snapshot_, aliases, row_policy_data_opt, context, *builder, storage_stage);
     }
 
     return builder;
@@ -1116,13 +1157,13 @@ QueryPlan ReadFromMerge::createPlanForTable(
     bool allow_experimental_analyzer = modified_context->getSettingsRef().allow_experimental_analyzer;
 
     auto storage_stage = storage->getQueryProcessingStage(modified_context,
-        QueryProcessingStage::Complete,
+        processed_stage,
         storage_snapshot_,
         modified_query_info);
 
     QueryPlan plan;
 
-    if (processed_stage <= storage_stage || (allow_experimental_analyzer && processed_stage == QueryProcessingStage::FetchColumns))
+    if (processed_stage <= storage_stage)
     {
         /// If there are only virtual columns in query, you must request at least one other column.
         if (real_column_names.empty())
@@ -1167,7 +1208,7 @@ QueryPlan ReadFromMerge::createPlanForTable(
                 row_policy_data_opt->addStorageFilter(source_step_with_filter);
         }
     }
-    else if (processed_stage > storage_stage || (allow_experimental_analyzer && processed_stage != QueryProcessingStage::FetchColumns))
+    else if (processed_stage > storage_stage || allow_experimental_analyzer)
     {
         /// Maximum permissible parallelism is streams_num
         modified_context->setSetting("max_threads", streams_num);
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index bcf0eee0d0e..7cd73705e77 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -1,5 +1,4 @@
 00223_shard_distributed_aggregation_memory_efficient
-00717_merge_and_distributed
 00725_memory_tracking
 01062_pm_all_join_with_block_continuation
 01083_expressions_in_engine_arguments

From 64b5acf0e47b65f616dce2427a57014e1e80d534 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 14 Mar 2024 18:38:27 +0100
Subject: [PATCH 659/985] Code cleanup

---
 .../ClusterProxy/SelectStreamFactory.h        |  3 --
 .../OptimizeShardingKeyRewriteInVisitor.cpp   | 28 +++++++++----------
 .../OptimizeShardingKeyRewriteInVisitor.h     |  2 +-
 3 files changed, 14 insertions(+), 19 deletions(-)

diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.h b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
index 760281284fd..2e7b2445c6b 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.h
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
@@ -1,6 +1,5 @@
 #pragma once
 
-#include <vector>
 #include <Analyzer/IQueryTreeNode.h>
 #include <Client/ConnectionPool.h>
 #include <Core/QueryProcessingStage.h>
@@ -44,8 +43,6 @@ ASTPtr rewriteSelectQuery(
 using ColumnsDescriptionByShardNum = std::unordered_map<UInt32, ColumnsDescription>;
 using AdditionalShardFilterGenerator = std::function<ASTPtr(uint64_t)>;
 
-using MissingObjectList = std::vector<std::pair<String, String>>;
-
 class SelectStreamFactory
 {
 public:
diff --git a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
index 0df6fcee229..84279282d92 100644
--- a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
+++ b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.cpp
@@ -1,19 +1,17 @@
-#include <memory>
-#include <Interpreters/ExpressionActions.h>
-#include <Interpreters/convertFieldToType.h>
-#include <Parsers/ASTFunction.h>
-#include <Parsers/ASTLiteral.h>
-#include <Parsers/ASTIdentifier.h>
-#include <DataTypes/DataTypesNumber.h>
 #include <Interpreters/OptimizeShardingKeyRewriteInVisitor.h>
-#include "Analyzer/ColumnNode.h"
-#include "Analyzer/ConstantNode.h"
-#include "Analyzer/FunctionNode.h"
-#include "Analyzer/IQueryTreeNode.h"
-#include "Analyzer/InDepthQueryTreeVisitor.h"
-#include "Analyzer/Utils.h"
-#include "DataTypes/IDataType.h"
-#include "Interpreters/Context_fwd.h"
+
+#include <Analyzer/ColumnNode.h>
+#include <Analyzer/ConstantNode.h>
+#include <Analyzer/FunctionNode.h>
+#include <Analyzer/InDepthQueryTreeVisitor.h>
+#include <Analyzer/Utils.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Interpreters/Context_fwd.h>
+#include <Interpreters/convertFieldToType.h>
+#include <Interpreters/ExpressionActions.h>
+#include <Parsers/ASTFunction.h>
+#include <Parsers/ASTIdentifier.h>
+#include <Parsers/ASTLiteral.h>
 
 namespace
 {
diff --git a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.h b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.h
index d202609160b..1b2d5a8fc15 100644
--- a/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.h
+++ b/src/Interpreters/OptimizeShardingKeyRewriteInVisitor.h
@@ -1,8 +1,8 @@
 #pragma once
 
+#include <Analyzer/IQueryTreeNode.h>
 #include <Interpreters/InDepthNodeVisitor.h>
 #include <Interpreters/Cluster.h>
-#include "Analyzer/IQueryTreeNode.h"
 
 namespace DB
 {

From 08d64f9e118329232a2149ff21e6ad47ffd37e1c Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Fri, 15 Mar 2024 00:42:12 +0100
Subject: [PATCH 660/985] Get rid of modifying a shared AbstractConfiguration
 (between StorageDictionary and ExternalDictionariesLoader). Always create a
 new configuration when we need to modify it.

---
 src/Common/Config/ConfigHelper.cpp | 29 +++++++++++++++++++++++++++++
 src/Common/Config/ConfigHelper.h   | 13 ++++++++-----
 src/Storages/StorageDictionary.cpp | 13 +++++++++----
 src/Storages/StorageDictionary.h   |  2 +-
 4 files changed, 47 insertions(+), 10 deletions(-)

diff --git a/src/Common/Config/ConfigHelper.cpp b/src/Common/Config/ConfigHelper.cpp
index 69fe42de86c..6de63fe78d7 100644
--- a/src/Common/Config/ConfigHelper.cpp
+++ b/src/Common/Config/ConfigHelper.cpp
@@ -1,5 +1,7 @@
 #include <Common/Config/ConfigHelper.h>
 #include <Poco/Util/AbstractConfiguration.h>
+#include <Poco/Util/XMLConfiguration.h>
+
 
 namespace DB
 {
@@ -7,6 +9,33 @@ namespace DB
 namespace ConfigHelper
 {
 
+namespace
+{
+    void cloneImpl(Poco::Util::AbstractConfiguration & dest, const Poco::Util::AbstractConfiguration & src, const std::string & prefix = "")
+    {
+        std::vector<std::string> keys;
+        src.keys(prefix, keys);
+        if (!keys.empty())
+        {
+            std::string prefix_with_dot = prefix + ".";
+            for (const auto & key : keys)
+                cloneImpl(dest, src, prefix_with_dot + key);
+        }
+        else if (!prefix.empty())
+        {
+            dest.setString(prefix, src.getRawString(prefix));
+        }
+    }
+}
+
+
+Poco::AutoPtr<Poco::Util::AbstractConfiguration> clone(const Poco::Util::AbstractConfiguration & src)
+{
+    Poco::AutoPtr<Poco::Util::AbstractConfiguration> res(new Poco::Util::XMLConfiguration());
+    cloneImpl(*res, src);
+    return res;
+}
+
 bool getBool(const Poco::Util::AbstractConfiguration & config, const std::string & key, bool default_, bool empty_as)
 {
     if (!config.has(key))
diff --git a/src/Common/Config/ConfigHelper.h b/src/Common/Config/ConfigHelper.h
index a1b630fa726..4f13bc4ad78 100644
--- a/src/Common/Config/ConfigHelper.h
+++ b/src/Common/Config/ConfigHelper.h
@@ -1,18 +1,21 @@
 #pragma once
 
+#include <Poco/AutoPtr.h>
 #include <string>
 
-namespace Poco
+
+namespace Poco::Util
 {
-    namespace Util
-    {
-        class AbstractConfiguration;
-    }
+    class AbstractConfiguration;
 }
 
+
 namespace DB::ConfigHelper
 {
 
+/// Clones a configuration.
+Poco::AutoPtr<Poco::Util::AbstractConfiguration> clone(const Poco::Util::AbstractConfiguration & src);
+
 /// The behavior is like `config.getBool(key, default_)`,
 /// except when the tag is empty (aka. self-closing), `empty_as` will be used instead of throwing Poco::Exception.
 bool getBool(const Poco::Util::AbstractConfiguration & config, const std::string & key, bool default_ = false, bool empty_as = true);
diff --git a/src/Storages/StorageDictionary.cpp b/src/Storages/StorageDictionary.cpp
index ee76522fe48..414c66e9522 100644
--- a/src/Storages/StorageDictionary.cpp
+++ b/src/Storages/StorageDictionary.cpp
@@ -7,6 +7,7 @@
 #include <Interpreters/ExternalDictionariesLoader.h>
 #include <Interpreters/ExternalLoaderDictionaryStorageConfigRepository.h>
 #include <Parsers/ASTLiteral.h>
+#include <Common/Config/ConfigHelper.h>
 #include <Common/quoteString.h>
 #include <QueryPipeline/Pipe.h>
 #include <IO/Operators.h>
@@ -221,13 +222,17 @@ void StorageDictionary::renameInMemory(const StorageID & new_table_id)
 
     {
         std::lock_guard lock(dictionary_config_mutex);
+        auto new_configuration = ConfigHelper::clone(*configuration);
+
+        new_configuration->setString("dictionary.database", new_table_id.database_name);
+        new_configuration->setString("dictionary.name", new_table_id.table_name);
 
-        configuration->setString("dictionary.database", new_table_id.database_name);
-        configuration->setString("dictionary.name", new_table_id.table_name);
         if (move_to_atomic)
-            configuration->setString("dictionary.uuid", toString(new_table_id.uuid));
+            new_configuration->setString("dictionary.uuid", toString(new_table_id.uuid));
         else if (move_to_ordinary)
-            configuration->remove("dictionary.uuid");
+            new_configuration->remove("dictionary.uuid");
+
+        configuration = new_configuration;
     }
 
     const auto & external_dictionaries_loader = getContext()->getExternalDictionariesLoader();
diff --git a/src/Storages/StorageDictionary.h b/src/Storages/StorageDictionary.h
index 5c6b2f6d8ad..a414e4586d9 100644
--- a/src/Storages/StorageDictionary.h
+++ b/src/Storages/StorageDictionary.h
@@ -101,7 +101,7 @@ private:
     const Location location;
 
     mutable std::mutex dictionary_config_mutex;
-    LoadablesConfigurationPtr configuration;
+    LoadablesConfigurationPtr configuration TSA_GUARDED_BY(dictionary_config_mutex);
 
     scope_guard remove_repository_callback;
 

From 5c60b1fab17823bd865394a54003336e5e0965a6 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Fri, 15 Mar 2024 02:52:30 +0100
Subject: [PATCH 661/985] Remove unnecessary reloading while renaming a
 dictionary in Atomic database.

---
 .../AbstractConfigurationComparison.cpp       | 91 ++++++++++++-------
 .../Config/AbstractConfigurationComparison.h  |  6 ++
 .../ExternalDictionariesLoader.cpp            | 14 +++
 src/Interpreters/ExternalDictionariesLoader.h |  3 +
 src/Interpreters/ExternalLoader.cpp           | 18 +++-
 src/Interpreters/ExternalLoader.h             |  4 +
 6 files changed, 98 insertions(+), 38 deletions(-)

diff --git a/src/Common/Config/AbstractConfigurationComparison.cpp b/src/Common/Config/AbstractConfigurationComparison.cpp
index c00a1efeebe..e983bd32f51 100644
--- a/src/Common/Config/AbstractConfigurationComparison.cpp
+++ b/src/Common/Config/AbstractConfigurationComparison.cpp
@@ -19,6 +19,56 @@ namespace
         result += subkey;
         return result;
     }
+
+    bool isSameConfigurationImpl(const Poco::Util::AbstractConfiguration & left, const String & left_key,
+                                 const Poco::Util::AbstractConfiguration & right, const String & right_key,
+                                 const std::unordered_set<std::string_view> * ignore_keys)
+    {
+        if (&left == &right && left_key == right_key)
+            return true;
+
+        /// Get the subkeys of the left and right configurations.
+        Poco::Util::AbstractConfiguration::Keys left_subkeys;
+        Poco::Util::AbstractConfiguration::Keys right_subkeys;
+        left.keys(left_key, left_subkeys);
+        right.keys(right_key, right_subkeys);
+
+        if (ignore_keys)
+        {
+            std::erase_if(left_subkeys, [&](const String & key) { return ignore_keys->contains(key); });
+            std::erase_if(right_subkeys, [&](const String & key) { return ignore_keys->contains(key); });
+        }
+
+        /// Check that the right configuration has the same set of subkeys as the left configuration.
+        if (left_subkeys.size() != right_subkeys.size())
+            return false;
+
+        if (left_subkeys.empty())
+        {
+            if (left.hasProperty(left_key))
+            {
+                return right.hasProperty(right_key) && (left.getRawString(left_key) == right.getRawString(right_key));
+            }
+            else
+            {
+                return !right.hasProperty(right_key);
+            }
+        }
+        else
+        {
+            /// Go through all the subkeys and compare corresponding parts of the configurations.
+            std::unordered_set<std::string_view> left_subkeys_set{left_subkeys.begin(), left_subkeys.end()};
+            for (const auto & subkey : right_subkeys)
+            {
+                if (!left_subkeys_set.contains(subkey))
+                    return false;
+
+                if (!isSameConfiguration(left, concatKeyAndSubKey(left_key, subkey), right, concatKeyAndSubKey(right_key, subkey)))
+                    return false;
+            }
+            return true;
+        }
+    }
 }
 
 
@@ -52,41 +102,14 @@ bool isSameConfigurationWithMultipleKeys(const Poco::Util::AbstractConfiguration
 bool isSameConfiguration(const Poco::Util::AbstractConfiguration & left, const String & left_key,
                          const Poco::Util::AbstractConfiguration & right, const String & right_key)
 {
-    if (&left == &right && left_key == right_key)
-        return true;
+    return isSameConfigurationImpl(left, left_key, right, right_key, /* ignore_keys= */ nullptr);
+}
 
-    bool has_property = left.hasProperty(left_key);
-    if (has_property != right.hasProperty(right_key))
-        return false;
-    if (has_property)
-    {
-        /// The left and right configurations contains values so we can compare them.
-        if (left.getRawString(left_key) != right.getRawString(right_key))
-            return false;
-    }
-
-    /// Get the subkeys of the left and right configurations.
-    Poco::Util::AbstractConfiguration::Keys subkeys;
-    left.keys(left_key, subkeys);
-
-    {
-        /// Check that the right configuration has the same set of subkeys as the left configuration.
-        Poco::Util::AbstractConfiguration::Keys right_subkeys;
-        right.keys(right_key, right_subkeys);
-        std::unordered_set<std::string_view> left_subkeys{subkeys.begin(), subkeys.end()};
-        if ((left_subkeys.size() != right_subkeys.size()) || (left_subkeys.size() != subkeys.size()))
-            return false;
-        for (const auto & right_subkey : right_subkeys)
-            if (!left_subkeys.contains(right_subkey))
-                return false;
-    }
-
-    /// Go through all the subkeys and compare corresponding parts of the configurations.
-    for (const auto & subkey : subkeys)
-        if (!isSameConfiguration(left, concatKeyAndSubKey(left_key, subkey), right, concatKeyAndSubKey(right_key, subkey)))
-            return false;
-
-    return true;
+bool isSameConfigurationIgnoringKeys(const Poco::Util::AbstractConfiguration & left, const String & left_key,
+                                     const Poco::Util::AbstractConfiguration & right, const String & right_key,
+                                     const std::unordered_set<std::string_view> & ignore_keys)
+{
+    return isSameConfigurationImpl(left, left_key, right, right_key, !ignore_keys.empty() ? &ignore_keys : nullptr);
 }
 
 }
diff --git a/src/Common/Config/AbstractConfigurationComparison.h b/src/Common/Config/AbstractConfigurationComparison.h
index 75e0b77b1ca..edaff8d5363 100644
--- a/src/Common/Config/AbstractConfigurationComparison.h
+++ b/src/Common/Config/AbstractConfigurationComparison.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <base/types.h>
+#include <unordered_set>
 
 namespace Poco::Util
 {
@@ -33,6 +34,11 @@ namespace DB
     bool isSameConfiguration(const Poco::Util::AbstractConfiguration & left, const String & left_key,
                              const Poco::Util::AbstractConfiguration & right, const String & right_key);
 
+    /// Returns true if specified subviews of the two configurations contains the same keys and values, but without checking specified keys.
+    bool isSameConfigurationIgnoringKeys(const Poco::Util::AbstractConfiguration & left, const String & left_key,
+                                         const Poco::Util::AbstractConfiguration & right, const String & right_key,
+                                         const std::unordered_set<std::string_view> & ignore_keys);
+
     inline bool operator==(const Poco::Util::AbstractConfiguration & left, const Poco::Util::AbstractConfiguration & right)
     {
         return isSameConfiguration(left, right);
diff --git a/src/Interpreters/ExternalDictionariesLoader.cpp b/src/Interpreters/ExternalDictionariesLoader.cpp
index 760f94d18c2..0591a6232d0 100644
--- a/src/Interpreters/ExternalDictionariesLoader.cpp
+++ b/src/Interpreters/ExternalDictionariesLoader.cpp
@@ -5,6 +5,7 @@
 #include <Dictionaries/DictionaryStructure.h>
 #include <Databases/IDatabase.h>
 #include <Storages/IStorage.h>
+#include <Common/Config/AbstractConfigurationComparison.h>
 
 #include "config.h"
 
@@ -41,6 +42,19 @@ ExternalLoader::LoadablePtr ExternalDictionariesLoader::create(
     return DictionaryFactory::instance().create(name, config, key_in_config, getContext(), created_from_ddl);
 }
 
+bool ExternalDictionariesLoader::doesConfigChangeRequiresReloadingObject(const Poco::Util::AbstractConfiguration & old_config, const String & old_key_in_config,
+                                                                         const Poco::Util::AbstractConfiguration & new_config, const String & new_key_in_config) const
+{
+    /// If the database is atomic then a dictionary can be renamed without reloading.
+    if (!old_config.getString(old_key_in_config + ".uuid", "").empty() && !new_config.getString(new_key_in_config + ".uuid", "").empty())
+    {
+        static const std::unordered_set<std::string_view> ignore_keys{"name", "database"};
+        bool only_name_or_database_may_differ = isSameConfigurationIgnoringKeys(old_config, old_key_in_config, new_config, new_key_in_config, ignore_keys);
+        return !only_name_or_database_may_differ;
+    }
+    return true;
+}
+
 void ExternalDictionariesLoader::updateObjectFromConfigWithoutReloading(IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config) const
 {
     IDictionary & dict = static_cast<IDictionary &>(object);
diff --git a/src/Interpreters/ExternalDictionariesLoader.h b/src/Interpreters/ExternalDictionariesLoader.h
index 3c226f998be..f3aa8fa5f8e 100644
--- a/src/Interpreters/ExternalDictionariesLoader.h
+++ b/src/Interpreters/ExternalDictionariesLoader.h
@@ -43,6 +43,9 @@ protected:
     LoadablePtr create(const std::string & name, const Poco::Util::AbstractConfiguration & config,
             const std::string & key_in_config, const std::string & repository_name) const override;
 
+    bool doesConfigChangeRequiresReloadingObject(const Poco::Util::AbstractConfiguration & old_config, const String & old_key_in_config,
+                                                 const Poco::Util::AbstractConfiguration & new_config, const String & new_key_in_config) const override;
+
     void updateObjectFromConfigWithoutReloading(
         IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config) const override;
 
diff --git a/src/Interpreters/ExternalLoader.cpp b/src/Interpreters/ExternalLoader.cpp
index 3e162b1114f..6ab083f9fb7 100644
--- a/src/Interpreters/ExternalLoader.cpp
+++ b/src/Interpreters/ExternalLoader.cpp
@@ -88,6 +88,7 @@ namespace
         }
     };
 
+    using DoesConfigChangeRequiresReloadingObjectFunction = std::function<bool(const Poco::Util::AbstractConfiguration & config_1, const String & key_in_config_1, const Poco::Util::AbstractConfiguration & config_2, const String & key_in_config_2)>;
     using UpdateObjectFromConfigWithoutReloadingFunction = std::function<void(const IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config)>;
 }
 
@@ -402,10 +403,12 @@ public:
 
     LoadingDispatcher(
         const CreateObjectFunction & create_object_function_,
+        const DoesConfigChangeRequiresReloadingObjectFunction & does_config_change_requires_reloading_object_,
         const UpdateObjectFromConfigWithoutReloadingFunction & update_object_from_config_without_reloading_,
         const String & type_name_,
         LoggerPtr log_)
         : create_object(create_object_function_)
+        , does_config_change_requires_reloading_object(does_config_change_requires_reloading_object_)
         , update_object_from_config_without_reloading(update_object_from_config_without_reloading_)
         , type_name(type_name_)
         , log(log_)
@@ -472,10 +475,14 @@ public:
 
                     if (info.triedToLoad())
                     {
-                        /// The object has been tried to load before, so it is currently in use or was in use
-                        /// and we should try to reload it with the new config.
-                        LOG_TRACE(log, "Will reload '{}' because its configuration has been changed and there were attempts to load it before", name);
-                        startLoading(info, true);
+                        bool config_change_requires_reloading = does_config_change_requires_reloading_object(*previous_config->config, previous_config->key_in_config, *new_config->config, new_config->key_in_config);
+                        if (config_change_requires_reloading)
+                        {
+                            /// The object has been tried to load before, so it is currently in use or was in use
+                            /// and we should try to reload it with the new config.
+                            LOG_TRACE(log, "Will reload '{}' because its configuration has been changed and there were attempts to load it before", name);
+                            startLoading(info, true);
+                        }
                     }
                 }
             }
@@ -1204,6 +1211,7 @@ private:
     }
 
     const CreateObjectFunction create_object;
+    const DoesConfigChangeRequiresReloadingObjectFunction does_config_change_requires_reloading_object;
     const UpdateObjectFromConfigWithoutReloadingFunction update_object_from_config_without_reloading;
     const String type_name;
     LoggerPtr log;
@@ -1290,6 +1298,8 @@ ExternalLoader::ExternalLoader(const String & type_name_, LoggerPtr log_)
     : config_files_reader(std::make_unique<LoadablesConfigReader>(type_name_, log_))
     , loading_dispatcher(std::make_unique<LoadingDispatcher>(
           [this](auto && a, auto && b, auto && c) { return createObject(a, b, c); },
+          [this](const Poco::Util::AbstractConfiguration & config_1, const String & key_in_config_1, const Poco::Util::AbstractConfiguration & config_2, const String & key_in_config_2)
+                { return doesConfigChangeRequiresReloadingObject(config_1, key_in_config_1, config_2, key_in_config_2); },
           [this](const IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config)
                 { return updateObjectFromConfigWithoutReloading(const_cast<IExternalLoadable &>(object), config, key_in_config); },
           type_name_,
diff --git a/src/Interpreters/ExternalLoader.h b/src/Interpreters/ExternalLoader.h
index 279157b6d51..781d8ca9e7b 100644
--- a/src/Interpreters/ExternalLoader.h
+++ b/src/Interpreters/ExternalLoader.h
@@ -213,6 +213,10 @@ public:
 protected:
     virtual LoadablePtr create(const String & name, const Poco::Util::AbstractConfiguration & config, const String & key_in_config, const String & repository_name) const = 0;
 
+    /// Returns whether the object must be reloaded after a specified change in its configuration.
+    virtual bool doesConfigChangeRequiresReloadingObject(const Poco::Util::AbstractConfiguration & /* old_config */, const String & /* old_key_in_config */,
+                                                         const Poco::Util::AbstractConfiguration & /* new_config */, const String & /* new_key_in_config */) const { return true; /* always reload */ }
+
     /// Updates the object from the configuration without reloading as much as possible.
     virtual void updateObjectFromConfigWithoutReloading(
         IExternalLoadable & /* object */, const Poco::Util::AbstractConfiguration & /* config */, const String & /* key_in_config */) const {}

From 0240ffa5a6dab4f747d17295648d030af907f8f6 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 11 Mar 2024 19:31:52 +0100
Subject: [PATCH 662/985] Fetch the changed files only once

---
 tests/ci/pr_info.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/tests/ci/pr_info.py b/tests/ci/pr_info.py
index 6f4b400f7a8..9bd30f3c58e 100644
--- a/tests/ci/pr_info.py
+++ b/tests/ci/pr_info.py
@@ -337,6 +337,9 @@ class PRInfo:
         )
 
     def fetch_changed_files(self):
+        if self.changed_files_requested:
+            return
+
         if not getattr(self, "diff_urls", False):
             raise TypeError("The event does not have diff URLs")
 

From 49017fc163174e4cb4b3e9253094f399503add42 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 11 Mar 2024 20:39:47 +0100
Subject: [PATCH 663/985] Run the style-check on top of the merge-commit of PRs

---
 tests/ci/style_check.py | 22 ----------------------
 1 file changed, 22 deletions(-)

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 7fb5d22a3ce..4daa6921d6b 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -67,26 +67,6 @@ def parse_args():
     return parser.parse_args()
 
 
-def checkout_head(pr_info: PRInfo) -> None:
-    # It works ONLY for PRs, and only over ssh, so either
-    # ROBOT_CLICKHOUSE_SSH_KEY should be set or ssh-agent should work
-    assert pr_info.number
-    if not pr_info.head_name == pr_info.base_name:
-        # We can't push to forks, sorry folks
-        return
-    remote_url = pr_info.event["pull_request"]["base"]["repo"]["ssh_url"]
-    fetch_cmd = (
-        f"{GIT_PREFIX} fetch --depth=1 "
-        f"{remote_url} {pr_info.head_ref}:head-{pr_info.head_ref}"
-    )
-    if os.getenv("ROBOT_CLICKHOUSE_SSH_KEY", ""):
-        with SSHKey("ROBOT_CLICKHOUSE_SSH_KEY"):
-            git_runner(fetch_cmd)
-    else:
-        git_runner(fetch_cmd)
-    git_runner(f"git checkout -f head-{pr_info.head_ref}")
-
-
 def commit_push_staged(pr_info: PRInfo) -> None:
     # It works ONLY for PRs, and only over ssh, so either
     # ROBOT_CLICKHOUSE_SSH_KEY should be set or ssh-agent should work
@@ -177,8 +157,6 @@ def main():
             _ = future1.result()
 
         if run_pycheck:
-            if args.push:
-                checkout_head(pr_info)
             logging.info("Run py files check: %s", cmd_py)
             future2 = executor.submit(subprocess.run, cmd_py, shell=True)
             _ = future2.result()

From c3f386d06a2c12f08d168accbf51457ad7a735c0 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 11 Mar 2024 20:57:35 +0100
Subject: [PATCH 664/985] Fix the autofixer

---
 tests/ci/style_check.py | 22 ++++++++++------------
 1 file changed, 10 insertions(+), 12 deletions(-)

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 4daa6921d6b..0332383df91 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -78,24 +78,23 @@ def commit_push_staged(pr_info: PRInfo) -> None:
     if not git_staged:
         return
     remote_url = pr_info.event["pull_request"]["base"]["repo"]["ssh_url"]
+    head = git_runner("git rev-parse HEAD^{}")
     git_runner(f"{GIT_PREFIX} commit -m 'Automatic style fix'")
-    push_cmd = (
-        f"{GIT_PREFIX} push {remote_url} head-{pr_info.head_ref}:{pr_info.head_ref}"
+    # The fetch to avoid issue 'pushed branch tip is behind its remote'
+    fetch_cmd = (
+        f"{GIT_PREFIX} fetch {remote_url} --no-recurse-submodules --depth=2 {head}"
     )
+    push_cmd = f"{GIT_PREFIX} push {remote_url} HEAD:{pr_info.head_ref}"
     if os.getenv("ROBOT_CLICKHOUSE_SSH_KEY", ""):
         with SSHKey("ROBOT_CLICKHOUSE_SSH_KEY"):
+            git_runner(fetch_cmd)
             git_runner(push_cmd)
-    else:
-        git_runner(push_cmd)
+            return
+
+    git_runner(fetch_cmd)
+    git_runner(push_cmd)
 
 
-def checkout_last_ref(pr_info: PRInfo) -> None:
-    # Checkout the merge commit back to avoid special effects
-    assert pr_info.number
-    if not pr_info.head_name == pr_info.base_name:
-        # We can't push to forks, sorry folks
-        return
-    git_runner("git checkout -f -")
 
 
 def main():
@@ -162,7 +161,6 @@ def main():
             _ = future2.result()
             if args.push:
                 commit_push_staged(pr_info)
-                checkout_last_ref(pr_info)
 
     subprocess.check_call(
         f"python3 ../../utils/check-style/process_style_check_result.py --in-results-dir {temp_path} "

From 41432c56a8f13a8914b65b265d9855847314db79 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 12 Mar 2024 10:50:44 +0100
Subject: [PATCH 665/985] Enable shellcheck conditionally

---
 tests/ci/style_check.py                       | 84 +++++++++++--------
 utils/check-style/check_shell.sh              | 13 +++
 .../check-style/process_style_check_result.py |  4 +-
 3 files changed, 64 insertions(+), 37 deletions(-)
 create mode 100755 utils/check-style/check_shell.sh

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 0332383df91..797c0ef12d0 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -8,8 +8,9 @@ import subprocess
 import sys
 from concurrent.futures import ProcessPoolExecutor
 from pathlib import Path
-from typing import List, Tuple
+from typing import List, Tuple, Union
 
+import magic
 from docker_images_helper import get_docker_image, pull_image
 from env_helper import CI, REPO_COPY, TEMP_PATH
 from git_helper import GIT_PREFIX, git_runner
@@ -95,6 +96,24 @@ def commit_push_staged(pr_info: PRInfo) -> None:
     git_runner(push_cmd)
 
 
+def is_python(file: Union[Path, str]) -> bool:
+    """returns if the changed file in the repository is python script"""
+    # WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
+    # and `Support os.PathLike values in magic.from_file` is only from 0.4.25
+    return bool(
+        magic.from_file(os.path.join(REPO_COPY, file), mime=True)
+        == "text/x-script.python"
+    )
+
+
+def is_shell(file: Union[Path, str]) -> bool:
+    """returns if the changed file in the repository is shell script"""
+    # WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
+    # and `Support os.PathLike values in magic.from_file` is only from 0.4.25
+    return bool(
+        magic.from_file(os.path.join(REPO_COPY, file), mime=True)
+        == "text/x-shellscript"
+    )
 
 
 def main():
@@ -111,29 +130,28 @@ def main():
     temp_path.mkdir(parents=True, exist_ok=True)
 
     pr_info = PRInfo()
+    run_cpp_check = True
+    run_shell_check = True
+    run_python_check = True
+    if CI and pr_info.number > 0:
+        pr_info.fetch_changed_files()
+        run_cpp_check = not any(
+            is_python(file) or is_shell(file) for file in pr_info.changed_files
+        )
+        run_shell_check = any(is_shell(file) for file in pr_info.changed_files)
+        run_python_check = any(is_python(file) for file in pr_info.changed_files)
 
     IMAGE_NAME = "clickhouse/style-test"
     image = pull_image(get_docker_image(IMAGE_NAME))
-    cmd_cpp = (
+    docker_command = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
-        f"--entrypoint= -w/ClickHouse/utils/check-style "
-        f"{image} ./check_cpp.sh"
-    )
-
-    cmd_py = (
-        f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
-        f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
-        f"--entrypoint= -w/ClickHouse/utils/check-style "
-        f"{image} ./check_py.sh"
-    )
-
-    cmd_docs = (
-        f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
-        f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
-        f"--entrypoint= -w/ClickHouse/utils/check-style "
-        f"{image} ./check_docs.sh"
+        f"--entrypoint= -w/ClickHouse/utils/check-style {image}"
     )
+    cmd_docs = f"{docker_command} ./check_docs.sh"
+    cmd_cpp = f"{docker_command} ./check_cpp.sh"
+    cmd_py = f"{docker_command} ./check_py.sh"
+    cmd_shell = f"{docker_command} ./check_shell.sh"
 
     with ProcessPoolExecutor(max_workers=2) as executor:
         logging.info("Run docs files check: %s", cmd_docs)
@@ -141,26 +159,22 @@ def main():
         # Parallelization  does not make it faster - run subsequently
         _ = future.result()
 
-        run_cppcheck = True
-        run_pycheck = True
-        if CI and pr_info.number > 0:
-            pr_info.fetch_changed_files()
-            if not any(file.endswith(".py") for file in pr_info.changed_files):
-                run_pycheck = False
-            if all(file.endswith(".py") for file in pr_info.changed_files):
-                run_cppcheck = False
-
-        if run_cppcheck:
+        if run_cpp_check:
             logging.info("Run source files check: %s", cmd_cpp)
-            future1 = executor.submit(subprocess.run, cmd_cpp, shell=True)
-            _ = future1.result()
+            future = executor.submit(subprocess.run, cmd_cpp, shell=True)
+            _ = future.result()
 
-        if run_pycheck:
+        if run_python_check:
             logging.info("Run py files check: %s", cmd_py)
-            future2 = executor.submit(subprocess.run, cmd_py, shell=True)
-            _ = future2.result()
-            if args.push:
-                commit_push_staged(pr_info)
+            future = executor.submit(subprocess.run, cmd_py, shell=True)
+            _ = future.result()
+        if run_shell_check:
+            logging.info("Run shellcheck check: %s", cmd_shell)
+            future = executor.submit(subprocess.run, cmd_shell, shell=True)
+            _ = future.result()
+
+    if args.push:
+        commit_push_staged(pr_info)
 
     subprocess.check_call(
         f"python3 ../../utils/check-style/process_style_check_result.py --in-results-dir {temp_path} "
diff --git a/utils/check-style/check_shell.sh b/utils/check-style/check_shell.sh
new file mode 100755
index 00000000000..94f06220f88
--- /dev/null
+++ b/utils/check-style/check_shell.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+
+cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_output/check_status.tsv
+
+start_total=$(date +%s)
+
+start=$(date +%s)
+./shellcheck-run.sh |& tee /test_output/shellcheck.txt
+runtime=$(($(date +%s)-start))
+echo "Check shellcheck. Done. $runtime seconds."
+
+runtime=$(($(date +%s)-start_total))
+echo "Check style total. Done. $runtime seconds."
diff --git a/utils/check-style/process_style_check_result.py b/utils/check-style/process_style_check_result.py
index 8c9837b4fc6..f1ca53eba3b 100755
--- a/utils/check-style/process_style_check_result.py
+++ b/utils/check-style/process_style_check_result.py
@@ -13,8 +13,8 @@ def process_result(result_folder):
     description = ""
     test_results = []
     checks = (
-        # "duplicate includes",
-        # "shellcheck",
+        "duplicate includes",
+        "shellcheck",
         "style",
         "pylint",
         "black",

From 0e6b5705fbdce4c7032d39dbdae452f266e1b0b3 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 12 Mar 2024 12:20:30 +0100
Subject: [PATCH 666/985] Install python-magic in style-check, split pip and
 apt

---
 docker/test/style/Dockerfile | 28 +++++++++++++++-------------
 1 file changed, 15 insertions(+), 13 deletions(-)

diff --git a/docker/test/style/Dockerfile b/docker/test/style/Dockerfile
index b4ffcfb597c..5d53d03606f 100644
--- a/docker/test/style/Dockerfile
+++ b/docker/test/style/Dockerfile
@@ -8,20 +8,22 @@ ARG apt_archive="http://archive.ubuntu.com"
 RUN sed -i "s|http://archive.ubuntu.com|$apt_archive|g" /etc/apt/sources.list
 
 RUN apt-get update && env DEBIAN_FRONTEND=noninteractive apt-get install --yes \
-    aspell \
-    curl \
-    git \
-    file \
-    libxml2-utils \
-    moreutils \
-    python3-fuzzywuzzy \
-    python3-pip \
-    yamllint \
-    locales \
-    && pip3 install black==23.12.0 boto3 codespell==2.2.1 mypy==1.8.0 PyGithub unidiff pylint==3.1.0 \
-        requests types-requests \
+        aspell \
+        curl \
+        git \
+        file \
+        libxml2-utils \
+        moreutils \
+        python3-fuzzywuzzy \
+        python3-pip \
+        yamllint \
+        locales \
     && apt-get clean \
-    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/* \
+    && rm -rf /var/lib/apt/lists/* /var/cache/debconf /tmp/*
+
+# python-magic is the same version as in Ubuntu 22.04
+RUN pip3 install black==23.12.0 boto3 codespell==2.2.1 mypy==1.8.0 PyGithub unidiff pylint==3.1.0 \
+        python-magic==0.4.24 requests types-requests \
     && rm -rf /root/.cache/pip
 
 RUN echo "en_US.UTF-8 UTF-8" > /etc/locale.gen && locale-gen en_US.UTF-8

From 97b0513f9928de5f0207978d8138b478bc1677bd Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 12 Mar 2024 19:21:05 +0100
Subject: [PATCH 667/985] Enable duplicate includes back, rewrite and
 parallelize them

---
 utils/check-style/check-duplicate-includes.sh |  5 ++-
 utils/check-style/check_cpp.sh                | 31 +++++++++----------
 2 files changed, 18 insertions(+), 18 deletions(-)

diff --git a/utils/check-style/check-duplicate-includes.sh b/utils/check-style/check-duplicate-includes.sh
index 64aca4d180d..ca8b98d9537 100755
--- a/utils/check-style/check-duplicate-includes.sh
+++ b/utils/check-style/check-duplicate-includes.sh
@@ -1,6 +1,9 @@
 #!/usr/bin/env bash
 
 ROOT_PATH=$(git rev-parse --show-toplevel)
+NPROC=$(($(nproc) + 3))
 
 # Find duplicate include directives
-find $ROOT_PATH/{src,base,programs,utils} -name '*.h' -or -name '*.cpp' | while read file; do grep -P '^#include ' $file | sort | uniq -c | grep -v -P '^\s+1\s' && echo $file; done | sed '/^[[:space:]]*$/d'
+find "$ROOT_PATH"/{src,base,programs,utils} -type f '(' -name '*.h' -or -name '*.cpp' ')' -print0 | \
+  xargs -0 -I {} -P "$NPROC" bash -c 'grep -P "^#include " "{}" | sort | uniq -c | grep -v -P "^\s+1\s" && echo "{}" '| \
+  sed '/^\s*$/d'
diff --git a/utils/check-style/check_cpp.sh b/utils/check-style/check_cpp.sh
index ea90d79418c..dc1dae70e22 100755
--- a/utils/check-style/check_cpp.sh
+++ b/utils/check-style/check_cpp.sh
@@ -4,35 +4,32 @@
 
 cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_output/check_status.tsv
 
-start_total=`date +%s`
+start_total=$(date +%s)
 
-# FIXME: 30 sec to wait
-# echo "Check duplicates" | ts
-# ./check-duplicate-includes.sh |& tee /test_output/duplicate_includes_output.txt
+start=$(date +%s)
+./check-duplicate-includes.sh |& tee /test_output/duplicate_includes_output.txt
+runtime=$(($(date +%s)-start))
+echo "Check duplicates. Done. $runtime seconds."
 
-start=`date +%s`
+start=$(date +%s)
 ./check-style -n              |& tee /test_output/style_output.txt
-runtime=$((`date +%s`-start))
+runtime=$(($(date +%s)-start))
 echo "Check style. Done. $runtime seconds."
 
-start=`date +%s`
+start=$(date +%s)
 ./check-whitespaces -n        |& tee /test_output/whitespaces_output.txt
-runtime=$((`date +%s`-start))
+runtime=$(($(date +%s)-start))
 echo "Check whitespaces. Done. $runtime seconds."
 
-start=`date +%s`
+start=$(date +%s)
 ./check-workflows             |& tee /test_output/workflows_output.txt
-runtime=$((`date +%s`-start))
+runtime=$(($(date +%s)-start))
 echo "Check workflows. Done. $runtime seconds."
 
-start=`date +%s`
+start=$(date +%s)
 ./check-submodules            |& tee /test_output/submodules_output.txt
-runtime=$((`date +%s`-start))
+runtime=$(($(date +%s)-start))
 echo "Check submodules. Done. $runtime seconds."
 
-# FIXME: 6 min to wait
-# echo "Check shell scripts with shellcheck" | ts
-# ./shellcheck-run.sh           |& tee /test_output/shellcheck_output.txt
-
-runtime=$((`date +%s`-start_total))
+runtime=$(($(date +%s)-start_total))
 echo "Check style total. Done. $runtime seconds."

From a5331ea54462c5cdb300c7f48d28d8795fac1bc9 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 14 Mar 2024 13:49:05 +0100
Subject: [PATCH 668/985] Rewrite list-licenses.sh to use array+find

---
 utils/list-licenses/list-licenses.sh | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/utils/list-licenses/list-licenses.sh b/utils/list-licenses/list-licenses.sh
index f09168a0596..cc730464e8e 100755
--- a/utils/list-licenses/list-licenses.sh
+++ b/utils/list-licenses/list-licenses.sh
@@ -5,15 +5,16 @@ if [[ "$OSTYPE" == "darwin"* ]]; then
     GREP_CMD=ggrep
     FIND_CMD=gfind
 else
-    FIND_CMD=find
-    GREP_CMD=grep
+    FIND_CMD='find'
+    GREP_CMD='grep'
 fi
 
 ROOT_PATH="$(git rev-parse --show-toplevel)"
 LIBS_PATH="${ROOT_PATH}/contrib"
 
-ls -1 -d ${LIBS_PATH}/*/ "${ROOT_PATH}/base/poco" | ${GREP_CMD} -F -v -- '-cmake' | LC_ALL=C sort | while read LIB; do
-    LIB_NAME=$(basename $LIB)
+mapfile -t libs < <(echo "${ROOT_PATH}/base/poco"; find "${LIBS_PATH}" -type d -maxdepth 1 ! -name '*-cmake' | LC_ALL=C sort)
+for LIB in "${libs[@]}"; do
+    LIB_NAME=$(basename "$LIB")
 
     LIB_LICENSE=$(
         LC_ALL=C ${FIND_CMD} "$LIB" -type f -and '(' -iname 'LICENSE*' -or -iname 'COPYING*' -or -iname 'COPYRIGHT*' ')' -and -not '(' -iname '*.html' -or -iname '*.htm' -or -iname '*.rtf' -or -name '*.cpp' -or -name '*.h' -or -iname '*.json' ')' -printf "%d\t%p\n" |

From 070f7bee9b550962cba6768ffd3a74306e4e2107 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 14 Mar 2024 13:56:43 +0100
Subject: [PATCH 669/985] Fix shellcheck issues in durability-test.sh

---
 utils/durability-test/durability-test.sh | 51 +++++++++++-------------
 1 file changed, 24 insertions(+), 27 deletions(-)

diff --git a/utils/durability-test/durability-test.sh b/utils/durability-test/durability-test.sh
index 97c39473b69..188ef3452e7 100755
--- a/utils/durability-test/durability-test.sh
+++ b/utils/durability-test/durability-test.sh
@@ -15,7 +15,6 @@ Usage:
 URL=http://cloud-images.ubuntu.com/bionic/current
 IMAGE=bionic-server-cloudimg-amd64.img
 SSH_PORT=11022
-CLICKHOUSE_PORT=9090
 PASSWORD=root
 
 TABLE_NAME=$1
@@ -34,19 +33,18 @@ function run()
 
 function copy()
 {
-    sshpass -p $PASSWORD scp -r -P $SSH_PORT $1 root@localhost:$2 2>/dev/null
+    sshpass -p $PASSWORD scp -r -P $SSH_PORT "$1" "root@localhost:$2" 2>/dev/null
 }
 
 function wait_vm_for_start()
 {
     echo "Waiting until VM started..."
     started=0
-    for i in {0..100}; do
-        run "exit"
-        if [ $? -eq 0 ]; then
+    for _ in {0..100}; do
+        if run "exit"; then
             started=1
             break
-        fi 
+        fi
         sleep 1s
     done
 
@@ -62,9 +60,8 @@ function wait_clickhouse_for_start()
 {
     echo "Waiting until ClickHouse started..."
     started=0
-    for i in {0..30}; do
-        run "clickhouse client --query 'select 1'" > /dev/null
-        if [ $? -eq 0 ]; then
+    for _ in {0..30}; do
+        if run "clickhouse client --query 'select 1'" > /dev/null; then
             started=1
             break
         fi
@@ -105,11 +102,11 @@ if [[ -z $CLICKHOUSE_CONFIG_DIR ]]; then
     CLICKHOUSE_CONFIG_DIR=/etc/clickhouse-server
 fi
 
-echo "Using ClickHouse binary:" $CLICKHOUSE_BINARY
-echo "Using ClickHouse config from:" $CLICKHOUSE_CONFIG_DIR
+echo "Using ClickHouse binary: $CLICKHOUSE_BINARY"
+echo "Using ClickHouse config from: $CLICKHOUSE_CONFIG_DIR"
 
-copy $CLICKHOUSE_BINARY /usr/bin
-copy $CLICKHOUSE_CONFIG_DIR /etc
+copy "$CLICKHOUSE_BINARY" /usr/bin
+copy "$CLICKHOUSE_CONFIG_DIR" /etc
 run "mv /etc/$CLICKHOUSE_CONFIG_DIR /etc/clickhouse-server"
 
 echo "Prepared VM"
@@ -118,23 +115,23 @@ echo "Starting ClickHouse"
 run "clickhouse server --config-file=/etc/clickhouse-server/config.xml > clickhouse-server.log 2>&1" &
 wait_clickhouse_for_start
 
-query=`cat $CREATE_QUERY`
-echo "Executing query:" $query
+query=$(cat "$CREATE_QUERY")
+echo "Executing query: $query"
 run "clickhouse client --query '$query'"
 
-query=`cat $INSERT_QUERY`
-echo "Will run in a loop query: " $query
+query=$(cat "$INSERT_QUERY")
+echo "Will run in a loop query:  $query"
 run "clickhouse benchmark <<< '$query' -c 8" &
 echo "Running queries"
 
-pid=`pidof qemu-system-x86_64`
+pid=$(pidof qemu-system-x86_64)
 sec=$(( (RANDOM % 5) + 25 ))
 ms=$(( RANDOM % 1000 ))
 
 echo "Will kill VM in $sec.$ms sec"
 
 sleep $sec.$ms
-kill -9 $pid
+kill -9 "$pid"
 
 echo "Restarting"
 
@@ -147,22 +144,22 @@ run "rm -r *data/system"
 run "clickhouse server --config-file=/etc/clickhouse-server/config.xml > clickhouse-server.log 2>&1" &
 wait_clickhouse_for_start
 
-pid=`pidof qemu-system-x86_64`
-result=`run "grep $TABLE_NAME clickhouse-server.log | grep 'Caught exception while loading metadata'"`
+pid=$(pidof qemu-system-x86_64)
+result=$(run "grep $TABLE_NAME clickhouse-server.log | grep 'Caught exception while loading metadata'")
 if [[ -n $result ]]; then
     echo "FAIL. Can't attach table:"
-    echo $result
-    kill -9 $pid
+    echo "$result"
+    kill -9 "$pid"
     exit 1
 fi
 
-result=`run "grep $TABLE_NAME clickhouse-server.log | grep 'Considering to remove broken part'"`
+result=$(run "grep $TABLE_NAME clickhouse-server.log | grep 'Considering to remove broken part'")
 if [[ -n $result ]]; then
     echo "FAIL. Have broken parts:"
-    echo $result
-    kill -9 $pid
+    echo "$result"
+    kill -9 "$pid"
     exit 1
 fi
 
-kill -9 $pid
+kill -9 "$pid"
 echo OK

From e208907f39b1bcccc16d56cc672a30282c9223b6 Mon Sep 17 00:00:00 2001
From: PapaToemmsn <160967948+PapaToemmsn@users.noreply.github.com>
Date: Thu, 22 Feb 2024 22:46:13 +0100
Subject: [PATCH 670/985] fix for #57598 (ROLLBACK should be no-op...)

Change to verify proper behaviour for ROLLBACK should be no-op when no active tranaction is running (MySQL compatibility) #57598
---
 src/Interpreters/InterpreterTransactionControlQuery.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/InterpreterTransactionControlQuery.cpp b/src/Interpreters/InterpreterTransactionControlQuery.cpp
index b1758013f18..fc71874f7a8 100644
--- a/src/Interpreters/InterpreterTransactionControlQuery.cpp
+++ b/src/Interpreters/InterpreterTransactionControlQuery.cpp
@@ -52,7 +52,7 @@ BlockIO InterpreterTransactionControlQuery::executeCommit(ContextMutablePtr sess
 {
     auto txn = session_context->getCurrentTransaction();
     if (!txn)
-        throw Exception(ErrorCodes::INVALID_TRANSACTION, "There is no current transaction");
+        return {};
     if (txn->getState() != MergeTreeTransaction::RUNNING)
         throw Exception(ErrorCodes::INVALID_TRANSACTION, "Transaction is not in RUNNING state");
 
@@ -111,7 +111,7 @@ BlockIO InterpreterTransactionControlQuery::executeRollback(ContextMutablePtr se
 {
     auto txn = session_context->getCurrentTransaction();
     if (!txn)
-        throw Exception(ErrorCodes::INVALID_TRANSACTION, "There is no current transaction");
+        return {};
     if (txn->getState() == MergeTreeTransaction::COMMITTED)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Transaction is in COMMITTED state");
     if (txn->getState() == MergeTreeTransaction::COMMITTING)

From c68fd07cff040e567df3affd6d2de34eaf6e98e3 Mon Sep 17 00:00:00 2001
From: PapaToemmsn <160967948+PapaToemmsn@users.noreply.github.com>
Date: Fri, 23 Feb 2024 10:57:45 +0100
Subject: [PATCH 671/985] adjusted 01173_transaction_control_queries.sql to
 changed no transaction active bahaviour

Adapted transaction test queries to changed beahviour
---
 .../queries/0_stateless/01173_transaction_control_queries.sql | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/01173_transaction_control_queries.sql b/tests/queries/0_stateless/01173_transaction_control_queries.sql
index 03c98f50cc4..afad79c6353 100644
--- a/tests/queries/0_stateless/01173_transaction_control_queries.sql
+++ b/tests/queries/0_stateless/01173_transaction_control_queries.sql
@@ -6,8 +6,8 @@ drop table if exists mt2;
 create table mt1 (n Int64) engine=MergeTree order by n;
 create table mt2 (n Int64) engine=MergeTree order by n;
 
-commit; -- { serverError INVALID_TRANSACTION } -- no transaction
-rollback; -- { serverError INVALID_TRANSACTION }
+commit;
+rollback;
 
 begin transaction;
 insert into mt1 values (1);

From 6eafc21211d6123c4ff51ab5af577fd67aa53044 Mon Sep 17 00:00:00 2001
From: PapaToemmsn <160967948+PapaToemmsn@users.noreply.github.com>
Date: Wed, 13 Mar 2024 16:26:11 +0100
Subject: [PATCH 672/985] Reveted 01173_transaction_control_queries.sql back to
 original state

As changes in Txn handling for COMMIT and ROLLBACK should only be honoured for MySQL client mode the test was reverted back
---
 .../queries/0_stateless/01173_transaction_control_queries.sql | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/01173_transaction_control_queries.sql b/tests/queries/0_stateless/01173_transaction_control_queries.sql
index afad79c6353..03c98f50cc4 100644
--- a/tests/queries/0_stateless/01173_transaction_control_queries.sql
+++ b/tests/queries/0_stateless/01173_transaction_control_queries.sql
@@ -6,8 +6,8 @@ drop table if exists mt2;
 create table mt1 (n Int64) engine=MergeTree order by n;
 create table mt2 (n Int64) engine=MergeTree order by n;
 
-commit;
-rollback;
+commit; -- { serverError INVALID_TRANSACTION } -- no transaction
+rollback; -- { serverError INVALID_TRANSACTION }
 
 begin transaction;
 insert into mt1 values (1);

From 723f860333e767a693b064104c8c2b48f9d975bd Mon Sep 17 00:00:00 2001
From: PapaToemmsn <160967948+PapaToemmsn@users.noreply.github.com>
Date: Wed, 13 Mar 2024 18:06:46 +0100
Subject: [PATCH 673/985] COMMIT/ROLLBACK with no active transaction do not
 throw an exception for MySQL clients anymore

---
 .../0_stateless/02989_mysql_transaction_test.sh        | 10 ++++++++++
 1 file changed, 10 insertions(+)
 create mode 100644 tests/queries/0_stateless/02989_mysql_transaction_test.sh

diff --git a/tests/queries/0_stateless/02989_mysql_transaction_test.sh b/tests/queries/0_stateless/02989_mysql_transaction_test.sh
new file mode 100644
index 00000000000..ffb113255f7
--- /dev/null
+++ b/tests/queries/0_stateless/02989_mysql_transaction_test.sh
@@ -0,0 +1,10 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+# Tag no-fasttest: requires mysql client
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+${MYSQL_CLIENT} --verbose --execute "COMMIT;" | grep -c "COMMIT"
+${MYSQL_CLIENT} --verbose --execute "ROLLBACK;" | grep -c "ROLLBACK"

From 36e53007de9649c72165fb5283369a1b1be1f903 Mon Sep 17 00:00:00 2001
From: PapaToemmsn <160967948+PapaToemmsn@users.noreply.github.com>
Date: Wed, 13 Mar 2024 18:07:41 +0100
Subject: [PATCH 674/985] COMMIT/ROLLBACK with no active transaction do not
 throw an exception for MySQL clients anymore

---
 .../queries/0_stateless/02989_mysql_transaction_test.reference  | 2 ++
 1 file changed, 2 insertions(+)
 create mode 100644 tests/queries/0_stateless/02989_mysql_transaction_test.reference

diff --git a/tests/queries/0_stateless/02989_mysql_transaction_test.reference b/tests/queries/0_stateless/02989_mysql_transaction_test.reference
new file mode 100644
index 00000000000..6ed281c757a
--- /dev/null
+++ b/tests/queries/0_stateless/02989_mysql_transaction_test.reference
@@ -0,0 +1,2 @@
+1
+1

From da3cb02df5985b0425facb8543f67236e5d9bf38 Mon Sep 17 00:00:00 2001
From: PapaToemmsn <160967948+PapaToemmsn@users.noreply.github.com>
Date: Wed, 13 Mar 2024 18:10:26 +0100
Subject: [PATCH 675/985] COMMIT/ROLLBACK with no active transaction do not
 throw an exception for MySQL clients anymore

---
 .../InterpreterTransactionControlQuery.cpp       | 16 ++++++++++++++--
 1 file changed, 14 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/InterpreterTransactionControlQuery.cpp b/src/Interpreters/InterpreterTransactionControlQuery.cpp
index fc71874f7a8..d0f7ddb5fcf 100644
--- a/src/Interpreters/InterpreterTransactionControlQuery.cpp
+++ b/src/Interpreters/InterpreterTransactionControlQuery.cpp
@@ -52,7 +52,13 @@ BlockIO InterpreterTransactionControlQuery::executeCommit(ContextMutablePtr sess
 {
     auto txn = session_context->getCurrentTransaction();
     if (!txn)
-        return {};
+    {
+        if (session_context->getClientInfo().interface == ClientInfo::Interface::MYSQL)
+            return {};
+        else
+            throw Exception(ErrorCodes::INVALID_TRANSACTION, "There is no current transaction");
+    }
+    
     if (txn->getState() != MergeTreeTransaction::RUNNING)
         throw Exception(ErrorCodes::INVALID_TRANSACTION, "Transaction is not in RUNNING state");
 
@@ -111,7 +117,13 @@ BlockIO InterpreterTransactionControlQuery::executeRollback(ContextMutablePtr se
 {
     auto txn = session_context->getCurrentTransaction();
     if (!txn)
-        return {};
+    {
+        if (session_context->getClientInfo().interface == ClientInfo::Interface::MYSQL)
+            return {};
+        else
+            throw Exception(ErrorCodes::INVALID_TRANSACTION, "There is no current transaction");
+    }
+    
     if (txn->getState() == MergeTreeTransaction::COMMITTED)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Transaction is in COMMITTED state");
     if (txn->getState() == MergeTreeTransaction::COMMITTING)

From 364fe95b76af03d392c91a780bbda4339f14113c Mon Sep 17 00:00:00 2001
From: PapaToemmsn <160967948+PapaToemmsn@users.noreply.github.com>
Date: Wed, 13 Mar 2024 18:33:41 +0100
Subject: [PATCH 676/985] fix style check errors

---
 src/Interpreters/InterpreterTransactionControlQuery.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Interpreters/InterpreterTransactionControlQuery.cpp b/src/Interpreters/InterpreterTransactionControlQuery.cpp
index d0f7ddb5fcf..d31ace758c4 100644
--- a/src/Interpreters/InterpreterTransactionControlQuery.cpp
+++ b/src/Interpreters/InterpreterTransactionControlQuery.cpp
@@ -58,7 +58,6 @@ BlockIO InterpreterTransactionControlQuery::executeCommit(ContextMutablePtr sess
         else
             throw Exception(ErrorCodes::INVALID_TRANSACTION, "There is no current transaction");
     }
-    
     if (txn->getState() != MergeTreeTransaction::RUNNING)
         throw Exception(ErrorCodes::INVALID_TRANSACTION, "Transaction is not in RUNNING state");
 
@@ -123,7 +122,6 @@ BlockIO InterpreterTransactionControlQuery::executeRollback(ContextMutablePtr se
         else
             throw Exception(ErrorCodes::INVALID_TRANSACTION, "There is no current transaction");
     }
-    
     if (txn->getState() == MergeTreeTransaction::COMMITTED)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Transaction is in COMMITTED state");
     if (txn->getState() == MergeTreeTransaction::COMMITTING)

From 4f9702aa164a5daaaf2d9fe769fcb23d9a31f557 Mon Sep 17 00:00:00 2001
From: PapaToemmsn <th+github@litterbox.online>
Date: Fri, 15 Mar 2024 10:13:21 +0000
Subject: [PATCH 677/985] made 02989_mysql_transaction_test.sh executable

---
 tests/queries/0_stateless/02989_mysql_transaction_test.sh | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 mode change 100644 => 100755 tests/queries/0_stateless/02989_mysql_transaction_test.sh

diff --git a/tests/queries/0_stateless/02989_mysql_transaction_test.sh b/tests/queries/0_stateless/02989_mysql_transaction_test.sh
old mode 100644
new mode 100755

From 836fe46c3371e99b8e6657d7fbeccff2f1cc9af2 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Mon, 18 Mar 2024 15:50:58 +0100
Subject: [PATCH 678/985] Disable new analyzer in MutationsInterpreter
 #ci_set_analyzer

---
 src/Interpreters/MutationsInterpreter.cpp | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index 3b1a499255b..45ca9afce7c 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -402,10 +402,17 @@ MutationsInterpreter::MutationsInterpreter(
     , metadata_snapshot(metadata_snapshot_)
     , commands(std::move(commands_))
     , available_columns(std::move(available_columns_))
-    , context(Context::createCopy(context_))
     , settings(std::move(settings_))
     , select_limits(SelectQueryOptions().analyze(!settings.can_execute).ignoreLimits())
 {
+    auto new_context = Context::createCopy(context_);
+    if (new_context->getSettingsRef().allow_experimental_analyzer)
+    {
+        new_context->setSetting("allow_experimental_analyzer", false);
+        LOG_DEBUG(&Poco::Logger::get("MutationsInterpreter"), "Will use old analyzer to prepare mutation");
+    }
+    context = std::move(new_context);
+
     prepare(!settings.can_execute);
 }
 

From 53159070b5598f43865e80d0957fccbc7314fa15 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 18 Mar 2024 15:52:16 +0100
Subject: [PATCH 679/985] Remove default cluster in tests

---
 tests/config/config.d/clusters.xml                     | 3 +++
 tests/integration/helpers/0_common_instance_config.xml | 3 +++
 2 files changed, 6 insertions(+)

diff --git a/tests/config/config.d/clusters.xml b/tests/config/config.d/clusters.xml
index 7ade716902c..9490f98d6d8 100644
--- a/tests/config/config.d/clusters.xml
+++ b/tests/config/config.d/clusters.xml
@@ -1,5 +1,8 @@
 <clickhouse>
     <remote_servers>
+        <!-- Remove the default remote server to avoid people depending on its hardcoded config
+             Use test_shard_localhost instead -->
+        <default remove="remove"></default>
         <test_shard_localhost>
             <shard>
                 <replica>
diff --git a/tests/integration/helpers/0_common_instance_config.xml b/tests/integration/helpers/0_common_instance_config.xml
index 73792affee6..1d97bcb7bcf 100644
--- a/tests/integration/helpers/0_common_instance_config.xml
+++ b/tests/integration/helpers/0_common_instance_config.xml
@@ -29,4 +29,7 @@
     </access_control_improvements>
 
     <custom_cached_disks_base_directory replace="replace">/</custom_cached_disks_base_directory>
+
+    <!-- Remove the default remote server to avoid people depending on its hardcoded config -->
+    <remote_servers remove="remove"></remote_servers>
 </clickhouse>

From 3df9e3febc652f1d268e6ffe1d026e0561007b77 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 18 Mar 2024 15:52:54 +0100
Subject: [PATCH 680/985] Adapt stateless tests

---
 .../02860_distributed_flush_on_detach.reference  |  4 ++--
 .../02860_distributed_flush_on_detach.sql        |  4 ++--
 .../02890_describe_table_options.reference       | 16 ++++++++--------
 .../0_stateless/02890_describe_table_options.sql | 16 ++++++++--------
 .../02903_rmt_retriable_merge_exception.sh       |  2 +-
 ...ngs_background_insert_compatibility.reference | 16 ++++++++--------
 ...ttings_background_insert_compatibility.sql.j2 |  4 ++--
 7 files changed, 31 insertions(+), 31 deletions(-)

diff --git a/tests/queries/0_stateless/02860_distributed_flush_on_detach.reference b/tests/queries/0_stateless/02860_distributed_flush_on_detach.reference
index 8e5815188e7..2bb78f92948 100644
--- a/tests/queries/0_stateless/02860_distributed_flush_on_detach.reference
+++ b/tests/queries/0_stateless/02860_distributed_flush_on_detach.reference
@@ -1,7 +1,7 @@
 -- { echoOn }
 
 create table data (key Int) engine=Memory();
-create table dist (key Int) engine=Distributed(default, currentDatabase(), data);
+create table dist (key Int) engine=Distributed(test_shard_localhost, currentDatabase(), data);
 system stop distributed sends dist;
 -- check that FLUSH DISTRIBUTED does flushing anyway
 insert into dist values (1);
@@ -19,7 +19,7 @@ attach table dist;
 truncate table data;
 -- check flush_on_detach=0
 drop table dist;
-create table dist (key Int) engine=Distributed(default, currentDatabase(), data) settings flush_on_detach=0;
+create table dist (key Int) engine=Distributed(test_shard_localhost, currentDatabase(), data) settings flush_on_detach=0;
 system stop distributed sends dist;
 insert into dist values (1);
 detach table dist;
diff --git a/tests/queries/0_stateless/02860_distributed_flush_on_detach.sql b/tests/queries/0_stateless/02860_distributed_flush_on_detach.sql
index 5ba45d72c08..10442650478 100644
--- a/tests/queries/0_stateless/02860_distributed_flush_on_detach.sql
+++ b/tests/queries/0_stateless/02860_distributed_flush_on_detach.sql
@@ -6,7 +6,7 @@ drop table if exists dist;
 -- { echoOn }
 
 create table data (key Int) engine=Memory();
-create table dist (key Int) engine=Distributed(default, currentDatabase(), data);
+create table dist (key Int) engine=Distributed(test_shard_localhost, currentDatabase(), data);
 system stop distributed sends dist;
 
 -- check that FLUSH DISTRIBUTED does flushing anyway
@@ -25,7 +25,7 @@ truncate table data;
 
 -- check flush_on_detach=0
 drop table dist;
-create table dist (key Int) engine=Distributed(default, currentDatabase(), data) settings flush_on_detach=0;
+create table dist (key Int) engine=Distributed(test_shard_localhost, currentDatabase(), data) settings flush_on_detach=0;
 system stop distributed sends dist;
 insert into dist values (1);
 detach table dist;
diff --git a/tests/queries/0_stateless/02890_describe_table_options.reference b/tests/queries/0_stateless/02890_describe_table_options.reference
index ff58202ae49..05daade09d8 100644
--- a/tests/queries/0_stateless/02890_describe_table_options.reference
+++ b/tests/queries/0_stateless/02890_describe_table_options.reference
@@ -7,7 +7,7 @@ DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
 │ arr  │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │
 │ t    │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │              │ ZSTD(1)          │                │
 └──────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┘
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 ┌─name─┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┐
 │ id   │ UInt64                    │              │                    │ index column │                  │                │
 │ arr  │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │
@@ -23,7 +23,7 @@ DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
 │ t.a       │ String                    │              │                    │              │ ZSTD(1)          │                │            1 │
 │ t.b       │ UInt64                    │              │                    │              │ ZSTD(1)          │                │            1 │
 └───────────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┴──────────────┘
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 ┌─name──────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┐
 │ id        │ UInt64                    │              │                    │ index column │                  │                │            0 │
 │ arr       │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │            0 │
@@ -47,7 +47,7 @@ DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
 │ _row_exists    │ UInt8                     │              │                    │ Persisted mask created by lightweight delete that show whether row exists or is deleted │                  │                │          1 │
 │ _block_number  │ UInt64                    │              │                    │ Persisted original number of block that was assigned at insert                          │ Delta, LZ4       │                │          1 │
 └────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴────────────┘
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 ┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_virtual─┐
 │ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │          0 │
 │ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │          0 │
@@ -80,7 +80,7 @@ DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
 │ t.a            │ String                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
 │ t.b            │ UInt64                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
 └────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴──────────────┴────────────┘
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 ┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┬─is_virtual─┐
 │ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │            0 │          0 │
 │ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │            0 │          0 │
@@ -105,7 +105,7 @@ DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
 │ arr  │ Array(UInt64)             │
 │ t    │ Tuple(a String, b UInt64) │
 └──────┴───────────────────────────┘
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 ┌─name─┬─type──────────────────────┐
 │ id   │ UInt64                    │
 │ arr  │ Array(UInt64)             │
@@ -121,7 +121,7 @@ DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
 │ t.a       │ String                    │            1 │
 │ t.b       │ UInt64                    │            1 │
 └───────────┴───────────────────────────┴──────────────┘
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 ┌─name──────┬─type──────────────────────┬─is_subcolumn─┐
 │ id        │ UInt64                    │            0 │
 │ arr       │ Array(UInt64)             │            0 │
@@ -145,7 +145,7 @@ DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
 │ _row_exists    │ UInt8                     │          1 │
 │ _block_number  │ UInt64                    │          1 │
 └────────────────┴───────────────────────────┴────────────┘
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 ┌─name───────────┬─type──────────────────────┬─is_virtual─┐
 │ id             │ UInt64                    │          0 │
 │ arr            │ Array(UInt64)             │          0 │
@@ -178,7 +178,7 @@ DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
 │ t.a            │ String                    │            1 │          0 │
 │ t.b            │ UInt64                    │            1 │          0 │
 └────────────────┴───────────────────────────┴──────────────┴────────────┘
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 ┌─name───────────┬─type──────────────────────┬─is_subcolumn─┬─is_virtual─┐
 │ id             │ UInt64                    │            0 │          0 │
 │ arr            │ Array(UInt64)             │            0 │          0 │
diff --git a/tests/queries/0_stateless/02890_describe_table_options.sql b/tests/queries/0_stateless/02890_describe_table_options.sql
index 63806c7ee3d..419aec1a0f8 100644
--- a/tests/queries/0_stateless/02890_describe_table_options.sql
+++ b/tests/queries/0_stateless/02890_describe_table_options.sql
@@ -14,42 +14,42 @@ ORDER BY id;
 SET describe_compact_output = 0, describe_include_virtual_columns = 0, describe_include_subcolumns = 0;
 
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 
 SET describe_compact_output = 0, describe_include_virtual_columns = 0, describe_include_subcolumns = 1;
 
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 
 SET describe_compact_output = 0, describe_include_virtual_columns = 1, describe_include_subcolumns = 0;
 
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 
 SET describe_compact_output = 0, describe_include_virtual_columns = 1, describe_include_subcolumns = 1;
 
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 
 SET describe_compact_output = 1, describe_include_virtual_columns = 0, describe_include_subcolumns = 0;
 
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 
 SET describe_compact_output = 1, describe_include_virtual_columns = 0, describe_include_subcolumns = 1;
 
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 
 SET describe_compact_output = 1, describe_include_virtual_columns = 1, describe_include_subcolumns = 0;
 
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 
 SET describe_compact_output = 1, describe_include_virtual_columns = 1, describe_include_subcolumns = 1;
 
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-DESCRIBE remote(default, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
+DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
 
 -- { echoOff }
 
diff --git a/tests/queries/0_stateless/02903_rmt_retriable_merge_exception.sh b/tests/queries/0_stateless/02903_rmt_retriable_merge_exception.sh
index 095239954f4..5065da371a8 100755
--- a/tests/queries/0_stateless/02903_rmt_retriable_merge_exception.sh
+++ b/tests/queries/0_stateless/02903_rmt_retriable_merge_exception.sh
@@ -10,7 +10,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # (i.e. "No active replica has part X or covering part")
 # does not appears as errors (level=Error), only as info message (level=Information).
 
-cluster=default
+cluster=test_shard_localhost
 if [[ $($CLICKHOUSE_CLIENT -q "select count()>0 from system.clusters where cluster = 'test_cluster_database_replicated'") = 1 ]]; then
     cluster=test_cluster_database_replicated
 fi
diff --git a/tests/queries/0_stateless/02904_distributed_settings_background_insert_compatibility.reference b/tests/queries/0_stateless/02904_distributed_settings_background_insert_compatibility.reference
index fc7383b32bc..0694f895e38 100644
--- a/tests/queries/0_stateless/02904_distributed_settings_background_insert_compatibility.reference
+++ b/tests/queries/0_stateless/02904_distributed_settings_background_insert_compatibility.reference
@@ -1,8 +1,8 @@
-CREATE TABLE default.dist_monitor_batch_inserts\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'default\', \'system\', \'one\')\nSETTINGS monitor_batch_inserts = 1
-CREATE TABLE default.dist_monitor_split_batch_on_failure\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'default\', \'system\', \'one\')\nSETTINGS monitor_split_batch_on_failure = 1
-CREATE TABLE default.dist_monitor_sleep_time_ms\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'default\', \'system\', \'one\')\nSETTINGS monitor_sleep_time_ms = 1
-CREATE TABLE default.dist_monitor_max_sleep_time_ms\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'default\', \'system\', \'one\')\nSETTINGS monitor_max_sleep_time_ms = 1
-CREATE TABLE default.dist_background_insert_batch\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'default\', \'system\', \'one\')\nSETTINGS background_insert_batch = 1
-CREATE TABLE default.dist_background_insert_split_batch_on_failure\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'default\', \'system\', \'one\')\nSETTINGS background_insert_split_batch_on_failure = 1
-CREATE TABLE default.dist_background_insert_sleep_time_ms\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'default\', \'system\', \'one\')\nSETTINGS background_insert_sleep_time_ms = 1
-CREATE TABLE default.dist_background_insert_max_sleep_time_ms\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'default\', \'system\', \'one\')\nSETTINGS background_insert_max_sleep_time_ms = 1
+CREATE TABLE default.dist_monitor_batch_inserts\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'test_shard_localhost\', \'system\', \'one\')\nSETTINGS monitor_batch_inserts = 1
+CREATE TABLE default.dist_monitor_split_batch_on_failure\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'test_shard_localhost\', \'system\', \'one\')\nSETTINGS monitor_split_batch_on_failure = 1
+CREATE TABLE default.dist_monitor_sleep_time_ms\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'test_shard_localhost\', \'system\', \'one\')\nSETTINGS monitor_sleep_time_ms = 1
+CREATE TABLE default.dist_monitor_max_sleep_time_ms\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'test_shard_localhost\', \'system\', \'one\')\nSETTINGS monitor_max_sleep_time_ms = 1
+CREATE TABLE default.dist_background_insert_batch\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'test_shard_localhost\', \'system\', \'one\')\nSETTINGS background_insert_batch = 1
+CREATE TABLE default.dist_background_insert_split_batch_on_failure\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'test_shard_localhost\', \'system\', \'one\')\nSETTINGS background_insert_split_batch_on_failure = 1
+CREATE TABLE default.dist_background_insert_sleep_time_ms\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'test_shard_localhost\', \'system\', \'one\')\nSETTINGS background_insert_sleep_time_ms = 1
+CREATE TABLE default.dist_background_insert_max_sleep_time_ms\n(\n    `dummy` UInt8\n)\nENGINE = Distributed(\'test_shard_localhost\', \'system\', \'one\')\nSETTINGS background_insert_max_sleep_time_ms = 1
diff --git a/tests/queries/0_stateless/02904_distributed_settings_background_insert_compatibility.sql.j2 b/tests/queries/0_stateless/02904_distributed_settings_background_insert_compatibility.sql.j2
index 3116f0f5973..20e848baa88 100644
--- a/tests/queries/0_stateless/02904_distributed_settings_background_insert_compatibility.sql.j2
+++ b/tests/queries/0_stateless/02904_distributed_settings_background_insert_compatibility.sql.j2
@@ -10,13 +10,13 @@
     'background_insert_max_sleep_time_ms',
 ] %}
 drop table if exists dist_{{ table_setting }};
-create table dist_{{ table_setting }} as system.one engine=Distributed(default, system, one) settings {{ table_setting }}=1;
+create table dist_{{ table_setting }} as system.one engine=Distributed(test_shard_localhost, system, one) settings {{ table_setting }}=1;
 show create dist_{{ table_setting }};
 drop table dist_{{ table_setting }};
 {% endfor %}
 
 create table data (key Int) engine=Null();
-create table dist (key Int) engine=Distributed(default, currentDatabase(), data, key);
+create table dist (key Int) engine=Distributed(test_shard_localhost, currentDatabase(), data, key);
 {% for query_setting in [
     'distributed_directory_monitor_sleep_time_ms',
     'distributed_directory_monitor_max_sleep_time_ms',

From 0530055842a14468218d774d020baf0153abfea7 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Mon, 18 Mar 2024 15:59:05 +0100
Subject: [PATCH 681/985] Updated names in BufferAllocationPolicy

---
 src/Common/BufferAllocationPolicy.cpp         |  6 +--
 src/Common/BufferAllocationPolicy.h           | 41 ++++++++++---------
 .../IO/WriteBufferFromAzureBlobStorage.cpp    | 12 +++---
 .../IO/WriteBufferFromAzureBlobStorage.h      |  2 +-
 src/IO/WriteBufferFromS3.cpp                  | 12 +++---
 src/IO/WriteBufferFromS3.h                    |  2 +-
 6 files changed, 39 insertions(+), 36 deletions(-)

diff --git a/src/Common/BufferAllocationPolicy.cpp b/src/Common/BufferAllocationPolicy.cpp
index 1456233eb03..2b00d4f84d0 100644
--- a/src/Common/BufferAllocationPolicy.cpp
+++ b/src/Common/BufferAllocationPolicy.cpp
@@ -11,7 +11,7 @@ class FixedSizeBufferAllocationPolicy : public IBufferAllocationPolicy
     size_t buffer_number = 0;
 
 public:
-    explicit FixedSizeBufferAllocationPolicy(const BufferAllocationSettings & settings_)
+    explicit FixedSizeBufferAllocationPolicy(const IBufferAllocationPolicy::Settings & settings_)
         : buffer_size(settings_.strict_upload_part_size)
     {
         chassert(buffer_size > 0);
@@ -45,7 +45,7 @@ class ExpBufferAllocationPolicy : public DB::IBufferAllocationPolicy
     size_t buffer_number = 0;
 
 public:
-    explicit ExpBufferAllocationPolicy(const BufferAllocationSettings & settings_)
+    explicit ExpBufferAllocationPolicy(const IBufferAllocationPolicy::Settings & settings_)
         : first_size(std::max(settings_.max_single_part_upload_size, settings_.min_upload_part_size))
         , second_size(settings_.min_upload_part_size)
         , multiply_factor(settings_.upload_part_size_multiply_factor)
@@ -91,7 +91,7 @@ public:
 
 IBufferAllocationPolicy::~IBufferAllocationPolicy() = default;
 
-IBufferAllocationPolicyPtr ChooseBufferPolicy(BufferAllocationSettings settings_)
+IBufferAllocationPolicy::IBufferAllocationPolicyPtr IBufferAllocationPolicy::create(IBufferAllocationPolicy::Settings settings_)
 {
     if (settings_.strict_upload_part_size > 0)
         return std::make_unique<FixedSizeBufferAllocationPolicy>(settings_);
diff --git a/src/Common/BufferAllocationPolicy.h b/src/Common/BufferAllocationPolicy.h
index b759d22ede6..3ada9e52fdf 100644
--- a/src/Common/BufferAllocationPolicy.h
+++ b/src/Common/BufferAllocationPolicy.h
@@ -9,27 +9,30 @@
 namespace DB
 {
 
-struct BufferAllocationSettings
-{
-    size_t strict_upload_part_size = 0;
-    size_t min_upload_part_size = 16 * 1024 * 1024;
-    size_t max_upload_part_size = 5ULL * 1024 * 1024 * 1024;
-    size_t upload_part_size_multiply_factor = 2;
-    size_t upload_part_size_multiply_parts_count_threshold = 500;
-    size_t max_single_part_upload_size = 32 * 1024 * 1024;
-};
-
 class IBufferAllocationPolicy
 {
-    public:
-        virtual size_t getBufferNumber() const = 0;
-        virtual size_t getBufferSize() const = 0;
-        virtual void nextBuffer() = 0;
-        virtual ~IBufferAllocationPolicy() = 0;
+public:
+
+    struct Settings
+    {
+        size_t strict_upload_part_size = 0;
+        size_t min_upload_part_size = 16 * 1024 * 1024;
+        size_t max_upload_part_size = 5ULL * 1024 * 1024 * 1024;
+        size_t upload_part_size_multiply_factor = 2;
+        size_t upload_part_size_multiply_parts_count_threshold = 500;
+        size_t max_single_part_upload_size = 32 * 1024 * 1024;
+    };
+
+
+    virtual size_t getBufferNumber() const = 0;
+    virtual size_t getBufferSize() const = 0;
+    virtual void nextBuffer() = 0;
+    virtual ~IBufferAllocationPolicy() = 0;
+
+    using IBufferAllocationPolicyPtr = std::unique_ptr<IBufferAllocationPolicy>;
+
+    static IBufferAllocationPolicyPtr create(Settings settings_);
+
 };
 
-using IBufferAllocationPolicyPtr = std::unique_ptr<IBufferAllocationPolicy>;
-
-IBufferAllocationPolicyPtr ChooseBufferPolicy(BufferAllocationSettings settings_);
-
 }
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index bc11d445a51..41d7187afda 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -33,12 +33,12 @@ WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     ThreadPoolCallbackRunner<void> schedule_)
     : WriteBufferFromFileBase(buf_size_, nullptr, 0)
     , log(getLogger("WriteBufferFromAzureBlobStorage"))
-    , buffer_allocation_policy(ChooseBufferPolicy({settings_->strict_upload_part_size,
-                                                   settings_->min_upload_part_size,
-                                                   settings_->max_upload_part_size,
-                                                   settings_->upload_part_size_multiply_factor,
-                                                   settings_->upload_part_size_multiply_parts_count_threshold,
-                                                   settings_->max_single_part_upload_size}))
+    , buffer_allocation_policy(IBufferAllocationPolicy::create({settings_->strict_upload_part_size,
+                                                                settings_->min_upload_part_size,
+                                                                settings_->max_upload_part_size,
+                                                                settings_->upload_part_size_multiply_factor,
+                                                                settings_->upload_part_size_multiply_parts_count_threshold,
+                                                                settings_->max_single_part_upload_size}))
     , max_single_part_upload_size(settings_->max_single_part_upload_size)
     , max_unexpected_write_error_retries(settings_->max_unexpected_write_error_retries)
     , blob_path(blob_path_)
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
index 7223f66693e..f047dd53724 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
@@ -62,7 +62,7 @@ private:
     LoggerPtr log;
     LogSeriesLimiterPtr limitedLog = std::make_shared<LogSeriesLimiter>(log, 1, 5);
 
-    IBufferAllocationPolicyPtr buffer_allocation_policy;
+    IBufferAllocationPolicy::IBufferAllocationPolicyPtr buffer_allocation_policy;
 
     const size_t max_single_part_upload_size;
     const size_t max_unexpected_write_error_retries;
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index 60fa828d6c4..c907c4cb6b6 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -93,12 +93,12 @@ WriteBufferFromS3::WriteBufferFromS3(
     , write_settings(write_settings_)
     , client_ptr(std::move(client_ptr_))
     , object_metadata(std::move(object_metadata_))
-    , buffer_allocation_policy(ChooseBufferPolicy({upload_settings.strict_upload_part_size,
-                                                   upload_settings.min_upload_part_size,
-                                                   upload_settings.max_upload_part_size,
-                                                   upload_settings.upload_part_size_multiply_factor,
-                                                   upload_settings.upload_part_size_multiply_parts_count_threshold,
-                                                   upload_settings.max_single_part_upload_size}))
+    , buffer_allocation_policy(IBufferAllocationPolicy::create({upload_settings.strict_upload_part_size,
+                                                                upload_settings.min_upload_part_size,
+                                                                upload_settings.max_upload_part_size,
+                                                                upload_settings.upload_part_size_multiply_factor,
+                                                                upload_settings.upload_part_size_multiply_parts_count_threshold,
+                                                                upload_settings.max_single_part_upload_size}))
     , task_tracker(
           std::make_unique<TaskTracker>(
               std::move(schedule_),
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 840274c8ace..201743e7f9c 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -86,7 +86,7 @@ private:
     LoggerPtr log = getLogger("WriteBufferFromS3");
     LogSeriesLimiterPtr limitedLog = std::make_shared<LogSeriesLimiter>(log, 1, 5);
 
-    IBufferAllocationPolicyPtr buffer_allocation_policy;
+    IBufferAllocationPolicy::IBufferAllocationPolicyPtr buffer_allocation_policy;
 
     /// Upload in S3 is made in parts.
     /// We initiate upload, then upload each part and get ETag as a response, and then finalizeImpl() upload with listing all our parts.

From 6b19c5ea753c1990d3bb0636c5108b75a017ae7c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 18 Mar 2024 16:07:10 +0100
Subject: [PATCH 682/985] Fix integration tests

---
 .../configs/remote_servers.xml                       | 12 ++++++++++++
 .../test_select_from_system_tables.py                |  5 ++++-
 .../test_quota/configs/remote_servers.xml            | 12 ++++++++++++
 tests/integration/test_quota/test.py                 |  1 +
 .../configs/remote_servers.xml                       | 12 ++++++++++++
 .../test_from_system_tables.py                       |  1 +
 6 files changed, 42 insertions(+), 1 deletion(-)
 create mode 100644 tests/integration/test_disabled_access_control_improvements/configs/remote_servers.xml
 create mode 100644 tests/integration/test_quota/configs/remote_servers.xml
 create mode 100644 tests/integration/test_select_access_rights/configs/remote_servers.xml

diff --git a/tests/integration/test_disabled_access_control_improvements/configs/remote_servers.xml b/tests/integration/test_disabled_access_control_improvements/configs/remote_servers.xml
new file mode 100644
index 00000000000..b9aee7f5ca6
--- /dev/null
+++ b/tests/integration/test_disabled_access_control_improvements/configs/remote_servers.xml
@@ -0,0 +1,12 @@
+<clickhouse>
+    <remote_servers>
+        <default>
+            <shard>
+                <replica>
+                    <host>node1</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </default>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_disabled_access_control_improvements/test_select_from_system_tables.py b/tests/integration/test_disabled_access_control_improvements/test_select_from_system_tables.py
index 894464fd813..4ea5a524fed 100644
--- a/tests/integration/test_disabled_access_control_improvements/test_select_from_system_tables.py
+++ b/tests/integration/test_disabled_access_control_improvements/test_select_from_system_tables.py
@@ -6,7 +6,10 @@ from helpers.test_tools import TSV
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance(
     "node",
-    main_configs=["configs/config.d/disable_access_control_improvements.xml"],
+    main_configs=[
+        "configs/config.d/disable_access_control_improvements.xml",
+        "configs/remote_servers.xml",
+    ],
     user_configs=[
         "configs/users.d/another_user.xml",
     ],
diff --git a/tests/integration/test_quota/configs/remote_servers.xml b/tests/integration/test_quota/configs/remote_servers.xml
new file mode 100644
index 00000000000..b9aee7f5ca6
--- /dev/null
+++ b/tests/integration/test_quota/configs/remote_servers.xml
@@ -0,0 +1,12 @@
+<clickhouse>
+    <remote_servers>
+        <default>
+            <shard>
+                <replica>
+                    <host>node1</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </default>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_quota/test.py b/tests/integration/test_quota/test.py
index bf64b57a7bf..bb50c84b340 100644
--- a/tests/integration/test_quota/test.py
+++ b/tests/integration/test_quota/test.py
@@ -9,6 +9,7 @@ from helpers.test_tools import assert_eq_with_retry, TSV
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance(
     "instance",
+    main_configs=["configs/remote_servers.xml"],
     user_configs=[
         "configs/users.d/assign_myquota_to_default_user.xml",
         "configs/users.d/drop_default_quota.xml",
diff --git a/tests/integration/test_select_access_rights/configs/remote_servers.xml b/tests/integration/test_select_access_rights/configs/remote_servers.xml
new file mode 100644
index 00000000000..b9aee7f5ca6
--- /dev/null
+++ b/tests/integration/test_select_access_rights/configs/remote_servers.xml
@@ -0,0 +1,12 @@
+<clickhouse>
+    <remote_servers>
+        <default>
+            <shard>
+                <replica>
+                    <host>node1</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </default>
+    </remote_servers>
+</clickhouse>
diff --git a/tests/integration/test_select_access_rights/test_from_system_tables.py b/tests/integration/test_select_access_rights/test_from_system_tables.py
index 3cd6b90109c..7076e5c8ce7 100644
--- a/tests/integration/test_select_access_rights/test_from_system_tables.py
+++ b/tests/integration/test_select_access_rights/test_from_system_tables.py
@@ -6,6 +6,7 @@ from helpers.test_tools import TSV
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance(
     "node",
+    main_configs=["configs/remote_servers.xml"],
     user_configs=[
         "configs/another_user.xml",
     ],

From 679bf92cd146f0855ba5e02bc0c343c46506b534 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 18 Mar 2024 15:08:46 +0000
Subject: [PATCH 683/985] Split test 00159_parallel_formatting_json_and_friends
 to avoid timeouts

---
 ...l_formatting_json_and_friends_1.reference} | 12 -----------
 ...parallel_formatting_json_and_friends_1.sh} |  2 +-
 ...el_formatting_json_and_friends_2.reference | 12 +++++++++++
 ..._parallel_formatting_json_and_friends_2.sh | 20 +++++++++++++++++++
 4 files changed, 33 insertions(+), 13 deletions(-)
 rename tests/queries/1_stateful/{00159_parallel_formatting_json_and_friends.reference => 00159_parallel_formatting_json_and_friends_1.reference} (51%)
 rename tests/queries/1_stateful/{00159_parallel_formatting_json_and_friends.sh => 00159_parallel_formatting_json_and_friends_1.sh} (83%)
 create mode 100644 tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_2.reference
 create mode 100755 tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_2.sh

diff --git a/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends.reference b/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_1.reference
similarity index 51%
rename from tests/queries/1_stateful/00159_parallel_formatting_json_and_friends.reference
rename to tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_1.reference
index 787b57ce761..cd425198651 100644
--- a/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends.reference
+++ b/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_1.reference
@@ -14,15 +14,3 @@ JSONCompactEachRowWithNames, false
 e3231b1c8187de4da6752d692b2ddba9  -
 JSONCompactEachRowWithNames, true
 e3231b1c8187de4da6752d692b2ddba9  -
-JSONCompactStringsEachRowWithNames, false
-e3231b1c8187de4da6752d692b2ddba9  -
-JSONCompactStringsEachRowWithNames, true
-e3231b1c8187de4da6752d692b2ddba9  -
-JSONCompactEachRowWithNamesAndTypes, false
-d40c4327c63eded184eee185a5330e12  -
-JSONCompactEachRowWithNamesAndTypes, true
-d40c4327c63eded184eee185a5330e12  -
-JSONCompactStringsEachRowWithNamesAndTypes, false
-d40c4327c63eded184eee185a5330e12  -
-JSONCompactStringsEachRowWithNamesAndTypes, true
-d40c4327c63eded184eee185a5330e12  -
diff --git a/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends.sh b/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_1.sh
similarity index 83%
rename from tests/queries/1_stateful/00159_parallel_formatting_json_and_friends.sh
rename to tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_1.sh
index 77dd330099a..0cc4636ef5d 100755
--- a/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends.sh
+++ b/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_1.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-FORMATS=('JSONEachRow' 'JSONCompactEachRow' 'JSONCompactStringsEachRow' 'JSONCompactEachRowWithNames' 'JSONCompactStringsEachRowWithNames' 'JSONCompactEachRowWithNamesAndTypes' 'JSONCompactStringsEachRowWithNamesAndTypes')
+FORMATS=('JSONEachRow' 'JSONCompactEachRow' 'JSONCompactStringsEachRow' 'JSONCompactEachRowWithNames')
 
 for format in "${FORMATS[@]}"
 do
diff --git a/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_2.reference b/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_2.reference
new file mode 100644
index 00000000000..ba7a8ac5fdc
--- /dev/null
+++ b/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_2.reference
@@ -0,0 +1,12 @@
+JSONCompactStringsEachRowWithNames, false
+e3231b1c8187de4da6752d692b2ddba9  -
+JSONCompactStringsEachRowWithNames, true
+e3231b1c8187de4da6752d692b2ddba9  -
+JSONCompactEachRowWithNamesAndTypes, false
+d40c4327c63eded184eee185a5330e12  -
+JSONCompactEachRowWithNamesAndTypes, true
+d40c4327c63eded184eee185a5330e12  -
+JSONCompactStringsEachRowWithNamesAndTypes, false
+d40c4327c63eded184eee185a5330e12  -
+JSONCompactStringsEachRowWithNamesAndTypes, true
+d40c4327c63eded184eee185a5330e12  -
diff --git a/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_2.sh b/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_2.sh
new file mode 100755
index 00000000000..1c49305fe53
--- /dev/null
+++ b/tests/queries/1_stateful/00159_parallel_formatting_json_and_friends_2.sh
@@ -0,0 +1,20 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+
+FORMATS=('JSONCompactStringsEachRowWithNames' 'JSONCompactEachRowWithNamesAndTypes' 'JSONCompactStringsEachRowWithNamesAndTypes')
+
+for format in "${FORMATS[@]}"
+do
+    echo "$format, false";
+    $CLICKHOUSE_CLIENT --max_threads=0 --output_format_parallel_formatting=false -q \
+    "SELECT ClientEventTime::DateTime('Asia/Dubai') as a, MobilePhoneModel as b, ClientIP6 as c FROM test.hits ORDER BY a, b, c LIMIT 3000000 Format $format" | md5sum
+
+    echo "$format, true";
+    $CLICKHOUSE_CLIENT --max_threads=0 --output_format_parallel_formatting=true -q \
+    "SELECT ClientEventTime::DateTime('Asia/Dubai') as a, MobilePhoneModel as b, ClientIP6 as c FROM test.hits ORDER BY a, b, c LIMIT 3000000 Format $format" | md5sum
+done

From 514faa851c32d26620fb3a086f3dbfe40ecd1a23 Mon Sep 17 00:00:00 2001
From: avogar <avogar@clickhouse.com>
Date: Mon, 18 Mar 2024 15:26:01 +0000
Subject: [PATCH 684/985] Make test
 00159_parallel_formatting_tsv_and_friends.sh faster

---
 .../1_stateful/00159_parallel_formatting_tsv_and_friends.sh   | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/1_stateful/00159_parallel_formatting_tsv_and_friends.sh b/tests/queries/1_stateful/00159_parallel_formatting_tsv_and_friends.sh
index 02441190b91..393a9fc4282 100755
--- a/tests/queries/1_stateful/00159_parallel_formatting_tsv_and_friends.sh
+++ b/tests/queries/1_stateful/00159_parallel_formatting_tsv_and_friends.sh
@@ -11,9 +11,9 @@ for format in "${FORMATS[@]}"
 do
     echo "$format, false";
     $CLICKHOUSE_CLIENT --max_threads=0 --output_format_parallel_formatting=false -q \
-    "SELECT ClientEventTime::DateTime('Asia/Dubai') as a, MobilePhoneModel as b, ClientIP6 as c FROM test.hits ORDER BY a, b, c Format $format" | md5sum
+    "SELECT ClientEventTime::DateTime('Asia/Dubai') as a, MobilePhoneModel as b, ClientIP6 as c FROM test.hits ORDER BY a, b, c LIMIT 3000000 Format $format" | md5sum
 
     echo "$format, true";
     $CLICKHOUSE_CLIENT --max_threads=0 --output_format_parallel_formatting=true -q \
-    "SELECT ClientEventTime::DateTime('Asia/Dubai') as a, MobilePhoneModel as b, ClientIP6 as c FROM test.hits ORDER BY a, b, c Format $format" | md5sum
+    "SELECT ClientEventTime::DateTime('Asia/Dubai') as a, MobilePhoneModel as b, ClientIP6 as c FROM test.hits ORDER BY a, b, c LIMIT 3000000 Format $format" | md5sum
 done

From 10dd47cf5cf76c4e6a8475e56d4d9e39f562319b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 18 Mar 2024 16:40:03 +0100
Subject: [PATCH 685/985] Separate CH and sanitizer logs

---
 docker/test/fuzzer/run-fuzzer.sh | 16 +++++++++++-----
 tests/ci/ast_fuzzer_check.py     |  9 +--------
 2 files changed, 12 insertions(+), 13 deletions(-)

diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index 1c41d299ac3..e8eb2d21e4d 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -174,7 +174,14 @@ function fuzz
     mkdir -p /var/run/clickhouse-server
 
     # NOTE: we use process substitution here to preserve keep $! as a pid of clickhouse-server
-    clickhouse-server --config-file db/config.xml --pid-file /var/run/clickhouse-server/clickhouse-server.pid -- --path db > server.log 2>>stderr.log &
+    # server.log -> CH logs
+    # stderr.log -> Process logs (sanitizer)
+    clickhouse-server \
+        --config-file db/config.xml \
+        --pid-file /var/run/clickhouse-server/clickhouse-server.pid \
+        --  --path db \
+            --logger.console=0 \
+            --logger.log=server.log > stderr.log 2>&1
     server_pid=$!
 
     kill -0 $server_pid
@@ -310,7 +317,7 @@ quit
 
         IS_SANITIZED=$(clickhouse-local --query "SELECT value LIKE '%-fsanitize=%' FROM system.build_options WHERE name = 'CXX_FLAGS'")
 
-        if [ "${IS_SANITIZED}" -eq "1" ] && rg --text 'Sanitizer:? (out-of-memory|out of memory|failed to allocate)|Child process was terminated by signal 9' description.txt
+        if [ "${IS_SANITIZED}" -eq "1" ] && rg --text 'Sanitizer:? (out-of-memory|out of memory|failed to allocate)|Child process was terminated by signal 9' stderr.log
         then
             # OOM of sanitizer is not a problem we can handle - treat it as success, but preserve the description.
             # Why? Because sanitizers have the memory overhead, that is not controllable from inside clickhouse-server.
@@ -392,7 +399,7 @@ if [ -f core.zst ]; then
 fi
 
 # Keep all the lines in the paragraphs containing <Fatal> that either contain <Fatal> or don't start with 20... (year)
-sed -n '/<Fatal>/,/^$/p' server.log stderr.log | awk '/<Fatal>/ || !/^20/' > fatal.log ||:
+sed -n '/<Fatal>/,/^$/p' server.log | awk '/<Fatal>/ || !/^20/' > fatal.log ||:
 FATAL_LINK=''
 if [ -s fatal.log ]; then
     FATAL_LINK='<a href="fatal.log">fatal.log</a>'
@@ -401,7 +408,6 @@ fi
 dmesg -T > dmesg.log ||:
 
 zstd --threads=0 --rm server.log
-zstd --threads=0 --rm stderr.log
 zstd --threads=0 --rm fuzzer.log
 
 cat > report.html <<EOF ||:
@@ -428,7 +434,7 @@ p.links a { padding: 5px; margin: 3px; background: #FFF; line-height: 2; white-s
   <a href="run.log">run.log</a>
   <a href="fuzzer.log.zst">fuzzer.log.zst</a>
   <a href="server.log.zst">server.log.zst</a>
-  <a href="stderr.log.zst">stderr.log.zst</a>
+  <a href="stderr.log">stderr.log</a>
   <a href="main.log">main.log</a>
   <a href="dmesg.log">dmesg.log</a>
   ${CORE_LINK}
diff --git a/tests/ci/ast_fuzzer_check.py b/tests/ci/ast_fuzzer_check.py
index c24a67a7a6e..b88a9476a6d 100644
--- a/tests/ci/ast_fuzzer_check.py
+++ b/tests/ci/ast_fuzzer_check.py
@@ -115,6 +115,7 @@ def main():
         "core.zst": workspace_path / "core.zst",
         "dmesg.log": workspace_path / "dmesg.log",
         "fatal.log": workspace_path / "fatal.log",
+        "stderr.log": workspace_path / "stderr.log",
     }
 
     compressed_server_log_path = workspace_path / "server.log.zst"
@@ -126,14 +127,6 @@ def main():
         if not_compressed_server_log_path.exists():
             paths["server.log"] = not_compressed_server_log_path
 
-    compressed_stderr_log_path = workspace_path / "stderr.log.zst"
-    if compressed_stderr_log_path.exists():
-        paths["stderr.log.zst"] = compressed_stderr_log_path
-    else:
-        not_compressed_stderr_log_path = workspace_path / "stderr.log"
-        if compressed_stderr_log_path.exists():
-            paths["stderr.log"] = not_compressed_stderr_log_path
-
     # Same idea but with the fuzzer log
     compressed_fuzzer_log_path = workspace_path / "fuzzer.log.zst"
     if compressed_fuzzer_log_path.exists():

From efe5373f2bae7c0101862c7b4e59874d6a332271 Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 18 Mar 2024 15:54:18 +0000
Subject: [PATCH 686/985] refactoring of reading from compact parts

---
 .../MergeTree/MergeTreeDataPartCompact.cpp    |  23 +-
 src/Storages/MergeTree/MergeTreeIOSettings.h  |  13 +
 .../MergeTree/MergeTreeIndexReader.cpp        |  21 +-
 .../MergeTree/MergeTreeMarksLoader.cpp        |  78 +--
 src/Storages/MergeTree/MergeTreeMarksLoader.h |  51 +-
 .../MergeTree/MergeTreeReaderCompact.cpp      | 515 ++++--------------
 .../MergeTree/MergeTreeReaderCompact.h        |  77 +--
 .../MergeTreeReaderCompactSingleBuffer.cpp    | 108 ++++
 .../MergeTreeReaderCompactSingleBuffer.h      |  33 ++
 .../MergeTree/MergeTreeReaderStream.cpp       | 441 ++++++++++-----
 .../MergeTree/MergeTreeReaderStream.h         | 136 ++++-
 .../MergeTree/MergeTreeReaderWide.cpp         |  27 +-
 src/Storages/StorageMergeTreeIndex.cpp        |   4 +-
 13 files changed, 814 insertions(+), 713 deletions(-)
 create mode 100644 src/Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.cpp
 create mode 100644 src/Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.h

diff --git a/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp b/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp
index 9f201ab3b81..77a73fcc8f9 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartCompact.cpp
@@ -1,10 +1,8 @@
 #include "MergeTreeDataPartCompact.h"
 #include <DataTypes/NestedUtils.h>
-#include <Storages/MergeTree/MergeTreeReaderCompact.h>
+#include <Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.h>
 #include <Storages/MergeTree/MergeTreeDataPartWriterCompact.h>
-#include <Interpreters/Context.h>
 #include <Storages/MergeTree/LoadedMergeTreeDataPartInfoForReader.h>
-#include <Compression/CompressedReadBufferFromFile.h>
 
 
 namespace DB
@@ -41,21 +39,12 @@ IMergeTreeDataPart::MergeTreeReaderPtr MergeTreeDataPartCompact::getReader(
     const ReadBufferFromFileBase::ProfileCallback & profile_callback) const
 {
     auto read_info = std::make_shared<LoadedMergeTreeDataPartInfoForReader>(shared_from_this(), alter_conversions);
-    auto * load_marks_threadpool
-        = reader_settings.read_settings.load_marks_asynchronously ? &read_info->getContext()->getLoadMarksThreadpool() : nullptr;
 
-    return std::make_unique<MergeTreeReaderCompact>(
-        read_info,
-        columns_to_read,
-        virtual_fields,
-        storage_snapshot,
-        uncompressed_cache,
-        mark_cache,
-        mark_ranges,
-        reader_settings,
-        load_marks_threadpool,
-        avg_value_size_hints,
-        profile_callback);
+    return std::make_unique<MergeTreeReaderCompactSingleBuffer>(
+        read_info, columns_to_read, virtual_fields,
+        storage_snapshot, uncompressed_cache,
+        mark_cache, mark_ranges, reader_settings,
+        avg_value_size_hints, profile_callback, CLOCK_MONOTONIC_COARSE);
 }
 
 IMergeTreeDataPart::MergeTreeWriterPtr MergeTreeDataPartCompact::getWriter(
diff --git a/src/Storages/MergeTree/MergeTreeIOSettings.h b/src/Storages/MergeTree/MergeTreeIOSettings.h
index 379d7af8569..feeb1808a6f 100644
--- a/src/Storages/MergeTree/MergeTreeIOSettings.h
+++ b/src/Storages/MergeTree/MergeTreeIOSettings.h
@@ -13,6 +13,11 @@ namespace DB
 class MMappedFileCache;
 using MMappedFileCachePtr = std::shared_ptr<MMappedFileCache>;
 
+enum class CompactPartsReadMethod
+{
+    SingleBuffer,
+    MultiBuffer,
+};
 
 struct MergeTreeReaderSettings
 {
@@ -25,12 +30,20 @@ struct MergeTreeReaderSettings
     bool checksum_on_read = true;
     /// True if we read in order of sorting key.
     bool read_in_order = false;
+    /// Use one buffer for each column or for all columns while reading from compact.
+    CompactPartsReadMethod compact_parts_read_method = CompactPartsReadMethod::SingleBuffer;
+    /// True if we read stream for dictionary of LowCardinality type.
+    bool is_low_cardinality_dictionary = false;
+    /// True if data may be compressed by different codecs in one stream.
+    bool allow_different_codecs = false;
     /// Deleted mask is applied to all reads except internal select from mutate some part columns.
     bool apply_deleted_mask = true;
     /// Put reading task in a common I/O pool, return Async state on prepare()
     bool use_asynchronous_read_from_pool = false;
     /// If PREWHERE has multiple conditions combined with AND, execute them in separate read/filtering steps.
     bool enable_multiple_prewhere_read_steps = false;
+    /// If true, try to lower size of read buffer according to granule size and compressed block size.
+    bool adjust_read_buffer_size = true;
 };
 
 struct MergeTreeWriterSettings
diff --git a/src/Storages/MergeTree/MergeTreeIndexReader.cpp b/src/Storages/MergeTree/MergeTreeIndexReader.cpp
index f0b1aacc239..6012994b46d 100644
--- a/src/Storages/MergeTree/MergeTreeIndexReader.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexReader.cpp
@@ -20,14 +20,23 @@ std::unique_ptr<MergeTreeReaderStream> makeIndexReader(
     auto context = part->storage.getContext();
     auto * load_marks_threadpool = settings.read_settings.load_marks_asynchronously ? &context->getLoadMarksThreadpool() : nullptr;
 
-    return std::make_unique<MergeTreeReaderStream>(
+    auto marks_loader = std::make_shared<MergeTreeMarksLoader>(
         std::make_shared<LoadedMergeTreeDataPartInfoForReader>(part, std::make_shared<AlterConversions>()),
+        mark_cache,
+        part->index_granularity_info.getMarksFilePath(index->getFileName()),
+        marks_count,
+        part->index_granularity_info,
+        settings.save_marks_in_cache,
+        settings.read_settings,
+        load_marks_threadpool,
+        /*num_columns_in_mark=*/ 1);
+
+    return std::make_unique<MergeTreeReaderStreamSingleColumn>(
+        part->getDataPartStoragePtr(),
         index->getFileName(), extension, marks_count,
-        all_mark_ranges,
-        std::move(settings), mark_cache, uncompressed_cache,
-        part->getFileSizeOrZero(index->getFileName() + extension),
-        &part->index_granularity_info,
-        ReadBufferFromFileBase::ProfileCallback{}, CLOCK_MONOTONIC_COARSE, false, load_marks_threadpool);
+        all_mark_ranges, std::move(settings), uncompressed_cache,
+        part->getFileSizeOrZero(index->getFileName() + extension), std::move(marks_loader),
+        ReadBufferFromFileBase::ProfileCallback{}, CLOCK_MONOTONIC_COARSE);
 }
 
 }
diff --git a/src/Storages/MergeTree/MergeTreeMarksLoader.cpp b/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
index 8250050412f..a7a635f3b72 100644
--- a/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
+++ b/src/Storages/MergeTree/MergeTreeMarksLoader.cpp
@@ -28,6 +28,23 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
+MergeTreeMarksGetter::MergeTreeMarksGetter(MarkCache::MappedPtr marks_, size_t num_columns_in_mark_)
+    : marks(std::move(marks_)), num_columns_in_mark(num_columns_in_mark_)
+{
+    assert(marks);
+}
+
+MarkInCompressedFile MergeTreeMarksGetter::getMark(size_t row_index, size_t column_index) const
+{
+#ifndef NDEBUG
+    if (column_index >= num_columns_in_mark)
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+            "Column index: {} is out of range [0, {})", column_index, num_columns_in_mark);
+#endif
+
+    return marks->get(row_index * num_columns_in_mark + column_index);
+}
+
 MergeTreeMarksLoader::MergeTreeMarksLoader(
     MergeTreeDataPartInfoForReaderPtr data_part_reader_,
     MarkCache * mark_cache_,
@@ -37,58 +54,49 @@ MergeTreeMarksLoader::MergeTreeMarksLoader(
     bool save_marks_in_cache_,
     const ReadSettings & read_settings_,
     ThreadPool * load_marks_threadpool_,
-    size_t columns_in_mark_)
+    size_t num_columns_in_mark_)
     : data_part_reader(data_part_reader_)
     , mark_cache(mark_cache_)
     , mrk_path(mrk_path_)
     , marks_count(marks_count_)
     , index_granularity_info(index_granularity_info_)
     , save_marks_in_cache(save_marks_in_cache_)
-    , columns_in_mark(columns_in_mark_)
     , read_settings(read_settings_)
+    , num_columns_in_mark(num_columns_in_mark_)
     , load_marks_threadpool(load_marks_threadpool_)
 {
     if (load_marks_threadpool)
-    {
         future = loadMarksAsync();
-    }
 }
 
 MergeTreeMarksLoader::~MergeTreeMarksLoader()
 {
     if (future.valid())
-    {
         future.wait();
-    }
 }
 
-
-MarkInCompressedFile MergeTreeMarksLoader::getMark(size_t row_index, size_t column_index)
+MergeTreeMarksGetterPtr MergeTreeMarksLoader::loadMarks()
 {
-    if (!marks)
+    std::lock_guard lock(load_mutex);
+
+    if (marks)
+        return std::make_unique<MergeTreeMarksGetter>(marks, num_columns_in_mark);
+
+    Stopwatch watch(CLOCK_MONOTONIC);
+
+    if (future.valid())
     {
-        Stopwatch watch(CLOCK_MONOTONIC);
-
-        if (future.valid())
-        {
-            marks = future.get();
-            future = {};
-        }
-        else
-        {
-            marks = loadMarks();
-        }
-
-        watch.stop();
-        ProfileEvents::increment(ProfileEvents::WaitMarksLoadMicroseconds, watch.elapsedMicroseconds());
+        marks = future.get();
+        future = {};
+    }
+    else
+    {
+        marks = loadMarksSync();
     }
 
-#ifndef NDEBUG
-    if (column_index >= columns_in_mark)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Column index: {} is out of range [0, {})", column_index, columns_in_mark);
-#endif
-
-    return marks->get(row_index * columns_in_mark + column_index);
+    watch.stop();
+    ProfileEvents::increment(ProfileEvents::WaitMarksLoadMicroseconds, watch.elapsedMicroseconds());
+    return std::make_unique<MergeTreeMarksGetter>(marks, num_columns_in_mark);
 }
 
 
@@ -100,12 +108,12 @@ MarkCache::MappedPtr MergeTreeMarksLoader::loadMarksImpl()
     auto data_part_storage = data_part_reader->getDataPartStorage();
 
     size_t file_size = data_part_storage->getFileSize(mrk_path);
-    size_t mark_size = index_granularity_info.getMarkSizeInBytes(columns_in_mark);
+    size_t mark_size = index_granularity_info.getMarkSizeInBytes(num_columns_in_mark);
     size_t expected_uncompressed_size = mark_size * marks_count;
 
     // We first read the marks into a temporary simple array, then compress them into a more compact
     // representation.
-    PODArray<MarkInCompressedFile> plain_marks(marks_count * columns_in_mark); // temporary
+    PODArray<MarkInCompressedFile> plain_marks(marks_count * num_columns_in_mark); // temporary
     auto full_mark_path = std::string(fs::path(data_part_storage->getFullPath()) / mrk_path);
 
     if (file_size == 0 && marks_count != 0)
@@ -159,7 +167,7 @@ MarkCache::MappedPtr MergeTreeMarksLoader::loadMarksImpl()
 
             size_t granularity;
             reader->readStrict(
-                reinterpret_cast<char *>(plain_marks.data() + i * columns_in_mark), columns_in_mark * sizeof(MarkInCompressedFile));
+                reinterpret_cast<char *>(plain_marks.data() + i * num_columns_in_mark), num_columns_in_mark * sizeof(MarkInCompressedFile));
             readBinaryLittleEndian(granularity, *reader);
         }
 
@@ -182,13 +190,13 @@ MarkCache::MappedPtr MergeTreeMarksLoader::loadMarksImpl()
 
     auto res = std::make_shared<MarksInCompressedFile>(plain_marks);
 
-    ProfileEvents::increment(ProfileEvents::LoadedMarksCount, marks_count * columns_in_mark);
+    ProfileEvents::increment(ProfileEvents::LoadedMarksCount, marks_count * num_columns_in_mark);
     ProfileEvents::increment(ProfileEvents::LoadedMarksMemoryBytes, res->approximateMemoryUsage());
 
     return res;
 }
 
-MarkCache::MappedPtr MergeTreeMarksLoader::loadMarks()
+MarkCache::MappedPtr MergeTreeMarksLoader::loadMarksSync()
 {
     MarkCache::MappedPtr loaded_marks;
 
@@ -227,7 +235,7 @@ std::future<MarkCache::MappedPtr> MergeTreeMarksLoader::loadMarksAsync()
         [this]() -> MarkCache::MappedPtr
         {
             ProfileEvents::increment(ProfileEvents::BackgroundLoadingMarksTasks);
-            return loadMarks();
+            return loadMarksSync();
         },
         *load_marks_threadpool,
         "LoadMarksThread");
diff --git a/src/Storages/MergeTree/MergeTreeMarksLoader.h b/src/Storages/MergeTree/MergeTreeMarksLoader.h
index 0889da0cb85..73dd462f2fa 100644
--- a/src/Storages/MergeTree/MergeTreeMarksLoader.h
+++ b/src/Storages/MergeTree/MergeTreeMarksLoader.h
@@ -10,13 +10,33 @@ namespace DB
 {
 
 struct MergeTreeIndexGranularityInfo;
+using MarksPtr = MarkCache::MappedPtr;
 class Threadpool;
 
+/// Class that helps to get marks by indexes.
+/// Always immutable and thread safe.
+/// Marks can be shared between several threads
+/// that read columns from the same file.
+class MergeTreeMarksGetter
+{
+public:
+    MergeTreeMarksGetter(MarkCache::MappedPtr marks_, size_t num_columns_in_mark_);
+
+    MarkInCompressedFile getMark(size_t row_index, size_t column_index) const;
+    size_t getNumColumns() const { return num_columns_in_mark; }
+
+private:
+    const MarkCache::MappedPtr marks;
+    const size_t num_columns_in_mark;
+};
+
+using MergeTreeMarksGetterPtr = std::unique_ptr<const MergeTreeMarksGetter>;
+
+/// Class that helps to load marks on demand.
+/// Thread safe, but locks while loading marks.
 class MergeTreeMarksLoader
 {
 public:
-    using MarksPtr = MarkCache::MappedPtr;
-
     MergeTreeMarksLoader(
         MergeTreeDataPartInfoForReaderPtr data_part_reader_,
         MarkCache * mark_cache_,
@@ -26,24 +46,27 @@ public:
         bool save_marks_in_cache_,
         const ReadSettings & read_settings_,
         ThreadPool * load_marks_threadpool_,
-        size_t columns_in_mark_ = 1);
+        size_t num_columns_in_mark_);
 
     ~MergeTreeMarksLoader();
 
-    MarkInCompressedFile getMark(size_t row_index, size_t column_index = 0);
+    MergeTreeMarksGetterPtr loadMarks();
+    size_t getNumColumns() const { return num_columns_in_mark; }
 
 private:
-    MergeTreeDataPartInfoForReaderPtr data_part_reader;
-    MarkCache * mark_cache = nullptr;
-    String mrk_path;
-    size_t marks_count;
+    const MergeTreeDataPartInfoForReaderPtr data_part_reader;
+    MarkCache * const mark_cache;
+    const String mrk_path;
+    const size_t marks_count;
     const MergeTreeIndexGranularityInfo & index_granularity_info;
-    bool save_marks_in_cache = false;
-    size_t columns_in_mark;
-    MarkCache::MappedPtr marks;
-    ReadSettings read_settings;
+    const bool save_marks_in_cache;
+    const ReadSettings read_settings;
+    const size_t num_columns_in_mark;
 
-    MarkCache::MappedPtr loadMarks();
+    std::mutex load_mutex;
+    MarkCache::MappedPtr marks;
+
+    MarkCache::MappedPtr loadMarksSync();
     std::future<MarkCache::MappedPtr> loadMarksAsync();
     MarkCache::MappedPtr loadMarksImpl();
 
@@ -51,4 +74,6 @@ private:
     ThreadPool * load_marks_threadpool;
 };
 
+using MergeTreeMarksLoaderPtr = std::shared_ptr<MergeTreeMarksLoader>;
+
 }
diff --git a/src/Storages/MergeTree/MergeTreeReaderCompact.cpp b/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
index 63824366722..3835c1e2054 100644
--- a/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
@@ -10,10 +10,8 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int CANNOT_READ_ALL_DATA;
-    extern const int ARGUMENT_OUT_OF_BOUND;
 }
 
-
 MergeTreeReaderCompact::MergeTreeReaderCompact(
     MergeTreeDataPartInfoForReaderPtr data_part_info_for_read_,
     NamesAndTypesList columns_,
@@ -23,7 +21,6 @@ MergeTreeReaderCompact::MergeTreeReaderCompact(
     MarkCache * mark_cache_,
     MarkRanges mark_ranges_,
     MergeTreeReaderSettings settings_,
-    ThreadPool * load_marks_threadpool_,
     ValueSizeMap avg_value_size_hints_,
     const ReadBufferFromFileBase::ProfileCallback & profile_callback_,
     clockid_t clock_type_)
@@ -37,91 +34,22 @@ MergeTreeReaderCompact::MergeTreeReaderCompact(
         mark_ranges_,
         settings_,
         avg_value_size_hints_)
-    , marks_loader(
-          data_part_info_for_read_,
-          mark_cache,
-          data_part_info_for_read_->getIndexGranularityInfo().getMarksFilePath(MergeTreeDataPartCompact::DATA_FILE_NAME),
-          data_part_info_for_read_->getMarksCount(),
-          data_part_info_for_read_->getIndexGranularityInfo(),
-          settings.save_marks_in_cache,
-          settings.read_settings,
-          load_marks_threadpool_,
-          data_part_info_for_read_->getColumns().size())
+    , marks_loader(std::make_shared<MergeTreeMarksLoader>(
+        data_part_info_for_read_,
+        mark_cache,
+        data_part_info_for_read_->getIndexGranularityInfo().getMarksFilePath(MergeTreeDataPartCompact::DATA_FILE_NAME),
+        data_part_info_for_read_->getMarksCount(),
+        data_part_info_for_read_->getIndexGranularityInfo(),
+        settings.save_marks_in_cache,
+        settings.read_settings,
+        settings_.read_settings.load_marks_asynchronously
+            ? &data_part_info_for_read_->getContext()->getLoadMarksThreadpool() : nullptr,
+        data_part_info_for_read_->getColumns().size()))
     , profile_callback(profile_callback_)
     , clock_type(clock_type_)
 {
 }
 
-void MergeTreeReaderCompact::initialize()
-{
-    try
-    {
-        fillColumnPositions();
-
-        /// Do not use max_read_buffer_size, but try to lower buffer size with maximal size of granule to avoid reading much data.
-        auto buffer_size = getReadBufferSize(*data_part_info_for_read, marks_loader, column_positions, all_mark_ranges);
-        if (buffer_size)
-            settings.read_settings = settings.read_settings.adjustBufferSize(buffer_size);
-
-        if (!settings.read_settings.local_fs_buffer_size || !settings.read_settings.remote_fs_buffer_size)
-            throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Cannot read to empty buffer.");
-
-        const String path = MergeTreeDataPartCompact::DATA_FILE_NAME_WITH_EXTENSION;
-        auto data_part_storage = data_part_info_for_read->getDataPartStorage();
-
-        if (uncompressed_cache)
-        {
-            auto buffer = std::make_unique<CachedCompressedReadBuffer>(
-                std::string(fs::path(data_part_storage->getFullPath()) / path),
-                [this, path, data_part_storage]()
-                {
-                    return data_part_storage->readFile(
-                        path,
-                        settings.read_settings,
-                        std::nullopt, std::nullopt);
-                },
-                uncompressed_cache,
-                /* allow_different_codecs = */ true);
-
-            if (profile_callback)
-                buffer->setProfileCallback(profile_callback, clock_type);
-
-            if (!settings.checksum_on_read)
-                buffer->disableChecksumming();
-
-            cached_buffer = std::move(buffer);
-            data_buffer = cached_buffer.get();
-            compressed_data_buffer = cached_buffer.get();
-        }
-        else
-        {
-            auto buffer =
-                std::make_unique<CompressedReadBufferFromFile>(
-                    data_part_storage->readFile(
-                        path,
-                        settings.read_settings,
-                        std::nullopt, std::nullopt),
-                    /* allow_different_codecs = */ true);
-
-            if (profile_callback)
-                buffer->setProfileCallback(profile_callback, clock_type);
-
-            if (!settings.checksum_on_read)
-                buffer->disableChecksumming();
-
-            non_cached_buffer = std::move(buffer);
-            data_buffer = non_cached_buffer.get();
-            compressed_data_buffer = non_cached_buffer.get();
-        }
-    }
-    catch (...)
-    {
-        if (!isRetryableException(std::current_exception()))
-            data_part_info_for_read->reportBroken();
-        throw;
-    }
-}
-
 void MergeTreeReaderCompact::fillColumnPositions()
 {
     size_t columns_num = columns_to_read.size();
@@ -191,189 +119,31 @@ void MergeTreeReaderCompact::fillColumnPositions()
     }
 }
 
-size_t MergeTreeReaderCompact::readRows(
-    size_t from_mark, size_t current_task_last_mark, bool continue_reading, size_t max_rows_to_read, Columns & res_columns)
-{
-    if (!initialized)
-    {
-        initialize();
-        initialized = true;
-    }
-
-    if (continue_reading)
-        from_mark = next_mark;
-
-    size_t read_rows = 0;
-    size_t num_columns = columns_to_read.size();
-    checkNumberOfColumns(num_columns);
-
-    MutableColumns mutable_columns(num_columns);
-    for (size_t i = 0; i < num_columns; ++i)
-    {
-        if (column_positions[i] && res_columns[i] == nullptr)
-            res_columns[i] = columns_to_read[i].type->createColumn(*serializations[i]);
-    }
-
-    while (read_rows < max_rows_to_read)
-    {
-        size_t rows_to_read = data_part_info_for_read->getIndexGranularity().getMarkRows(from_mark);
-
-        /// If we need to read multiple subcolumns from a single column in storage,
-        /// we will read it this column only once and then reuse to extract all subcolumns.
-        std::unordered_map<String, ColumnPtr> columns_cache_for_subcolumns;
-
-        for (size_t pos = 0; pos < num_columns; ++pos)
-        {
-            if (!res_columns[pos])
-                continue;
-
-            try
-            {
-                auto & column = res_columns[pos];
-                size_t column_size_before_reading = column->size();
-
-                readData(columns_to_read[pos], column, from_mark, current_task_last_mark, *column_positions[pos], rows_to_read, columns_for_offsets[pos], columns_cache_for_subcolumns);
-
-                size_t read_rows_in_column = column->size() - column_size_before_reading;
-                if (read_rows_in_column != rows_to_read)
-                    throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA,
-                        "Cannot read all data in MergeTreeReaderCompact. Rows read: {}. Rows expected: {}.",
-                        read_rows_in_column, rows_to_read);
-            }
-            catch (...)
-            {
-                if (!isRetryableException(std::current_exception()))
-                    data_part_info_for_read->reportBroken();
-
-                /// Better diagnostics.
-                try
-                {
-                    rethrow_exception(std::current_exception());
-                }
-                catch (Exception & e)
-                {
-                    e.addMessage(getMessageForDiagnosticOfBrokenPart(from_mark, max_rows_to_read));
-                }
-
-                throw;
-            }
-        }
-
-        ++from_mark;
-        read_rows += rows_to_read;
-    }
-
-    next_mark = from_mark;
-
-    return read_rows;
-}
-
 void MergeTreeReaderCompact::readData(
-    const NameAndTypePair & name_and_type, ColumnPtr & column,
-    size_t from_mark, size_t current_task_last_mark, size_t column_position, size_t rows_to_read,
-    ColumnNameLevel name_level_for_offsets, std::unordered_map<String, ColumnPtr> & columns_cache_for_subcolumns)
+    const NameAndTypePair & name_and_type,
+    ColumnPtr & column,
+    size_t rows_to_read,
+    const InputStreamGetter & getter)
 {
-    const auto & [name, type] = name_and_type;
-    std::optional<NameAndTypePair> column_for_offsets;
-
-    if (name_level_for_offsets.has_value())
+    try
     {
-        const auto & part_columns = data_part_info_for_read->getColumnsDescription();
-        column_for_offsets = part_columns.getPhysical(name_level_for_offsets->first);
-    }
+        const auto [name, type] = name_and_type;
+        size_t column_size_before_reading = column->size();
 
-    adjustUpperBound(current_task_last_mark); /// Must go before seek.
+        ISerialization::DeserializeBinaryBulkSettings deserialize_settings;
+        deserialize_settings.getter = getter;
+        deserialize_settings.avg_value_size_hint = avg_value_size_hints[name];
 
-    if (!isContinuousReading(from_mark, column_position))
-        seekToMark(from_mark, column_position);
-
-    /// If we read only offsets we have to read prefix anyway
-    /// to preserve correctness of serialization.
-    auto buffer_getter_for_prefix = [&](const auto &) -> ReadBuffer *
-    {
-        return data_buffer;
-    };
-
-    auto buffer_getter = [&](const ISerialization::SubstreamPath & substream_path) -> ReadBuffer *
-    {
-        /// Offset stream from another column could be read, in case of current
-        /// column does not exists (see findColumnForOffsets() in
-        /// MergeTreeReaderCompact::fillColumnPositions())
-        if (name_level_for_offsets.has_value())
+        if (name_and_type.isSubcolumn())
         {
-            bool is_offsets = !substream_path.empty() && substream_path.back().type == ISerialization::Substream::ArraySizes;
-            if (!is_offsets)
-                return nullptr;
+            const auto & type_in_storage = name_and_type.getTypeInStorage();
+            const auto & name_in_storage = name_and_type.getNameInStorage();
 
-            /// Offset stream can be read only from columns of current level or
-            /// below (since it is OK to read all parent streams from the
-            /// alternative).
-            ///
-            /// Consider the following columns in nested "root":
-            /// - root.array Array(UInt8) - exists
-            /// - root.nested_array Array(Array(UInt8)) - does not exists (only_offsets_level=1)
-            ///
-            /// For root.nested_array it will try to read multiple streams:
-            /// - offsets (substream_path = {ArraySizes})
-            ///   OK
-            /// - root.nested_array elements (substream_path = {ArrayElements, ArraySizes})
-            ///   NOT OK - cannot use root.array offsets stream for this
-            ///
-            /// Here only_offsets_level is the level of the alternative stream,
-            /// and substream_path.size() is the level of the current stream.
-            if (name_level_for_offsets->second < ISerialization::getArrayLevel(substream_path))
-                return nullptr;
-        }
+            auto serialization = getSerializationInPart({name_in_storage, type_in_storage});
+            ColumnPtr temp_column = type_in_storage->createColumn(*serialization);
 
-        return data_buffer;
-    };
-
-    ISerialization::DeserializeBinaryBulkStatePtr state;
-    ISerialization::DeserializeBinaryBulkStatePtr state_for_prefix;
-
-    ISerialization::DeserializeBinaryBulkSettings deserialize_settings;
-    deserialize_settings.avg_value_size_hint = avg_value_size_hints[name];
-    bool columns_cache_was_used = false;
-
-    if (name_and_type.isSubcolumn())
-    {
-        NameAndTypePair name_type_in_storage{name_and_type.getNameInStorage(), name_and_type.getTypeInStorage()};
-        ColumnPtr temp_column;
-
-        auto it = columns_cache_for_subcolumns.find(name_type_in_storage.name);
-        if (!column_for_offsets && it != columns_cache_for_subcolumns.end())
-        {
-            temp_column = it->second;
-            auto subcolumn = name_type_in_storage.type->getSubcolumn(name_and_type.getSubcolumnName(), temp_column);
-            if (column->empty())
-                column = IColumn::mutate(subcolumn);
-            else
-                column->assumeMutable()->insertRangeFrom(*subcolumn, 0, subcolumn->size());
-
-            columns_cache_was_used = true;
-        }
-        else
-        {
-            /// In case of reading only offset use the correct serialization for reading of the prefix
-            auto serialization = getSerializationInPart(name_type_in_storage);
-            temp_column = name_type_in_storage.type->createColumn(*serialization);
-
-            if (column_for_offsets)
-            {
-                auto serialization_for_prefix = getSerializationInPart(*column_for_offsets);
-
-                deserialize_settings.getter = buffer_getter_for_prefix;
-                serialization_for_prefix->deserializeBinaryBulkStatePrefix(deserialize_settings, state_for_prefix);
-            }
-
-            deserialize_settings.getter = buffer_getter;
-            serialization->deserializeBinaryBulkStatePrefix(deserialize_settings, state);
-            serialization->deserializeBinaryBulkWithMultipleStreams(temp_column, rows_to_read, deserialize_settings, state, nullptr);
-
-            if (!column_for_offsets)
-                columns_cache_for_subcolumns[name_type_in_storage.name] = temp_column;
-
-            auto subcolumn = name_type_in_storage.type->getSubcolumn(name_and_type.getSubcolumnName(), temp_column);
+            serialization->deserializeBinaryBulkWithMultipleStreams(temp_column, rows_to_read, deserialize_settings, deserialize_binary_bulk_state_map[name], nullptr);
+            auto subcolumn = type_in_storage->getSubcolumn(name_and_type.getSubcolumnName(), temp_column);
 
             /// TODO: Avoid extra copying.
             if (column->empty())
@@ -381,185 +151,98 @@ void MergeTreeReaderCompact::readData(
             else
                 column->assumeMutable()->insertRangeFrom(*subcolumn, 0, subcolumn->size());
         }
-    }
-    else
-    {
-        /// In case of reading only offsets use the correct serialization for reading the prefix
-        auto serialization = getSerializationInPart(name_and_type);
-
-        if (column_for_offsets)
+        else
         {
-            auto serialization_for_prefix = getSerializationInPart(*column_for_offsets);
-
-            deserialize_settings.getter = buffer_getter_for_prefix;
-            serialization_for_prefix->deserializeBinaryBulkStatePrefix(deserialize_settings, state_for_prefix);
+            auto serialization = getSerializationInPart(name_and_type);
+            serialization->deserializeBinaryBulkWithMultipleStreams(column, rows_to_read, deserialize_settings, deserialize_binary_bulk_state_map[name], nullptr);
         }
 
-        deserialize_settings.getter = buffer_getter;
-        serialization->deserializeBinaryBulkStatePrefix(deserialize_settings, state);
-        serialization->deserializeBinaryBulkWithMultipleStreams(column, rows_to_read, deserialize_settings, state, nullptr);
-    }
-
-    /// The buffer is left in inconsistent state after reading single offsets or using columns cache during subcolumns reading.
-    if (name_level_for_offsets.has_value() || columns_cache_was_used)
-        last_read_granule.reset();
-    else
-        last_read_granule.emplace(from_mark, column_position);
-}
-
-void MergeTreeReaderCompact::prefetchBeginOfRange(Priority priority)
-try
-{
-    if (!initialized)
-    {
-        initialize();
-        initialized = true;
-    }
-
-    adjustUpperBound(all_mark_ranges.back().end);
-    seekToMark(all_mark_ranges.front().begin, 0);
-    data_buffer->prefetch(priority);
-}
-catch (...)
-{
-    if (!isRetryableException(std::current_exception()))
-        data_part_info_for_read->reportBroken();
-    throw;
-}
-
-void MergeTreeReaderCompact::seekToMark(size_t row_index, size_t column_index)
-{
-    MarkInCompressedFile mark = marks_loader.getMark(row_index, column_index);
-    try
-    {
-        compressed_data_buffer->seek(mark.offset_in_compressed_file, mark.offset_in_decompressed_block);
+        size_t read_rows_in_column = column->size() - column_size_before_reading;
+        if (read_rows_in_column != rows_to_read)
+            throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA,
+                "Cannot read all data in MergeTreeReaderCompact. Rows read: {}. Rows expected: {}.",
+                read_rows_in_column, rows_to_read);
     }
     catch (Exception & e)
     {
-        /// Better diagnostics.
-        if (e.code() == ErrorCodes::ARGUMENT_OUT_OF_BOUND)
-            e.addMessage("(while seeking to mark (" + toString(row_index) + ", " + toString(column_index) + ")");
-
+        e.addMessage("(while reading column " + name_and_type.name + ")");
         throw;
     }
 }
 
-void MergeTreeReaderCompact::adjustUpperBound(size_t last_mark)
+
+void MergeTreeReaderCompact::readPrefix(
+    const NameAndTypePair & name_and_type,
+    const InputStreamGetter & buffer_getter,
+    const InputStreamGetter & buffer_getter_for_prefix,
+    const ColumnNameLevel & name_level_for_offsets)
 {
-    size_t right_offset = 0;
-    if (last_mark < data_part_info_for_read->getMarksCount()) /// Otherwise read until the end of file
-        right_offset = marks_loader.getMark(last_mark).offset_in_compressed_file;
-
-    if (right_offset == 0)
+    try
     {
-        /// If already reading till the end of file.
-        if (last_right_offset && *last_right_offset == 0)
-            return;
+        ISerialization::DeserializeBinaryBulkSettings deserialize_settings;
 
-        last_right_offset = 0; // Zero value means the end of file.
-        data_buffer->setReadUntilEnd();
+        if (name_level_for_offsets.has_value())
+        {
+            const auto & part_columns = data_part_info_for_read->getColumnsDescription();
+            auto column_for_offsets = part_columns.getPhysical(name_level_for_offsets->first);
+
+            auto serialization_for_prefix = getSerializationInPart(column_for_offsets);
+            deserialize_settings.getter = buffer_getter_for_prefix;
+            ISerialization::DeserializeBinaryBulkStatePtr state_for_prefix;
+
+            serialization_for_prefix->deserializeBinaryBulkStatePrefix(deserialize_settings, state_for_prefix);
+        }
+
+        SerializationPtr serialization;
+        if (name_and_type.isSubcolumn())
+            serialization = getSerializationInPart({name_and_type.getNameInStorage(), name_and_type.getTypeInStorage()});
+        else
+            serialization = getSerializationInPart(name_and_type);
+
+
+        deserialize_settings.getter = buffer_getter;
+        serialization->deserializeBinaryBulkStatePrefix(deserialize_settings, deserialize_binary_bulk_state_map[name_and_type.name]);
     }
-    else
+    catch (Exception & e)
     {
-        if (last_right_offset && right_offset <= last_right_offset.value())
-            return;
-
-        last_right_offset = right_offset;
-        data_buffer->setReadUntilPosition(right_offset);
+        e.addMessage("(while reading column " + name_and_type.name + ")");
+        throw;
     }
 }
 
-bool MergeTreeReaderCompact::isContinuousReading(size_t mark, size_t column_position)
+void MergeTreeReaderCompact::createColumnsForReading(Columns & res_columns) const
 {
-    if (!last_read_granule)
+    for (size_t i = 0; i < columns_to_read.size(); ++i)
+    {
+        if (column_positions[i] && res_columns[i] == nullptr)
+            res_columns[i] = columns_to_read[i].type->createColumn(*serializations[i]);
+    }
+}
+
+bool MergeTreeReaderCompact::needSkipStream(size_t column_pos, const ISerialization::SubstreamPath & substream) const
+{
+    /// Offset stream can be read only from columns of current level or
+    /// below (since it is OK to read all parent streams from the
+    /// alternative).
+    ///
+    /// Consider the following columns in nested "root":
+    /// - root.array Array(UInt8) - exists
+    /// - root.nested_array Array(Array(UInt8)) - does not exists (only_offsets_level=1)
+    ///
+    /// For root.nested_array it will try to read multiple streams:
+    /// - offsets (substream_path = {ArraySizes})
+    ///   OK
+    /// - root.nested_array elements (substream_path = {ArrayElements, ArraySizes})
+    ///   NOT OK - cannot use root.array offsets stream for this
+    ///
+    /// Here only_offsets_level is the level of the alternative stream,
+    /// and substream_path.size() is the level of the current stream.
+
+    if (!columns_for_offsets[column_pos])
         return false;
-    const auto & [last_mark, last_column] = *last_read_granule;
-    return (mark == last_mark && column_position == last_column + 1)
-        || (mark == last_mark + 1 && column_position == 0 && last_column == data_part_info_for_read->getColumns().size() - 1);
-}
 
-namespace
-{
-
-/// A simple class that helps to iterate over 2-dim marks of compact parts.
-class MarksCounter
-{
-public:
-    MarksCounter(size_t rows_num_, size_t columns_num_)
-        : rows_num(rows_num_), columns_num(columns_num_) {}
-
-    struct Iterator
-    {
-        size_t row;
-        size_t column;
-        MarksCounter * counter;
-
-        Iterator(size_t row_, size_t column_, MarksCounter * counter_)
-            : row(row_), column(column_), counter(counter_) {}
-
-        Iterator operator++()
-        {
-            if (column + 1 == counter->columns_num)
-            {
-                ++row;
-                column = 0;
-            }
-            else
-            {
-                ++column;
-            }
-
-            return *this;
-        }
-
-        bool operator==(const Iterator & other) const { return row == other.row && column == other.column; }
-        bool operator!=(const Iterator & other) const { return !(*this == other); }
-    };
-
-    Iterator get(size_t row, size_t column) { return Iterator(row, column, this); }
-    Iterator end() { return get(rows_num, 0); }
-
-private:
-    size_t rows_num;
-    size_t columns_num;
-};
-
-}
-
-size_t MergeTreeReaderCompact::getReadBufferSize(
-    const IMergeTreeDataPartInfoForReader & data_part_info_for_reader,
-    MergeTreeMarksLoader & marks_loader,
-    const ColumnPositions & column_positions,
-    const MarkRanges & mark_ranges)
-{
-    size_t buffer_size = 0;
-    size_t columns_num = column_positions.size();
-    size_t file_size = data_part_info_for_reader.getFileSizeOrZero(MergeTreeDataPartCompact::DATA_FILE_NAME_WITH_EXTENSION);
-
-    MarksCounter counter(data_part_info_for_reader.getMarksCount(), data_part_info_for_reader.getColumns().size());
-
-    for (const auto & mark_range : mark_ranges)
-    {
-        for (size_t mark = mark_range.begin; mark < mark_range.end; ++mark)
-        {
-            for (size_t i = 0; i < columns_num; ++i)
-            {
-                if (!column_positions[i])
-                    continue;
-
-                auto it = counter.get(mark, *column_positions[i]);
-                size_t cur_offset = marks_loader.getMark(it.row, it.column).offset_in_compressed_file;
-
-                while (it != counter.end() && cur_offset == marks_loader.getMark(it.row, it.column).offset_in_compressed_file)
-                    ++it;
-
-                size_t next_offset = (it == counter.end() ? file_size : marks_loader.getMark(it.row, it.column).offset_in_compressed_file);
-                buffer_size = std::max(buffer_size, next_offset - cur_offset);
-            }
-        }
-    }
-
-    return buffer_size;
+    bool is_offsets = !substream.empty() && substream.back().type == ISerialization::Substream::ArraySizes;
+    return !is_offsets || columns_for_offsets[column_pos]->second < ISerialization::getArrayLevel(substream);
 }
 
 }
diff --git a/src/Storages/MergeTree/MergeTreeReaderCompact.h b/src/Storages/MergeTree/MergeTreeReaderCompact.h
index 769e6a08be4..9c66b4691a3 100644
--- a/src/Storages/MergeTree/MergeTreeReaderCompact.h
+++ b/src/Storages/MergeTree/MergeTreeReaderCompact.h
@@ -3,7 +3,7 @@
 #include <Core/NamesAndTypes.h>
 #include <Storages/MergeTree/IMergeTreeReader.h>
 #include <IO/ReadBufferFromFileBase.h>
-
+#include <DataTypes/Serializations/ISerialization.h>
 
 namespace DB
 {
@@ -14,7 +14,7 @@ using DataPartCompactPtr = std::shared_ptr<const MergeTreeDataPartCompact>;
 class IMergeTreeDataPart;
 using DataPartPtr = std::shared_ptr<const IMergeTreeDataPart>;
 
-/// Reader for compact parts
+/// Base class of readers for compact parts.
 class MergeTreeReaderCompact : public IMergeTreeReader
 {
 public:
@@ -27,31 +27,37 @@ public:
         MarkCache * mark_cache_,
         MarkRanges mark_ranges_,
         MergeTreeReaderSettings settings_,
-        ThreadPool * load_marks_threadpool_,
-        ValueSizeMap avg_value_size_hints_ = {},
-        const ReadBufferFromFileBase::ProfileCallback & profile_callback_ = {},
-        clockid_t clock_type_ = CLOCK_MONOTONIC_COARSE);
+        ValueSizeMap avg_value_size_hints_,
+        const ReadBufferFromFileBase::ProfileCallback & profile_callback_,
+        clockid_t clock_type_);
 
-    /// Return the number of rows has been read or zero if there is no columns to read.
-    /// If continue_reading is true, continue reading from last state, otherwise seek to from_mark
-    size_t readRows(size_t from_mark, size_t current_task_last_mark,
-                    bool continue_reading, size_t max_rows_to_read, Columns & res_columns) override;
+    bool canReadIncompleteGranules() const override final { return false; }
 
-    bool canReadIncompleteGranules() const override { return false; }
-
-    void prefetchBeginOfRange(Priority priority) override;
-
-private:
-    bool isContinuousReading(size_t mark, size_t column_position);
+protected:
     void fillColumnPositions();
-    void initialize();
 
-    ReadBuffer * data_buffer;
-    CompressedReadBufferBase * compressed_data_buffer;
-    std::unique_ptr<CachedCompressedReadBuffer> cached_buffer;
-    std::unique_ptr<CompressedReadBufferFromFile> non_cached_buffer;
+    using InputStreamGetter = ISerialization::InputStreamGetter;
 
-    MergeTreeMarksLoader marks_loader;
+    void readData(
+        const NameAndTypePair & name_and_type,
+        ColumnPtr & column,
+        size_t rows_to_read,
+        const InputStreamGetter & getter);
+
+    void readPrefix(
+        const NameAndTypePair & name_and_type,
+        const InputStreamGetter & buffer_getter,
+        const InputStreamGetter & buffer_getter_for_prefix,
+        const ColumnNameLevel & name_level_for_offsets);
+
+    void createColumnsForReading(Columns & res_columns) const;
+    bool needSkipStream(size_t column_pos, const ISerialization::SubstreamPath & substream) const;
+
+    const MergeTreeMarksLoaderPtr marks_loader;
+    MergeTreeMarksGetterPtr marks_getter;
+
+    ReadBufferFromFileBase::ProfileCallback profile_callback;
+    clockid_t clock_type;
 
     /// Storage columns with collected separate arrays of Nested to columns of Nested type.
     /// They maybe be needed for finding offsets of missed Nested columns in parts.
@@ -67,32 +73,9 @@ private:
     /// Element of the vector is the level of the alternative stream.
     std::vector<ColumnNameLevel> columns_for_offsets;
 
-    /// For asynchronous reading from remote fs. Same meaning as in MergeTreeReaderStream.
-    std::optional<size_t> last_right_offset;
-
+    /// Mark to read in next 'readRows' call in case,
+    /// when 'continue_reading' is true.
     size_t next_mark = 0;
-    std::optional<std::pair<size_t, size_t>> last_read_granule;
-
-    void seekToMark(size_t row_index, size_t column_index);
-
-    void readData(const NameAndTypePair & name_and_type, ColumnPtr & column, size_t from_mark,
-        size_t current_task_last_mark, size_t column_position,
-        size_t rows_to_read, ColumnNameLevel name_level_for_offsets, std::unordered_map<String, ColumnPtr> & columns_cache_for_subcolumns);
-
-    /// Returns maximal value of granule size in compressed file from @mark_ranges.
-    /// This value is used as size of read buffer.
-    static size_t getReadBufferSize(
-        const IMergeTreeDataPartInfoForReader & data_part_info_for_reader,
-        MergeTreeMarksLoader & marks_loader,
-        const ColumnPositions & column_positions,
-        const MarkRanges & mark_ranges);
-
-    /// For asynchronous reading from remote fs.
-    void adjustUpperBound(size_t last_mark);
-
-    ReadBufferFromFileBase::ProfileCallback profile_callback;
-    clockid_t clock_type;
-    bool initialized = false;
 };
 
 }
diff --git a/src/Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.cpp b/src/Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.cpp
new file mode 100644
index 00000000000..2b2cf493bb5
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.cpp
@@ -0,0 +1,108 @@
+#include <Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.h>
+#include <Storages/MergeTree/MergeTreeDataPartCompact.h>
+#include <Storages/MergeTree/checkDataPart.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/NestedUtils.h>
+
+namespace DB
+{
+
+size_t MergeTreeReaderCompactSingleBuffer::readRows(
+    size_t from_mark, size_t current_task_last_mark, bool continue_reading, size_t max_rows_to_read, Columns & res_columns)
+try
+{
+    init();
+
+    if (continue_reading)
+        from_mark = next_mark;
+
+    size_t read_rows = 0;
+    size_t num_columns = columns_to_read.size();
+
+    checkNumberOfColumns(num_columns);
+    createColumnsForReading(res_columns);
+
+    while (read_rows < max_rows_to_read)
+    {
+        size_t rows_to_read = data_part_info_for_read->getIndexGranularity().getMarkRows(from_mark);
+
+        for (size_t pos = 0; pos < num_columns; ++pos)
+        {
+            if (!res_columns[pos])
+                continue;
+
+            auto & column = res_columns[pos];
+
+            stream->adjustRightMark(current_task_last_mark); /// Must go before seek.
+            stream->seekToMarkAndColumn(from_mark, *column_positions[pos]);
+
+            auto buffer_getter = [&](const ISerialization::SubstreamPath & substream_path) -> ReadBuffer *
+            {
+                if (needSkipStream(pos, substream_path))
+                    return nullptr;
+
+                return stream->getDataBuffer();
+            };
+
+            /// If we read only offsets we have to read prefix anyway
+            /// to preserve correctness of serialization.
+            auto buffer_getter_for_prefix = [&](const auto &) -> ReadBuffer *
+            {
+                return stream->getDataBuffer();
+            };
+
+            readPrefix(columns_to_read[pos], buffer_getter, buffer_getter_for_prefix, columns_for_offsets[pos]);
+            readData(columns_to_read[pos], column, rows_to_read, buffer_getter);
+        }
+
+        ++from_mark;
+        read_rows += rows_to_read;
+    }
+
+    next_mark = from_mark;
+    return read_rows;
+}
+catch (...)
+{
+    if (!isRetryableException(std::current_exception()))
+        data_part_info_for_read->reportBroken();
+
+    /// Better diagnostics.
+    try
+    {
+        rethrow_exception(std::current_exception());
+    }
+    catch (Exception & e)
+    {
+        e.addMessage(getMessageForDiagnosticOfBrokenPart(from_mark, max_rows_to_read));
+    }
+
+    throw;
+}
+
+void MergeTreeReaderCompactSingleBuffer::init()
+try
+{
+    if (initialized)
+        return;
+
+    auto stream_settings = settings;
+    stream_settings.allow_different_codecs = true;
+
+    stream = std::make_unique<MergeTreeReaderStreamAllOfMultipleColumns>(
+        data_part_info_for_read->getDataPartStorage(), MergeTreeDataPartCompact::DATA_FILE_NAME,
+        MergeTreeDataPartCompact::DATA_FILE_EXTENSION, data_part_info_for_read->getMarksCount(),
+        all_mark_ranges, stream_settings,uncompressed_cache,
+        data_part_info_for_read->getFileSizeOrZero(MergeTreeDataPartCompact::DATA_FILE_NAME_WITH_EXTENSION),
+        marks_loader, profile_callback, clock_type);
+
+    initialized = true;
+}
+catch (...)
+{
+    if (!isRetryableException(std::current_exception()))
+        data_part_info_for_read->reportBroken();
+    throw;
+}
+
+}
diff --git a/src/Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.h b/src/Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.h
new file mode 100644
index 00000000000..f358120e717
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreeReaderCompactSingleBuffer.h
@@ -0,0 +1,33 @@
+#pragma once
+#include <Storages/MergeTree/MergeTreeReaderCompact.h>
+#include <Storages/MergeTree/MergeTreeReaderStream.h>
+
+namespace DB
+{
+
+/// Reader for compact parts, that uses one buffer for
+/// all column and doesn't support parallel prefetch of columns.
+/// It's suitable for compact parts with small size of stripe.
+class MergeTreeReaderCompactSingleBuffer : public MergeTreeReaderCompact
+{
+public:
+    template <typename... Args>
+    explicit MergeTreeReaderCompactSingleBuffer(Args &&... args)
+        : MergeTreeReaderCompact{std::forward<Args>(args)...}
+    {
+        fillColumnPositions();
+    }
+
+    /// Returns the number of rows has been read or zero if there is no columns to read.
+    /// If continue_reading is true, continue reading from last state, otherwise seek to from_mark
+    size_t readRows(size_t from_mark, size_t current_task_last_mark,
+                    bool continue_reading, size_t max_rows_to_read, Columns & res_columns) override;
+
+private:
+    void init();
+
+    bool initialized = false;
+    std::unique_ptr<MergeTreeReaderStream> stream;
+};
+
+}
diff --git a/src/Storages/MergeTree/MergeTreeReaderStream.cpp b/src/Storages/MergeTree/MergeTreeReaderStream.cpp
index 8e460630d5e..40a16176c69 100644
--- a/src/Storages/MergeTree/MergeTreeReaderStream.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderStream.cpp
@@ -16,43 +16,28 @@ namespace ErrorCodes
 }
 
 MergeTreeReaderStream::MergeTreeReaderStream(
-        MergeTreeDataPartInfoForReaderPtr data_part_reader_,
-        const String & path_prefix_,
-        const String & data_file_extension_,
-        size_t marks_count_,
-        const MarkRanges & all_mark_ranges_,
-        const MergeTreeReaderSettings & settings_,
-        MarkCache * mark_cache_,
-        UncompressedCache * uncompressed_cache_,
-        size_t file_size_,
-        const MergeTreeIndexGranularityInfo * index_granularity_info_,
-        const ReadBufferFromFileBase::ProfileCallback & profile_callback_,
-        clockid_t clock_type_,
-        bool is_low_cardinality_dictionary_,
-        ThreadPool * load_marks_cache_threadpool_)
-    : settings(settings_)
-    , profile_callback(profile_callback_)
+    DataPartStoragePtr data_part_storage_,
+    const String & path_prefix_,
+    const String & data_file_extension_,
+    size_t marks_count_,
+    const MarkRanges & all_mark_ranges_,
+    const MergeTreeReaderSettings & settings_,
+    UncompressedCache * uncompressed_cache_,
+    size_t file_size_,
+    MergeTreeMarksLoaderPtr marks_loader_,
+    const ReadBufferFromFileBase::ProfileCallback & profile_callback_,
+    clockid_t clock_type_)
+    : profile_callback(profile_callback_)
     , clock_type(clock_type_)
     , all_mark_ranges(all_mark_ranges_)
-    , file_size(file_size_)
-    , uncompressed_cache(uncompressed_cache_)
-    , data_part_storage(data_part_reader_->getDataPartStorage())
+    , data_part_storage(std::move(data_part_storage_))
     , path_prefix(path_prefix_)
     , data_file_extension(data_file_extension_)
-    , is_low_cardinality_dictionary(is_low_cardinality_dictionary_)
+    , uncompressed_cache(uncompressed_cache_)
+    , settings(settings_)
     , marks_count(marks_count_)
-    , mark_cache(mark_cache_)
-    , save_marks_in_cache(settings.save_marks_in_cache)
-    , index_granularity_info(index_granularity_info_)
-    , marks_loader(
-        data_part_reader_,
-        mark_cache,
-        index_granularity_info->getMarksFilePath(path_prefix),
-        marks_count,
-        *index_granularity_info,
-        save_marks_in_cache,
-        settings.read_settings,
-        load_marks_cache_threadpool_)
+    , file_size(file_size_)
+    , marks_loader(std::move(marks_loader_))
 {
 }
 
@@ -60,21 +45,12 @@ void MergeTreeReaderStream::init()
 {
     if (initialized)
         return;
+
     initialized = true;
+    marks_getter = marks_loader->loadMarks();
+
     /// Compute the size of the buffer.
-    size_t max_mark_range_bytes = 0;
-    size_t sum_mark_range_bytes = 0;
-
-    for (const auto & mark_range : all_mark_ranges)
-    {
-        size_t left_mark = mark_range.begin;
-        size_t right_mark = mark_range.end;
-        size_t left_offset = left_mark < marks_count ? marks_loader.getMark(left_mark).offset_in_compressed_file : 0;
-        auto mark_range_bytes = getRightOffset(right_mark) - left_offset;
-
-        max_mark_range_bytes = std::max(max_mark_range_bytes, mark_range_bytes);
-        sum_mark_range_bytes += mark_range_bytes;
-    }
+    auto [max_mark_range_bytes, sum_mark_range_bytes] = estimateMarkRangeBytes(all_mark_ranges);
 
     std::optional<size_t> estimated_sum_mark_range_bytes;
     if (sum_mark_range_bytes)
@@ -83,7 +59,7 @@ void MergeTreeReaderStream::init()
     /// Avoid empty buffer. May happen while reading dictionary for DataTypeLowCardinality.
     /// For example: part has single dictionary and all marks point to the same position.
     ReadSettings read_settings = settings.read_settings;
-    if (max_mark_range_bytes != 0)
+    if (settings.adjust_read_buffer_size && max_mark_range_bytes != 0)
         read_settings = read_settings.adjustBufferSize(max_mark_range_bytes);
 
     //// Empty buffer does not makes progress.
@@ -102,7 +78,8 @@ void MergeTreeReaderStream::init()
                     read_settings,
                     estimated_sum_mark_range_bytes, std::nullopt);
             },
-            uncompressed_cache);
+            uncompressed_cache,
+            settings.allow_different_codecs);
 
         if (profile_callback)
             buffer->setProfileCallback(profile_callback, clock_type);
@@ -121,7 +98,7 @@ void MergeTreeReaderStream::init()
                 path_prefix + data_file_extension,
                 read_settings,
                 estimated_sum_mark_range_bytes,
-                std::nullopt));
+                std::nullopt), settings.allow_different_codecs);
 
         if (profile_callback)
             buffer->setProfileCallback(profile_callback, clock_type);
@@ -135,99 +112,10 @@ void MergeTreeReaderStream::init()
     }
 }
 
-
-size_t MergeTreeReaderStream::getRightOffset(size_t right_mark)
-{
-    /// NOTE: if we are reading the whole file, then right_mark == marks_count
-    /// and we will use max_read_buffer_size for buffer size, thus avoiding the need to load marks.
-
-    /// Special case, can happen in Collapsing/Replacing engines
-    if (marks_count == 0)
-        return 0;
-
-    assert(right_mark <= marks_count);
-
-    if (0 < right_mark && right_mark < marks_count)
-    {
-        /// Find the right border of the last mark we need to read.
-        /// To do that let's find the upper bound of the offset of the last
-        /// included mark.
-
-        if (is_low_cardinality_dictionary)
-        {
-
-            /// In LowCardinality dictionary several consecutive marks can point to the same offset.
-            ///
-            /// Also, in some cases, when one granule is not-atomically written (which is possible at merges)
-            /// one granule may require reading of two dictionaries which starts from different marks.
-            /// The only correct way is to take offset from at least next different granule from the right one.
-            /// So, that's why we have to read one extra granule to the right,
-            /// while reading dictionary of LowCardinality.
-            ///
-            /// Example:
-            /// Mark 0, points to [0, 8]
-            /// Mark 1, points to [0, 8]
-            /// Mark 2, points to [0, 8]
-            /// Mark 3, points to [0, 8]
-            /// Mark 4, points to [42336, 2255]
-            /// Mark 5, points to [42336, 2255]  <--- for example need to read until 5
-            /// Mark 6, points to [42336, 2255]  <--- not suitable, because have same offset
-            /// Mark 7, points to [84995, 7738]  <--- next different mark
-            /// Mark 8, points to [84995, 7738]
-            /// Mark 9, points to [126531, 8637] <--- what we are looking for
-
-            auto indices = collections::range(right_mark, marks_count);
-            auto next_different_mark = [&](auto lhs, auto rhs)
-            {
-                return marks_loader.getMark(lhs).asTuple() < marks_loader.getMark(rhs).asTuple();
-            };
-            auto it = std::upper_bound(indices.begin(), indices.end(), right_mark, std::move(next_different_mark));
-
-            if (it == indices.end())
-                return file_size;
-
-            right_mark = *it;
-        }
-
-        /// This is a good scenario. The compressed block is finished within the right mark,
-        /// and previous mark was different.
-        if (marks_loader.getMark(right_mark).offset_in_decompressed_block == 0
-            && marks_loader.getMark(right_mark) != marks_loader.getMark(right_mark - 1))
-            return marks_loader.getMark(right_mark).offset_in_compressed_file;
-
-        /// If right_mark has non-zero offset in decompressed block, we have to
-        /// read its compressed block in a whole, because it may consist of data from previous granule.
-        ///
-        /// For example:
-        /// Mark 6, points to [42336, 2255]
-        /// Mark 7, points to [84995, 7738]  <--- right_mark
-        /// Mark 8, points to [84995, 7738]
-        /// Mark 9, points to [126531, 8637] <--- what we are looking for
-        ///
-        /// Since mark 7 starts from offset in decompressed block 7738,
-        /// it has some data from mark 6 and we have to read
-        /// compressed block  [84995; 126531 in a whole.
-
-        auto indices = collections::range(right_mark, marks_count);
-        auto next_different_compressed_offset = [&](auto lhs, auto rhs)
-        {
-            return marks_loader.getMark(lhs).offset_in_compressed_file < marks_loader.getMark(rhs).offset_in_compressed_file;
-        };
-        auto it = std::upper_bound(indices.begin(), indices.end(), right_mark, std::move(next_different_compressed_offset));
-
-        if (it != indices.end())
-            return marks_loader.getMark(*it).offset_in_compressed_file;
-    }
-    else if (right_mark == 0)
-        return marks_loader.getMark(right_mark).offset_in_compressed_file;
-
-    return file_size;
-}
-
-void MergeTreeReaderStream::seekToMark(size_t index)
+void MergeTreeReaderStream::seekToMarkAndColumn(size_t row_index, size_t column_position)
 {
     init();
-    MarkInCompressedFile mark = marks_loader.getMark(index);
+    const auto & mark = marks_getter->getMark(row_index, column_position);
 
     try
     {
@@ -237,7 +125,7 @@ void MergeTreeReaderStream::seekToMark(size_t index)
     {
         /// Better diagnostics.
         if (e.code() == ErrorCodes::ARGUMENT_OUT_OF_BOUND)
-            e.addMessage("(while seeking to mark " + toString(index)
+            e.addMessage("(while seeking to mark " + toString(row_index)
                          + " of column " + path_prefix + "; offsets are: "
                          + toString(mark.offset_in_compressed_file) + " "
                          + toString(mark.offset_in_decompressed_block) + ")");
@@ -274,6 +162,7 @@ void MergeTreeReaderStream::adjustRightMark(size_t right_mark)
      */
     init();
     auto right_offset = getRightOffset(right_mark);
+
     if (!right_offset)
     {
         if (last_right_offset && *last_right_offset == 0)
@@ -304,4 +193,276 @@ CompressedReadBufferBase * MergeTreeReaderStream::getCompressedDataBuffer()
     return compressed_data_buffer;
 }
 
+size_t MergeTreeReaderStreamSingleColumn::getRightOffset(size_t right_mark) const
+{
+    /// NOTE: if we are reading the whole file, then right_mark == marks_count
+    /// and we will use max_read_buffer_size for buffer size, thus avoiding the need to load marks.
+
+    /// Special case, can happen in Collapsing/Replacing engines
+    if (marks_count == 0)
+        return 0;
+
+    assert(right_mark <= marks_count);
+
+    if (right_mark == 0)
+        return marks_getter->getMark(right_mark, 0).offset_in_compressed_file;
+
+    if (right_mark == marks_count)
+        return file_size;
+
+    /// Find the right border of the last mark we need to read.
+    /// To do that let's find the upper bound of the offset of the last
+    /// included mark.
+
+    if (settings.is_low_cardinality_dictionary)
+    {
+        /// In LowCardinality dictionary several consecutive marks can point to the same offset.
+        ///
+        /// Also, in some cases, when one granule is not-atomically written (which is possible at merges)
+        /// one granule may require reading of two dictionaries which starts from different marks.
+        /// The only correct way is to take offset from at least next different granule from the right one.
+        /// So, that's why we have to read one extra granule to the right,
+        /// while reading dictionary of LowCardinality.
+        ///
+        /// Example:
+        /// Mark 0, points to [0, 8]
+        /// Mark 1, points to [0, 8]
+        /// Mark 2, points to [0, 8]
+        /// Mark 3, points to [0, 8]
+        /// Mark 4, points to [42336, 2255]
+        /// Mark 5, points to [42336, 2255]  <--- for example need to read until 5
+        /// Mark 6, points to [42336, 2255]  <--- not suitable, because have same offset
+        /// Mark 7, points to [84995, 7738]  <--- next different mark
+        /// Mark 8, points to [84995, 7738]
+        /// Mark 9, points to [126531, 8637] <--- what we are looking for
+
+        auto indices = collections::range(right_mark, marks_count);
+        auto next_different_mark = [&](auto lhs, auto rhs)
+        {
+            return marks_getter->getMark(lhs, 0).asTuple() < marks_getter->getMark(rhs, 0).asTuple();
+        };
+
+        auto it = std::upper_bound(indices.begin(), indices.end(), right_mark, std::move(next_different_mark));
+        if (it == indices.end())
+            return file_size;
+
+        right_mark = *it;
+    }
+
+    /// This is a good scenario. The compressed block is finished within the right mark,
+    /// and previous mark was different.
+    if (marks_getter->getMark(right_mark, 0).offset_in_decompressed_block == 0
+        && marks_getter->getMark(right_mark, 0) != marks_getter->getMark(right_mark - 1, 0))
+        return marks_getter->getMark(right_mark, 0).offset_in_compressed_file;
+
+    /// If right_mark has non-zero offset in decompressed block, we have to
+    /// read its compressed block in a whole, because it may consist of data from previous granule.
+    ///
+    /// For example:
+    /// Mark 6, points to [42336, 2255]
+    /// Mark 7, points to [84995, 7738]  <--- right_mark
+    /// Mark 8, points to [84995, 7738]
+    /// Mark 9, points to [126531, 8637] <--- what we are looking for
+    ///
+    /// Since mark 7 starts from offset in decompressed block 7738,
+    /// it has some data from mark 6 and we have to read
+    /// compressed block  [84995; 126531 in a whole.
+
+    auto indices = collections::range(right_mark, marks_count);
+    auto next_different_compressed_offset = [&](auto lhs, auto rhs)
+    {
+        return marks_getter->getMark(lhs, 0).offset_in_compressed_file < marks_getter->getMark(rhs, 0).offset_in_compressed_file;
+    };
+
+    auto it = std::upper_bound(indices.begin(), indices.end(), right_mark, std::move(next_different_compressed_offset));
+    if (it != indices.end())
+        return marks_getter->getMark(*it, 0).offset_in_compressed_file;
+
+    return file_size;
+}
+
+std::pair<size_t, size_t> MergeTreeReaderStreamSingleColumn::estimateMarkRangeBytes(const MarkRanges & mark_ranges) const
+{
+    assert(marks_getter != nullptr);
+
+    size_t max_range_bytes = 0;
+    size_t sum_range_bytes = 0;
+
+    for (const auto & mark_range : mark_ranges)
+    {
+        size_t left_mark = mark_range.begin;
+        size_t right_mark = mark_range.end;
+        size_t left_offset = left_mark < marks_count ? marks_getter->getMark(left_mark, 0).offset_in_compressed_file : 0;
+        auto mark_range_bytes = getRightOffset(right_mark) - left_offset;
+
+        max_range_bytes = std::max(max_range_bytes, mark_range_bytes);
+        sum_range_bytes += mark_range_bytes;
+    }
+
+    return {max_range_bytes, sum_range_bytes};
+}
+
+size_t MergeTreeReaderStreamMultipleColumns::getRightOffsetOneColumn(size_t right_mark_non_included, size_t column_position) const
+{
+    /// NOTE: if we are reading the whole file, then right_mark == marks_count
+    /// and we will use max_read_buffer_size for buffer size, thus avoiding the need to load marks.
+
+    /// Special case, can happen in Collapsing/Replacing engines
+    if (marks_count == 0)
+        return 0;
+
+    assert(right_mark_non_included <= marks_count);
+
+    if (right_mark_non_included == 0)
+        return marks_getter->getMark(right_mark_non_included, column_position).offset_in_compressed_file;
+
+    size_t right_mark_included = right_mark_non_included - 1;
+    if (right_mark_non_included != marks_count
+        && marks_getter->getMark(right_mark_non_included, column_position).offset_in_decompressed_block != 0)
+         ++right_mark_included;
+
+    /// The right bound for case, where there is no smaller suitable mark
+    /// is the start of the next stripe (in which the next column is written)
+    /// because each stripe always start from a new compressed block.
+    const auto & right_mark_in_file = marks_getter->getMark(right_mark_included, column_position);
+    auto next_stripe_right_mark_in_file = getStartOfNextStripeMark(right_mark_included, column_position);
+
+    /// Try to find suitable right mark in current stripe.
+    for (size_t mark = right_mark_included + 1; mark < marks_count; ++mark)
+    {
+        const auto & current_mark = marks_getter->getMark(mark, column_position);
+        /// We found first mark that starts from the new compressed block.
+        if (current_mark.offset_in_compressed_file > right_mark_in_file.offset_in_compressed_file)
+        {
+            /// If it is in current stripe return it to reduce amount of read data.
+            if (current_mark < next_stripe_right_mark_in_file)
+                return current_mark.offset_in_compressed_file;
+
+            /// Otherwise return start of new stripe as an upper bound.
+            break;
+        }
+    }
+
+    return next_stripe_right_mark_in_file.offset_in_compressed_file;
+}
+
+std::pair<size_t, size_t>
+MergeTreeReaderStreamMultipleColumns::estimateMarkRangeBytesOneColumn(const MarkRanges & mark_ranges, size_t column_position) const
+{
+    assert(marks_getter != nullptr);
+
+    /// As a maximal range we return the maximal size of a whole stripe.
+    size_t max_range_bytes = 0;
+    size_t sum_range_bytes = 0;
+
+    for (const auto & mark_range : mark_ranges)
+    {
+        auto start_of_stripe_mark = marks_getter->getMark(mark_range.begin, column_position);
+        auto start_of_next_stripe_mark = getStartOfNextStripeMark(mark_range.begin, column_position);
+
+        for (size_t mark = mark_range.begin; mark < mark_range.end; ++mark)
+        {
+            const auto & current_mark = marks_getter->getMark(mark, column_position);
+
+            /// We found a start of new stripe, now update values.
+            if (current_mark > start_of_next_stripe_mark)
+            {
+                auto current_range_bytes = getRightOffsetOneColumn(mark, column_position) - start_of_stripe_mark.offset_in_compressed_file;
+
+                max_range_bytes = std::max(max_range_bytes, current_range_bytes);
+                sum_range_bytes += current_range_bytes;
+
+                start_of_stripe_mark = current_mark;
+                start_of_next_stripe_mark = getStartOfNextStripeMark(mark, column_position);
+            }
+        }
+
+        auto current_range_bytes = getRightOffsetOneColumn(mark_range.end, column_position) - start_of_stripe_mark.offset_in_compressed_file;
+
+        max_range_bytes = std::max(max_range_bytes, current_range_bytes);
+        sum_range_bytes += current_range_bytes;
+    }
+
+    return {max_range_bytes, sum_range_bytes};
+}
+
+MarkInCompressedFile MergeTreeReaderStreamMultipleColumns::getStartOfNextStripeMark(size_t row_index, size_t column_position) const
+{
+    const auto & current_mark = marks_getter->getMark(row_index, column_position);
+
+    if (marks_getter->getNumColumns() == 1)
+        return MarkInCompressedFile{file_size, 0};
+
+    if (column_position + 1 == marks_getter->getNumColumns())
+    {
+        /**
+         * In case of the last column (c3), we have the following picture:
+         *                   c1 c2 c3
+         *                   x  x  x
+         * (row_index, 0) -> o  x  o <- (row_index, column_position)
+         *                   x  x  x
+         *                   ------- <- start of new stripe
+         *    what we are -> o  x  x
+         *    looking for    x  x  x
+         *                   x  x  x
+         *                   -------
+         * So, we need to iterate forward.
+         */
+        size_t mark_index = row_index + 1;
+        while (mark_index < marks_count && marks_getter->getMark(mark_index, 0) <= current_mark)
+            ++mark_index;
+
+        return mark_index == marks_count
+            ? MarkInCompressedFile{file_size, 0}
+            : marks_getter->getMark(mark_index, 0);
+    }
+
+    /**
+    * Otherwise, we have the following picture:
+    *                c1 c2 c3
+    *                x  x  o <- what we are looking for
+    * (row, column) --> o  o <- (row, column + 1)
+    *                x  x  x
+    *                ------- <- start of new stripe
+    * So, we need to iterate backward.
+    */
+
+    ssize_t mark_index = row_index;
+    while (mark_index >= 0 && marks_getter->getMark(mark_index, column_position + 1) >= current_mark)
+        --mark_index;
+
+    return marks_getter->getMark(mark_index + 1, column_position + 1);
+}
+
+size_t MergeTreeReaderStreamOneOfMultipleColumns::getRightOffset(size_t right_mark_non_included) const
+{
+    return getRightOffsetOneColumn(right_mark_non_included, column_position);
+}
+
+std::pair<size_t, size_t> MergeTreeReaderStreamOneOfMultipleColumns::estimateMarkRangeBytes(const MarkRanges & mark_ranges) const
+{
+    return estimateMarkRangeBytesOneColumn(mark_ranges, column_position);
+}
+
+size_t MergeTreeReaderStreamAllOfMultipleColumns::getRightOffset(size_t right_mark_non_included) const
+{
+    return getRightOffsetOneColumn(right_mark_non_included, marks_loader->getNumColumns() - 1);
+}
+
+std::pair<size_t, size_t> MergeTreeReaderStreamAllOfMultipleColumns::estimateMarkRangeBytes(const MarkRanges & mark_ranges) const
+{
+    size_t max_range_bytes = 0;
+    size_t sum_range_bytes = 0;
+
+    for (size_t i = 0; i < marks_getter->getNumColumns(); ++i)
+    {
+        auto [current_max, current_sum] = estimateMarkRangeBytesOneColumn(mark_ranges, i);
+
+        max_range_bytes = std::max(max_range_bytes, current_max);
+        sum_range_bytes += current_sum;
+    }
+
+    return {max_range_bytes, sum_range_bytes};
+}
+
 }
diff --git a/src/Storages/MergeTree/MergeTreeReaderStream.h b/src/Storages/MergeTree/MergeTreeReaderStream.h
index 49ce3103434..f3ca6953ceb 100644
--- a/src/Storages/MergeTree/MergeTreeReaderStream.h
+++ b/src/Storages/MergeTree/MergeTreeReaderStream.h
@@ -14,27 +14,31 @@
 namespace DB
 {
 
-/// Class for reading a single column (or index).
+/// Basic and the most low-level class
+/// for reading single columns or indexes.
 class MergeTreeReaderStream
 {
 public:
     MergeTreeReaderStream(
-        MergeTreeDataPartInfoForReaderPtr data_part_reader_,
+        DataPartStoragePtr data_part_storage_,
         const String & path_prefix_,
         const String & data_file_extension_,
         size_t marks_count_,
-        const MarkRanges & all_mark_ranges,
+        const MarkRanges & all_mark_ranges_,
         const MergeTreeReaderSettings & settings_,
-        MarkCache * mark_cache,
-        UncompressedCache * uncompressed_cache,
+        UncompressedCache * uncompressed_cache_,
         size_t file_size_,
-        const MergeTreeIndexGranularityInfo * index_granularity_info_,
-        const ReadBufferFromFileBase::ProfileCallback & profile_callback,
-        clockid_t clock_type,
-        bool is_low_cardinality_dictionary_,
-        ThreadPool * load_marks_cache_threadpool_);
+        MergeTreeMarksLoaderPtr marks_loader_,
+        const ReadBufferFromFileBase::ProfileCallback & profile_callback_,
+        clockid_t clock_type_);
 
-    void seekToMark(size_t index);
+    virtual ~MergeTreeReaderStream() = default;
+
+    /// Seeks to start of @row_index mark. Column position is implementation defined.
+    virtual void seekToMark(size_t row_index) = 0;
+
+    /// Seeks to exact mark in file.
+    void seekToMarkAndColumn(size_t row_index, size_t column_position);
 
     void seekToStart();
 
@@ -48,39 +52,111 @@ public:
     CompressedReadBufferBase * getCompressedDataBuffer();
 
 private:
-    void init();
-    size_t getRightOffset(size_t right_mark);
+    /// Returns offset in file up to which it's needed to read file to read all rows up to @right_mark mark.
+    virtual size_t getRightOffset(size_t right_mark) const = 0;
+
+    /// Returns estimated max amount of bytes to read among mark ranges (which is used as size for read buffer)
+    /// and total amount of bytes to read in all mark ranges.
+    virtual std::pair<size_t, size_t> estimateMarkRangeBytes(const MarkRanges & mark_ranges) const = 0;
 
-    const MergeTreeReaderSettings settings;
     const ReadBufferFromFileBase::ProfileCallback profile_callback;
-    clockid_t clock_type;
+    const clockid_t clock_type;
     const MarkRanges all_mark_ranges;
-    size_t file_size;
-    UncompressedCache * uncompressed_cache;
 
-    DataPartStoragePtr data_part_storage;
-    std::string path_prefix;
-    std::string data_file_extension;
-
-    bool is_low_cardinality_dictionary = false;
-
-    size_t marks_count;
+    const DataPartStoragePtr data_part_storage;
+    const std::string path_prefix;
+    const std::string data_file_extension;
 
+    UncompressedCache * const uncompressed_cache;
 
     ReadBuffer * data_buffer;
     CompressedReadBufferBase * compressed_data_buffer;
-    MarkCache * mark_cache;
-    bool save_marks_in_cache;
+
     bool initialized = false;
-
     std::optional<size_t> last_right_offset;
 
-    const MergeTreeIndexGranularityInfo * index_granularity_info;
-
     std::unique_ptr<CachedCompressedReadBuffer> cached_buffer;
     std::unique_ptr<CompressedReadBufferFromFile> non_cached_buffer;
 
-    MergeTreeMarksLoader marks_loader;
+protected:
+    void init();
+
+    const MergeTreeReaderSettings settings;
+    const size_t marks_count;
+    const size_t file_size;
+
+    const MergeTreeMarksLoaderPtr marks_loader;
+    MergeTreeMarksGetterPtr marks_getter;
+};
+
+/// Class for reading a single column (or index) from file
+/// that contains a single column (for wide parts).
+class MergeTreeReaderStreamSingleColumn : public MergeTreeReaderStream
+{
+public:
+    template <typename... Args>
+    explicit MergeTreeReaderStreamSingleColumn(Args &&... args)
+        : MergeTreeReaderStream{std::forward<Args>(args)...}
+    {
+    }
+
+    size_t getRightOffset(size_t right_mark_non_included) const override;
+    std::pair<size_t, size_t> estimateMarkRangeBytes(const MarkRanges & mark_ranges) const override;
+    void seekToMark(size_t row_index) override { seekToMarkAndColumn(row_index, 0); }
+};
+
+/// Base class for reading from file that contains multiple columns.
+/// It is used to read from compact parts.
+/// See more details about data layout in MergeTreeDataPartCompact.h.
+class MergeTreeReaderStreamMultipleColumns : public MergeTreeReaderStream
+{
+public:
+    template <typename... Args>
+    explicit MergeTreeReaderStreamMultipleColumns(Args &&... args)
+        : MergeTreeReaderStream{std::forward<Args>(args)...}
+    {
+    }
+
+protected:
+    size_t getRightOffsetOneColumn(size_t right_mark_non_included, size_t column_position) const;
+    std::pair<size_t, size_t> estimateMarkRangeBytesOneColumn(const MarkRanges & mark_ranges, size_t column_position) const;
+    MarkInCompressedFile getStartOfNextStripeMark(size_t row_index, size_t column_position) const;
+};
+
+/// Class for reading a single column from file that contains multiple columns
+/// (for parallel reading from compact parts with large stripes).
+class MergeTreeReaderStreamOneOfMultipleColumns : public MergeTreeReaderStreamMultipleColumns
+{
+public:
+    template <typename... Args>
+    explicit MergeTreeReaderStreamOneOfMultipleColumns(size_t column_position_, Args &&... args)
+        : MergeTreeReaderStreamMultipleColumns{std::forward<Args>(args)...}
+        , column_position(column_position_)
+    {
+    }
+
+    size_t getRightOffset(size_t right_mark_non_included) const override;
+    std::pair<size_t, size_t> estimateMarkRangeBytes(const MarkRanges & mark_ranges) const override;
+    void seekToMark(size_t row_index) override { seekToMarkAndColumn(row_index, column_position); }
+
+private:
+    const size_t column_position;
+};
+
+/// Class for reading multiple columns from file that contains multiple columns
+/// (for reading from compact parts with small stripes).
+class MergeTreeReaderStreamAllOfMultipleColumns : public MergeTreeReaderStreamMultipleColumns
+{
+public:
+    template <typename... Args>
+    explicit MergeTreeReaderStreamAllOfMultipleColumns(Args &&... args)
+        : MergeTreeReaderStreamMultipleColumns{std::forward<Args>(args)...}
+    {
+    }
+
+    size_t getRightOffset(size_t right_mark_non_included) const override;
+    std::pair<size_t, size_t> estimateMarkRangeBytes(const MarkRanges & mark_ranges) const override;
+    void seekToMark(size_t row_index) override { seekToMarkAndColumn(row_index, 0); }
 };
 
 }
diff --git a/src/Storages/MergeTree/MergeTreeReaderWide.cpp b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
index d34a58a25b0..394a22835f1 100644
--- a/src/Storages/MergeTree/MergeTreeReaderWide.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderWide.cpp
@@ -225,18 +225,29 @@ void MergeTreeReaderWide::addStreams(
             return;
         }
 
-        has_any_stream = true;
-        bool is_lc_dict = substream_path.size() > 1 && substream_path[substream_path.size() - 2].type == ISerialization::Substream::Type::DictionaryKeys;
-
         auto context = data_part_info_for_read->getContext();
         auto * load_marks_threadpool = settings.read_settings.load_marks_asynchronously ? &context->getLoadMarksThreadpool() : nullptr;
 
-        streams.emplace(*stream_name, std::make_unique<MergeTreeReaderStream>(
-            data_part_info_for_read, *stream_name, DATA_FILE_EXTENSION,
-            data_part_info_for_read->getMarksCount(), all_mark_ranges, settings, mark_cache,
+        auto marks_loader = std::make_shared<MergeTreeMarksLoader>(
+            data_part_info_for_read,
+            mark_cache,
+            data_part_info_for_read->getIndexGranularityInfo().getMarksFilePath(*stream_name),
+            data_part_info_for_read->getMarksCount(),
+            data_part_info_for_read->getIndexGranularityInfo(),
+            settings.save_marks_in_cache,
+            settings.read_settings,
+            load_marks_threadpool,
+            /*num_columns_in_mark=*/ 1);
+
+        has_any_stream = true;
+        auto stream_settings = settings;
+        stream_settings.is_low_cardinality_dictionary = substream_path.size() > 1 && substream_path[substream_path.size() - 2].type == ISerialization::Substream::Type::DictionaryKeys;
+
+        streams.emplace(*stream_name, std::make_unique<MergeTreeReaderStreamSingleColumn>(
+            data_part_info_for_read->getDataPartStorage(), *stream_name, DATA_FILE_EXTENSION,
+            data_part_info_for_read->getMarksCount(), all_mark_ranges, stream_settings,
             uncompressed_cache, data_part_info_for_read->getFileSizeOrZero(*stream_name + DATA_FILE_EXTENSION),
-            &data_part_info_for_read->getIndexGranularityInfo(),
-            profile_callback, clock_type, is_lc_dict, load_marks_threadpool));
+            std::move(marks_loader), profile_callback, clock_type));
     };
 
     serialization->enumerateStreams(callback);
diff --git a/src/Storages/StorageMergeTreeIndex.cpp b/src/Storages/StorageMergeTreeIndex.cpp
index 5f89849e920..329275f4605 100644
--- a/src/Storages/StorageMergeTreeIndex.cpp
+++ b/src/Storages/StorageMergeTreeIndex.cpp
@@ -184,9 +184,11 @@ private:
         auto & compressed_data = compressed->getData();
         auto & uncompressed_data = uncompressed->getData();
 
+        auto marks_getter = marks_loader->loadMarks();
+
         for (size_t i = 0; i < num_rows; ++i)
         {
-            auto mark = marks_loader->getMark(i, col_idx);
+            auto mark = marks_getter->getMark(i, col_idx);
 
             compressed_data[i] = mark.offset_in_compressed_file;
             uncompressed_data[i] = mark.offset_in_decompressed_block;

From 15896ecaf67843d5a56105f438efd1c868c29b15 Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Mon, 18 Mar 2024 16:58:57 +0100
Subject: [PATCH 687/985] Add table `system.keywords` [Part 1] (#51808)

---
 programs/keeper-client/Commands.cpp           |  19 +-
 src/Access/Common/AuthenticationType.cpp      |  26 +-
 src/Access/Common/AuthenticationType.h        |   5 +-
 src/Common/HashTable/StringHashMap.h          |   6 +-
 src/Common/HashTable/StringHashTable.h        |   6 +-
 src/Common/IntervalKind.cpp                   |   2 +-
 .../MySQL/tryParseTableIDFromDDL.cpp          |  14 +-
 src/Functions/DateTimeTransforms.h            |   1 -
 .../JSONPath/Parsers/ParserJSONPathRange.cpp  |   2 +-
 src/Interpreters/SessionLog.cpp               |   2 +-
 src/Interpreters/SystemLog.cpp                |  33 +-
 src/Parsers/ASTQueryWithOnCluster.cpp         |   2 +-
 src/Parsers/Access/ParserCreateQuotaQuery.cpp |  40 +-
 src/Parsers/Access/ParserCreateRoleQuery.cpp  |  20 +-
 .../Access/ParserCreateRowPolicyQuery.cpp     |  38 +-
 .../ParserCreateSettingsProfileQuery.cpp      |  22 +-
 src/Parsers/Access/ParserCreateUserQuery.cpp  |  80 +--
 .../Access/ParserDropAccessEntityQuery.cpp    |  12 +-
 src/Parsers/Access/ParserGrantQuery.cpp       |  28 +-
 .../Access/ParserMoveAccessEntityQuery.cpp    |  10 +-
 src/Parsers/Access/ParserPublicSSHKey.cpp     |   4 +-
 src/Parsers/Access/ParserRolesOrUsersSet.cpp  |  10 +-
 src/Parsers/Access/ParserRowPolicyName.cpp    |  12 +-
 src/Parsers/Access/ParserSetRoleQuery.cpp     |   8 +-
 .../Access/ParserSettingsProfileElement.cpp   |  22 +-
 .../Access/ParserShowAccessEntitiesQuery.cpp  |  14 +-
 src/Parsers/Access/ParserShowAccessQuery.h    |   2 +-
 .../ParserShowCreateAccessEntityQuery.cpp     |  12 +-
 src/Parsers/Access/ParserShowGrantsQuery.cpp  |   4 +-
 .../Access/ParserShowPrivilegesQuery.cpp      |   2 +-
 src/Parsers/Access/parseUserName.cpp          |   2 +-
 src/Parsers/CommonParsers.cpp                 | 109 ++++
 src/Parsers/CommonParsers.h                   | 580 +++++++++++++++++-
 src/Parsers/ExpressionElementParsers.cpp      |  99 +--
 src/Parsers/ExpressionListParsers.cpp         | 134 ++--
 .../KustoFunctions/KQLStringFunctions.cpp     |   4 +-
 src/Parsers/Kusto/ParserKQLMVExpand.cpp       |  12 +-
 src/Parsers/Kusto/ParserKQLMakeSeries.cpp     |   6 +-
 src/Parsers/Kusto/ParserKQLQuery.cpp          |   2 +-
 src/Parsers/MySQL/ASTAlterCommand.cpp         |  64 +-
 src/Parsers/MySQL/ASTAlterQuery.cpp           |   2 +-
 src/Parsers/MySQL/ASTCreateQuery.cpp          |  12 +-
 src/Parsers/MySQL/ASTDeclareConstraint.cpp    |  12 +-
 src/Parsers/MySQL/ASTDeclareIndex.cpp         |  34 +-
 src/Parsers/MySQL/ASTDeclareOption.cpp        |   2 +-
 src/Parsers/MySQL/ASTDeclarePartition.cpp     |   8 +-
 .../MySQL/ASTDeclarePartitionOptions.cpp      |  24 +-
 src/Parsers/MySQL/ASTDeclareReference.cpp     |  24 +-
 src/Parsers/MySQL/ASTDeclareSubPartition.cpp  |   2 +-
 src/Parsers/MySQL/ASTDeclareTableOptions.cpp  |   8 +-
 src/Parsers/MySQL/ASTDropQuery.cpp            |  24 +-
 .../ParserAlterNamedCollectionQuery.cpp       |  17 +-
 src/Parsers/ParserAlterQuery.cpp              | 180 +++---
 src/Parsers/ParserBackupQuery.cpp             |  40 +-
 src/Parsers/ParserCase.cpp                    |  10 +-
 src/Parsers/ParserCheckQuery.cpp              |   8 +-
 src/Parsers/ParserCreateFunctionQuery.cpp     |  12 +-
 src/Parsers/ParserCreateIndexQuery.cpp        |  16 +-
 src/Parsers/ParserCreateQuery.cpp             | 230 +++----
 src/Parsers/ParserCreateQuery.h               |  36 +-
 src/Parsers/ParserDataType.cpp                |  48 +-
 src/Parsers/ParserDatabaseOrNone.cpp          |   2 +-
 src/Parsers/ParserDeleteQuery.cpp             |  10 +-
 src/Parsers/ParserDescribeCacheQuery.cpp      |   6 +-
 src/Parsers/ParserDescribeTableQuery.cpp      |   8 +-
 src/Parsers/ParserDictionary.cpp              |  12 +-
 .../ParserDictionaryAttributeDeclaration.cpp  |  12 +-
 src/Parsers/ParserDropFunctionQuery.cpp       |   8 +-
 src/Parsers/ParserDropIndexQuery.cpp          |   8 +-
 .../ParserDropNamedCollectionQuery.cpp        |   8 +-
 src/Parsers/ParserDropQuery.cpp               |  28 +-
 src/Parsers/ParserExplainQuery.cpp            |  18 +-
 src/Parsers/ParserExternalDDLQuery.cpp        |  10 +-
 src/Parsers/ParserInsertQuery.cpp             |  24 +-
 src/Parsers/ParserKillQueryQuery.cpp          |  20 +-
 src/Parsers/ParserOptimizeQuery.cpp           |  14 +-
 src/Parsers/ParserPartition.cpp               |   4 +-
 src/Parsers/ParserProjectionSelectQuery.cpp   |   8 +-
 src/Parsers/ParserQueryWithOutput.cpp         |  16 +-
 src/Parsers/ParserRefreshStrategy.cpp         |  19 +-
 src/Parsers/ParserRenameQuery.cpp             |  22 +-
 src/Parsers/ParserSelectQuery.cpp             |  58 +-
 src/Parsers/ParserSetQuery.cpp                |  14 +-
 src/Parsers/ParserShowColumnsQuery.cpp        |  20 +-
 src/Parsers/ParserShowEngineQuery.h           |   2 +-
 src/Parsers/ParserShowFunctionsQuery.cpp      |   4 +-
 src/Parsers/ParserShowIndexesQuery.cpp        |  12 +-
 src/Parsers/ParserShowProcesslistQuery.h      |   2 +-
 src/Parsers/ParserShowSettingQuery.cpp        |   2 +-
 src/Parsers/ParserShowTablesQuery.cpp         |  40 +-
 src/Parsers/ParserSystemQuery.cpp             |  83 +--
 src/Parsers/ParserTablePropertiesQuery.cpp    |  16 +-
 src/Parsers/ParserTablesInSelectQuery.cpp     |  46 +-
 src/Parsers/ParserTransactionControl.cpp      |   8 +-
 src/Parsers/ParserUndropQuery.cpp             |   8 +-
 src/Parsers/ParserUseQuery.cpp                |   2 +-
 src/Parsers/ParserWatchQuery.cpp              |   6 +-
 src/Parsers/ParserWithElement.cpp             |   2 +-
 src/Parsers/parseIntervalKind.cpp             |  65 +-
 src/Storages/System/StorageSystemKeywords.cpp |  29 +
 src/Storages/System/StorageSystemKeywords.h   |  28 +
 src/Storages/System/attachSystemTables.cpp    |   2 +
 102 files changed, 1848 insertions(+), 1077 deletions(-)
 create mode 100644 src/Storages/System/StorageSystemKeywords.cpp
 create mode 100644 src/Storages/System/StorageSystemKeywords.h

diff --git a/programs/keeper-client/Commands.cpp b/programs/keeper-client/Commands.cpp
index 62b082ce15a..2ec43ae15d0 100644
--- a/programs/keeper-client/Commands.cpp
+++ b/programs/keeper-client/Commands.cpp
@@ -2,6 +2,7 @@
 #include "Commands.h"
 #include <queue>
 #include "KeeperClient.h"
+#include "Parsers/CommonParsers.h"
 
 
 namespace DB
@@ -106,13 +107,13 @@ bool CreateCommand::parse(IParser::Pos & pos, std::shared_ptr<ASTKeeperQuery> &
 
     int mode = zkutil::CreateMode::Persistent;
 
-    if (ParserKeyword{"PERSISTENT"}.ignore(pos, expected))
+    if (ParserKeyword(Keyword::PERSISTENT).ignore(pos, expected))
         mode = zkutil::CreateMode::Persistent;
-    else if (ParserKeyword{"EPHEMERAL"}.ignore(pos, expected))
+    else if (ParserKeyword(Keyword::EPHEMERAL).ignore(pos, expected))
         mode = zkutil::CreateMode::Ephemeral;
-    else if (ParserKeyword{"EPHEMERAL SEQUENTIAL"}.ignore(pos, expected))
+    else if (ParserKeyword(Keyword::EPHEMERAL_SEQUENTIAL).ignore(pos, expected))
         mode = zkutil::CreateMode::EphemeralSequential;
-    else if (ParserKeyword{"PERSISTENT SEQUENTIAL"}.ignore(pos, expected))
+    else if (ParserKeyword(Keyword::PERSISTENT_SEQUENTIAL).ignore(pos, expected))
         mode = zkutil::CreateMode::PersistentSequential;
 
     node->args.push_back(std::move(mode));
@@ -382,12 +383,16 @@ void RMRCommand::execute(const ASTKeeperQuery * query, KeeperClient * client) co
 
 bool ReconfigCommand::parse(IParser::Pos & pos, std::shared_ptr<ASTKeeperQuery> & node, DB::Expected & expected) const
 {
+    ParserKeyword s_add(Keyword::ADD);
+    ParserKeyword s_remove(Keyword::REMOVE);
+    ParserKeyword s_set(Keyword::SET);
+
     ReconfigCommand::Operation operation;
-    if (ParserKeyword{"ADD"}.ignore(pos, expected))
+    if (s_add.ignore(pos, expected))
         operation = ReconfigCommand::Operation::ADD;
-    else if (ParserKeyword{"REMOVE"}.ignore(pos, expected))
+    else if (s_remove.ignore(pos, expected))
         operation = ReconfigCommand::Operation::REMOVE;
-    else if (ParserKeyword{"SET"}.ignore(pos, expected))
+    else if (s_set.ignore(pos, expected))
         operation = ReconfigCommand::Operation::SET;
     else
         return false;
diff --git a/src/Access/Common/AuthenticationType.cpp b/src/Access/Common/AuthenticationType.cpp
index a61dc33fc0e..2cc126ad9b7 100644
--- a/src/Access/Common/AuthenticationType.cpp
+++ b/src/Access/Common/AuthenticationType.cpp
@@ -13,63 +13,63 @@ namespace ErrorCodes
 
 const AuthenticationTypeInfo & AuthenticationTypeInfo::get(AuthenticationType type_)
 {
-    static constexpr auto make_info = [](const char * raw_name_, bool is_password_ = false)
+    static constexpr auto make_info = [](Keyword keyword_, bool is_password_ = false)
     {
-        String init_name = raw_name_;
+        String init_name = String(toStringView(keyword_));
         boost::to_lower(init_name);
-        return AuthenticationTypeInfo{raw_name_, std::move(init_name), is_password_};
+        return AuthenticationTypeInfo{keyword_, std::move(init_name), is_password_};
     };
 
     switch (type_)
     {
         case AuthenticationType::NO_PASSWORD:
         {
-            static const auto info = make_info("NO_PASSWORD");
+            static const auto info = make_info(Keyword::NO_PASSWORD);
             return info;
         }
         case AuthenticationType::PLAINTEXT_PASSWORD:
         {
-            static const auto info = make_info("PLAINTEXT_PASSWORD", true);
+            static const auto info = make_info(Keyword::PLAINTEXT_PASSWORD, true);
             return info;
         }
         case AuthenticationType::SHA256_PASSWORD:
         {
-            static const auto info = make_info("SHA256_PASSWORD", true);
+            static const auto info = make_info(Keyword::SHA256_PASSWORD, true);
             return info;
         }
         case AuthenticationType::DOUBLE_SHA1_PASSWORD:
         {
-            static const auto info = make_info("DOUBLE_SHA1_PASSWORD", true);
+            static const auto info = make_info(Keyword::DOUBLE_SHA1_PASSWORD, true);
             return info;
         }
         case AuthenticationType::LDAP:
         {
-            static const auto info = make_info("LDAP");
+            static const auto info = make_info(Keyword::LDAP);
             return info;
         }
         case AuthenticationType::KERBEROS:
         {
-            static const auto info = make_info("KERBEROS");
+            static const auto info = make_info(Keyword::KERBEROS);
             return info;
         }
         case AuthenticationType::SSL_CERTIFICATE:
         {
-            static const auto info = make_info("SSL_CERTIFICATE");
+            static const auto info = make_info(Keyword::SSL_CERTIFICATE);
             return info;
         }
         case AuthenticationType::BCRYPT_PASSWORD:
         {
-            static const auto info = make_info("BCRYPT_PASSWORD", true);
+            static const auto info = make_info(Keyword::BCRYPT_PASSWORD, true);
             return info;
         }
         case AuthenticationType::SSH_KEY:
         {
-            static const auto info = make_info("SSH_KEY");
+            static const auto info = make_info(Keyword::SSH_KEY);
             return info;
         }
         case AuthenticationType::HTTP:
         {
-            static const auto info = make_info("HTTP");
+            static const auto info = make_info(Keyword::HTTP);
             return info;
         }
         case AuthenticationType::MAX:
diff --git a/src/Access/Common/AuthenticationType.h b/src/Access/Common/AuthenticationType.h
index e81b9e6e439..48ace3ca00a 100644
--- a/src/Access/Common/AuthenticationType.h
+++ b/src/Access/Common/AuthenticationType.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <base/types.h>
+#include <Parsers/CommonParsers.h>
 
 namespace DB
 {
@@ -45,7 +46,7 @@ enum class AuthenticationType
 
 struct AuthenticationTypeInfo
 {
-    const char * const raw_name;
+    Keyword keyword; // Keyword used in parser
     const String name; /// Lowercased with underscores, e.g. "sha256_password".
     bool is_password;
     static const AuthenticationTypeInfo & get(AuthenticationType type_);
@@ -53,7 +54,7 @@ struct AuthenticationTypeInfo
 
 inline String toString(AuthenticationType type_)
 {
-    return AuthenticationTypeInfo::get(type_).raw_name;
+    return String(toStringView(AuthenticationTypeInfo::get(type_).keyword));
 }
 
 }
diff --git a/src/Common/HashTable/StringHashMap.h b/src/Common/HashTable/StringHashMap.h
index 828a54d357a..2599422ff3c 100644
--- a/src/Common/HashTable/StringHashMap.h
+++ b/src/Common/HashTable/StringHashMap.h
@@ -12,7 +12,7 @@ struct StringHashMapCell : public HashMapCell<Key, TMapped, StringHashTableHash,
     using Base::Base;
     static constexpr bool need_zero_value_storage = false;
     // external
-    StringRef getKey() const { return toStringRef(this->value.first); } /// NOLINT
+    StringRef getKey() const { return toStringView(this->value.first); } /// NOLINT
     // internal
     static const Key & getKey(const value_type & value_) { return value_.first; }
 };
@@ -32,7 +32,7 @@ struct StringHashMapCell<StringKey16, TMapped> : public HashMapCell<StringKey16,
     void setZero() { this->value.first.items[1] = 0; }
 
     // external
-    StringRef getKey() const { return toStringRef(this->value.first); } /// NOLINT
+    StringRef getKey() const { return toStringView(this->value.first); } /// NOLINT
     // internal
     static const StringKey16 & getKey(const value_type & value_) { return value_.first; }
 };
@@ -53,7 +53,7 @@ struct StringHashMapCell<StringKey24, TMapped> : public HashMapCell<StringKey24,
     void setZero() { this->value.first.c = 0; }
 
     // external
-    StringRef getKey() const { return toStringRef(this->value.first); } /// NOLINT
+    StringRef getKey() const { return toStringView(this->value.first); } /// NOLINT
     // internal
     static const StringKey24 & getKey(const value_type & value_) { return value_.first; }
 };
diff --git a/src/Common/HashTable/StringHashTable.h b/src/Common/HashTable/StringHashTable.h
index f3ba54e7d6e..30137d4ca6e 100644
--- a/src/Common/HashTable/StringHashTable.h
+++ b/src/Common/HashTable/StringHashTable.h
@@ -19,7 +19,7 @@ struct StringKey24
     bool operator==(const StringKey24 rhs) const { return a == rhs.a && b == rhs.b && c == rhs.c; }
 };
 
-inline StringRef ALWAYS_INLINE toStringRef(const StringKey8 & n)
+inline StringRef ALWAYS_INLINE toStringView(const StringKey8 & n)
 {
     assert(n != 0);
 #if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
@@ -28,7 +28,7 @@ inline StringRef ALWAYS_INLINE toStringRef(const StringKey8 & n)
     return {reinterpret_cast<const char *>(&n), 8ul - (std::countl_zero(n) >> 3)};
 #endif
 }
-inline StringRef ALWAYS_INLINE toStringRef(const StringKey16 & n)
+inline StringRef ALWAYS_INLINE toStringView(const StringKey16 & n)
 {
     assert(n.items[1] != 0);
 #if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
@@ -37,7 +37,7 @@ inline StringRef ALWAYS_INLINE toStringRef(const StringKey16 & n)
     return {reinterpret_cast<const char *>(&n), 16ul - (std::countl_zero(n.items[1]) >> 3)};
 #endif
 }
-inline StringRef ALWAYS_INLINE toStringRef(const StringKey24 & n)
+inline StringRef ALWAYS_INLINE toStringView(const StringKey24 & n)
 {
     assert(n.c != 0);
 #if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
diff --git a/src/Common/IntervalKind.cpp b/src/Common/IntervalKind.cpp
index 659f8fa5c6c..7ba32a689f5 100644
--- a/src/Common/IntervalKind.cpp
+++ b/src/Common/IntervalKind.cpp
@@ -240,7 +240,7 @@ const char * IntervalKind::toNameOfFunctionExtractTimePart() const
             return "toDayOfMonth";
         case IntervalKind::Kind::Week:
             // TODO: SELECT toRelativeWeekNum(toDate('2017-06-15')) - toRelativeWeekNum(toStartOfYear(toDate('2017-06-15')))
-            // else if (ParserKeyword("WEEK").ignore(pos, expected))
+            // else if (ParserKeyword(Keyword::WEEK).ignore(pos, expected))
             //    function_name = "toRelativeWeekNum";
             throw Exception(ErrorCodes::SYNTAX_ERROR, "The syntax 'EXTRACT(WEEK FROM date)' is not supported, cannot extract the number of a week");
         case IntervalKind::Kind::Month:
diff --git a/src/Databases/MySQL/tryParseTableIDFromDDL.cpp b/src/Databases/MySQL/tryParseTableIDFromDDL.cpp
index 4fe0f44c767..bc7f2507e57 100644
--- a/src/Databases/MySQL/tryParseTableIDFromDDL.cpp
+++ b/src/Databases/MySQL/tryParseTableIDFromDDL.cpp
@@ -12,23 +12,23 @@ StorageID tryParseTableIDFromDDL(const String & query, const String & default_da
     Tokens tokens(query.data(), query.data() + query.size());
     IParser::Pos pos(tokens, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
     Expected expected;
-    if (ParserKeyword("CREATE TEMPORARY TABLE").ignore(pos, expected) || ParserKeyword("CREATE TABLE").ignore(pos, expected))
+    if (ParserKeyword(Keyword::CREATE_TEMPORARY_TABLE).ignore(pos, expected) || ParserKeyword(Keyword::CREATE_TABLE).ignore(pos, expected))
     {
-        ParserKeyword("IF NOT EXISTS").ignore(pos, expected);
+        ParserKeyword(Keyword::IF_NOT_EXISTS).ignore(pos, expected);
         is_ddl = true;
     }
-    else if (ParserKeyword("ALTER TABLE").ignore(pos, expected) || ParserKeyword("RENAME TABLE").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::ALTER_TABLE).ignore(pos, expected) || ParserKeyword(Keyword::RENAME_TABLE).ignore(pos, expected))
     {
         is_ddl = true;
     }
-    else if (ParserKeyword("DROP TABLE").ignore(pos, expected) || ParserKeyword("DROP TEMPORARY TABLE").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::DROP_TABLE).ignore(pos, expected) || ParserKeyword(Keyword::DROP_TEMPORARY_TABLE).ignore(pos, expected))
     {
-        ParserKeyword("IF EXISTS").ignore(pos, expected);
+        ParserKeyword(Keyword::IF_EXISTS).ignore(pos, expected);
         is_ddl = true;
     }
-    else if (ParserKeyword("TRUNCATE").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::TRUNCATE).ignore(pos, expected))
     {
-        ParserKeyword("TABLE").ignore(pos, expected);
+        ParserKeyword(Keyword::TABLE).ignore(pos, expected);
         is_ddl = true;
     }
 
diff --git a/src/Functions/DateTimeTransforms.h b/src/Functions/DateTimeTransforms.h
index 70b2a7a83b4..f5072de24f3 100644
--- a/src/Functions/DateTimeTransforms.h
+++ b/src/Functions/DateTimeTransforms.h
@@ -2094,7 +2094,6 @@ struct Transformer
                     || std::is_same_v<Additions, DateTimeAccurateOrNullConvertStrategyAdditions>)
                 {
                     bool is_valid_input = vec_from[i] >= 0 && vec_from[i] <= 0xFFFFFFFFL;
-
                     if (!is_valid_input)
                     {
                         if constexpr (std::is_same_v<Additions, DateTimeAccurateOrNullConvertStrategyAdditions>)
diff --git a/src/Functions/JSONPath/Parsers/ParserJSONPathRange.cpp b/src/Functions/JSONPath/Parsers/ParserJSONPathRange.cpp
index 03c006774c0..fb74018b330 100644
--- a/src/Functions/JSONPath/Parsers/ParserJSONPathRange.cpp
+++ b/src/Functions/JSONPath/Parsers/ParserJSONPathRange.cpp
@@ -55,7 +55,7 @@ bool ParserJSONPathRange::parseImpl(Pos & pos, ASTPtr & node, Expected & expecte
         }
         else if (pos->type == TokenType::BareWord)
         {
-            if (!ParserKeyword("TO").ignore(pos, expected))
+            if (!ParserKeyword(Keyword::TO).ignore(pos, expected))
             {
                 return false;
             }
diff --git a/src/Interpreters/SessionLog.cpp b/src/Interpreters/SessionLog.cpp
index dc0ac963d0b..adb94cae0c2 100644
--- a/src/Interpreters/SessionLog.cpp
+++ b/src/Interpreters/SessionLog.cpp
@@ -77,7 +77,7 @@ ColumnsDescription SessionLogElement::getColumnsDescription()
             {"Logout",                 static_cast<Int8>(SESSION_LOGOUT)}
         });
 
-#define AUTH_TYPE_NAME_AND_VALUE(v) std::make_pair(AuthenticationTypeInfo::get(v).raw_name, static_cast<Int8>(v))
+#define AUTH_TYPE_NAME_AND_VALUE(v) std::make_pair(toString(v), static_cast<Int8>(v))
     auto identified_with_column = std::make_shared<DataTypeEnum8>(
         DataTypeEnum8::Values
         {
diff --git a/src/Interpreters/SystemLog.cpp b/src/Interpreters/SystemLog.cpp
index e4cbbb8f5f7..efb2559ce42 100644
--- a/src/Interpreters/SystemLog.cpp
+++ b/src/Interpreters/SystemLog.cpp
@@ -1,8 +1,18 @@
-#include <IO/WriteHelpers.h>
+#include <Interpreters/SystemLog.h>
+
+#include <base/scope_guard.h>
+#include <Common/logger_useful.h>
+#include <Common/MemoryTrackerBlockerInThread.h>
+#include <Common/quoteString.h>
+#include <Common/setThreadName.h>
 #include <Interpreters/AsynchronousInsertLog.h>
 #include <Interpreters/AsynchronousMetricLog.h>
+#include <Interpreters/BackupLog.h>
+#include <Interpreters/BlobStorageLog.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/CrashLog.h>
+#include <Interpreters/FilesystemCacheLog.h>
+#include <Interpreters/FilesystemReadPrefetchesLog.h>
 #include <Interpreters/InterpreterCreateQuery.h>
 #include <Interpreters/InterpreterInsertQuery.h>
 #include <Interpreters/InterpreterRenameQuery.h>
@@ -10,38 +20,31 @@
 #include <Interpreters/OpenTelemetrySpanLog.h>
 #include <Interpreters/PartLog.h>
 #include <Interpreters/ProcessorsProfileLog.h>
-#include <Interpreters/BlobStorageLog.h>
 #include <Interpreters/QueryLog.h>
 #include <Interpreters/QueryThreadLog.h>
 #include <Interpreters/QueryViewsLog.h>
+#include <Interpreters/S3QueueLog.h>
 #include <Interpreters/SessionLog.h>
 #include <Interpreters/TextLog.h>
 #include <Interpreters/TraceLog.h>
 #include <Interpreters/TransactionsInfoLog.h>
-#include <Interpreters/FilesystemCacheLog.h>
-#include <Interpreters/FilesystemReadPrefetchesLog.h>
-#include <Interpreters/S3QueueLog.h>
 #include <Interpreters/ZooKeeperLog.h>
-#include <Interpreters/BackupLog.h>
+#include <IO/WriteHelpers.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIndexDeclaration.h>
 #include <Parsers/ASTInsertQuery.h>
 #include <Parsers/ASTRenameQuery.h>
-#include <Parsers/ParserCreateQuery.h>
+#include <Parsers/CommonParsers.h>
 #include <Parsers/formatAST.h>
 #include <Parsers/parseQuery.h>
+#include <Parsers/ParserCreateQuery.h>
+#include <Poco/Util/AbstractConfiguration.h>
 #include <Processors/Executors/PushingPipelineExecutor.h>
 #include <Storages/IStorage.h>
 #include <Storages/MergeTree/MergeTreeSettings.h>
-#include <base/scope_guard.h>
-#include <fmt/core.h>
-#include <Poco/Util/AbstractConfiguration.h>
-#include "Common/quoteString.h"
-#include <Common/MemoryTrackerBlockerInThread.h>
-#include <Common/logger_useful.h>
-#include <Common/setThreadName.h>
 
+#include <fmt/core.h>
 
 namespace DB
 {
@@ -91,7 +94,7 @@ namespace
             if (!storage_p.parse(pos, storage, expected))
                 return false;
 
-            ParserKeyword s_comment("COMMENT");
+            ParserKeyword s_comment(Keyword::COMMENT);
             ParserStringLiteral string_literal_parser;
             ASTPtr comment;
 
diff --git a/src/Parsers/ASTQueryWithOnCluster.cpp b/src/Parsers/ASTQueryWithOnCluster.cpp
index d0b6d82ab13..1281a97fa00 100644
--- a/src/Parsers/ASTQueryWithOnCluster.cpp
+++ b/src/Parsers/ASTQueryWithOnCluster.cpp
@@ -19,7 +19,7 @@ std::string ASTQueryWithOnCluster::getRewrittenQueryWithoutOnCluster(const Witho
 
 bool ASTQueryWithOnCluster::parse(Pos & pos, std::string & cluster_str, Expected & expected)
 {
-    if (!ParserKeyword{"CLUSTER"}.ignore(pos, expected))
+    if (!ParserKeyword(Keyword::CLUSTER).ignore(pos, expected))
         return false;
 
     return parseIdentifierOrStringLiteral(pos, expected, cluster_str);
diff --git a/src/Parsers/Access/ParserCreateQuotaQuery.cpp b/src/Parsers/Access/ParserCreateQuotaQuery.cpp
index bc3512e3fc0..ddfdbe38903 100644
--- a/src/Parsers/Access/ParserCreateQuotaQuery.cpp
+++ b/src/Parsers/Access/ParserCreateQuotaQuery.cpp
@@ -33,7 +33,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"RENAME TO"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::RENAME_TO}.ignore(pos, expected))
                 return false;
 
             return parseIdentifierOrStringLiteral(pos, expected, new_name);
@@ -44,13 +44,13 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (ParserKeyword{"NOT KEYED"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::NOT_KEYED}.ignore(pos, expected))
             {
                 key_type = QuotaKeyType::NONE;
                 return true;
             }
 
-            if (!ParserKeyword{"KEY BY"}.ignore(pos, expected) && !ParserKeyword{"KEYED BY"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::KEY_BY}.ignore(pos, expected) && !ParserKeyword{Keyword::KEYED_BY}.ignore(pos, expected))
                 return false;
 
             Strings names;
@@ -84,7 +84,7 @@ namespace
         {
             for (auto qt : collections::range(QuotaType::MAX))
             {
-                if (ParserKeyword{QuotaTypeInfo::get(qt).keyword}.ignore(pos, expected))
+                if (ParserKeyword::createDeprecated(QuotaTypeInfo::get(qt).keyword).ignore(pos, expected))
                 {
                     quota_type = qt;
                     return true;
@@ -141,7 +141,7 @@ namespace
 
         auto parse_limit = [&]
         {
-            max_prefix_encountered |= ParserKeyword{"MAX"}.ignore(pos, expected);
+            max_prefix_encountered |= ParserKeyword{Keyword::MAX}.ignore(pos, expected);
 
             QuotaType quota_type;
             if (!parseQuotaType(pos, expected, quota_type))
@@ -153,7 +153,7 @@ namespace
             }
             else
             {
-                if (!ParserKeyword{"MAX"}.ignore(pos, expected))
+                if (!ParserKeyword{Keyword::MAX}.ignore(pos, expected))
                     return false;
             }
 
@@ -178,13 +178,13 @@ namespace
 
         auto parse_interval_with_limits = [&]
         {
-            if (!ParserKeyword{"FOR"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::FOR}.ignore(pos, expected))
                 return false;
 
             ASTCreateQuotaQuery::Limits limits;
-            limits.randomize_interval = ParserKeyword{"RANDOMIZED"}.ignore(pos, expected);
+            limits.randomize_interval = ParserKeyword{Keyword::RANDOMIZED}.ignore(pos, expected);
 
-            ParserKeyword{"INTERVAL"}.ignore(pos, expected);
+            ParserKeyword{Keyword::INTERVAL}.ignore(pos, expected);
 
             ASTPtr num_intervals_ast;
             if (!ParserNumber{}.parse(pos, num_intervals_ast, expected))
@@ -199,11 +199,11 @@ namespace
             limits.duration = std::chrono::seconds(static_cast<UInt64>(num_intervals * interval_kind.toAvgSeconds()));
             std::vector<std::pair<QuotaType, QuotaValue>> new_limits;
 
-            if (ParserKeyword{"NO LIMITS"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::NO_LIMITS}.ignore(pos, expected))
             {
                 limits.drop = true;
             }
-            else if (ParserKeyword{"TRACKING ONLY"}.ignore(pos, expected))
+            else if (ParserKeyword{Keyword::TRACKING_ONLY}.ignore(pos, expected))
             {
             }
             else if (parseLimits(pos, expected, new_limits))
@@ -232,7 +232,7 @@ namespace
             ASTPtr node;
             ParserRolesOrUsersSet roles_p;
             roles_p.allowAll().allowRoles().allowUsers().allowCurrentUser().useIDMode(id_mode);
-            if (!ParserKeyword{"TO"}.ignore(pos, expected) || !roles_p.parse(pos, node, expected))
+            if (!ParserKeyword{Keyword::TO}.ignore(pos, expected) || !roles_p.parse(pos, node, expected))
                 return false;
 
             roles = std::static_pointer_cast<ASTRolesOrUsersSet>(node);
@@ -244,7 +244,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 }
@@ -255,14 +255,14 @@ bool ParserCreateQuotaQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
     bool alter = false;
     if (attach_mode)
     {
-        if (!ParserKeyword{"ATTACH QUOTA"}.ignore(pos, expected))
+        if (!ParserKeyword{Keyword::ATTACH_QUOTA}.ignore(pos, expected))
             return false;
     }
     else
     {
-        if (ParserKeyword{"ALTER QUOTA"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::ALTER_QUOTA}.ignore(pos, expected))
             alter = true;
-        else if (!ParserKeyword{"CREATE QUOTA"}.ignore(pos, expected))
+        else if (!ParserKeyword{Keyword::CREATE_QUOTA}.ignore(pos, expected))
             return false;
     }
 
@@ -271,14 +271,14 @@ bool ParserCreateQuotaQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
     bool or_replace = false;
     if (alter)
     {
-        if (ParserKeyword{"IF EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_EXISTS}.ignore(pos, expected))
             if_exists = true;
     }
     else
     {
-        if (ParserKeyword{"IF NOT EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_NOT_EXISTS}.ignore(pos, expected))
             if_not_exists = true;
-        else if (ParserKeyword{"OR REPLACE"}.ignore(pos, expected))
+        else if (ParserKeyword{Keyword::OR_REPLACE}.ignore(pos, expected))
             or_replace = true;
     }
 
@@ -313,7 +313,7 @@ bool ParserCreateQuotaQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
         if (cluster.empty() && parseOnCluster(pos, expected, cluster))
             continue;
 
-        if (storage_name.empty() && ParserKeyword{"IN"}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
+        if (storage_name.empty() && ParserKeyword{Keyword::IN}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
             continue;
 
         break;
diff --git a/src/Parsers/Access/ParserCreateRoleQuery.cpp b/src/Parsers/Access/ParserCreateRoleQuery.cpp
index 99a97f6901d..cdcb399e408 100644
--- a/src/Parsers/Access/ParserCreateRoleQuery.cpp
+++ b/src/Parsers/Access/ParserCreateRoleQuery.cpp
@@ -18,7 +18,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"RENAME TO"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::RENAME_TO}.ignore(pos, expected))
                 return false;
 
             return parseRoleName(pos, expected, new_name);
@@ -29,7 +29,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"SETTINGS"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::SETTINGS}.ignore(pos, expected))
                 return false;
 
             ASTPtr new_settings_ast;
@@ -47,7 +47,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 }
@@ -58,14 +58,14 @@ bool ParserCreateRoleQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     bool alter = false;
     if (attach_mode)
     {
-        if (!ParserKeyword{"ATTACH ROLE"}.ignore(pos, expected))
+        if (!ParserKeyword{Keyword::ATTACH_ROLE}.ignore(pos, expected))
             return false;
     }
     else
     {
-        if (ParserKeyword{"ALTER ROLE"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::ALTER_ROLE}.ignore(pos, expected))
             alter = true;
-        else if (!ParserKeyword{"CREATE ROLE"}.ignore(pos, expected))
+        else if (!ParserKeyword{Keyword::CREATE_ROLE}.ignore(pos, expected))
             return false;
     }
 
@@ -74,14 +74,14 @@ bool ParserCreateRoleQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     bool or_replace = false;
     if (alter)
     {
-        if (ParserKeyword{"IF EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_EXISTS}.ignore(pos, expected))
             if_exists = true;
     }
     else
     {
-        if (ParserKeyword{"IF NOT EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_NOT_EXISTS}.ignore(pos, expected))
             if_not_exists = true;
-        else if (ParserKeyword{"OR REPLACE"}.ignore(pos, expected))
+        else if (ParserKeyword{Keyword::OR_REPLACE}.ignore(pos, expected))
             or_replace = true;
     }
 
@@ -112,7 +112,7 @@ bool ParserCreateRoleQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
         if (cluster.empty() && parseOnCluster(pos, expected, cluster))
             continue;
 
-        if (storage_name.empty() && ParserKeyword{"IN"}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
+        if (storage_name.empty() && ParserKeyword{Keyword::IN}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
             continue;
 
         break;
diff --git a/src/Parsers/Access/ParserCreateRowPolicyQuery.cpp b/src/Parsers/Access/ParserCreateRowPolicyQuery.cpp
index f9e9466e35d..b49e153c5b0 100644
--- a/src/Parsers/Access/ParserCreateRowPolicyQuery.cpp
+++ b/src/Parsers/Access/ParserCreateRowPolicyQuery.cpp
@@ -23,7 +23,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"RENAME TO"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::RENAME_TO}.ignore(pos, expected))
                 return false;
 
             return parseIdentifierOrStringLiteral(pos, expected, new_short_name);
@@ -34,16 +34,16 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"AS"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::AS}.ignore(pos, expected))
                 return false;
 
-            if (ParserKeyword{"RESTRICTIVE"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::RESTRICTIVE}.ignore(pos, expected))
             {
                 is_restrictive = true;
                 return true;
             }
 
-            if (!ParserKeyword{"PERMISSIVE"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::PERMISSIVE}.ignore(pos, expected))
                 return false;
 
             is_restrictive = false;
@@ -55,7 +55,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (ParserKeyword("NONE").ignore(pos, expected))
+            if (ParserKeyword(Keyword::NONE).ignore(pos, expected))
             {
                 expr = nullptr;
                 return true;
@@ -89,7 +89,7 @@ namespace
 
         auto parse_command = [&]
         {
-            if (ParserKeyword{"ALL"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::ALL}.ignore(pos, expected))
             {
                 addAllCommands(res_commands);
                 return true;
@@ -98,7 +98,7 @@ namespace
             for (auto filter_type : collections::range(RowPolicyFilterType::MAX))
             {
                 std::string_view command = RowPolicyFilterTypeInfo::get(filter_type).command;
-                if (ParserKeyword{command.data()}.ignore(pos, expected))
+                if (ParserKeyword::createDeprecated(command.data()).ignore(pos, expected))
                 {
                     res_commands.emplace(command);
                     return true;
@@ -125,7 +125,7 @@ namespace
         {
             boost::container::flat_set<std::string_view> commands;
 
-            if (ParserKeyword{"FOR"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::FOR}.ignore(pos, expected))
             {
                 if (!parseCommands(pos, expected, commands))
                     return false;
@@ -135,12 +135,12 @@ namespace
 
             std::optional<ASTPtr> filter;
             std::optional<ASTPtr> check;
-            if (ParserKeyword{"USING"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::USING}.ignore(pos, expected))
             {
                 if (!parseFilterExpression(pos, expected, filter.emplace()))
                     return false;
             }
-            if (ParserKeyword{"WITH CHECK"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::WITH_CHECK}.ignore(pos, expected))
             {
                 if (!parseFilterExpression(pos, expected, check.emplace()))
                     return false;
@@ -179,7 +179,7 @@ namespace
         return IParserBase::wrapParseImpl(pos, [&]
         {
             ASTPtr ast;
-            if (!ParserKeyword{"TO"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::TO}.ignore(pos, expected))
                 return false;
 
             ParserRolesOrUsersSet roles_p;
@@ -196,7 +196,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 }
@@ -207,14 +207,14 @@ bool ParserCreateRowPolicyQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
     bool alter = false;
     if (attach_mode)
     {
-        if (!ParserKeyword{"ATTACH POLICY"}.ignore(pos, expected) && !ParserKeyword{"ATTACH ROW POLICY"}.ignore(pos, expected))
+        if (!ParserKeyword{Keyword::ATTACH_POLICY}.ignore(pos, expected) && !ParserKeyword{Keyword::ATTACH_ROW_POLICY}.ignore(pos, expected))
             return false;
     }
     else
     {
-        if (ParserKeyword{"ALTER POLICY"}.ignore(pos, expected) || ParserKeyword{"ALTER ROW POLICY"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::ALTER_POLICY}.ignore(pos, expected) || ParserKeyword{Keyword::ALTER_ROW_POLICY}.ignore(pos, expected))
             alter = true;
-        else if (!ParserKeyword{"CREATE POLICY"}.ignore(pos, expected) && !ParserKeyword{"CREATE ROW POLICY"}.ignore(pos, expected))
+        else if (!ParserKeyword{Keyword::CREATE_POLICY}.ignore(pos, expected) && !ParserKeyword{Keyword::CREATE_ROW_POLICY}.ignore(pos, expected))
             return false;
     }
 
@@ -223,14 +223,14 @@ bool ParserCreateRowPolicyQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
     bool or_replace = false;
     if (alter)
     {
-        if (ParserKeyword{"IF EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_EXISTS}.ignore(pos, expected))
             if_exists = true;
     }
     else
     {
-        if (ParserKeyword{"IF NOT EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_NOT_EXISTS}.ignore(pos, expected))
             if_not_exists = true;
-        else if (ParserKeyword{"OR REPLACE"}.ignore(pos, expected))
+        else if (ParserKeyword{Keyword::OR_REPLACE}.ignore(pos, expected))
             or_replace = true;
     }
 
@@ -273,7 +273,7 @@ bool ParserCreateRowPolicyQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
         if (cluster.empty() && parseOnCluster(pos, expected, cluster))
             continue;
 
-        if (storage_name.empty() && ParserKeyword{"IN"}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
+        if (storage_name.empty() && ParserKeyword{Keyword::IN}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
             continue;
 
         break;
diff --git a/src/Parsers/Access/ParserCreateSettingsProfileQuery.cpp b/src/Parsers/Access/ParserCreateSettingsProfileQuery.cpp
index fcb6ebd8806..6526aaf4fc5 100644
--- a/src/Parsers/Access/ParserCreateSettingsProfileQuery.cpp
+++ b/src/Parsers/Access/ParserCreateSettingsProfileQuery.cpp
@@ -20,7 +20,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"RENAME TO"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::RENAME_TO}.ignore(pos, expected))
                 return false;
 
             return parseIdentifierOrStringLiteral(pos, expected, new_name);
@@ -31,7 +31,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"SETTINGS"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::SETTINGS}.ignore(pos, expected))
                 return false;
 
             ASTPtr new_settings_ast;
@@ -50,7 +50,7 @@ namespace
         return IParserBase::wrapParseImpl(pos, [&]
         {
             ASTPtr ast;
-            if (!ParserKeyword{"TO"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::TO}.ignore(pos, expected))
                 return false;
 
             ParserRolesOrUsersSet roles_p;
@@ -67,7 +67,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 }
@@ -78,14 +78,14 @@ bool ParserCreateSettingsProfileQuery::parseImpl(Pos & pos, ASTPtr & node, Expec
     bool alter = false;
     if (attach_mode)
     {
-        if (!ParserKeyword{"ATTACH SETTINGS PROFILE"}.ignore(pos, expected) && !ParserKeyword{"ATTACH PROFILE"}.ignore(pos, expected))
+        if (!ParserKeyword{Keyword::ATTACH_SETTINGS_PROFILE}.ignore(pos, expected) && !ParserKeyword{Keyword::ATTACH_PROFILE}.ignore(pos, expected))
             return false;
     }
     else
     {
-        if (ParserKeyword{"ALTER SETTINGS PROFILE"}.ignore(pos, expected) || ParserKeyword{"ALTER PROFILE"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::ALTER_SETTINGS_PROFILE}.ignore(pos, expected) || ParserKeyword{Keyword::ALTER_PROFILE}.ignore(pos, expected))
             alter = true;
-        else if (!ParserKeyword{"CREATE SETTINGS PROFILE"}.ignore(pos, expected) && !ParserKeyword{"CREATE PROFILE"}.ignore(pos, expected))
+        else if (!ParserKeyword{Keyword::CREATE_SETTINGS_PROFILE}.ignore(pos, expected) && !ParserKeyword{Keyword::CREATE_PROFILE}.ignore(pos, expected))
             return false;
     }
 
@@ -94,14 +94,14 @@ bool ParserCreateSettingsProfileQuery::parseImpl(Pos & pos, ASTPtr & node, Expec
     bool or_replace = false;
     if (alter)
     {
-        if (ParserKeyword{"IF EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_EXISTS}.ignore(pos, expected))
             if_exists = true;
     }
     else
     {
-        if (ParserKeyword{"IF NOT EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_NOT_EXISTS}.ignore(pos, expected))
             if_not_exists = true;
-        else if (ParserKeyword{"OR REPLACE"}.ignore(pos, expected))
+        else if (ParserKeyword{Keyword::OR_REPLACE}.ignore(pos, expected))
             or_replace = true;
     }
 
@@ -132,7 +132,7 @@ bool ParserCreateSettingsProfileQuery::parseImpl(Pos & pos, ASTPtr & node, Expec
         if (cluster.empty() && parseOnCluster(pos, expected, cluster))
             continue;
 
-        if (storage_name.empty() && ParserKeyword{"IN"}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
+        if (storage_name.empty() && ParserKeyword{Keyword::IN}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
             continue;
 
         break;
diff --git a/src/Parsers/Access/ParserCreateUserQuery.cpp b/src/Parsers/Access/ParserCreateUserQuery.cpp
index 8e5a4d789c6..d4729ab796a 100644
--- a/src/Parsers/Access/ParserCreateUserQuery.cpp
+++ b/src/Parsers/Access/ParserCreateUserQuery.cpp
@@ -32,7 +32,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"RENAME TO"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::RENAME_TO}.ignore(pos, expected))
                 return false;
 
             String maybe_new_name;
@@ -48,7 +48,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (ParserKeyword{"NOT IDENTIFIED"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::NOT_IDENTIFIED}.ignore(pos, expected))
             {
                 auth_data = std::make_shared<ASTAuthenticationData>();
                 auth_data->type = AuthenticationType::NO_PASSWORD;
@@ -56,7 +56,7 @@ namespace
                 return true;
             }
 
-            if (!ParserKeyword{"IDENTIFIED"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::IDENTIFIED}.ignore(pos, expected))
                 return false;
 
             std::optional<AuthenticationType> type;
@@ -69,11 +69,11 @@ namespace
             bool expect_public_ssh_key = false;
             bool expect_http_auth_server = false;
 
-            if (ParserKeyword{"WITH"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::WITH}.ignore(pos, expected))
             {
                 for (auto check_type : collections::range(AuthenticationType::MAX))
                 {
-                    if (ParserKeyword{AuthenticationTypeInfo::get(check_type).raw_name}.ignore(pos, expected))
+                    if (ParserKeyword{AuthenticationTypeInfo::get(check_type).keyword}.ignore(pos, expected))
                     {
                         type = check_type;
 
@@ -96,17 +96,17 @@ namespace
 
                 if (!type)
                 {
-                    if (ParserKeyword{"SHA256_HASH"}.ignore(pos, expected))
+                    if (ParserKeyword{Keyword::SHA256_HASH}.ignore(pos, expected))
                     {
                         type = AuthenticationType::SHA256_PASSWORD;
                         expect_hash = true;
                     }
-                    else if (ParserKeyword{"DOUBLE_SHA1_HASH"}.ignore(pos, expected))
+                    else if (ParserKeyword{Keyword::DOUBLE_SHA1_HASH}.ignore(pos, expected))
                     {
                         type = AuthenticationType::DOUBLE_SHA1_PASSWORD;
                         expect_hash = true;
                     }
-                    else if (ParserKeyword{"BCRYPT_HASH"}.ignore(pos, expected))
+                    else if (ParserKeyword{Keyword::BCRYPT_HASH}.ignore(pos, expected))
                     {
                         type = AuthenticationType::BCRYPT_PASSWORD;
                         expect_hash = true;
@@ -128,12 +128,12 @@ namespace
 
             if (expect_password || expect_hash)
             {
-                if (!ParserKeyword{"BY"}.ignore(pos, expected) || !ParserStringAndSubstitution{}.parse(pos, value, expected))
+                if (!ParserKeyword{Keyword::BY}.ignore(pos, expected) || !ParserStringAndSubstitution{}.parse(pos, value, expected))
                     return false;
 
                 if (expect_hash && type == AuthenticationType::SHA256_PASSWORD)
                 {
-                    if (ParserKeyword{"SALT"}.ignore(pos, expected))
+                    if (ParserKeyword{Keyword::SALT}.ignore(pos, expected))
                     {
                         if (!ParserStringAndSubstitution{}.parse(pos, parsed_salt, expected))
                             return false;
@@ -142,12 +142,12 @@ namespace
             }
             else if (expect_ldap_server_name)
             {
-                if (!ParserKeyword{"SERVER"}.ignore(pos, expected) || !ParserStringAndSubstitution{}.parse(pos, value, expected))
+                if (!ParserKeyword{Keyword::SERVER}.ignore(pos, expected) || !ParserStringAndSubstitution{}.parse(pos, value, expected))
                     return false;
             }
             else if (expect_kerberos_realm)
             {
-                if (ParserKeyword{"REALM"}.ignore(pos, expected))
+                if (ParserKeyword{Keyword::REALM}.ignore(pos, expected))
                 {
                     if (!ParserStringAndSubstitution{}.parse(pos, value, expected))
                         return false;
@@ -155,7 +155,7 @@ namespace
             }
             else if (expect_common_names)
             {
-                if (!ParserKeyword{"CN"}.ignore(pos, expected))
+                if (!ParserKeyword{Keyword::CN}.ignore(pos, expected))
                     return false;
 
                 if (!ParserList{std::make_unique<ParserStringAndSubstitution>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, common_names, expected))
@@ -163,7 +163,7 @@ namespace
             }
             else if (expect_public_ssh_key)
             {
-                if (!ParserKeyword{"BY"}.ignore(pos, expected))
+                if (!ParserKeyword{Keyword::BY}.ignore(pos, expected))
                     return false;
 
                 if (!ParserList{std::make_unique<ParserPublicSSHKey>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, common_names, expected))
@@ -171,12 +171,12 @@ namespace
             }
             else if (expect_http_auth_server)
             {
-                if (!ParserKeyword{"SERVER"}.ignore(pos, expected))
+                if (!ParserKeyword{Keyword::SERVER}.ignore(pos, expected))
                     return false;
                 if (!ParserStringAndSubstitution{}.parse(pos, value, expected))
                     return false;
 
-                if (ParserKeyword{"SCHEME"}.ignore(pos, expected))
+                if (ParserKeyword{Keyword::SCHEME}.ignore(pos, expected))
                 {
                     if (!ParserStringAndSubstitution{}.parse(pos, http_auth_scheme, expected))
                         return false;
@@ -215,22 +215,22 @@ namespace
 
         auto parse_host = [&]
         {
-            if (ParserKeyword{"NONE"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::NONE}.ignore(pos, expected))
                 return true;
 
-            if (ParserKeyword{"ANY"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::ANY}.ignore(pos, expected))
             {
                 res_hosts.addAnyHost();
                 return true;
             }
 
-            if (ParserKeyword{"LOCAL"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::LOCAL}.ignore(pos, expected))
             {
                 res_hosts.addLocalHost();
                 return true;
             }
 
-            if (ParserKeyword{"REGEXP"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::REGEXP}.ignore(pos, expected))
             {
                 ASTPtr ast;
                 if (!ParserList{std::make_unique<ParserStringLiteral>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, ast, expected))
@@ -241,7 +241,7 @@ namespace
                 return true;
             }
 
-            if (ParserKeyword{"NAME"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::NAME}.ignore(pos, expected))
             {
                 ASTPtr ast;
                 if (!ParserList{std::make_unique<ParserStringLiteral>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, ast, expected))
@@ -253,7 +253,7 @@ namespace
                 return true;
             }
 
-            if (ParserKeyword{"IP"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::IP}.ignore(pos, expected))
             {
                 ASTPtr ast;
                 if (!ParserList{std::make_unique<ParserStringLiteral>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, ast, expected))
@@ -265,7 +265,7 @@ namespace
                 return true;
             }
 
-            if (ParserKeyword{"LIKE"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::LIKE}.ignore(pos, expected))
             {
                 ASTPtr ast;
                 if (!ParserList{std::make_unique<ParserStringLiteral>(), std::make_unique<ParserToken>(TokenType::Comma), false}.parse(pos, ast, expected))
@@ -292,10 +292,10 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!prefix.empty() && !ParserKeyword{prefix}.ignore(pos, expected))
+            if (!prefix.empty() && !ParserKeyword::createDeprecated(prefix).ignore(pos, expected))
                 return false;
 
-            if (!ParserKeyword{"HOST"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::HOST}.ignore(pos, expected))
                 return false;
 
             AllowedClientHosts res_hosts;
@@ -312,7 +312,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"DEFAULT ROLE"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::DEFAULT_ROLE}.ignore(pos, expected))
                 return false;
 
             ASTPtr ast;
@@ -332,7 +332,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"SETTINGS"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::SETTINGS}.ignore(pos, expected))
                 return false;
 
             ASTPtr new_settings_ast;
@@ -350,7 +350,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"GRANTEES"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::GRANTEES}.ignore(pos, expected))
                 return false;
 
             ASTPtr ast;
@@ -368,7 +368,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 
@@ -376,7 +376,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"DEFAULT DATABASE"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::DEFAULT_DATABASE}.ignore(pos, expected))
                 return false;
 
             ASTPtr ast;
@@ -393,7 +393,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"VALID UNTIL"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::VALID_UNTIL}.ignore(pos, expected))
                 return false;
 
             ParserStringAndSubstitution until_p;
@@ -409,14 +409,14 @@ bool ParserCreateUserQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     bool alter = false;
     if (attach_mode)
     {
-        if (!ParserKeyword{"ATTACH USER"}.ignore(pos, expected))
+        if (!ParserKeyword{Keyword::ATTACH_USER}.ignore(pos, expected))
             return false;
     }
     else
     {
-        if (ParserKeyword{"ALTER USER"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::ALTER_USER}.ignore(pos, expected))
             alter = true;
-        else if (!ParserKeyword{"CREATE USER"}.ignore(pos, expected))
+        else if (!ParserKeyword{Keyword::CREATE_USER}.ignore(pos, expected))
             return false;
     }
 
@@ -425,14 +425,14 @@ bool ParserCreateUserQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     bool or_replace = false;
     if (alter)
     {
-        if (ParserKeyword{"IF EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_EXISTS}.ignore(pos, expected))
             if_exists = true;
     }
     else
     {
-        if (ParserKeyword{"IF NOT EXISTS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IF_NOT_EXISTS}.ignore(pos, expected))
             if_not_exists = true;
-        else if (ParserKeyword{"OR REPLACE"}.ignore(pos, expected))
+        else if (ParserKeyword{Keyword::OR_REPLACE}.ignore(pos, expected))
             or_replace = true;
     }
 
@@ -508,7 +508,7 @@ bool ParserCreateUserQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
             if (!new_name && (names->size() == 1) && parseRenameTo(pos, expected, new_name))
                 continue;
 
-            if (parseHosts(pos, expected, "ADD", new_hosts))
+            if (parseHosts(pos, expected, toStringView(Keyword::ADD), new_hosts))
             {
                 if (!add_hosts)
                     add_hosts.emplace();
@@ -516,7 +516,7 @@ bool ParserCreateUserQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
                 continue;
             }
 
-            if (parseHosts(pos, expected, "DROP", new_hosts))
+            if (parseHosts(pos, expected, toStringView(Keyword::DROP), new_hosts))
             {
                 if (!remove_hosts)
                     remove_hosts.emplace();
@@ -525,7 +525,7 @@ bool ParserCreateUserQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
             }
         }
 
-        if (storage_name.empty() && ParserKeyword{"IN"}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
+        if (storage_name.empty() && ParserKeyword{Keyword::IN}.ignore(pos, expected) && parseAccessStorageName(pos, expected, storage_name))
             continue;
 
         break;
diff --git a/src/Parsers/Access/ParserDropAccessEntityQuery.cpp b/src/Parsers/Access/ParserDropAccessEntityQuery.cpp
index 7fd34a6f8e4..973bf07e346 100644
--- a/src/Parsers/Access/ParserDropAccessEntityQuery.cpp
+++ b/src/Parsers/Access/ParserDropAccessEntityQuery.cpp
@@ -18,8 +18,8 @@ namespace
         for (auto i : collections::range(AccessEntityType::MAX))
         {
             const auto & type_info = AccessEntityTypeInfo::get(i);
-            if (ParserKeyword{type_info.name}.ignore(pos, expected)
-                || (!type_info.alias.empty() && ParserKeyword{type_info.alias}.ignore(pos, expected)))
+            if (ParserKeyword::createDeprecated(type_info.name).ignore(pos, expected)
+                || (!type_info.alias.empty() && ParserKeyword::createDeprecated(type_info.alias).ignore(pos, expected)))
             {
                 type = i;
                 return true;
@@ -33,7 +33,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 }
@@ -41,7 +41,7 @@ namespace
 
 bool ParserDropAccessEntityQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (!ParserKeyword{"DROP"}.ignore(pos, expected))
+    if (!ParserKeyword{Keyword::DROP}.ignore(pos, expected))
         return false;
 
     AccessEntityType type;
@@ -49,7 +49,7 @@ bool ParserDropAccessEntityQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
         return false;
 
     bool if_exists = false;
-    if (ParserKeyword{"IF EXISTS"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::IF_EXISTS}.ignore(pos, expected))
         if_exists = true;
 
     Strings names;
@@ -78,7 +78,7 @@ bool ParserDropAccessEntityQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
             return false;
     }
 
-    if (ParserKeyword{"FROM"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::FROM}.ignore(pos, expected))
         parseAccessStorageName(pos, expected, storage_name);
 
     if (cluster.empty())
diff --git a/src/Parsers/Access/ParserGrantQuery.cpp b/src/Parsers/Access/ParserGrantQuery.cpp
index bdb338e9338..799cd65dd5c 100644
--- a/src/Parsers/Access/ParserGrantQuery.cpp
+++ b/src/Parsers/Access/ParserGrantQuery.cpp
@@ -28,7 +28,7 @@ namespace
             if (pos_->type != TokenType::BareWord)
                 return false;
             std::string_view word{pos_->begin, pos_->size()};
-            return !(boost::iequals(word, "ON") || boost::iequals(word, "TO") || boost::iequals(word, "FROM"));
+            return !(boost::iequals(word, toStringView(Keyword::ON)) || boost::iequals(word, toStringView(Keyword::TO)) || boost::iequals(word, toStringView(Keyword::FROM)));
         };
 
         expected.add(pos, "access type");
@@ -132,7 +132,7 @@ namespace
                         ++is_global_with_parameter;
                 }
 
-                if (!ParserKeyword{"ON"}.ignore(pos, expected))
+                if (!ParserKeyword{Keyword::ON}.ignore(pos, expected))
                     return false;
 
                 if (is_global_with_parameter && is_global_with_parameter == access_and_columns.size())
@@ -197,7 +197,7 @@ namespace
         {
             AccessRightsElement default_element(AccessType::ALL);
 
-            if (!ParserKeyword{"ON"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::ON}.ignore(pos, expected))
                 return false;
 
             String database_name;
@@ -265,7 +265,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{is_revoke ? "FROM" : "TO"}.ignore(pos, expected))
+            if (!ParserKeyword{is_revoke ? Keyword::FROM : Keyword::TO}.ignore(pos, expected))
                 return false;
 
             ASTPtr ast;
@@ -283,7 +283,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 }
@@ -291,14 +291,14 @@ namespace
 
 bool ParserGrantQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (attach_mode && !ParserKeyword{"ATTACH"}.ignore(pos, expected))
+    if (attach_mode && !ParserKeyword{Keyword::ATTACH}.ignore(pos, expected))
         return false;
 
     bool is_replace = false;
     bool is_revoke = false;
-    if (ParserKeyword{"REVOKE"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::REVOKE}.ignore(pos, expected))
         is_revoke = true;
-    else if (!ParserKeyword{"GRANT"}.ignore(pos, expected))
+    else if (!ParserKeyword{Keyword::GRANT}.ignore(pos, expected))
         return false;
 
     String cluster;
@@ -308,9 +308,9 @@ bool ParserGrantQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     bool admin_option = false;
     if (is_revoke)
     {
-        if (ParserKeyword{"GRANT OPTION FOR"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::GRANT_OPTION_FOR}.ignore(pos, expected))
             grant_option = true;
-        else if (ParserKeyword{"ADMIN OPTION FOR"}.ignore(pos, expected))
+        else if (ParserKeyword{Keyword::ADMIN_OPTION_FOR}.ignore(pos, expected))
             admin_option = true;
     }
 
@@ -318,7 +318,7 @@ bool ParserGrantQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     std::shared_ptr<ASTRolesOrUsersSet> roles;
 
     bool current_grants = false;
-    if (!is_revoke && ParserKeyword{"CURRENT GRANTS"}.ignore(pos, expected))
+    if (!is_revoke && ParserKeyword{Keyword::CURRENT_GRANTS}.ignore(pos, expected))
     {
         current_grants = true;
         if (!parseCurrentGrants(pos, expected, elements))
@@ -342,12 +342,12 @@ bool ParserGrantQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
     if (!is_revoke)
     {
-        if (ParserKeyword{"WITH GRANT OPTION"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::WITH_GRANT_OPTION}.ignore(pos, expected))
             grant_option = true;
-        else if (ParserKeyword{"WITH ADMIN OPTION"}.ignore(pos, expected))
+        else if (ParserKeyword{Keyword::WITH_ADMIN_OPTION}.ignore(pos, expected))
             admin_option = true;
 
-        if (ParserKeyword{"WITH REPLACE OPTION"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::WITH_REPLACE_OPTION}.ignore(pos, expected))
             is_replace = true;
     }
 
diff --git a/src/Parsers/Access/ParserMoveAccessEntityQuery.cpp b/src/Parsers/Access/ParserMoveAccessEntityQuery.cpp
index 798e200bfb3..571b03f6f3c 100644
--- a/src/Parsers/Access/ParserMoveAccessEntityQuery.cpp
+++ b/src/Parsers/Access/ParserMoveAccessEntityQuery.cpp
@@ -18,8 +18,8 @@ namespace
         for (auto i : collections::range(AccessEntityType::MAX))
         {
             const auto & type_info = AccessEntityTypeInfo::get(i);
-            if (ParserKeyword{type_info.name}.ignore(pos, expected)
-                || (!type_info.alias.empty() && ParserKeyword{type_info.alias}.ignore(pos, expected)))
+            if (ParserKeyword::createDeprecated(type_info.name).ignore(pos, expected)
+                || (!type_info.alias.empty() && ParserKeyword::createDeprecated(type_info.alias).ignore(pos, expected)))
             {
                 type = i;
                 return true;
@@ -33,7 +33,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 }
@@ -41,7 +41,7 @@ namespace
 
 bool ParserMoveAccessEntityQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (!ParserKeyword{"MOVE"}.ignore(pos, expected))
+    if (!ParserKeyword{Keyword::MOVE}.ignore(pos, expected))
         return false;
 
     AccessEntityType type;
@@ -74,7 +74,7 @@ bool ParserMoveAccessEntityQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
             return false;
     }
 
-    if (!ParserKeyword{"TO"}.ignore(pos, expected) || !parseAccessStorageName(pos, expected, storage_name))
+    if (!ParserKeyword{Keyword::TO}.ignore(pos, expected) || !parseAccessStorageName(pos, expected, storage_name))
         return false;
 
     if (cluster.empty())
diff --git a/src/Parsers/Access/ParserPublicSSHKey.cpp b/src/Parsers/Access/ParserPublicSSHKey.cpp
index 725fe67a75b..bc033e25bbb 100644
--- a/src/Parsers/Access/ParserPublicSSHKey.cpp
+++ b/src/Parsers/Access/ParserPublicSSHKey.cpp
@@ -15,11 +15,11 @@ namespace
         return IParserBase::wrapParseImpl(pos, [&]
         {
             String key_base64;
-            if (!ParserKeyword{"KEY"}.ignore(pos, expected) || !parseIdentifierOrStringLiteral(pos, expected, key_base64))
+            if (!ParserKeyword{Keyword::KEY}.ignore(pos, expected) || !parseIdentifierOrStringLiteral(pos, expected, key_base64))
                 return false;
 
             String type;
-            if (!ParserKeyword{"TYPE"}.ignore(pos, expected) || !parseIdentifierOrStringLiteral(pos, expected, type))
+            if (!ParserKeyword{Keyword::TYPE}.ignore(pos, expected) || !parseIdentifierOrStringLiteral(pos, expected, type))
                 return false;
 
             ast = std::make_shared<ASTPublicSSHKey>();
diff --git a/src/Parsers/Access/ParserRolesOrUsersSet.cpp b/src/Parsers/Access/ParserRolesOrUsersSet.cpp
index 6f426d89bb3..6c46bff459b 100644
--- a/src/Parsers/Access/ParserRolesOrUsersSet.cpp
+++ b/src/Parsers/Access/ParserRolesOrUsersSet.cpp
@@ -19,7 +19,7 @@ namespace
             if (!id_mode)
                 return parseRoleName(pos, expected, res);
 
-            if (!ParserKeyword{"ID"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::ID}.ignore(pos, expected))
                 return false;
             if (!ParserToken(TokenType::OpeningRoundBracket).ignore(pos, expected))
                 return false;
@@ -53,16 +53,16 @@ namespace
 
         auto parse_element = [&]
         {
-            if (ParserKeyword{"NONE"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::NONE}.ignore(pos, expected))
                 return true;
 
-            if (allow_all && ParserKeyword{"ALL"}.ignore(pos, expected))
+            if (allow_all && ParserKeyword{Keyword::ALL}.ignore(pos, expected))
             {
                 res_all = true;
                 return true;
             }
 
-            if (allow_any && ParserKeyword{"ANY"}.ignore(pos, expected))
+            if (allow_any && ParserKeyword{Keyword::ANY}.ignore(pos, expected))
             {
                 res_all = true;
                 return true;
@@ -102,7 +102,7 @@ namespace
         bool & except_current_user)
     {
         return IParserBase::wrapParseImpl(pos, [&] {
-            if (!ParserKeyword{"EXCEPT"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::EXCEPT}.ignore(pos, expected))
                 return false;
 
             bool unused;
diff --git a/src/Parsers/Access/ParserRowPolicyName.cpp b/src/Parsers/Access/ParserRowPolicyName.cpp
index efdff3c24bf..e15b8b471e6 100644
--- a/src/Parsers/Access/ParserRowPolicyName.cpp
+++ b/src/Parsers/Access/ParserRowPolicyName.cpp
@@ -16,7 +16,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 
@@ -39,13 +39,13 @@ namespace
                 res_table_name = RowPolicyName::ANY_TABLE_MARK;
             }
 
-            /// If table is specified without DB it cannot be followed by "ON"
-            /// (but can be followed by "ON CLUSTER").
+            /// If table is specified without DB it cannot be followed by Keyword::ON
+            /// (but can be followed by Keyword::ON CLUSTER).
             /// The following code is necessary to figure out while parsing something like
             /// policy1 ON table1, policy2 ON table2
             /// that policy2 is another policy, not another table.
             auto end_pos = pos;
-            if (res_database.empty() && ParserKeyword{"ON"}.ignore(pos, expected))
+            if (res_database.empty() && ParserKeyword{Keyword::ON}.ignore(pos, expected))
             {
                 String unused;
                 if (ASTQueryWithOnCluster::parse(pos, unused, expected))
@@ -65,7 +65,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && parseDBAndTableName(pos, expected, database, table_name);
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected) && parseDBAndTableName(pos, expected, database, table_name);
         });
     }
 
@@ -74,7 +74,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"ON"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::ON}.ignore(pos, expected))
                 return false;
 
             std::vector<std::pair<String, String>> res;
diff --git a/src/Parsers/Access/ParserSetRoleQuery.cpp b/src/Parsers/Access/ParserSetRoleQuery.cpp
index 50ccc67a372..251b33e9c11 100644
--- a/src/Parsers/Access/ParserSetRoleQuery.cpp
+++ b/src/Parsers/Access/ParserSetRoleQuery.cpp
@@ -29,7 +29,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"TO"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::TO}.ignore(pos, expected))
                 return false;
 
             ASTPtr ast;
@@ -50,11 +50,11 @@ bool ParserSetRoleQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
 {
     using Kind = ASTSetRoleQuery::Kind;
     Kind kind;
-    if (ParserKeyword{"SET ROLE DEFAULT"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::SET_ROLE_DEFAULT}.ignore(pos, expected))
         kind = Kind::SET_ROLE_DEFAULT;
-    else if (ParserKeyword{"SET ROLE"}.ignore(pos, expected))
+    else if (ParserKeyword{Keyword::SET_ROLE}.ignore(pos, expected))
         kind = Kind::SET_ROLE;
-    else if (ParserKeyword{"SET DEFAULT ROLE"}.ignore(pos, expected))
+    else if (ParserKeyword{Keyword::SET_DEFAULT_ROLE}.ignore(pos, expected))
         kind = Kind::SET_DEFAULT_ROLE;
     else
         return false;
diff --git a/src/Parsers/Access/ParserSettingsProfileElement.cpp b/src/Parsers/Access/ParserSettingsProfileElement.cpp
index 36330b96622..78002d1b425 100644
--- a/src/Parsers/Access/ParserSettingsProfileElement.cpp
+++ b/src/Parsers/Access/ParserSettingsProfileElement.cpp
@@ -15,12 +15,12 @@ namespace
 {
     bool parseProfileKeyword(IParserBase::Pos & pos, Expected & expected, bool use_inherit_keyword)
     {
-        if (ParserKeyword{"PROFILE"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::PROFILE}.ignore(pos, expected))
             return true;
 
-        if (use_inherit_keyword && ParserKeyword{"INHERIT"}.ignore(pos, expected))
+        if (use_inherit_keyword && ParserKeyword{Keyword::INHERIT}.ignore(pos, expected))
         {
-            ParserKeyword{"PROFILE"}.ignore(pos, expected);
+            ParserKeyword{Keyword::PROFILE}.ignore(pos, expected);
             return true;
         }
 
@@ -36,7 +36,7 @@ namespace
             if (!id_mode)
                 return parseIdentifierOrStringLiteral(pos, expected, res);
 
-            if (!ParserKeyword{"ID"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::ID}.ignore(pos, expected))
                 return false;
             if (!ParserToken(TokenType::OpeningRoundBracket).ignore(pos, expected))
                 return false;
@@ -73,8 +73,8 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            bool is_min_value = ParserKeyword{"MIN"}.ignore(pos, expected);
-            bool is_max_value = !is_min_value && ParserKeyword{"MAX"}.ignore(pos, expected);
+            bool is_min_value = ParserKeyword{Keyword::MIN}.ignore(pos, expected);
+            bool is_max_value = !is_min_value && ParserKeyword{Keyword::MAX}.ignore(pos, expected);
             if (!is_min_value && !is_max_value)
                 return false;
 
@@ -99,17 +99,17 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (ParserKeyword{"READONLY"}.ignore(pos, expected) || ParserKeyword{"CONST"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::READONLY}.ignore(pos, expected) || ParserKeyword{Keyword::CONST}.ignore(pos, expected))
             {
                 writability = SettingConstraintWritability::CONST;
                 return true;
             }
-            else if (ParserKeyword{"WRITABLE"}.ignore(pos, expected))
+            else if (ParserKeyword{Keyword::WRITABLE}.ignore(pos, expected))
             {
                 writability = SettingConstraintWritability::WRITABLE;
                 return true;
             }
-            else if (ParserKeyword{"CHANGEABLE_IN_READONLY"}.ignore(pos, expected))
+            else if (ParserKeyword{Keyword::CHANGEABLE_IN_READONLY}.ignore(pos, expected))
             {
                 writability = SettingConstraintWritability::CHANGEABLE_IN_READONLY;
                 return true;
@@ -151,7 +151,7 @@ namespace
             if (!has_value_or_constraint)
                 return false;
 
-            if (boost::iequals(res_setting_name, "PROFILE") && !res_value && !res_min_value && !res_max_value
+            if (boost::iequals(res_setting_name, toStringView(Keyword::PROFILE)) && !res_value && !res_min_value && !res_max_value
                 && res_writability == SettingConstraintWritability::CONST)
             {
                 /// Ambiguity: "profile readonly" can be treated either as a profile named "readonly" or
@@ -224,7 +224,7 @@ bool ParserSettingsProfileElements::parseImpl(Pos & pos, ASTPtr & node, Expected
 {
     std::vector<std::shared_ptr<ASTSettingsProfileElement>> elements;
 
-    if (ParserKeyword{"NONE"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::NONE}.ignore(pos, expected))
     {
     }
     else
diff --git a/src/Parsers/Access/ParserShowAccessEntitiesQuery.cpp b/src/Parsers/Access/ParserShowAccessEntitiesQuery.cpp
index 15cb815f457..898971a02b3 100644
--- a/src/Parsers/Access/ParserShowAccessEntitiesQuery.cpp
+++ b/src/Parsers/Access/ParserShowAccessEntitiesQuery.cpp
@@ -15,8 +15,8 @@ namespace
         for (auto i : collections::range(AccessEntityType::MAX))
         {
             const auto & type_info = AccessEntityTypeInfo::get(i);
-            if (ParserKeyword{type_info.plural_name}.ignore(pos, expected)
-                || (!type_info.plural_alias.empty() && ParserKeyword{type_info.plural_alias}.ignore(pos, expected)))
+            if (ParserKeyword::createDeprecated(type_info.plural_name).ignore(pos, expected)
+                || (!type_info.plural_alias.empty() && ParserKeyword::createDeprecated(type_info.plural_alias).ignore(pos, expected)))
             {
                 type = i;
                 return true;
@@ -29,7 +29,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected)
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected)
                 && parseDatabaseAndTableNameOrAsterisks(pos, expected, database, any_database, table, any_table);
         });
     }
@@ -38,7 +38,7 @@ namespace
 
 bool ParserShowAccessEntitiesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (!ParserKeyword{"SHOW"}.ignore(pos, expected))
+    if (!ParserKeyword{Keyword::SHOW}.ignore(pos, expected))
         return false;
 
     AccessEntityType type;
@@ -51,17 +51,17 @@ bool ParserShowAccessEntitiesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected
     {
         all = true;
     }
-    else if (ParserKeyword{"CURRENT ROLES"}.ignore(pos, expected))
+    else if (ParserKeyword{Keyword::CURRENT_ROLES}.ignore(pos, expected))
     {
         type = AccessEntityType::ROLE;
         current_roles = true;
     }
-    else if (ParserKeyword{"ENABLED ROLES"}.ignore(pos, expected))
+    else if (ParserKeyword{Keyword::ENABLED_ROLES}.ignore(pos, expected))
     {
         type = AccessEntityType::ROLE;
         enabled_roles = true;
     }
-    else if (ParserKeyword{"CURRENT QUOTA"}.ignore(pos, expected) || ParserKeyword{"QUOTA"}.ignore(pos, expected))
+    else if (ParserKeyword{Keyword::CURRENT_QUOTA}.ignore(pos, expected) || ParserKeyword{Keyword::QUOTA}.ignore(pos, expected))
     {
         type = AccessEntityType::QUOTA;
         current_quota = true;
diff --git a/src/Parsers/Access/ParserShowAccessQuery.h b/src/Parsers/Access/ParserShowAccessQuery.h
index da0d6ff449f..51ccf84b349 100644
--- a/src/Parsers/Access/ParserShowAccessQuery.h
+++ b/src/Parsers/Access/ParserShowAccessQuery.h
@@ -20,7 +20,7 @@ protected:
     {
         auto query = std::make_shared<ASTShowAccessQuery>();
 
-        if (!ParserKeyword("SHOW ACCESS").ignore(pos, expected))
+        if (!ParserKeyword(Keyword::SHOW_ACCESS).ignore(pos, expected))
             return false;
 
         node = query;
diff --git a/src/Parsers/Access/ParserShowCreateAccessEntityQuery.cpp b/src/Parsers/Access/ParserShowCreateAccessEntityQuery.cpp
index 17caa6366f1..8e8321dad28 100644
--- a/src/Parsers/Access/ParserShowCreateAccessEntityQuery.cpp
+++ b/src/Parsers/Access/ParserShowCreateAccessEntityQuery.cpp
@@ -25,8 +25,8 @@ namespace
         for (auto i : collections::range(AccessEntityType::MAX))
         {
             const auto & type_info = AccessEntityTypeInfo::get(i);
-            if (ParserKeyword{type_info.name}.ignore(pos, expected)
-                || (!type_info.alias.empty() && ParserKeyword{type_info.alias}.ignore(pos, expected)))
+            if (ParserKeyword::createDeprecated(type_info.name).ignore(pos, expected)
+                || (!type_info.alias.empty() && ParserKeyword::createDeprecated(type_info.alias).ignore(pos, expected)))
             {
                 type = i;
                 plural = false;
@@ -37,8 +37,8 @@ namespace
         for (auto i : collections::range(AccessEntityType::MAX))
         {
             const auto & type_info = AccessEntityTypeInfo::get(i);
-            if (ParserKeyword{type_info.plural_name}.ignore(pos, expected)
-                || (!type_info.plural_alias.empty() && ParserKeyword{type_info.plural_alias}.ignore(pos, expected)))
+            if (ParserKeyword::createDeprecated(type_info.plural_name).ignore(pos, expected)
+                || (!type_info.plural_alias.empty() && ParserKeyword::createDeprecated(type_info.plural_alias).ignore(pos, expected)))
             {
                 type = i;
                 plural = true;
@@ -53,7 +53,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected)
+            return ParserKeyword{Keyword::ON}.ignore(pos, expected)
                 && parseDatabaseAndTableNameOrAsterisks(pos, expected, database, any_database, table, any_table);
         });
     }
@@ -62,7 +62,7 @@ namespace
 
 bool ParserShowCreateAccessEntityQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (!ParserKeyword{"SHOW CREATE"}.ignore(pos, expected))
+    if (!ParserKeyword{Keyword::SHOW_CREATE}.ignore(pos, expected))
         return false;
 
     AccessEntityType type;
diff --git a/src/Parsers/Access/ParserShowGrantsQuery.cpp b/src/Parsers/Access/ParserShowGrantsQuery.cpp
index 02d85d2f90b..092334e8a6f 100644
--- a/src/Parsers/Access/ParserShowGrantsQuery.cpp
+++ b/src/Parsers/Access/ParserShowGrantsQuery.cpp
@@ -10,12 +10,12 @@ namespace DB
 {
 bool ParserShowGrantsQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (!ParserKeyword{"SHOW GRANTS"}.ignore(pos, expected))
+    if (!ParserKeyword{Keyword::SHOW_GRANTS}.ignore(pos, expected))
         return false;
 
     std::shared_ptr<ASTRolesOrUsersSet> for_roles;
 
-    if (ParserKeyword{"FOR"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::FOR}.ignore(pos, expected))
     {
         ASTPtr for_roles_ast;
         ParserRolesOrUsersSet for_roles_p;
diff --git a/src/Parsers/Access/ParserShowPrivilegesQuery.cpp b/src/Parsers/Access/ParserShowPrivilegesQuery.cpp
index a120d4ed7c2..33bf118bdad 100644
--- a/src/Parsers/Access/ParserShowPrivilegesQuery.cpp
+++ b/src/Parsers/Access/ParserShowPrivilegesQuery.cpp
@@ -10,7 +10,7 @@ bool ParserShowPrivilegesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & e
 {
     auto query = std::make_shared<ASTShowPrivilegesQuery>();
 
-    if (!ParserKeyword("SHOW PRIVILEGES").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::SHOW_PRIVILEGES).ignore(pos, expected))
         return false;
 
     node = query;
diff --git a/src/Parsers/Access/parseUserName.cpp b/src/Parsers/Access/parseUserName.cpp
index a4c5c7e8946..2c638094fce 100644
--- a/src/Parsers/Access/parseUserName.cpp
+++ b/src/Parsers/Access/parseUserName.cpp
@@ -32,7 +32,7 @@ bool parseCurrentUserTag(IParser::Pos & pos, Expected & expected)
 {
     return IParserBase::wrapParseImpl(pos, [&]
     {
-        if (!ParserKeyword{"CURRENT_USER"}.ignore(pos, expected) && !ParserKeyword{"currentUser"}.ignore(pos, expected))
+        if (!ParserKeyword{Keyword::CURRENTUSER}.ignore(pos, expected) && !ParserKeyword{Keyword::CURRENT_USER}.ignore(pos, expected))
             return false;
 
         if (ParserToken{TokenType::OpeningRoundBracket}.ignore(pos, expected))
diff --git a/src/Parsers/CommonParsers.cpp b/src/Parsers/CommonParsers.cpp
index 275679d61f0..ed8d58d5a68 100644
--- a/src/Parsers/CommonParsers.cpp
+++ b/src/Parsers/CommonParsers.cpp
@@ -1,9 +1,117 @@
 #include <Parsers/CommonParsers.h>
+#include <Common/ErrorCodes.h>
 #include <base/find_symbols.h>
+#include <algorithm>
+#include <cctype>
 
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+namespace
+{
+using Strings = std::vector<String>;
+
+class KeyWordToStringConverter
+{
+public:
+    static const KeyWordToStringConverter & instance()
+    {
+        static const KeyWordToStringConverter res;
+        return res;
+    }
+
+    std::string_view convert(Keyword type) const
+    {
+        return mapping[static_cast<size_t>(type)];
+    }
+
+    const std::vector<String> & getMapping() const
+    {
+        return mapping;
+    }
+
+private:
+    KeyWordToStringConverter()
+    {
+#define KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING(identifier, value) \
+        checkUnderscore(value); \
+        addToMapping(Keyword::identifier, value);
+        APPLY_FOR_PARSER_KEYWORDS(KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING)
+#undef KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING
+
+#define KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING(identifier, value) \
+        addToMapping(Keyword::identifier, value);
+        APPLY_FOR_PARSER_KEYWORDS_WITH_UNDERSCORES(KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING)
+#undef KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING
+
+#ifndef NDEBUG
+#define KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING(identifier, value) \
+        check(#identifier, value);
+        APPLY_FOR_PARSER_KEYWORDS(KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING)
+        APPLY_FOR_PARSER_KEYWORDS_WITH_UNDERSCORES(KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING)
+#undef KEYWORD_TYPE_TO_STRING_CONVERTER_ADD_TO_MAPPING
+#endif
+    }
+
+    void addToMapping(Keyword identifier, std::string_view value)
+    {
+        size_t index = static_cast<size_t>(identifier);
+        mapping.resize(std::max(index + 1, mapping.size()));
+        mapping[index] = value;
+    }
+
+    void checkUnderscore(std::string_view value)
+    {
+        if (value.contains('_'))
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                "The keyword {} has underscore. If this is intentional, please declare it in another list.", value);
+    }
+
+    [[ maybe_unused ]] void check(std::string_view identifier, std::string_view value)
+    {
+        if (value == "TRUE" || value == "FALSE" || value == "NULL")
+            return;
+
+        if (identifier.size() != value.size())
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "The length of the keyword identifier and the length of its value are different.");
+
+        for (size_t i = 0; i < identifier.size(); ++i)
+        {
+            if (std::tolower(identifier[i]) == '_' && std::tolower(value[i]) == ' ')
+                continue;
+            if (std::tolower(identifier[i]) == std::tolower(value[i]))
+                continue;
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                "Keyword identifier {} differs from its value {} in {} position: {} and {}",
+                identifier, value, i, identifier[i], value[i]);
+        }
+
+    }
+
+    Strings mapping;
+};
+}
+
+
+std::string_view toStringView(Keyword type)
+{
+    return KeyWordToStringConverter::instance().convert(type);
+}
+
+const std::vector<String> & getAllKeyWords()
+{
+    return KeyWordToStringConverter::instance().getMapping();
+}
+
+ParserKeyword::ParserKeyword(Keyword keyword)
+    : s(toStringView(keyword))
+{}
+
 bool ParserKeyword::parseImpl(Pos & pos, [[maybe_unused]] ASTPtr & node, Expected & expected)
 {
     if (pos->type != TokenType::BareWord)
@@ -38,4 +146,5 @@ bool ParserKeyword::parseImpl(Pos & pos, [[maybe_unused]] ASTPtr & node, Expecte
     return true;
 }
 
+
 }
diff --git a/src/Parsers/CommonParsers.h b/src/Parsers/CommonParsers.h
index f6c5c9c0520..b2a07bc06bf 100644
--- a/src/Parsers/CommonParsers.h
+++ b/src/Parsers/CommonParsers.h
@@ -3,10 +3,575 @@
 #include <Parsers/IParserBase.h>
 
 #include <cassert>
+#include <string_view>
 
 namespace DB
 {
 
+#define APPLY_FOR_PARSER_KEYWORDS(MR_MACROS) \
+    MR_MACROS(ADD_COLUMN, "ADD COLUMN") \
+    MR_MACROS(ADD_CONSTRAINT, "ADD CONSTRAINT") \
+    MR_MACROS(ADD_INDEX, "ADD INDEX") \
+    MR_MACROS(ADD_PROJECTION, "ADD PROJECTION") \
+    MR_MACROS(ADD_STATISTIC, "ADD STATISTIC") \
+    MR_MACROS(ADD, "ADD") \
+    MR_MACROS(ADMIN_OPTION_FOR, "ADMIN OPTION FOR") \
+    MR_MACROS(AFTER, "AFTER") \
+    MR_MACROS(ALGORITHM, "ALGORITHM") \
+    MR_MACROS(ALIAS, "ALIAS") \
+    MR_MACROS(ALL, "ALL") \
+    MR_MACROS(ALTER_COLUMN, "ALTER COLUMN") \
+    MR_MACROS(ALTER_DATABASE, "ALTER DATABASE") \
+    MR_MACROS(ALTER_LIVE_VIEW, "ALTER LIVE VIEW") \
+    MR_MACROS(ALTER_POLICY, "ALTER POLICY") \
+    MR_MACROS(ALTER_PROFILE, "ALTER PROFILE") \
+    MR_MACROS(ALTER_QUOTA, "ALTER QUOTA") \
+    MR_MACROS(ALTER_ROLE, "ALTER ROLE") \
+    MR_MACROS(ALTER_ROW_POLICY, "ALTER ROW POLICY") \
+    MR_MACROS(ALTER_SETTINGS_PROFILE, "ALTER SETTINGS PROFILE") \
+    MR_MACROS(ALTER_TABLE, "ALTER TABLE") \
+    MR_MACROS(ALTER_TEMPORARY_TABLE, "ALTER TEMPORARY TABLE") \
+    MR_MACROS(ALTER_USER, "ALTER USER") \
+    MR_MACROS(ALTER, "ALTER") \
+    MR_MACROS(AND_STDOUT, "AND STDOUT") \
+    MR_MACROS(AND, "AND") \
+    MR_MACROS(ANTI, "ANTI") \
+    MR_MACROS(ANY, "ANY") \
+    MR_MACROS(APPEND, "APPEND") \
+    MR_MACROS(APPLY_DELETED_MASK, "APPLY DELETED MASK") \
+    MR_MACROS(APPLY, "APPLY") \
+    MR_MACROS(ARRAY_JOIN, "ARRAY JOIN") \
+    MR_MACROS(AS, "AS") \
+    MR_MACROS(ASC, "ASC") \
+    MR_MACROS(ASCENDING, "ASCENDING") \
+    MR_MACROS(ASOF, "ASOF") \
+    MR_MACROS(ASSUME, "ASSUME") \
+    MR_MACROS(AST, "AST") \
+    MR_MACROS(ASYNC, "ASYNC") \
+    MR_MACROS(ATTACH_PART, "ATTACH PART") \
+    MR_MACROS(ATTACH_PARTITION, "ATTACH PARTITION") \
+    MR_MACROS(ATTACH_POLICY, "ATTACH POLICY") \
+    MR_MACROS(ATTACH_PROFILE, "ATTACH PROFILE") \
+    MR_MACROS(ATTACH_QUOTA, "ATTACH QUOTA") \
+    MR_MACROS(ATTACH_ROLE, "ATTACH ROLE") \
+    MR_MACROS(ATTACH_ROW_POLICY, "ATTACH ROW POLICY") \
+    MR_MACROS(ATTACH_SETTINGS_PROFILE, "ATTACH SETTINGS PROFILE") \
+    MR_MACROS(ATTACH_USER, "ATTACH USER") \
+    MR_MACROS(ATTACH, "ATTACH") \
+    MR_MACROS(AZURE, "AZURE") \
+    MR_MACROS(BACKUP, "BACKUP") \
+    MR_MACROS(BAGEXPANSION, "bagexpansion") \
+    MR_MACROS(BEGIN_TRANSACTION, "BEGIN TRANSACTION") \
+    MR_MACROS(BETWEEN, "BETWEEN") \
+    MR_MACROS(BIDIRECTIONAL, "BIDIRECTIONAL") \
+    MR_MACROS(BOTH, "BOTH") \
+    MR_MACROS(BY, "BY") \
+    MR_MACROS(CASCADE, "CASCADE") \
+    MR_MACROS(CASE, "CASE") \
+    MR_MACROS(CAST, "CAST") \
+    MR_MACROS(CHANGE, "CHANGE") \
+    MR_MACROS(CHANGED, "CHANGED") \
+    MR_MACROS(CHAR_VARYING, "CHAR VARYING") \
+    MR_MACROS(CHAR, "CHAR") \
+    MR_MACROS(CHARACTER_LARGE_OBJECT, "CHARACTER LARGE OBJECT") \
+    MR_MACROS(CHARACTER_VARYING, "CHARACTER VARYING") \
+    MR_MACROS(CHARACTER, "CHARACTER") \
+    MR_MACROS(CHECK_ALL_TABLES, "CHECK ALL TABLES") \
+    MR_MACROS(CHECK_TABLE, "CHECK TABLE") \
+    MR_MACROS(CHECK, "CHECK") \
+    MR_MACROS(CLEANUP, "CLEANUP") \
+    MR_MACROS(CLEAR_COLUMN, "CLEAR COLUMN") \
+    MR_MACROS(CLEAR_INDEX, "CLEAR INDEX") \
+    MR_MACROS(CLEAR_PROJECTION, "CLEAR PROJECTION") \
+    MR_MACROS(CLEAR_STATISTIC, "CLEAR STATISTIC") \
+    MR_MACROS(CLUSTER, "CLUSTER") \
+    MR_MACROS(CLUSTERS, "CLUSTERS") \
+    MR_MACROS(CN, "CN") \
+    MR_MACROS(CODEC, "CODEC") \
+    MR_MACROS(COLLATE, "COLLATE") \
+    MR_MACROS(COLUMN, "COLUMN") \
+    MR_MACROS(COLUMNS, "COLUMNS") \
+    MR_MACROS(COMMENT_COLUMN, "COMMENT COLUMN") \
+    MR_MACROS(COMMENT, "COMMENT") \
+    MR_MACROS(COMMIT, "COMMIT") \
+    MR_MACROS(COMPRESSION, "COMPRESSION") \
+    MR_MACROS(CONST, "CONST") \
+    MR_MACROS(CONSTRAINT, "CONSTRAINT") \
+    MR_MACROS(CREATE_POLICY, "CREATE POLICY") \
+    MR_MACROS(CREATE_PROFILE, "CREATE PROFILE") \
+    MR_MACROS(CREATE_QUOTA, "CREATE QUOTA") \
+    MR_MACROS(CREATE_ROLE, "CREATE ROLE") \
+    MR_MACROS(CREATE_ROW_POLICY, "CREATE ROW POLICY") \
+    MR_MACROS(CREATE_SETTINGS_PROFILE, "CREATE SETTINGS PROFILE") \
+    MR_MACROS(CREATE_TABLE, "CREATE TABLE") \
+    MR_MACROS(CREATE_TEMPORARY_TABLE, "CREATE TEMPORARY TABLE") \
+    MR_MACROS(CREATE_USER, "CREATE USER") \
+    MR_MACROS(CREATE, "CREATE") \
+    MR_MACROS(CROSS, "CROSS") \
+    MR_MACROS(CUBE, "CUBE") \
+    MR_MACROS(CURRENT_GRANTS, "CURRENT GRANTS") \
+    MR_MACROS(CURRENT_QUOTA, "CURRENT QUOTA") \
+    MR_MACROS(CURRENT_ROLES, "CURRENT ROLES") \
+    MR_MACROS(CURRENT_ROW, "CURRENT ROW") \
+    MR_MACROS(CURRENT_TRANSACTION, "CURRENT TRANSACTION") \
+    MR_MACROS(CURRENTUSER, "CURRENTUSER") \
+    MR_MACROS(D, "D") \
+    MR_MACROS(DATABASE, "DATABASE") \
+    MR_MACROS(DATABASES, "DATABASES") \
+    MR_MACROS(DATE, "DATE") \
+    MR_MACROS(DAY, "DAY") \
+    MR_MACROS(DAYS, "DAYS") \
+    MR_MACROS(DD, "DD") \
+    MR_MACROS(DEDUPLICATE, "DEDUPLICATE") \
+    MR_MACROS(DEFAULT_DATABASE, "DEFAULT DATABASE") \
+    MR_MACROS(DEFAULT_ROLE, "DEFAULT ROLE") \
+    MR_MACROS(DEFAULT, "DEFAULT") \
+    MR_MACROS(DEFINER, "DEFINER") \
+    MR_MACROS(DELETE, "DELETE") \
+    MR_MACROS(DEPENDS_ON, "DEPENDS ON") \
+    MR_MACROS(DESC, "DESC") \
+    MR_MACROS(DESCENDING, "DESCENDING") \
+    MR_MACROS(DESCRIBE, "DESCRIBE") \
+    MR_MACROS(DETACH_PART, "DETACH PART") \
+    MR_MACROS(DETACH_PARTITION, "DETACH PARTITION") \
+    MR_MACROS(DETACH, "DETACH") \
+    MR_MACROS(DICTIONARIES, "DICTIONARIES") \
+    MR_MACROS(DICTIONARY, "DICTIONARY") \
+    MR_MACROS(DISK, "DISK") \
+    MR_MACROS(DISTINCT_ON, "DISTINCT ON") \
+    MR_MACROS(DISTINCT, "DISTINCT") \
+    MR_MACROS(DIV, "DIV") \
+    MR_MACROS(DROP_COLUMN, "DROP COLUMN") \
+    MR_MACROS(DROP_CONSTRAINT, "DROP CONSTRAINT") \
+    MR_MACROS(DROP_DEFAULT, "DROP DEFAULT") \
+    MR_MACROS(DROP_DETACHED_PART, "DROP DETACHED PART") \
+    MR_MACROS(DROP_DETACHED_PARTITION, "DROP DETACHED PARTITION") \
+    MR_MACROS(DROP_INDEX, "DROP INDEX") \
+    MR_MACROS(DROP_PART, "DROP PART") \
+    MR_MACROS(DROP_PARTITION, "DROP PARTITION") \
+    MR_MACROS(DROP_PROJECTION, "DROP PROJECTION") \
+    MR_MACROS(DROP_STATISTIC, "DROP STATISTIC") \
+    MR_MACROS(DROP_TABLE, "DROP TABLE") \
+    MR_MACROS(DROP_TEMPORARY_TABLE, "DROP TEMPORARY TABLE") \
+    MR_MACROS(DROP, "DROP") \
+    MR_MACROS(ELSE, "ELSE") \
+    MR_MACROS(EMPTY_AS, "EMPTY AS") \
+    MR_MACROS(EMPTY, "EMPTY") \
+    MR_MACROS(ENABLED_ROLES, "ENABLED ROLES") \
+    MR_MACROS(END, "END") \
+    MR_MACROS(ENFORCED, "ENFORCED") \
+    MR_MACROS(ENGINE, "ENGINE") \
+    MR_MACROS(EPHEMERAL_SEQUENTIAL, "EPHEMERAL SEQUENTIAL") \
+    MR_MACROS(EPHEMERAL, "EPHEMERAL") \
+    MR_MACROS(ESTIMATE, "ESTIMATE") \
+    MR_MACROS(EVENT, "EVENT") \
+    MR_MACROS(EVENTS, "EVENTS") \
+    MR_MACROS(EVERY, "EVERY") \
+    MR_MACROS(EXCEPT_DATABASE, "EXCEPT DATABASE") \
+    MR_MACROS(EXCEPT_DATABASES, "EXCEPT DATABASES") \
+    MR_MACROS(EXCEPT_TABLE, "EXCEPT TABLE") \
+    MR_MACROS(EXCEPT_TABLES, "EXCEPT TABLES") \
+    MR_MACROS(EXCEPT, "EXCEPT") \
+    MR_MACROS(EXCHANGE_DICTIONARIES, "EXCHANGE DICTIONARIES") \
+    MR_MACROS(EXCHANGE_TABLES, "EXCHANGE TABLES") \
+    MR_MACROS(EXISTS, "EXISTS") \
+    MR_MACROS(EXPLAIN, "EXPLAIN") \
+    MR_MACROS(EXPRESSION, "EXPRESSION") \
+    MR_MACROS(EXTENDED, "EXTENDED") \
+    MR_MACROS(EXTERNAL_DDL_FROM, "EXTERNAL DDL FROM") \
+    MR_MACROS(FALSE_KEYWORD, "FALSE") /*The name differs from the value*/ \
+    MR_MACROS(FETCH_PART, "FETCH PART") \
+    MR_MACROS(FETCH_PARTITION, "FETCH PARTITION") \
+    MR_MACROS(FETCH, "FETCH") \
+    MR_MACROS(FIELDS, "FIELDS") \
+    MR_MACROS(FILE, "FILE") \
+    MR_MACROS(FILESYSTEM_CACHE, "FILESYSTEM CACHE") \
+    MR_MACROS(FILESYSTEM_CACHES, "FILESYSTEM CACHES") \
+    MR_MACROS(FILTER, "FILTER") \
+    MR_MACROS(FINAL, "FINAL") \
+    MR_MACROS(FIRST, "FIRST") \
+    MR_MACROS(FOLLOWING, "FOLLOWING") \
+    MR_MACROS(FOR, "FOR") \
+    MR_MACROS(FOREIGN_KEY, "FOREIGN KEY") \
+    MR_MACROS(FOREIGN, "FOREIGN") \
+    MR_MACROS(FORGET_PARTITION, "FORGET PARTITION") \
+    MR_MACROS(FORMAT, "FORMAT") \
+    MR_MACROS(FREEZE, "FREEZE") \
+    MR_MACROS(FROM_INFILE, "FROM INFILE") \
+    MR_MACROS(FROM_SHARD, "FROM SHARD") \
+    MR_MACROS(FROM, "FROM") \
+    MR_MACROS(FULL, "FULL") \
+    MR_MACROS(FULLTEXT, "FULLTEXT") \
+    MR_MACROS(FUNCTION, "FUNCTION") \
+    MR_MACROS(GLOBAL_IN, "GLOBAL IN") \
+    MR_MACROS(GLOBAL_NOT_IN, "GLOBAL NOT IN") \
+    MR_MACROS(GLOBAL, "GLOBAL") \
+    MR_MACROS(GRANT_OPTION_FOR, "GRANT OPTION FOR") \
+    MR_MACROS(GRANT, "GRANT") \
+    MR_MACROS(GRANTEES, "GRANTEES") \
+    MR_MACROS(GRANULARITY, "GRANULARITY") \
+    MR_MACROS(GROUP_BY, "GROUP BY") \
+    MR_MACROS(GROUPING_SETS, "GROUPING SETS") \
+    MR_MACROS(GROUPS, "GROUPS") \
+    MR_MACROS(H, "H") \
+    MR_MACROS(HASH, "HASH") \
+    MR_MACROS(HAVING, "HAVING") \
+    MR_MACROS(HDFS, "HDFS") \
+    MR_MACROS(HH, "HH") \
+    MR_MACROS(HIERARCHICAL, "HIERARCHICAL") \
+    MR_MACROS(HOST, "HOST") \
+    MR_MACROS(HOUR, "HOUR") \
+    MR_MACROS(HOURS, "HOURS") \
+    MR_MACROS(HTTP, "HTTP") \
+    MR_MACROS(ID, "ID") \
+    MR_MACROS(IDENTIFIED, "IDENTIFIED") \
+    MR_MACROS(IF_EMPTY, "IF EMPTY") \
+    MR_MACROS(IF_EXISTS, "IF EXISTS") \
+    MR_MACROS(IF_NOT_EXISTS, "IF NOT EXISTS") \
+    MR_MACROS(IGNORE_NULLS, "IGNORE NULLS") \
+    MR_MACROS(ILIKE, "ILIKE") \
+    MR_MACROS(IN_PARTITION, "IN PARTITION") \
+    MR_MACROS(IN, "IN") \
+    MR_MACROS(INDEX, "INDEX") \
+    MR_MACROS(INDEXES, "INDEXES") \
+    MR_MACROS(INDICES, "INDICES") \
+    MR_MACROS(INHERIT, "INHERIT") \
+    MR_MACROS(INJECTIVE, "INJECTIVE") \
+    MR_MACROS(INNER, "INNER") \
+    MR_MACROS(INSERT_INTO, "INSERT INTO") \
+    MR_MACROS(INTERPOLATE, "INTERPOLATE") \
+    MR_MACROS(INTERSECT, "INTERSECT") \
+    MR_MACROS(INTERVAL, "INTERVAL") \
+    MR_MACROS(INTO_OUTFILE, "INTO OUTFILE") \
+    MR_MACROS(INVISIBLE, "INVISIBLE") \
+    MR_MACROS(INVOKER, "INVOKER") \
+    MR_MACROS(IP, "IP") \
+    MR_MACROS(IS_NOT_DISTINCT_FROM, "IS NOT DISTINCT FROM") \
+    MR_MACROS(IS_NOT_NULL, "IS NOT NULL") \
+    MR_MACROS(IS_NULL, "IS NULL") \
+    MR_MACROS(JOIN, "JOIN") \
+    MR_MACROS(KERBEROS, "KERBEROS") \
+    MR_MACROS(KEY_BY, "KEY BY") \
+    MR_MACROS(KEY, "KEY") \
+    MR_MACROS(KEYED_BY, "KEYED BY") \
+    MR_MACROS(KEYS, "KEYS") \
+    MR_MACROS(KILL, "KILL") \
+    MR_MACROS(KIND, "KIND") \
+    MR_MACROS(LARGE_OBJECT, "LARGE OBJECT") \
+    MR_MACROS(LAST, "LAST") \
+    MR_MACROS(LAYOUT, "LAYOUT") \
+    MR_MACROS(LDAP, "LDAP") \
+    MR_MACROS(LEADING, "LEADING") \
+    MR_MACROS(LEFT_ARRAY_JOIN, "LEFT ARRAY JOIN") \
+    MR_MACROS(LEFT, "LEFT") \
+    MR_MACROS(LESS_THAN, "LESS THAN") \
+    MR_MACROS(LEVEL, "LEVEL") \
+    MR_MACROS(LIFETIME, "LIFETIME") \
+    MR_MACROS(LIGHTWEIGHT, "LIGHTWEIGHT") \
+    MR_MACROS(LIKE, "LIKE") \
+    MR_MACROS(LIMIT, "LIMIT") \
+    MR_MACROS(LINEAR, "LINEAR") \
+    MR_MACROS(LIST, "LIST") \
+    MR_MACROS(LIVE, "LIVE") \
+    MR_MACROS(LOCAL, "LOCAL") \
+    MR_MACROS(M, "M") \
+    MR_MACROS(MATCH, "MATCH") \
+    MR_MACROS(MATERIALIZE_COLUMN, "MATERIALIZE COLUMN") \
+    MR_MACROS(MATERIALIZE_INDEX, "MATERIALIZE INDEX") \
+    MR_MACROS(MATERIALIZE_PROJECTION, "MATERIALIZE PROJECTION") \
+    MR_MACROS(MATERIALIZE_STATISTIC, "MATERIALIZE STATISTIC") \
+    MR_MACROS(MATERIALIZE_TTL, "MATERIALIZE TTL") \
+    MR_MACROS(MATERIALIZE, "MATERIALIZE") \
+    MR_MACROS(MATERIALIZED, "MATERIALIZED") \
+    MR_MACROS(MAX, "MAX") \
+    MR_MACROS(MCS, "MCS") \
+    MR_MACROS(MEMORY, "MEMORY") \
+    MR_MACROS(MERGES, "MERGES") \
+    MR_MACROS(MI, "MI") \
+    MR_MACROS(MICROSECOND, "MICROSECOND") \
+    MR_MACROS(MICROSECONDS, "MICROSECONDS") \
+    MR_MACROS(MILLISECOND, "MILLISECOND") \
+    MR_MACROS(MILLISECONDS, "MILLISECONDS") \
+    MR_MACROS(MIN, "MIN") \
+    MR_MACROS(MINUTE, "MINUTE") \
+    MR_MACROS(MINUTES, "MINUTES") \
+    MR_MACROS(MM, "MM") \
+    MR_MACROS(MOD, "MOD") \
+    MR_MACROS(MODIFY_COLUMN, "MODIFY COLUMN") \
+    MR_MACROS(MODIFY_COMMENT, "MODIFY COMMENT") \
+    MR_MACROS(MODIFY_ORDER_BY, "MODIFY ORDER BY") \
+    MR_MACROS(MODIFY_QUERY, "MODIFY QUERY") \
+    MR_MACROS(MODIFY_REFRESH, "MODIFY REFRESH") \
+    MR_MACROS(MODIFY_SAMPLE_BY, "MODIFY SAMPLE BY") \
+    MR_MACROS(MODIFY_SETTING, "MODIFY SETTING") \
+    MR_MACROS(MODIFY_SQL_SECURITY, "MODIFY SQL SECURITY") \
+    MR_MACROS(MODIFY_TTL, "MODIFY TTL") \
+    MR_MACROS(MODIFY, "MODIFY") \
+    MR_MACROS(MONTH, "MONTH") \
+    MR_MACROS(MONTHS, "MONTHS") \
+    MR_MACROS(MOVE_PART, "MOVE PART") \
+    MR_MACROS(MOVE_PARTITION, "MOVE PARTITION") \
+    MR_MACROS(MOVE, "MOVE") \
+    MR_MACROS(MS, "MS") \
+    MR_MACROS(MUTATION, "MUTATION") \
+    MR_MACROS(N, "N") \
+    MR_MACROS(NAME, "NAME") \
+    MR_MACROS(NAMED_COLLECTION, "NAMED COLLECTION") \
+    MR_MACROS(NANOSECOND, "NANOSECOND") \
+    MR_MACROS(NANOSECONDS, "NANOSECONDS") \
+    MR_MACROS(NEXT, "NEXT") \
+    MR_MACROS(NO_ACTION, "NO ACTION") \
+    MR_MACROS(NO_DELAY, "NO DELAY") \
+    MR_MACROS(NO_LIMITS, "NO LIMITS") \
+    MR_MACROS(NONE, "NONE") \
+    MR_MACROS(NOT_BETWEEN, "NOT BETWEEN") \
+    MR_MACROS(NOT_IDENTIFIED, "NOT IDENTIFIED") \
+    MR_MACROS(NOT_ILIKE, "NOT ILIKE") \
+    MR_MACROS(NOT_IN, "NOT IN") \
+    MR_MACROS(NOT_KEYED, "NOT KEYED") \
+    MR_MACROS(NOT_LIKE, "NOT LIKE") \
+    MR_MACROS(NOT_OVERRIDABLE, "NOT OVERRIDABLE") \
+    MR_MACROS(NOT, "NOT") \
+    MR_MACROS(NS, "NS") \
+    MR_MACROS(NULL_KEYWORD, "NULL") \
+    MR_MACROS(NULLS, "NULLS") \
+    MR_MACROS(OFFSET, "OFFSET") \
+    MR_MACROS(ON_DELETE, "ON DELETE") \
+    MR_MACROS(ON_UPDATE, "ON UPDATE") \
+    MR_MACROS(ON_VOLUME, "ON VOLUME") \
+    MR_MACROS(ON, "ON") \
+    MR_MACROS(ONLY, "ONLY") \
+    MR_MACROS(OPTIMIZE_TABLE, "OPTIMIZE TABLE") \
+    MR_MACROS(OR_REPLACE, "OR REPLACE") \
+    MR_MACROS(OR, "OR") \
+    MR_MACROS(ORDER_BY, "ORDER BY") \
+    MR_MACROS(OUTER, "OUTER") \
+    MR_MACROS(OVER, "OVER") \
+    MR_MACROS(OVERRIDABLE, "OVERRIDABLE") \
+    MR_MACROS(PART, "PART") \
+    MR_MACROS(PARTIAL, "PARTIAL") \
+    MR_MACROS(PARTITION_BY, "PARTITION BY") \
+    MR_MACROS(PARTITION, "PARTITION") \
+    MR_MACROS(PARTITIONS, "PARTITIONS") \
+    MR_MACROS(PASTE, "PASTE") \
+    MR_MACROS(PERIODIC_REFRESH, "PERIODIC REFRESH") \
+    MR_MACROS(PERMANENTLY, "PERMANENTLY") \
+    MR_MACROS(PERMISSIVE, "PERMISSIVE") \
+    MR_MACROS(PERSISTENT_SEQUENTIAL, "PERSISTENT SEQUENTIAL") \
+    MR_MACROS(PERSISTENT, "PERSISTENT") \
+    MR_MACROS(PIPELINE, "PIPELINE") \
+    MR_MACROS(PLAN, "PLAN") \
+    MR_MACROS(POPULATE, "POPULATE") \
+    MR_MACROS(PRECEDING, "PRECEDING") \
+    MR_MACROS(PRECISION, "PRECISION") \
+    MR_MACROS(PREWHERE, "PREWHERE") \
+    MR_MACROS(PRIMARY_KEY, "PRIMARY KEY") \
+    MR_MACROS(PRIMARY, "PRIMARY") \
+    MR_MACROS(PROFILE, "PROFILE") \
+    MR_MACROS(PROJECTION, "PROJECTION") \
+    MR_MACROS(PROTOBUF, "Protobuf") \
+    MR_MACROS(PULL, "PULL") \
+    MR_MACROS(Q, "Q") \
+    MR_MACROS(QQ, "QQ") \
+    MR_MACROS(QUARTER, "QUARTER") \
+    MR_MACROS(QUARTERS, "QUARTERS") \
+    MR_MACROS(QUERY_TREE, "QUERY TREE") \
+    MR_MACROS(QUERY, "QUERY") \
+    MR_MACROS(QUOTA, "QUOTA") \
+    MR_MACROS(RANDOMIZE_FOR, "RANDOMIZE FOR") \
+    MR_MACROS(RANDOMIZED, "RANDOMIZED") \
+    MR_MACROS(RANGE, "RANGE") \
+    MR_MACROS(READONLY, "READONLY") \
+    MR_MACROS(REALM, "REALM") \
+    MR_MACROS(RECOMPRESS, "RECOMPRESS") \
+    MR_MACROS(REFERENCES, "REFERENCES") \
+    MR_MACROS(REFRESH, "REFRESH") \
+    MR_MACROS(REGEXP, "REGEXP") \
+    MR_MACROS(REMOVE_SAMPLE_BY, "REMOVE SAMPLE BY") \
+    MR_MACROS(REMOVE_TTL, "REMOVE TTL") \
+    MR_MACROS(REMOVE, "REMOVE") \
+    MR_MACROS(RENAME_COLUMN, "RENAME COLUMN") \
+    MR_MACROS(RENAME_DATABASE, "RENAME DATABASE") \
+    MR_MACROS(RENAME_DICTIONARY, "RENAME DICTIONARY") \
+    MR_MACROS(RENAME_TABLE, "RENAME TABLE") \
+    MR_MACROS(RENAME_TO, "RENAME TO") \
+    MR_MACROS(RENAME, "RENAME") \
+    MR_MACROS(REPLACE_PARTITION, "REPLACE PARTITION") \
+    MR_MACROS(REPLACE, "REPLACE") \
+    MR_MACROS(RESET_SETTING, "RESET SETTING") \
+    MR_MACROS(RESPECT_NULLS, "RESPECT NULLS") \
+    MR_MACROS(RESTORE, "RESTORE") \
+    MR_MACROS(RESTRICT, "RESTRICT") \
+    MR_MACROS(RESTRICTIVE, "RESTRICTIVE") \
+    MR_MACROS(RESUME, "RESUME") \
+    MR_MACROS(REVOKE, "REVOKE") \
+    MR_MACROS(RIGHT, "RIGHT") \
+    MR_MACROS(ROLLBACK, "ROLLBACK") \
+    MR_MACROS(ROLLUP, "ROLLUP") \
+    MR_MACROS(ROW, "ROW") \
+    MR_MACROS(ROWS, "ROWS") \
+    MR_MACROS(S, "S") \
+    MR_MACROS(S3, "S3") \
+    MR_MACROS(SALT, "SALT") \
+    MR_MACROS(SAMPLE_BY, "SAMPLE BY") \
+    MR_MACROS(SAMPLE, "SAMPLE") \
+    MR_MACROS(SCHEME, "SCHEME") \
+    MR_MACROS(SECOND, "SECOND") \
+    MR_MACROS(SECONDS, "SECONDS") \
+    MR_MACROS(SELECT, "SELECT") \
+    MR_MACROS(SEMI, "SEMI") \
+    MR_MACROS(SERVER, "SERVER") \
+    MR_MACROS(SET_DEFAULT_ROLE, "SET DEFAULT ROLE") \
+    MR_MACROS(SET_DEFAULT, "SET DEFAULT") \
+    MR_MACROS(SET_FAKE_TIME, "SET FAKE TIME") \
+    MR_MACROS(SET_NULL, "SET NULL") \
+    MR_MACROS(SET_ROLE_DEFAULT, "SET ROLE DEFAULT") \
+    MR_MACROS(SET_ROLE, "SET ROLE") \
+    MR_MACROS(SET_TRANSACTION_SNAPSHOT, "SET TRANSACTION SNAPSHOT") \
+    MR_MACROS(SET, "SET") \
+    MR_MACROS(SETTINGS, "SETTINGS") \
+    MR_MACROS(SHOW_ACCESS, "SHOW ACCESS") \
+    MR_MACROS(SHOW_CREATE, "SHOW CREATE") \
+    MR_MACROS(SHOW_ENGINES, "SHOW ENGINES") \
+    MR_MACROS(SHOW_FUNCTIONS, "SHOW FUNCTIONS") \
+    MR_MACROS(SHOW_GRANTS, "SHOW GRANTS") \
+    MR_MACROS(SHOW_PRIVILEGES, "SHOW PRIVILEGES") \
+    MR_MACROS(SHOW_PROCESSLIST, "SHOW PROCESSLIST") \
+    MR_MACROS(SHOW_SETTING, "SHOW SETTING") \
+    MR_MACROS(SHOW, "SHOW") \
+    MR_MACROS(SIGNED, "SIGNED") \
+    MR_MACROS(SIMPLE, "SIMPLE") \
+    MR_MACROS(SOURCE, "SOURCE") \
+    MR_MACROS(SPATIAL, "SPATIAL") \
+    MR_MACROS(SQL_SECURITY, "SQL SECURITY") \
+    MR_MACROS(SS, "SS") \
+    MR_MACROS(STATISTIC, "STATISTIC") \
+    MR_MACROS(STEP, "STEP") \
+    MR_MACROS(STORAGE, "STORAGE") \
+    MR_MACROS(STRICT, "STRICT") \
+    MR_MACROS(SUBPARTITION_BY, "SUBPARTITION BY") \
+    MR_MACROS(SUBPARTITION, "SUBPARTITION") \
+    MR_MACROS(SUBPARTITIONS, "SUBPARTITIONS") \
+    MR_MACROS(SUSPEND, "SUSPEND") \
+    MR_MACROS(SYNC, "SYNC") \
+    MR_MACROS(SYNTAX, "SYNTAX") \
+    MR_MACROS(SYSTEM, "SYSTEM") \
+    MR_MACROS(TABLE_OVERRIDE, "TABLE OVERRIDE") \
+    MR_MACROS(TABLE, "TABLE") \
+    MR_MACROS(TABLES, "TABLES") \
+    MR_MACROS(TEMPORARY_TABLE, "TEMPORARY TABLE") \
+    MR_MACROS(TEMPORARY, "TEMPORARY") \
+    MR_MACROS(TEST, "TEST") \
+    MR_MACROS(THEN, "THEN") \
+    MR_MACROS(TIMESTAMP, "TIMESTAMP") \
+    MR_MACROS(TO_DISK, "TO DISK") \
+    MR_MACROS(TO_INNER_UUID, "TO INNER UUID") \
+    MR_MACROS(TO_SHARD, "TO SHARD") \
+    MR_MACROS(TO_TABLE, "TO TABLE") \
+    MR_MACROS(TO_VOLUME, "TO VOLUME") \
+    MR_MACROS(TO, "TO") \
+    MR_MACROS(TOP, "TOP") \
+    MR_MACROS(TOTALS, "TOTALS") \
+    MR_MACROS(TRACKING_ONLY, "TRACKING ONLY") \
+    MR_MACROS(TRAILING, "TRAILING") \
+    MR_MACROS(TRANSACTION, "TRANSACTION") \
+    MR_MACROS(TRIGGER, "TRIGGER") \
+    MR_MACROS(TRUE_KEYWORD, "TRUE") /*The name differs from the value*/ \
+    MR_MACROS(TRUNCATE, "TRUNCATE") \
+    MR_MACROS(TTL, "TTL") \
+    MR_MACROS(TYPE, "TYPE") \
+    MR_MACROS(TYPEOF, "TYPEOF") \
+    MR_MACROS(UNBOUNDED, "UNBOUNDED") \
+    MR_MACROS(UNDROP, "UNDROP") \
+    MR_MACROS(UNFREEZE, "UNFREEZE") \
+    MR_MACROS(UNION, "UNION") \
+    MR_MACROS(UNIQUE, "UNIQUE") \
+    MR_MACROS(UNSET_FAKE_TIME, "UNSET FAKE TIME") \
+    MR_MACROS(UNSIGNED, "UNSIGNED") \
+    MR_MACROS(UPDATE, "UPDATE") \
+    MR_MACROS(URL, "URL") \
+    MR_MACROS(USE, "USE") \
+    MR_MACROS(USING, "USING") \
+    MR_MACROS(UUID, "UUID") \
+    MR_MACROS(VALID_UNTIL, "VALID UNTIL") \
+    MR_MACROS(VALUES, "VALUES") \
+    MR_MACROS(VARYING, "VARYING") \
+    MR_MACROS(VIEW, "VIEW") \
+    MR_MACROS(VISIBLE, "VISIBLE") \
+    MR_MACROS(WATCH, "WATCH") \
+    MR_MACROS(WATERMARK, "WATERMARK") \
+    MR_MACROS(WEEK, "WEEK") \
+    MR_MACROS(WEEKS, "WEEKS") \
+    MR_MACROS(WHEN, "WHEN") \
+    MR_MACROS(WHERE, "WHERE") \
+    MR_MACROS(WINDOW, "WINDOW") \
+    MR_MACROS(WITH_ADMIN_OPTION, "WITH ADMIN OPTION") \
+    MR_MACROS(WITH_CHECK, "WITH CHECK") \
+    MR_MACROS(WITH_FILL, "WITH FILL") \
+    MR_MACROS(WITH_GRANT_OPTION, "WITH GRANT OPTION") \
+    MR_MACROS(WITH_NAME, "WITH NAME") \
+    MR_MACROS(WITH_REPLACE_OPTION, "WITH REPLACE OPTION") \
+    MR_MACROS(WITH_TIES, "WITH TIES") \
+    MR_MACROS(WITH, "WITH") \
+    MR_MACROS(WK, "WK") \
+    MR_MACROS(WRITABLE, "WRITABLE") \
+    MR_MACROS(WW, "WW") \
+    MR_MACROS(YEAR, "YEAR") \
+    MR_MACROS(YEARS, "YEARS") \
+    MR_MACROS(YY, "YY") \
+    MR_MACROS(YYYY, "YYYY") \
+    MR_MACROS(ZKPATH, "ZKPATH") \
+
+/// The list of keywords where underscore is intentional
+#define APPLY_FOR_PARSER_KEYWORDS_WITH_UNDERSCORES(MR_MACROS) \
+    MR_MACROS(ALLOWED_LATENESS, "ALLOWED_LATENESS") \
+    MR_MACROS(AUTO_INCREMENT, "AUTO_INCREMENT") \
+    MR_MACROS(BASE_BACKUP, "base_backup") \
+    MR_MACROS(BCRYPT_HASH, "BCRYPT_HASH") \
+    MR_MACROS(BCRYPT_PASSWORD, "BCRYPT_PASSWORD") \
+    MR_MACROS(CHANGEABLE_IN_READONLY, "CHANGEABLE_IN_READONLY") \
+    MR_MACROS(CLUSTER_HOST_IDS, "cluster_host_ids") \
+    MR_MACROS(CURRENT_USER, "CURRENT_USER") \
+    MR_MACROS(DOUBLE_SHA1_HASH, "DOUBLE_SHA1_HASH") \
+    MR_MACROS(DOUBLE_SHA1_PASSWORD, "DOUBLE_SHA1_PASSWORD") \
+    MR_MACROS(IS_OBJECT_ID, "IS_OBJECT_ID") \
+    MR_MACROS(NO_PASSWORD, "NO_PASSWORD") \
+    MR_MACROS(PART_MOVE_TO_SHARD, "PART_MOVE_TO_SHARD") \
+    MR_MACROS(PLAINTEXT_PASSWORD, "PLAINTEXT_PASSWORD") \
+    MR_MACROS(SHA256_HASH, "SHA256_HASH") \
+    MR_MACROS(SHA256_PASSWORD, "SHA256_PASSWORD") \
+    MR_MACROS(SQL_TSI_DAY, "SQL_TSI_DAY") \
+    MR_MACROS(SQL_TSI_HOUR, "SQL_TSI_HOUR") \
+    MR_MACROS(SQL_TSI_MICROSECOND, "SQL_TSI_MICROSECOND") \
+    MR_MACROS(SQL_TSI_MILLISECOND, "SQL_TSI_MILLISECOND") \
+    MR_MACROS(SQL_TSI_MINUTE, "SQL_TSI_MINUTE") \
+    MR_MACROS(SQL_TSI_MONTH, "SQL_TSI_MONTH") \
+    MR_MACROS(SQL_TSI_NANOSECOND, "SQL_TSI_NANOSECOND") \
+    MR_MACROS(SQL_TSI_QUARTER, "SQL_TSI_QUARTER") \
+    MR_MACROS(SQL_TSI_SECOND, "SQL_TSI_SECOND") \
+    MR_MACROS(SQL_TSI_WEEK, "SQL_TSI_WEEK") \
+    MR_MACROS(SQL_TSI_YEAR, "SQL_TSI_YEAR") \
+    MR_MACROS(SSH_KEY, "SSH_KEY") \
+    MR_MACROS(SSL_CERTIFICATE, "SSL_CERTIFICATE") \
+    MR_MACROS(STRICTLY_ASCENDING, "STRICTLY_ASCENDING") \
+    MR_MACROS(WITH_ITEMINDEX, "with_itemindex") \
+
+enum class Keyword : size_t
+{
+#define DECLARE_PARSER_KEYWORD_ENUM(identifier, name) \
+    identifier,
+
+    APPLY_FOR_PARSER_KEYWORDS(DECLARE_PARSER_KEYWORD_ENUM)
+    APPLY_FOR_PARSER_KEYWORDS_WITH_UNDERSCORES(DECLARE_PARSER_KEYWORD_ENUM)
+#undef DECLARE_PARSER_KEYWORD_ENUM
+};
+
+
+std::string_view toStringView(Keyword type);
+
+const std::vector<String> & getAllKeyWords();
+
+
 /** Parse specified keyword such as SELECT or compound keyword such as ORDER BY.
   * All case insensitive. Requires word boundary.
   * For compound keywords, any whitespace characters and comments could be in the middle.
@@ -17,9 +582,20 @@ class ParserKeyword : public IParserBase
 private:
     std::string_view s;
 
+    explicit ParserKeyword(std::string_view s_): s(s_) { assert(!s.empty()); }
+
 public:
-    //NOLINTNEXTLINE Want to be able to init ParserKeyword("literal")
-    constexpr ParserKeyword(std::string_view s_): s(s_) { assert(!s.empty()); }
+    static ParserKeyword createDeprecated(std::string_view s_)
+    {
+        return ParserKeyword(s_);
+    }
+
+    static std::shared_ptr<ParserKeyword> createDeprecatedPtr(std::string_view s_)
+    {
+        return std::shared_ptr<ParserKeyword>(new ParserKeyword(s_));
+    }
+
+    explicit ParserKeyword(Keyword keyword);
 
     constexpr const char * getName() const override { return s.data(); }
 
diff --git a/src/Parsers/ExpressionElementParsers.cpp b/src/Parsers/ExpressionElementParsers.cpp
index 486555ae86d..1135fe88c16 100644
--- a/src/Parsers/ExpressionElementParsers.cpp
+++ b/src/Parsers/ExpressionElementParsers.cpp
@@ -8,6 +8,7 @@
 #include <Common/typeid_cast.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/BinStringDecodeHelper.h>
+#include "Parsers/CommonParsers.h"
 
 #include <Parsers/DumpASTNode.h>
 #include <Parsers/ASTAsterisk.h>
@@ -290,7 +291,7 @@ bool ParserCompoundIdentifier::parseImpl(Pos & pos, ASTPtr & node, Expected & ex
             params.push_back(child->as<ASTIdentifier>()->getParam());
     }
 
-    ParserKeyword s_uuid("UUID");
+    ParserKeyword s_uuid(Keyword::UUID);
     UUID uuid = UUIDHelpers::Nil;
 
     if (table_name_with_optional_uuid)
@@ -337,7 +338,7 @@ bool ParserFilterClause::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
         return false;
     }
 
-    ParserKeyword parser_where("WHERE");
+    ParserKeyword parser_where(Keyword::WHERE);
     if (!parser_where.ignore(pos, expected))
     {
         return false;
@@ -391,9 +392,9 @@ bool ParserWindowReference::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
 static bool tryParseFrameDefinition(ASTWindowDefinition * node, IParser::Pos & pos,
     Expected & expected)
 {
-    ParserKeyword keyword_rows("ROWS");
-    ParserKeyword keyword_groups("GROUPS");
-    ParserKeyword keyword_range("RANGE");
+    ParserKeyword keyword_rows(Keyword::ROWS);
+    ParserKeyword keyword_groups(Keyword::GROUPS);
+    ParserKeyword keyword_range(Keyword::RANGE);
 
     node->frame_is_default = false;
     if (keyword_rows.ignore(pos, expected))
@@ -415,12 +416,12 @@ static bool tryParseFrameDefinition(ASTWindowDefinition * node, IParser::Pos & p
         return true;
     }
 
-    ParserKeyword keyword_between("BETWEEN");
-    ParserKeyword keyword_unbounded("UNBOUNDED");
-    ParserKeyword keyword_preceding("PRECEDING");
-    ParserKeyword keyword_following("FOLLOWING");
-    ParserKeyword keyword_and("AND");
-    ParserKeyword keyword_current_row("CURRENT ROW");
+    ParserKeyword keyword_between(Keyword::BETWEEN);
+    ParserKeyword keyword_unbounded(Keyword::UNBOUNDED);
+    ParserKeyword keyword_preceding(Keyword::PRECEDING);
+    ParserKeyword keyword_following(Keyword::FOLLOWING);
+    ParserKeyword keyword_and(Keyword::AND);
+    ParserKeyword keyword_current_row(Keyword::CURRENT_ROW);
 
     // There are two variants of grammar for the frame:
     // 1) ROWS BETWEEN UNBOUNDED PRECEDING AND CURRENT ROW
@@ -524,10 +525,10 @@ static bool tryParseFrameDefinition(ASTWindowDefinition * node, IParser::Pos & p
 static bool parseWindowDefinitionParts(IParser::Pos & pos,
     ASTWindowDefinition & node, Expected & expected)
 {
-    ParserKeyword keyword_partition_by("PARTITION BY");
+    ParserKeyword keyword_partition_by(Keyword::PARTITION_BY);
     ParserNotEmptyExpressionList columns_partition_by(
         false /* we don't allow declaring aliases here*/);
-    ParserKeyword keyword_order_by("ORDER BY");
+    ParserKeyword keyword_order_by(Keyword::ORDER_BY);
     ParserOrderByExpressionList columns_order_by;
 
     if (keyword_partition_by.ignore(pos, expected))
@@ -626,7 +627,7 @@ bool ParserWindowList::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         }
         elem->name = getIdentifierName(window_name_identifier);
 
-        ParserKeyword keyword_as("AS");
+        ParserKeyword keyword_as(Keyword::AS);
         if (!keyword_as.ignore(pos, expected))
         {
             return false;
@@ -854,7 +855,7 @@ bool ParserCastOperator::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
 
 bool ParserNull::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword nested_parser("NULL");
+    ParserKeyword nested_parser(Keyword::NULL_KEYWORD);
     if (nested_parser.parse(pos, node, expected))
     {
         node = std::make_shared<ASTLiteral>(Null());
@@ -867,12 +868,12 @@ bool ParserNull::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
 bool ParserBool::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (ParserKeyword("true").parse(pos, node, expected))
+    if (ParserKeyword(Keyword::TRUE_KEYWORD).parse(pos, node, expected))
     {
         node = std::make_shared<ASTLiteral>(true);
         return true;
     }
-    else if (ParserKeyword("false").parse(pos, node, expected))
+    else if (ParserKeyword(Keyword::FALSE_KEYWORD).parse(pos, node, expected))
     {
         node = std::make_shared<ASTLiteral>(false);
         return true;
@@ -1488,7 +1489,7 @@ const char * ParserAlias::restricted_keywords[] =
 
 bool ParserAlias::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_as("AS");
+    ParserKeyword s_as(Keyword::AS);
     ParserIdentifier id_p;
 
     bool has_as_word = s_as.ignore(pos, expected);
@@ -1519,11 +1520,11 @@ bool ParserAlias::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
 bool ParserColumnsTransformers::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword apply("APPLY");
-    ParserKeyword except("EXCEPT");
-    ParserKeyword replace("REPLACE");
-    ParserKeyword as("AS");
-    ParserKeyword strict("STRICT");
+    ParserKeyword apply(Keyword::APPLY);
+    ParserKeyword except(Keyword::EXCEPT);
+    ParserKeyword replace(Keyword::REPLACE);
+    ParserKeyword as(Keyword::AS);
+    ParserKeyword strict(Keyword::STRICT);
 
     if (allowed_transformers.isSet(ColumnTransformer::APPLY) && apply.ignore(pos, expected))
     {
@@ -1847,7 +1848,7 @@ static bool parseColumnsMatcherBody(IParser::Pos & pos, ASTPtr & node, Expected
 
 bool ParserColumnsMatcher::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword columns("COLUMNS");
+    ParserKeyword columns(Keyword::COLUMNS);
 
     if (!columns.ignore(pos, expected))
         return false;
@@ -2052,18 +2053,18 @@ bool ParserWithOptionalAlias::parseImpl(Pos & pos, ASTPtr & node, Expected & exp
 bool ParserOrderByElement::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
     ParserExpressionWithOptionalAlias elem_p(false);
-    ParserKeyword ascending("ASCENDING");
-    ParserKeyword descending("DESCENDING");
-    ParserKeyword asc("ASC");
-    ParserKeyword desc("DESC");
-    ParserKeyword nulls("NULLS");
-    ParserKeyword first("FIRST");
-    ParserKeyword last("LAST");
-    ParserKeyword collate("COLLATE");
-    ParserKeyword with_fill("WITH FILL");
-    ParserKeyword from("FROM");
-    ParserKeyword to("TO");
-    ParserKeyword step("STEP");
+    ParserKeyword ascending(Keyword::ASCENDING);
+    ParserKeyword descending(Keyword::DESCENDING);
+    ParserKeyword asc(Keyword::ASC);
+    ParserKeyword desc(Keyword::DESC);
+    ParserKeyword nulls(Keyword::NULLS);
+    ParserKeyword first(Keyword::FIRST);
+    ParserKeyword last(Keyword::LAST);
+    ParserKeyword collate(Keyword::COLLATE);
+    ParserKeyword with_fill(Keyword::WITH_FILL);
+    ParserKeyword from(Keyword::FROM);
+    ParserKeyword to(Keyword::TO);
+    ParserKeyword step(Keyword::STEP);
     ParserStringLiteral collate_locale_parser;
     ParserExpressionWithOptionalAlias exp_parser(false);
 
@@ -2139,7 +2140,7 @@ bool ParserOrderByElement::parseImpl(Pos & pos, ASTPtr & node, Expected & expect
 
 bool ParserInterpolateElement::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword as("AS");
+    ParserKeyword as(Keyword::AS);
     ParserExpression element_p;
     ParserIdentifier ident_p;
 
@@ -2210,18 +2211,18 @@ bool ParserFunctionWithKeyValueArguments::parseImpl(Pos & pos, ASTPtr & node, Ex
 
 bool ParserTTLElement::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_to_disk("TO DISK");
-    ParserKeyword s_to_volume("TO VOLUME");
-    ParserKeyword s_if_exists("IF EXISTS");
-    ParserKeyword s_delete("DELETE");
-    ParserKeyword s_where("WHERE");
-    ParserKeyword s_group_by("GROUP BY");
-    ParserKeyword s_set("SET");
-    ParserKeyword s_recompress("RECOMPRESS");
-    ParserKeyword s_codec("CODEC");
-    ParserKeyword s_materialize("MATERIALIZE");
-    ParserKeyword s_remove("REMOVE");
-    ParserKeyword s_modify("MODIFY");
+    ParserKeyword s_to_disk(Keyword::TO_DISK);
+    ParserKeyword s_to_volume(Keyword::TO_VOLUME);
+    ParserKeyword s_if_exists(Keyword::IF_EXISTS);
+    ParserKeyword s_delete(Keyword::DELETE);
+    ParserKeyword s_where(Keyword::WHERE);
+    ParserKeyword s_group_by(Keyword::GROUP_BY);
+    ParserKeyword s_set(Keyword::SET);
+    ParserKeyword s_recompress(Keyword::RECOMPRESS);
+    ParserKeyword s_codec(Keyword::CODEC);
+    ParserKeyword s_materialize(Keyword::MATERIALIZE);
+    ParserKeyword s_remove(Keyword::REMOVE);
+    ParserKeyword s_modify(Keyword::MODIFY);
 
     ParserIdentifier parser_identifier;
     ParserStringLiteral parser_string_literal;
diff --git a/src/Parsers/ExpressionListParsers.cpp b/src/Parsers/ExpressionListParsers.cpp
index 1e7d0158878..05691529f43 100644
--- a/src/Parsers/ExpressionListParsers.cpp
+++ b/src/Parsers/ExpressionListParsers.cpp
@@ -69,11 +69,11 @@ bool ParserList::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 bool ParserUnionList::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
     ParserUnionQueryElement elem_parser;
-    ParserKeyword s_union_parser("UNION");
-    ParserKeyword s_all_parser("ALL");
-    ParserKeyword s_distinct_parser("DISTINCT");
-    ParserKeyword s_except_parser("EXCEPT");
-    ParserKeyword s_intersect_parser("INTERSECT");
+    ParserKeyword s_union_parser(Keyword::UNION);
+    ParserKeyword s_all_parser(Keyword::ALL);
+    ParserKeyword s_distinct_parser(Keyword::DISTINCT);
+    ParserKeyword s_except_parser(Keyword::EXCEPT);
+    ParserKeyword s_intersect_parser(Keyword::INTERSECT);
     ASTs elements;
 
     auto parse_element = [&]
@@ -135,7 +135,7 @@ static bool parseOperator(IParser::Pos & pos, std::string_view op, Expected & ex
 {
     if (!op.empty() && isWordCharASCII(op.front()))
     {
-        return ParserKeyword(op).ignore(pos, expected);
+        return ParserKeyword::createDeprecated(op).ignore(pos, expected);
     }
     else if (op.length() == pos->size() && 0 == memcmp(op.data(), pos->begin, pos->size()))
     {
@@ -806,7 +806,6 @@ struct ParserExpressionImpl
 {
     static const std::vector<std::pair<std::string_view, Operator>> operators_table;
     static const std::vector<std::pair<std::string_view, Operator>> unary_operators_table;
-    static const std::array<std::string_view, 1> overlapping_operators_to_skip;
 
     static const Operator finish_between_operator;
 
@@ -819,8 +818,8 @@ struct ParserExpressionImpl
     ParserSubstitution substitution_parser;
     ParserMySQLGlobalVariable mysql_global_variable_parser;
 
-    ParserKeyword any_parser{"ANY"};
-    ParserKeyword all_parser{"ALL"};
+    ParserKeyword any_parser{Keyword::ANY};
+    ParserKeyword all_parser{Keyword::ALL};
 
     // Recursion
     ParserQualifiedAsterisk qualified_asterisk_parser;
@@ -885,7 +884,7 @@ public:
             if (test_pos.isValid() && test_pos->type != TokenType::Semicolon)
             {
                 /// If we can't parse FROM then return
-                if (!ParserKeyword("FROM").ignore(test_pos, test_expected))
+                if (!ParserKeyword(Keyword::FROM).ignore(test_pos, test_expected))
                     return true;
 
                 // If there is a comma after 'from' then the first one was a name of a column
@@ -893,7 +892,7 @@ public:
                     return true;
 
                 /// If we parse a second FROM then the first one was a name of a column
-                if (ParserKeyword("FROM").ignore(test_pos, test_expected))
+                if (ParserKeyword(Keyword::FROM).ignore(test_pos, test_expected))
                     return true;
 
                 /// If we parse an explicit alias to FROM, then it was a name of a column
@@ -981,8 +980,8 @@ public:
             auto pos_after_bracket = pos;
             auto old_expected = expected;
 
-            ParserKeyword all("ALL");
-            ParserKeyword distinct("DISTINCT");
+            ParserKeyword all(Keyword::ALL);
+            ParserKeyword distinct(Keyword::DISTINCT);
 
             if (all.ignore(pos, expected))
                 has_all = true;
@@ -1065,8 +1064,8 @@ public:
                     auto pos_after_bracket = pos;
                     auto old_expected = expected;
 
-                    ParserKeyword all("ALL");
-                    ParserKeyword distinct("DISTINCT");
+                    ParserKeyword all(Keyword::ALL);
+                    ParserKeyword distinct(Keyword::DISTINCT);
 
                     if (all.ignore(pos, expected))
                         has_all = true;
@@ -1112,10 +1111,10 @@ public:
                 function_node->children.push_back(function_node->parameters);
             }
 
-            ParserKeyword filter("FILTER");
-            ParserKeyword over("OVER");
-            ParserKeyword respect_nulls("RESPECT NULLS");
-            ParserKeyword ignore_nulls("IGNORE NULLS");
+            ParserKeyword filter(Keyword::FILTER);
+            ParserKeyword over(Keyword::OVER);
+            ParserKeyword respect_nulls(Keyword::RESPECT_NULLS);
+            ParserKeyword ignore_nulls(Keyword::IGNORE_NULLS);
 
             if (filter.ignore(pos, expected))
             {
@@ -1267,7 +1266,7 @@ public:
         /// 0. Parse all the cases (-> 1)
         /// 1. Parse closing token (finished)
 
-        ParserKeyword as_keyword_parser("AS");
+        ParserKeyword as_keyword_parser(Keyword::AS);
         ASTPtr alias;
 
         /// expr AS type
@@ -1348,7 +1347,7 @@ public:
                 if (elements.size() != 2)
                     return false;
 
-                elements = {makeASTFunction("CAST", elements[0], elements[1])};
+                elements = {makeASTFunction(toString(toStringView(Keyword::CAST)), elements[0], elements[1])};
                 finished = true;
                 return true;
             }
@@ -1374,7 +1373,7 @@ public:
         if (state == 0)
         {
             IParser::Pos begin = pos;
-            ParserKeyword s_from("FROM");
+            ParserKeyword s_from(Keyword::FROM);
 
             if (parseIntervalKind(pos, expected, interval_kind) && s_from.ignore(pos, expected))
             {
@@ -1447,7 +1446,7 @@ public:
         if (state == 0)
         {
             if (ParserToken(TokenType::Comma).ignore(pos, expected) ||
-                ParserKeyword("FROM").ignore(pos, expected))
+                ParserKeyword(Keyword::FROM).ignore(pos, expected))
             {
                 action = Action::OPERAND;
 
@@ -1461,7 +1460,7 @@ public:
         if (state == 1)
         {
             if (ParserToken(TokenType::Comma).ignore(pos, expected) ||
-                ParserKeyword("FOR").ignore(pos, expected))
+                ParserKeyword(Keyword::FOR).ignore(pos, expected))
             {
                 action = Action::OPERAND;
 
@@ -1518,7 +1517,7 @@ public:
 
                 state = 1;
             }
-            if (ParserKeyword("IN").ignore(pos, expected))
+            if (ParserKeyword(Keyword::IN).ignore(pos, expected))
             {
                 action = Action::OPERAND;
 
@@ -1610,18 +1609,18 @@ public:
         {
             if (!trim_left && !trim_right)
             {
-                if (ParserKeyword("BOTH").ignore(pos, expected))
+                if (ParserKeyword(Keyword::BOTH).ignore(pos, expected))
                 {
                     trim_left = true;
                     trim_right = true;
                     char_override = true;
                 }
-                else if (ParserKeyword("LEADING").ignore(pos, expected))
+                else if (ParserKeyword(Keyword::LEADING).ignore(pos, expected))
                 {
                     trim_left = true;
                     char_override = true;
                 }
-                else if (ParserKeyword("TRAILING").ignore(pos, expected))
+                else if (ParserKeyword(Keyword::TRAILING).ignore(pos, expected))
                 {
                     trim_right = true;
                     char_override = true;
@@ -1645,7 +1644,7 @@ public:
 
         if (state == 1)
         {
-            if (ParserKeyword("FROM").ignore(pos, expected))
+            if (ParserKeyword(Keyword::FROM).ignore(pos, expected))
             {
                 action = Action::OPERAND;
 
@@ -2002,7 +2001,7 @@ public:
         if (state == 0)
         {
             auto old_pos = pos;
-            has_case_expr = !ParserKeyword("WHEN").ignore(pos, expected);
+            has_case_expr = !ParserKeyword(Keyword::WHEN).ignore(pos, expected);
             pos = old_pos;
 
             state = 1;
@@ -2010,7 +2009,7 @@ public:
 
         if (state == 1)
         {
-            if (ParserKeyword("WHEN").ignore(pos, expected))
+            if (ParserKeyword(Keyword::WHEN).ignore(pos, expected))
             {
                 if ((has_case_expr || !elements.empty()) && !mergeElement())
                     return false;
@@ -2018,7 +2017,7 @@ public:
                 action = Action::OPERAND;
                 state = 2;
             }
-            else if (ParserKeyword("ELSE").ignore(pos, expected))
+            else if (ParserKeyword(Keyword::ELSE).ignore(pos, expected))
             {
                 if (!mergeElement())
                     return false;
@@ -2026,7 +2025,7 @@ public:
                 action = Action::OPERAND;
                 state = 3;
             }
-            else if (ParserKeyword("END").ignore(pos, expected))
+            else if (ParserKeyword(Keyword::END).ignore(pos, expected))
             {
                 if (!mergeElement())
                     return false;
@@ -2045,7 +2044,7 @@ public:
 
         if (state == 2)
         {
-            if (ParserKeyword("THEN").ignore(pos, expected))
+            if (ParserKeyword(Keyword::THEN).ignore(pos, expected))
             {
                 if (!mergeElement())
                     return false;
@@ -2057,7 +2056,7 @@ public:
 
         if (state == 3)
         {
-            if (ParserKeyword("END").ignore(pos, expected))
+            if (ParserKeyword(Keyword::END).ignore(pos, expected))
             {
                 if (!mergeElement())
                     return false;
@@ -2119,7 +2118,7 @@ public:
                 return true;
             }
 
-            if (!ParserKeyword{"ELSE"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::ELSE}.ignore(pos, expected))
                 return false;
 
             state = 1;
@@ -2303,7 +2302,7 @@ bool ParseDateOperatorExpression(IParser::Pos & pos, ASTPtr & node, Expected & e
     auto begin = pos;
 
     /// If no DATE keyword, go to the nested parser.
-    if (!ParserKeyword("DATE").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::DATE).ignore(pos, expected))
         return false;
 
     ASTPtr expr;
@@ -2322,7 +2321,7 @@ bool ParseTimestampOperatorExpression(IParser::Pos & pos, ASTPtr & node, Expecte
     auto begin = pos;
 
     /// If no TIMESTAMP keyword, go to the nested parser.
-    if (!ParserKeyword("TIMESTAMP").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::TIMESTAMP).ignore(pos, expected))
         return false;
 
     ASTPtr expr;
@@ -2378,13 +2377,13 @@ const std::vector<std::pair<std::string_view, Operator>> ParserExpressionImpl::o
     {"->",            Operator("lambda",          1,  2, OperatorType::Lambda)},
     {"?",             Operator("",                2,  0, OperatorType::StartIf)},
     {":",             Operator("if",              3,  3, OperatorType::FinishIf)},
-    {"OR",            Operator("or",              3,  2, OperatorType::Mergeable)},
-    {"AND",           Operator("and",             4,  2, OperatorType::Mergeable)},
-    {"IS NOT DISTINCT FROM", Operator("isNotDistinctFrom", 6, 2)},
-    {"IS NULL",       Operator("isNull",          6,  1, OperatorType::IsNull)},
-    {"IS NOT NULL",   Operator("isNotNull",       6,  1, OperatorType::IsNull)},
-    {"BETWEEN",       Operator("",                7,  0, OperatorType::StartBetween)},
-    {"NOT BETWEEN",   Operator("",                7,  0, OperatorType::StartNotBetween)},
+    {toStringView(Keyword::OR),            Operator("or",              3,  2, OperatorType::Mergeable)},
+    {toStringView(Keyword::AND),           Operator("and",             4,  2, OperatorType::Mergeable)},
+    {toStringView(Keyword::IS_NOT_DISTINCT_FROM), Operator("isNotDistinctFrom", 6, 2)},
+    {toStringView(Keyword::IS_NULL),       Operator("isNull",          6,  1, OperatorType::IsNull)},
+    {toStringView(Keyword::IS_NOT_NULL),   Operator("isNotNull",       6,  1, OperatorType::IsNull)},
+    {toStringView(Keyword::BETWEEN),       Operator("",                7,  0, OperatorType::StartBetween)},
+    {toStringView(Keyword::NOT_BETWEEN),   Operator("",                7,  0, OperatorType::StartNotBetween)},
     {"==",            Operator("equals",          9,  2, OperatorType::Comparison)},
     {"!=",            Operator("notEquals",       9,  2, OperatorType::Comparison)},
     {"<=>",           Operator("isNotDistinctFrom", 9, 2, OperatorType::Comparison)},
@@ -2394,15 +2393,15 @@ const std::vector<std::pair<std::string_view, Operator>> ParserExpressionImpl::o
     {"<",             Operator("less",            9,  2, OperatorType::Comparison)},
     {">",             Operator("greater",         9,  2, OperatorType::Comparison)},
     {"=",             Operator("equals",          9,  2, OperatorType::Comparison)},
-    {"LIKE",          Operator("like",            9,  2)},
-    {"ILIKE",         Operator("ilike",           9,  2)},
-    {"NOT LIKE",      Operator("notLike",         9,  2)},
-    {"NOT ILIKE",     Operator("notILike",        9,  2)},
-    {"REGEXP",        Operator("match",           9,  2)},
-    {"IN",            Operator("in",              9,  2)},
-    {"NOT IN",        Operator("notIn",           9,  2)},
-    {"GLOBAL IN",     Operator("globalIn",        9,  2)},
-    {"GLOBAL NOT IN", Operator("globalNotIn",     9,  2)},
+    {toStringView(Keyword::LIKE),          Operator("like",            9,  2)},
+    {toStringView(Keyword::ILIKE),         Operator("ilike",           9,  2)},
+    {toStringView(Keyword::NOT_LIKE),      Operator("notLike",         9,  2)},
+    {toStringView(Keyword::NOT_ILIKE),     Operator("notILike",        9,  2)},
+    {toStringView(Keyword::REGEXP),        Operator("match",           9,  2)},
+    {toStringView(Keyword::IN),            Operator("in",              9,  2)},
+    {toStringView(Keyword::NOT_IN),        Operator("notIn",           9,  2)},
+    {toStringView(Keyword::GLOBAL_IN),     Operator("globalIn",        9,  2)},
+    {toStringView(Keyword::GLOBAL_NOT_IN), Operator("globalNotIn",     9,  2)},
     {"||",            Operator("concat",          10, 2, OperatorType::Mergeable)},
     {"+",             Operator("plus",            11, 2)},
     {"-",             Operator("minus",           11, 2)},
@@ -2410,26 +2409,22 @@ const std::vector<std::pair<std::string_view, Operator>> ParserExpressionImpl::o
     {"*",             Operator("multiply",        12, 2)},
     {"/",             Operator("divide",          12, 2)},
     {"%",             Operator("modulo",          12, 2)},
-    {"MOD",           Operator("modulo",          12, 2)},
-    {"DIV",           Operator("intDiv",          12, 2)},
+    {toStringView(Keyword::MOD),           Operator("modulo",          12, 2)},
+    {toStringView(Keyword::DIV),           Operator("intDiv",          12, 2)},
     {".",             Operator("tupleElement",    14, 2, OperatorType::TupleElement)},
     {"[",             Operator("arrayElement",    14, 2, OperatorType::ArrayElement)},
-    {"::",            Operator("CAST",            14, 2, OperatorType::Cast)},
+    {"::",            Operator(toString(toStringView(Keyword::CAST)),            14, 2, OperatorType::Cast)},
 };
 
 const std::vector<std::pair<std::string_view, Operator>> ParserExpressionImpl::unary_operators_table
 {
-    {"NOT",           Operator("not",             5,  1, OperatorType::Not)},
-    {"-",             Operator("negate",          13, 1)},
-    {"−",             Operator("negate",          13, 1)}
+    {toStringView(Keyword::NOT), Operator("not", 5, 1, OperatorType::Not)},
+    {"-", Operator("negate", 13, 1)},
+    {"−", Operator("negate", 13, 1)},
 };
 
 const Operator ParserExpressionImpl::finish_between_operator("", 8, 0, OperatorType::FinishBetween);
 
-const std::array<std::string_view, 1> ParserExpressionImpl::overlapping_operators_to_skip
-{
-    "IN PARTITION"
-};
 
 bool ParserExpressionImpl::parse(std::unique_ptr<Layer> start, IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
@@ -2516,7 +2511,7 @@ Action ParserExpressionImpl::tryParseOperand(Layers & layers, IParser::Pos & pos
         if (layers.back()->isCurrentElementEmpty())
         {
             auto old_pos = pos;
-            ParserKeyword s_settings("SETTINGS");
+            ParserKeyword s_settings(Keyword::SETTINGS);
             if (s_settings.ignore(pos, expected))
             {
                 ParserSetQuery parser_settings(true);
@@ -2608,13 +2603,13 @@ Action ParserExpressionImpl::tryParseOperand(Layers & layers, IParser::Pos & pos
     auto current_checkpoint = layers.back()->current_checkpoint;
     layers.back()->current_checkpoint = Checkpoint::None;
 
-    if (current_checkpoint != Checkpoint::Interval && parseOperator(pos, "INTERVAL", expected))
+    if (current_checkpoint != Checkpoint::Interval && parseOperator(pos, toStringView(Keyword::INTERVAL), expected))
     {
         layers.back()->saved_checkpoint = {old_pos, Checkpoint::Interval};
         layers.push_back(std::make_unique<IntervalLayer>());
         return Action::OPERAND;
     }
-    else if (current_checkpoint != Checkpoint::Case && parseOperator(pos, "CASE", expected))
+    else if (current_checkpoint != Checkpoint::Case && parseOperator(pos, toStringView(Keyword::CASE), expected))
     {
         layers.back()->saved_checkpoint = {old_pos, Checkpoint::Case};
         layers.push_back(std::make_unique<CaseLayer>());
@@ -2689,9 +2684,8 @@ Action ParserExpressionImpl::tryParseOperator(Layers & layers, IParser::Pos & po
     ///
     /// 'IN PARTITION' here is not an 'IN' operator, so we should stop parsing immediately
     Expected stub;
-    for (const auto & it : overlapping_operators_to_skip)
-        if (ParserKeyword{it}.checkWithoutMoving(pos, stub))
-            return Action::NONE;
+    if (ParserKeyword(Keyword::IN_PARTITION).checkWithoutMoving(pos, stub))
+        return Action::NONE;
 
     /// Try to find operators from 'operators_table'
     auto cur_op = operators_table.begin();
diff --git a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp
index 18c986c2191..991a3139fcb 100644
--- a/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp
+++ b/src/Parsers/Kusto/KustoFunctions/KQLStringFunctions.cpp
@@ -102,7 +102,7 @@ bool CountOf::convertImpl(String & out, IParser::Pos & pos)
 
 bool Extract::convertImpl(String & out, IParser::Pos & pos)
 {
-    ParserKeyword s_kql("typeof");
+    ParserKeyword s_kql(Keyword::TYPEOF);
     ParserToken open_bracket(TokenType::OpeningRoundBracket);
     ParserToken close_bracket(TokenType::ClosingRoundBracket);
     Expected expected;
@@ -243,7 +243,7 @@ bool ExtractAll::convertImpl(String & out, IParser::Pos & pos)
 bool ExtractJSON::convertImpl(String & out, IParser::Pos & pos)
 {
     String datatype = "String";
-    ParserKeyword s_kql("typeof");
+    ParserKeyword s_kql(Keyword::TYPEOF);
     ParserToken open_bracket(TokenType::OpeningRoundBracket);
     ParserToken close_bracket(TokenType::ClosingRoundBracket);
     Expected expected;
diff --git a/src/Parsers/Kusto/ParserKQLMVExpand.cpp b/src/Parsers/Kusto/ParserKQLMVExpand.cpp
index d174e9b5911..9beb1c39e34 100644
--- a/src/Parsers/Kusto/ParserKQLMVExpand.cpp
+++ b/src/Parsers/Kusto/ParserKQLMVExpand.cpp
@@ -39,8 +39,8 @@ bool ParserKQLMVExpand::parseColumnArrayExprs(ColumnArrayExprs & column_array_ex
     ParserToken close_bracket(TokenType::ClosingRoundBracket);
     ParserToken comma(TokenType::Comma);
 
-    ParserKeyword s_to("to");
-    ParserKeyword s_type("typeof");
+    ParserKeyword s_to(Keyword::TO);
+    ParserKeyword s_type(Keyword::TYPEOF);
     uint16_t bracket_count = 0;
     Pos expr_begin_pos = pos;
     Pos expr_end_pos = pos;
@@ -144,10 +144,10 @@ bool ParserKQLMVExpand::parseColumnArrayExprs(ColumnArrayExprs & column_array_ex
 
 bool ParserKQLMVExpand::parserMVExpand(KQLMVExpand & kql_mv_expand, Pos & pos, Expected & expected)
 {
-    ParserKeyword s_bagexpansion("bagexpansion");
-    ParserKeyword s_kind("kind");
-    ParserKeyword s_with_itemindex("with_itemindex");
-    ParserKeyword s_limit("limit");
+    ParserKeyword s_bagexpansion(Keyword::BAGEXPANSION);
+    ParserKeyword s_kind(Keyword::KIND);
+    ParserKeyword s_with_itemindex(Keyword::WITH_ITEMINDEX);
+    ParserKeyword s_limit(Keyword::LIMIT);
 
     ParserToken equals(TokenType::Equals);
     ParserToken comma(TokenType::Comma);
diff --git a/src/Parsers/Kusto/ParserKQLMakeSeries.cpp b/src/Parsers/Kusto/ParserKQLMakeSeries.cpp
index 4759efc0025..f1ad9d9738b 100644
--- a/src/Parsers/Kusto/ParserKQLMakeSeries.cpp
+++ b/src/Parsers/Kusto/ParserKQLMakeSeries.cpp
@@ -34,7 +34,7 @@ bool ParserKQLMakeSeries ::parseAggregationColumns(AggregationColumns & aggregat
          "variance"});
 
     Expected expected;
-    ParserKeyword s_default("default");
+    ParserKeyword s_default(Keyword::DEFAULT);
     ParserToken equals(TokenType::Equals);
     ParserToken open_bracket(TokenType::OpeningRoundBracket);
     ParserToken close_bracket(TokenType::ClosingRoundBracket);
@@ -364,8 +364,8 @@ bool ParserKQLMakeSeries ::makeSeries(KQLMakeSeries & kql_make_series, ASTPtr &
 bool ParserKQLMakeSeries ::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
     auto begin = pos;
-    ParserKeyword s_on("on");
-    ParserKeyword s_by("by");
+    ParserKeyword s_on(Keyword::ON);
+    ParserKeyword s_by(Keyword::BY);
 
     ParserToken equals(TokenType::Equals);
     ParserToken comma(TokenType::Comma);
diff --git a/src/Parsers/Kusto/ParserKQLQuery.cpp b/src/Parsers/Kusto/ParserKQLQuery.cpp
index 6fd9c95ec6f..99b2d1da890 100644
--- a/src/Parsers/Kusto/ParserKQLQuery.cpp
+++ b/src/Parsers/Kusto/ParserKQLQuery.cpp
@@ -399,7 +399,7 @@ bool ParserKQLQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
                     if (!isValidKQLPos(pos))
                         return false;
 
-                    ParserKeyword s_by("by");
+                    ParserKeyword s_by(Keyword::BY);
                     if (s_by.ignore(pos, expected))
                     {
                         kql_operator = "order by";
diff --git a/src/Parsers/MySQL/ASTAlterCommand.cpp b/src/Parsers/MySQL/ASTAlterCommand.cpp
index 10446d40172..733cb657efc 100644
--- a/src/Parsers/MySQL/ASTAlterCommand.cpp
+++ b/src/Parsers/MySQL/ASTAlterCommand.cpp
@@ -55,7 +55,7 @@ static inline bool parseAddCommand(IParser::Pos & pos, ASTPtr & node, Expected &
     else
     {
         alter_command->type = ASTAlterCommand::ADD_COLUMN;
-        ParserKeyword("COLUMN").ignore(pos, expected);
+        ParserKeyword(Keyword::COLUMN).ignore(pos, expected);
 
         if (ParserToken(TokenType::OpeningRoundBracket).ignore(pos, expected))
         {
@@ -76,9 +76,9 @@ static inline bool parseAddCommand(IParser::Pos & pos, ASTPtr & node, Expected &
             additional_columns = std::make_shared<ASTExpressionList>();
             additional_columns->children.emplace_back(declare_column);
 
-            if (ParserKeyword("FIRST").ignore(pos, expected))
+            if (ParserKeyword(Keyword::FIRST).ignore(pos, expected))
                 alter_command->first = true;
-            else if (ParserKeyword("AFTER").ignore(pos, expected))
+            else if (ParserKeyword(Keyword::AFTER).ignore(pos, expected))
             {
                 ASTPtr after_column;
                 ParserIdentifier identifier_p;
@@ -103,12 +103,12 @@ static inline bool parseDropCommand(IParser::Pos & pos, ASTPtr & node, Expected
 
     auto alter_command = std::make_shared<ASTAlterCommand>();
 
-    if (ParserKeyword("PRIMARY KEY").ignore(pos, expected))
+    if (ParserKeyword(Keyword::PRIMARY_KEY).ignore(pos, expected))
     {
         alter_command->index_type = "PRIMARY_KEY";
         alter_command->type = ASTAlterCommand::DROP_INDEX;
     }
-    else if (ParserKeyword("FOREIGN KEY").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::FOREIGN_KEY).ignore(pos, expected))
     {
         if (!identifier_p.parse(pos, name, expected))
             return false;
@@ -117,7 +117,7 @@ static inline bool parseDropCommand(IParser::Pos & pos, ASTPtr & node, Expected
         alter_command->type = ASTAlterCommand::DROP_INDEX;
         alter_command->index_name = getIdentifierName(name);
     }
-    else if (ParserKeyword("INDEX").ignore(pos, expected) || ParserKeyword("KEY").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::INDEX).ignore(pos, expected) || ParserKeyword(Keyword::KEY).ignore(pos, expected))
     {
         if (!identifier_p.parse(pos, name, expected))
             return false;
@@ -126,7 +126,7 @@ static inline bool parseDropCommand(IParser::Pos & pos, ASTPtr & node, Expected
         alter_command->type = ASTAlterCommand::DROP_INDEX;
         alter_command->index_name = getIdentifierName(name);
     }
-    else if (ParserKeyword("CONSTRAINT").ignore(pos, expected) || ParserKeyword("CHECK").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::CONSTRAINT).ignore(pos, expected) || ParserKeyword(Keyword::CHECK).ignore(pos, expected))
     {
         if (!identifier_p.parse(pos, name, expected))
             return false;
@@ -136,7 +136,7 @@ static inline bool parseDropCommand(IParser::Pos & pos, ASTPtr & node, Expected
     }
     else
     {
-        ParserKeyword("COLUMN").ignore(pos, expected);
+        ParserKeyword(Keyword::COLUMN).ignore(pos, expected);
 
         if (!identifier_p.parse(pos, name, expected))
             return false;
@@ -156,30 +156,30 @@ static inline bool parseAlterCommand(IParser::Pos & pos, ASTPtr & node, Expected
     ParserIdentifier identifier_p;
     auto alter_command = std::make_shared<ASTAlterCommand>();
 
-    if (ParserKeyword("INDEX").ignore(pos, expected))
+    if (ParserKeyword(Keyword::INDEX).ignore(pos, expected))
     {
         /// ALTER INDEX index_name {VISIBLE | INVISIBLE}
 
         if (!identifier_p.parse(pos, name, expected))
             return false;
 
-        alter_command->index_visible = ParserKeyword("VISIBLE").ignore(pos, expected);
+        alter_command->index_visible = ParserKeyword(Keyword::VISIBLE).ignore(pos, expected);
 
-        if (!alter_command->index_visible && !ParserKeyword("INVISIBLE").ignore(pos, expected))
+        if (!alter_command->index_visible && !ParserKeyword(Keyword::INVISIBLE).ignore(pos, expected))
             return false;
 
         alter_command->type = ASTAlterCommand::MODIFY_INDEX_VISIBLE;
         alter_command->index_name = getIdentifierName(name);
     }
-    else if (ParserKeyword("CHECK").ignore(pos, expected) || ParserKeyword("CONSTRAINT").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::CHECK).ignore(pos, expected) || ParserKeyword(Keyword::CONSTRAINT).ignore(pos, expected))
     {
         /// ALTER {CHECK | CONSTRAINT} symbol [NOT] ENFORCED
         if (!identifier_p.parse(pos, name, expected))
             return false;
 
-        alter_command->not_check_enforced = ParserKeyword("NOT").ignore(pos, expected);
+        alter_command->not_check_enforced = ParserKeyword(Keyword::NOT).ignore(pos, expected);
 
-        if (!ParserKeyword("ENFORCED").ignore(pos, expected))
+        if (!ParserKeyword(Keyword::ENFORCED).ignore(pos, expected))
             return false;
 
         alter_command->type = ASTAlterCommand::MODIFY_CHECK;
@@ -189,14 +189,14 @@ static inline bool parseAlterCommand(IParser::Pos & pos, ASTPtr & node, Expected
     {
         /// ALTER [COLUMN] col_name {SET DEFAULT {literal | (expr)} | DROP DEFAULT}
 
-        ParserKeyword("COLUMN").ignore(pos, expected);
+        ParserKeyword(Keyword::COLUMN).ignore(pos, expected);
 
         if (!identifier_p.parse(pos, name, expected))
             return false;
 
-        if (ParserKeyword("DROP DEFAULT").ignore(pos, expected))
+        if (ParserKeyword(Keyword::DROP_DEFAULT).ignore(pos, expected))
             alter_command->type = ASTAlterCommand::DROP_COLUMN_DEFAULT;
-        else if (ParserKeyword("SET DEFAULT").ignore(pos, expected))
+        else if (ParserKeyword(Keyword::SET_DEFAULT).ignore(pos, expected))
         {
             ASTPtr default_expression;
             ParserExpression expression_p;
@@ -225,12 +225,12 @@ static inline bool parseRenameCommand(IParser::Pos & pos, ASTPtr & node, Expecte
     ParserIdentifier identifier_p;
     auto alter_command = std::make_shared<ASTAlterCommand>();
 
-    if (ParserKeyword("COLUMN").ignore(pos, expected))
+    if (ParserKeyword(Keyword::COLUMN).ignore(pos, expected))
     {
         if (!identifier_p.parse(pos, old_name, expected))
             return false;
 
-        if (!ParserKeyword("TO").ignore(pos, expected))
+        if (!ParserKeyword(Keyword::TO).ignore(pos, expected))
             return false;
 
         if (!identifier_p.parse(pos, new_name, expected))
@@ -240,7 +240,7 @@ static inline bool parseRenameCommand(IParser::Pos & pos, ASTPtr & node, Expecte
         alter_command->old_name = getIdentifierName(old_name);
         alter_command->column_name = getIdentifierName(new_name);
     }
-    else if (ParserKeyword("TO").ignore(pos, expected) || ParserKeyword("AS").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::TO).ignore(pos, expected) || ParserKeyword(Keyword::AS).ignore(pos, expected))
     {
         if (!ParserCompoundIdentifier(true).parse(pos, new_name, expected))
             return false;
@@ -250,12 +250,12 @@ static inline bool parseRenameCommand(IParser::Pos & pos, ASTPtr & node, Expecte
         alter_command->new_table_name = new_table_id.table_name;
         alter_command->new_database_name = new_table_id.database_name;
     }
-    else if (ParserKeyword("INDEX").ignore(pos, expected) || ParserKeyword("KEY").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::INDEX).ignore(pos, expected) || ParserKeyword(Keyword::KEY).ignore(pos, expected))
     {
         if (!identifier_p.parse(pos, old_name, expected))
             return false;
 
-        if (!ParserKeyword("TO").ignore(pos, expected))
+        if (!ParserKeyword(Keyword::TO).ignore(pos, expected))
             return false;
 
         if (!identifier_p.parse(pos, new_name, expected))
@@ -283,7 +283,7 @@ static inline bool parseOtherCommand(IParser::Pos & pos, ASTPtr & node, Expected
 {
     auto alter_command = std::make_shared<ASTAlterCommand>();
 
-    if (ParserKeyword("ORDER BY").ignore(pos, expected))
+    if (ParserKeyword(Keyword::ORDER_BY).ignore(pos, expected))
     {
         /// ORDER BY col_name [, col_name] ...
         ASTPtr columns;
@@ -335,7 +335,7 @@ static inline bool parseModifyCommand(IParser::Pos & pos, ASTPtr & node, Expecte
     ASTPtr old_column_name;
     auto alter_command = std::make_shared<ASTAlterCommand>();
 
-    ParserKeyword("COLUMN").ignore(pos, expected);
+    ParserKeyword(Keyword::COLUMN).ignore(pos, expected);
     if (exists_old_column_name && !ParserIdentifier().parse(pos, old_column_name, expected))
         return false;
 
@@ -343,9 +343,9 @@ static inline bool parseModifyCommand(IParser::Pos & pos, ASTPtr & node, Expecte
     if (!ParserDeclareColumn().parse(pos, additional_column, expected))
         return false;
 
-    if (ParserKeyword("FIRST").ignore(pos, expected))
+    if (ParserKeyword(Keyword::FIRST).ignore(pos, expected))
         alter_command->first = true;
-    else if (ParserKeyword("AFTER").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::AFTER).ignore(pos, expected))
     {
         ASTPtr after_column;
         ParserIdentifier identifier_p;
@@ -368,12 +368,12 @@ static inline bool parseModifyCommand(IParser::Pos & pos, ASTPtr & node, Expecte
 
 bool ParserAlterCommand::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword k_add("ADD");
-    ParserKeyword k_drop("DROP");
-    ParserKeyword k_alter("ALTER");
-    ParserKeyword k_rename("RENAME");
-    ParserKeyword k_modify("MODIFY");
-    ParserKeyword k_change("CHANGE");
+    ParserKeyword k_add(Keyword::ADD);
+    ParserKeyword k_drop(Keyword::DROP);
+    ParserKeyword k_alter(Keyword::ALTER);
+    ParserKeyword k_rename(Keyword::RENAME);
+    ParserKeyword k_modify(Keyword::MODIFY);
+    ParserKeyword k_change(Keyword::CHANGE);
 
     if (k_add.ignore(pos, expected))
         return parseAddCommand(pos, node, expected);
diff --git a/src/Parsers/MySQL/ASTAlterQuery.cpp b/src/Parsers/MySQL/ASTAlterQuery.cpp
index 59f0ada4e32..4e8c2cb5a6b 100644
--- a/src/Parsers/MySQL/ASTAlterQuery.cpp
+++ b/src/Parsers/MySQL/ASTAlterQuery.cpp
@@ -33,7 +33,7 @@ bool ParserAlterQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & e
     ASTPtr table;
     ASTPtr command_list;
 
-    if (!ParserKeyword("ALTER TABLE").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::ALTER_TABLE).ignore(pos, expected))
         return false;
 
     if (!ParserCompoundIdentifier(true).parse(pos, table, expected))
diff --git a/src/Parsers/MySQL/ASTCreateQuery.cpp b/src/Parsers/MySQL/ASTCreateQuery.cpp
index 227ac62f86d..d8b053591d6 100644
--- a/src/Parsers/MySQL/ASTCreateQuery.cpp
+++ b/src/Parsers/MySQL/ASTCreateQuery.cpp
@@ -51,29 +51,29 @@ bool ParserCreateQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     bool is_temporary = false;
     bool if_not_exists = false;
 
-    if (!ParserKeyword("CREATE").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::CREATE).ignore(pos, expected))
         return false;
 
-    if (ParserKeyword("TEMPORARY").ignore(pos, expected))
+    if (ParserKeyword(Keyword::TEMPORARY).ignore(pos, expected))
         is_temporary = true;
 
-    if (!ParserKeyword("TABLE").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::TABLE).ignore(pos, expected))
         return false;
 
-    if (ParserKeyword("IF NOT EXISTS").ignore(pos, expected))
+    if (ParserKeyword(Keyword::IF_NOT_EXISTS).ignore(pos, expected))
         if_not_exists = true;
 
     if (!ParserCompoundIdentifier(true).parse(pos, table, expected))
         return false;
 
-    if (ParserKeyword("LIKE").ignore(pos, expected))
+    if (ParserKeyword(Keyword::LIKE).ignore(pos, expected))
     {
         if (!ParserCompoundIdentifier(true).parse(pos, like_table, expected))
             return false;
     }
     else if (ParserToken(TokenType::OpeningRoundBracket).ignore(pos, expected))
     {
-        if (ParserKeyword("LIKE").ignore(pos, expected))
+        if (ParserKeyword(Keyword::LIKE).ignore(pos, expected))
         {
             if (!ParserCompoundIdentifier(true).parse(pos, like_table, expected))
                 return false;
diff --git a/src/Parsers/MySQL/ASTDeclareConstraint.cpp b/src/Parsers/MySQL/ASTDeclareConstraint.cpp
index 96184dfc89d..414e259f08d 100644
--- a/src/Parsers/MySQL/ASTDeclareConstraint.cpp
+++ b/src/Parsers/MySQL/ASTDeclareConstraint.cpp
@@ -32,22 +32,22 @@ bool ParserDeclareConstraint::parseImpl(IParser::Pos & pos, ASTPtr & node, Expec
     ASTPtr index_check_expression;
     ParserExpression p_expression;
 
-    if (ParserKeyword("CONSTRAINT").ignore(pos, expected))
+    if (ParserKeyword(Keyword::CONSTRAINT).ignore(pos, expected))
     {
-        if (!ParserKeyword("CHECK").checkWithoutMoving(pos, expected))
+        if (!ParserKeyword(Keyword::CHECK).checkWithoutMoving(pos, expected))
             ParserIdentifier().parse(pos, constraint_symbol, expected);
     }
 
 
-    if (!ParserKeyword("CHECK").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::CHECK).ignore(pos, expected))
         return false;
 
     if (!p_expression.parse(pos, index_check_expression, expected))
         return false;
 
-    if (ParserKeyword("NOT").ignore(pos, expected))
+    if (ParserKeyword(Keyword::NOT).ignore(pos, expected))
     {
-        if (!ParserKeyword("ENFORCED").ignore(pos, expected))
+        if (!ParserKeyword(Keyword::ENFORCED).ignore(pos, expected))
             return false;
 
         enforced = false;
@@ -55,7 +55,7 @@ bool ParserDeclareConstraint::parseImpl(IParser::Pos & pos, ASTPtr & node, Expec
     else
     {
         enforced = true;
-        ParserKeyword("ENFORCED").ignore(pos, expected);
+        ParserKeyword(Keyword::ENFORCED).ignore(pos, expected);
     }
 
     auto declare_constraint = std::make_shared<ASTDeclareConstraint>();
diff --git a/src/Parsers/MySQL/ASTDeclareIndex.cpp b/src/Parsers/MySQL/ASTDeclareIndex.cpp
index c5b4686e976..146f803e650 100644
--- a/src/Parsers/MySQL/ASTDeclareIndex.cpp
+++ b/src/Parsers/MySQL/ASTDeclareIndex.cpp
@@ -24,8 +24,8 @@ protected:
         if (!p_expression.parse(pos, node, expected))
             return false;
 
-        ParserKeyword("ASC").ignore(pos, expected);
-        ParserKeyword("DESC").ignore(pos, expected);
+        ParserKeyword(Keyword::ASC).ignore(pos, expected);
+        ParserKeyword(Keyword::DESC).ignore(pos, expected);
         return true;
     }
 };
@@ -61,12 +61,12 @@ ASTPtr ASTDeclareIndex::clone() const
 static inline bool parseDeclareOrdinaryIndex(IParser::Pos & pos, String & index_name, String & index_type, Expected & expected)
 {
     ASTPtr temp_node;
-    ParserKeyword k_key("KEY");
-    ParserKeyword k_index("INDEX");
+    ParserKeyword k_key(Keyword::KEY);
+    ParserKeyword k_index(Keyword::INDEX);
 
     ParserIdentifier p_identifier;
 
-    if (ParserKeyword("SPATIAL").ignore(pos, expected))
+    if (ParserKeyword(Keyword::SPATIAL).ignore(pos, expected))
     {
         if (!k_key.ignore(pos, expected))
             k_index.ignore(pos, expected);
@@ -75,7 +75,7 @@ static inline bool parseDeclareOrdinaryIndex(IParser::Pos & pos, String & index_
         if (p_identifier.parse(pos, temp_node, expected))
             index_name = temp_node->as<ASTIdentifier>()->name();
     }
-    else if (ParserKeyword("FULLTEXT").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::FULLTEXT).ignore(pos, expected))
     {
         if (!k_key.ignore(pos, expected))
             k_index.ignore(pos, expected);
@@ -96,7 +96,7 @@ static inline bool parseDeclareOrdinaryIndex(IParser::Pos & pos, String & index_
         if (p_identifier.parse(pos, temp_node, expected))
             index_name = temp_node->as<ASTIdentifier>()->name();
 
-        if (ParserKeyword("USING").ignore(pos, expected))
+        if (ParserKeyword(Keyword::USING).ignore(pos, expected))
         {
             if (!p_identifier.parse(pos, temp_node, expected))
                 return false;
@@ -113,11 +113,11 @@ static inline bool parseDeclareConstraintIndex(IParser::Pos & pos, String & inde
     ASTPtr temp_node;
     ParserIdentifier p_identifier;
 
-    if (ParserKeyword("CONSTRAINT").ignore(pos, expected))
+    if (ParserKeyword(Keyword::CONSTRAINT).ignore(pos, expected))
     {
 
-        if (!ParserKeyword("PRIMARY").checkWithoutMoving(pos, expected) && !ParserKeyword("UNIQUE").checkWithoutMoving(pos, expected)
-            && !ParserKeyword("FOREIGN").checkWithoutMoving(pos, expected))
+        if (!ParserKeyword(Keyword::PRIMARY).checkWithoutMoving(pos, expected) && !ParserKeyword(Keyword::UNIQUE).checkWithoutMoving(pos, expected)
+            && !ParserKeyword(Keyword::FOREIGN).checkWithoutMoving(pos, expected))
         {
             if (!p_identifier.parse(pos, temp_node, expected))
                 return false;
@@ -126,16 +126,16 @@ static inline bool parseDeclareConstraintIndex(IParser::Pos & pos, String & inde
         }
     }
 
-    if (ParserKeyword("UNIQUE").ignore(pos, expected))
+    if (ParserKeyword(Keyword::UNIQUE).ignore(pos, expected))
     {
-        if (!ParserKeyword("KEY").ignore(pos, expected))
-            ParserKeyword("INDEX").ignore(pos, expected);
+        if (!ParserKeyword(Keyword::KEY).ignore(pos, expected))
+            ParserKeyword(Keyword::INDEX).ignore(pos, expected);
 
         if (p_identifier.parse(pos, temp_node, expected))
             index_name = temp_node->as<ASTIdentifier>()->name();  /// reset index_name
 
         index_type = "UNIQUE_BTREE"; /// default btree index_type
-        if (ParserKeyword("USING").ignore(pos, expected))
+        if (ParserKeyword(Keyword::USING).ignore(pos, expected))
         {
             if (!p_identifier.parse(pos, temp_node, expected))
                 return false;
@@ -143,10 +143,10 @@ static inline bool parseDeclareConstraintIndex(IParser::Pos & pos, String & inde
             index_type = "UNIQUE_" + temp_node->as<ASTIdentifier>()->name();
         }
     }
-    else if (ParserKeyword("PRIMARY KEY").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::PRIMARY_KEY).ignore(pos, expected))
     {
         index_type = "PRIMARY_KEY_BTREE"; /// default btree index_type
-        if (ParserKeyword("USING").ignore(pos, expected))
+        if (ParserKeyword(Keyword::USING).ignore(pos, expected))
         {
             if (!p_identifier.parse(pos, temp_node, expected))
                 return false;
@@ -154,7 +154,7 @@ static inline bool parseDeclareConstraintIndex(IParser::Pos & pos, String & inde
             index_type = "PRIMARY_KEY_" + temp_node->as<ASTIdentifier>()->name();
         }
     }
-    else if (ParserKeyword("FOREIGN KEY").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::FOREIGN_KEY).ignore(pos, expected))
     {
         index_type = "FOREIGN";
         if (p_identifier.parse(pos, temp_node, expected))
diff --git a/src/Parsers/MySQL/ASTDeclareOption.cpp b/src/Parsers/MySQL/ASTDeclareOption.cpp
index 740d049bafd..f4be38f4f2d 100644
--- a/src/Parsers/MySQL/ASTDeclareOption.cpp
+++ b/src/Parsers/MySQL/ASTDeclareOption.cpp
@@ -23,7 +23,7 @@ bool ParserDeclareOptionImpl<recursive>::parseImpl(Pos & pos, ASTPtr & node, Exp
     {
         auto iterator = usage_parsers_cached.find(usage_name);
         if (iterator == usage_parsers_cached.end())
-            iterator = usage_parsers_cached.insert(std::make_pair(usage_name, std::make_shared<ParserKeyword>(usage_name))).first;
+            iterator = usage_parsers_cached.insert(std::make_pair(usage_name, ParserKeyword::createDeprecatedPtr(usage_name))).first;
 
         return iterator->second;
     };
diff --git a/src/Parsers/MySQL/ASTDeclarePartition.cpp b/src/Parsers/MySQL/ASTDeclarePartition.cpp
index 76f864fcc44..2647131fde5 100644
--- a/src/Parsers/MySQL/ASTDeclarePartition.cpp
+++ b/src/Parsers/MySQL/ASTDeclarePartition.cpp
@@ -46,7 +46,7 @@ ASTPtr ASTDeclarePartition::clone() const
 
 bool ParserDeclarePartition::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (!ParserKeyword{"PARTITION"}.ignore(pos, expected))
+    if (!ParserKeyword{Keyword::PARTITION}.ignore(pos, expected))
         return false;
 
     ASTPtr options;
@@ -60,15 +60,15 @@ bool ParserDeclarePartition::parseImpl(IParser::Pos & pos, ASTPtr & node, Expect
     if (!p_identifier.parse(pos, partition_name, expected))
         return false;
 
-    ParserKeyword p_values("VALUES");
+    ParserKeyword p_values(Keyword::VALUES);
     if (p_values.ignore(pos, expected))
     {
-        if (ParserKeyword{"IN"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::IN}.ignore(pos, expected))
         {
             if (!p_expression.parse(pos, in_expression, expected))
                 return false;
         }
-        else if (ParserKeyword{"LESS THAN"}.ignore(pos, expected))
+        else if (ParserKeyword{Keyword::LESS_THAN}.ignore(pos, expected))
         {
             if (!p_expression.parse(pos, less_than, expected))
                 return false;
diff --git a/src/Parsers/MySQL/ASTDeclarePartitionOptions.cpp b/src/Parsers/MySQL/ASTDeclarePartitionOptions.cpp
index 199a5e2dd26..744beffe8e1 100644
--- a/src/Parsers/MySQL/ASTDeclarePartitionOptions.cpp
+++ b/src/Parsers/MySQL/ASTDeclarePartitionOptions.cpp
@@ -49,30 +49,30 @@ static inline bool parsePartitionExpression(IParser::Pos & pos, std::string & ty
 {
     ASTPtr expression;
     ParserExpression p_expression;
-    if (!subpartition && ParserKeyword("LIST").ignore(pos, expected))
+    if (!subpartition && ParserKeyword(Keyword::LIST).ignore(pos, expected))
     {
         type = "list";
-        ParserKeyword("COLUMNS").ignore(pos, expected);
+        ParserKeyword(Keyword::COLUMNS).ignore(pos, expected);
         if (!p_expression.parse(pos, expression, expected))
             return false;
     }
-    else if (!subpartition && ParserKeyword("RANGE").ignore(pos, expected))
+    else if (!subpartition && ParserKeyword(Keyword::RANGE).ignore(pos, expected))
     {
         type = "range";
-        ParserKeyword("COLUMNS").ignore(pos, expected);
+        ParserKeyword(Keyword::COLUMNS).ignore(pos, expected);
         if (!p_expression.parse(pos, expression, expected))
             return false;
     }
     else
     {
-        if (ParserKeyword("LINEAR").ignore(pos, expected))
+        if (ParserKeyword(Keyword::LINEAR).ignore(pos, expected))
             type = "linear_";
 
-        if (ParserKeyword("KEY").ignore(pos, expected))
+        if (ParserKeyword(Keyword::KEY).ignore(pos, expected))
         {
             type += "key";
 
-            if (ParserKeyword("ALGORITHM").ignore(pos, expected))
+            if (ParserKeyword(Keyword::ALGORITHM).ignore(pos, expected))
             {
                 if (!ParserToken(TokenType::Equals).ignore(pos, expected))
                     return false;
@@ -93,7 +93,7 @@ static inline bool parsePartitionExpression(IParser::Pos & pos, std::string & ty
             if (!p_expression.parse(pos, expression, expected))
                 return false;
         }
-        else if (ParserKeyword("HASH").ignore(pos, expected))
+        else if (ParserKeyword(Keyword::HASH).ignore(pos, expected))
         {
             type += "hash";
             if (!p_expression.parse(pos, expression, expected))
@@ -117,25 +117,25 @@ bool ParserDeclarePartitionOptions::parseImpl(Pos & pos, ASTPtr & node, Expected
     ASTPtr subpartition_expression;
     ASTPtr declare_partitions;
 
-    if (!ParserKeyword("PARTITION BY").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::PARTITION_BY).ignore(pos, expected))
         return false;
 
     if (!parsePartitionExpression(pos, partition_type, partition_expression, expected))
         return false;
 
-    if (ParserKeyword("PARTITIONS").ignore(pos, expected))
+    if (ParserKeyword(Keyword::PARTITIONS).ignore(pos, expected))
     {
         ParserLiteral p_literal;
         if (!p_literal.parse(pos, partition_numbers, expected))
             return false;
     }
 
-    if (ParserKeyword("SUBPARTITION BY").ignore(pos, expected))
+    if (ParserKeyword(Keyword::SUBPARTITION_BY).ignore(pos, expected))
     {
         if (!parsePartitionExpression(pos, subpartition_type, subpartition_expression, expected, true))
             return false;
 
-        if (ParserKeyword("SUBPARTITIONS").ignore(pos, expected))
+        if (ParserKeyword(Keyword::SUBPARTITIONS).ignore(pos, expected))
         {
             ParserLiteral p_literal;
             if (!p_literal.parse(pos, subpartition_numbers, expected))
diff --git a/src/Parsers/MySQL/ASTDeclareReference.cpp b/src/Parsers/MySQL/ASTDeclareReference.cpp
index 862d35e2b76..c8d6c4cd2ee 100644
--- a/src/Parsers/MySQL/ASTDeclareReference.cpp
+++ b/src/Parsers/MySQL/ASTDeclareReference.cpp
@@ -13,15 +13,15 @@ namespace MySQLParser
 
 bool parseReferenceOption(IParser::Pos & pos, ASTDeclareReference::ReferenceOption & option, Expected & expected)
 {
-    if (ParserKeyword("RESTRICT").ignore(pos, expected))
+    if (ParserKeyword(Keyword::RESTRICT).ignore(pos, expected))
         option = ASTDeclareReference::RESTRICT;
-    else if (ParserKeyword("CASCADE").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::CASCADE).ignore(pos, expected))
         option = ASTDeclareReference::CASCADE;
-    else if (ParserKeyword("SET NULL").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::SET_NULL).ignore(pos, expected))
         option = ASTDeclareReference::SET_NULL;
-    else if (ParserKeyword("NO ACTION").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::NO_ACTION).ignore(pos, expected))
         option = ASTDeclareReference::NO_ACTION;
-    else if (ParserKeyword("SET DEFAULT").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::SET_DEFAULT).ignore(pos, expected))
         option = ASTDeclareReference::SET_DEFAULT;
     else
         return false;
@@ -53,7 +53,7 @@ bool ParserDeclareReference::parseImpl(IParser::Pos & pos, ASTPtr & node, Expect
     ASTDeclareReference::ReferenceOption delete_option = ASTDeclareReference::RESTRICT;
     ASTDeclareReference::ReferenceOption update_option = ASTDeclareReference::RESTRICT;
 
-    if (!ParserKeyword("REFERENCES").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::REFERENCES).ignore(pos, expected))
         return false;
 
     if (!p_identifier.parse(pos, table_name, expected))
@@ -62,13 +62,13 @@ bool ParserDeclareReference::parseImpl(IParser::Pos & pos, ASTPtr & node, Expect
     if (!p_expression.parse(pos, expression, expected))
         return false;
 
-    if (ParserKeyword("MATCH").ignore(pos, expected))
+    if (ParserKeyword(Keyword::MATCH).ignore(pos, expected))
     {
-        if (ParserKeyword("FULL").ignore(pos, expected))
+        if (ParserKeyword(Keyword::FULL).ignore(pos, expected))
             match_kind = ASTDeclareReference::MATCH_FULL;
-        else if (ParserKeyword("SIMPLE").ignore(pos, expected))
+        else if (ParserKeyword(Keyword::SIMPLE).ignore(pos, expected))
             match_kind = ASTDeclareReference::MATCH_SIMPLE;
-        else if (ParserKeyword("PARTIAL").ignore(pos, expected))
+        else if (ParserKeyword(Keyword::PARTIAL).ignore(pos, expected))
             match_kind = ASTDeclareReference::MATCH_PARTIAL;
         else
             return false;
@@ -76,12 +76,12 @@ bool ParserDeclareReference::parseImpl(IParser::Pos & pos, ASTPtr & node, Expect
 
     while (true)
     {
-        if (ParserKeyword("ON DELETE").ignore(pos, expected))
+        if (ParserKeyword(Keyword::ON_DELETE).ignore(pos, expected))
         {
             if (!parseReferenceOption(pos, delete_option, expected))
                 return false;
         }
-        else if (ParserKeyword("ON UPDATE").ignore(pos, expected))
+        else if (ParserKeyword(Keyword::ON_UPDATE).ignore(pos, expected))
         {
             if (!parseReferenceOption(pos, update_option, expected))
                 return false;
diff --git a/src/Parsers/MySQL/ASTDeclareSubPartition.cpp b/src/Parsers/MySQL/ASTDeclareSubPartition.cpp
index d77fba271c4..e0f8098501e 100644
--- a/src/Parsers/MySQL/ASTDeclareSubPartition.cpp
+++ b/src/Parsers/MySQL/ASTDeclareSubPartition.cpp
@@ -13,7 +13,7 @@ namespace MySQLParser
 
 bool ParserDeclareSubPartition::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (!ParserKeyword{"SUBPARTITION"}.ignore(pos, expected))
+    if (!ParserKeyword{Keyword::SUBPARTITION}.ignore(pos, expected))
         return false;
 
     ASTPtr options;
diff --git a/src/Parsers/MySQL/ASTDeclareTableOptions.cpp b/src/Parsers/MySQL/ASTDeclareTableOptions.cpp
index c903c7d2fa7..05008e79f19 100644
--- a/src/Parsers/MySQL/ASTDeclareTableOptions.cpp
+++ b/src/Parsers/MySQL/ASTDeclareTableOptions.cpp
@@ -23,7 +23,7 @@ protected:
     {
         if constexpr (allow_default)
         {
-            if (ParserKeyword("DEFAULT").ignore(pos, expected))
+            if (ParserKeyword(Keyword::DEFAULT).ignore(pos, expected))
             {
                 node = std::make_shared<ASTIdentifier>("DEFAULT");
                 return true;
@@ -49,11 +49,11 @@ protected:
         if (!p_identifier.parse(pos, node, expected))
             return false;
 
-        if (ParserKeyword("STORAGE").ignore(pos, expected))
+        if (ParserKeyword(Keyword::STORAGE).ignore(pos, expected))
         {
-            if (!ParserKeyword("DISK").ignore(pos, expected))
+            if (!ParserKeyword(Keyword::DISK).ignore(pos, expected))
             {
-                if (!ParserKeyword("MEMORY").ignore(pos, expected))
+                if (!ParserKeyword(Keyword::MEMORY).ignore(pos, expected))
                     return false;
             }
         }
diff --git a/src/Parsers/MySQL/ASTDropQuery.cpp b/src/Parsers/MySQL/ASTDropQuery.cpp
index 890451e3e55..0879186a775 100644
--- a/src/Parsers/MySQL/ASTDropQuery.cpp
+++ b/src/Parsers/MySQL/ASTDropQuery.cpp
@@ -23,20 +23,20 @@ ASTPtr ASTDropQuery::clone() const
 
 bool ParserDropQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_drop("DROP");
-    ParserKeyword s_truncate("TRUNCATE");
-    ParserKeyword s_table("TABLE");
-    ParserKeyword s_database("DATABASE");
-    ParserKeyword s_if_exists("IF EXISTS");
-    ParserKeyword s_view("VIEW");
-    ParserKeyword on("ON");
+    ParserKeyword s_drop(Keyword::DROP);
+    ParserKeyword s_truncate(Keyword::TRUNCATE);
+    ParserKeyword s_table(Keyword::TABLE);
+    ParserKeyword s_database(Keyword::DATABASE);
+    ParserKeyword s_if_exists(Keyword::IF_EXISTS);
+    ParserKeyword s_view(Keyword::VIEW);
+    ParserKeyword on(Keyword::ON);
     ParserIdentifier name_p(false);
 
-    ParserKeyword s_event("EVENT");
-    ParserKeyword s_function("FUNCTION");
-    ParserKeyword s_index("INDEX");
-    ParserKeyword s_server("SERVER");
-    ParserKeyword s_trigger("TRIGGER");
+    ParserKeyword s_event(Keyword::EVENT);
+    ParserKeyword s_function(Keyword::FUNCTION);
+    ParserKeyword s_index(Keyword::INDEX);
+    ParserKeyword s_server(Keyword::SERVER);
+    ParserKeyword s_trigger(Keyword::TRIGGER);
 
     auto query = std::make_shared<ASTDropQuery>();
     node = query;
diff --git a/src/Parsers/ParserAlterNamedCollectionQuery.cpp b/src/Parsers/ParserAlterNamedCollectionQuery.cpp
index 9b33aa253ba..3c6f764a190 100644
--- a/src/Parsers/ParserAlterNamedCollectionQuery.cpp
+++ b/src/Parsers/ParserAlterNamedCollectionQuery.cpp
@@ -11,15 +11,16 @@ namespace DB
 
 bool ParserAlterNamedCollectionQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_alter("ALTER");
-    ParserKeyword s_collection("NAMED COLLECTION");
-    ParserKeyword s_if_exists("IF EXISTS");
-    ParserKeyword s_on("ON");
-    ParserKeyword s_delete("DELETE");
+    ParserKeyword s_alter(Keyword::ALTER);
+    ParserKeyword s_collection(Keyword::NAMED_COLLECTION);
+    ParserKeyword s_if_exists(Keyword::IF_EXISTS);
+    ParserKeyword s_on(Keyword::ON);
+    ParserKeyword s_delete(Keyword::DELETE);
+
     ParserIdentifier name_p;
-    ParserKeyword s_set("SET");
-    ParserKeyword s_overridable("OVERRIDABLE");
-    ParserKeyword s_not_overridable("NOT OVERRIDABLE");
+    ParserKeyword s_set(Keyword::SET);
+    ParserKeyword s_overridable(Keyword::OVERRIDABLE);
+    ParserKeyword s_not_overridable(Keyword::NOT_OVERRIDABLE);
     ParserToken s_comma(TokenType::Comma);
 
     String cluster_str;
diff --git a/src/Parsers/ParserAlterQuery.cpp b/src/Parsers/ParserAlterQuery.cpp
index 4bc95e67afb..c0c43381585 100644
--- a/src/Parsers/ParserAlterQuery.cpp
+++ b/src/Parsers/ParserAlterQuery.cpp
@@ -24,97 +24,97 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
     auto command = std::make_shared<ASTAlterCommand>();
     node = command;
 
-    ParserKeyword s_add_column("ADD COLUMN");
-    ParserKeyword s_drop_column("DROP COLUMN");
-    ParserKeyword s_clear_column("CLEAR COLUMN");
-    ParserKeyword s_modify_column("MODIFY COLUMN");
-    ParserKeyword s_alter_column("ALTER COLUMN");
-    ParserKeyword s_rename_column("RENAME COLUMN");
-    ParserKeyword s_comment_column("COMMENT COLUMN");
-    ParserKeyword s_materialize_column("MATERIALIZE COLUMN");
+    ParserKeyword s_add_column(Keyword::ADD_COLUMN);
+    ParserKeyword s_drop_column(Keyword::DROP_COLUMN);
+    ParserKeyword s_clear_column(Keyword::CLEAR_COLUMN);
+    ParserKeyword s_modify_column(Keyword::MODIFY_COLUMN);
+    ParserKeyword s_alter_column(Keyword::ALTER_COLUMN);
+    ParserKeyword s_rename_column(Keyword::RENAME_COLUMN);
+    ParserKeyword s_comment_column(Keyword::COMMENT_COLUMN);
+    ParserKeyword s_materialize_column(Keyword::MATERIALIZE_COLUMN);
 
-    ParserKeyword s_modify_order_by("MODIFY ORDER BY");
-    ParserKeyword s_modify_sample_by("MODIFY SAMPLE BY");
-    ParserKeyword s_modify_ttl("MODIFY TTL");
-    ParserKeyword s_materialize_ttl("MATERIALIZE TTL");
-    ParserKeyword s_modify_setting("MODIFY SETTING");
-    ParserKeyword s_reset_setting("RESET SETTING");
-    ParserKeyword s_modify_query("MODIFY QUERY");
-    ParserKeyword s_modify_sql_security("MODIFY SQL SECURITY");
-    ParserKeyword s_modify_refresh("MODIFY REFRESH");
+    ParserKeyword s_modify_order_by(Keyword::MODIFY_ORDER_BY);
+    ParserKeyword s_modify_sample_by(Keyword::MODIFY_SAMPLE_BY);
+    ParserKeyword s_modify_ttl(Keyword::MODIFY_TTL);
+    ParserKeyword s_materialize_ttl(Keyword::MATERIALIZE_TTL);
+    ParserKeyword s_modify_setting(Keyword::MODIFY_SETTING);
+    ParserKeyword s_reset_setting(Keyword::RESET_SETTING);
+    ParserKeyword s_modify_query(Keyword::MODIFY_QUERY);
+    ParserKeyword s_modify_sql_security(Keyword::MODIFY_SQL_SECURITY);
+    ParserKeyword s_modify_refresh(Keyword::MODIFY_REFRESH);
 
-    ParserKeyword s_add_index("ADD INDEX");
-    ParserKeyword s_drop_index("DROP INDEX");
-    ParserKeyword s_clear_index("CLEAR INDEX");
-    ParserKeyword s_materialize_index("MATERIALIZE INDEX");
+    ParserKeyword s_add_index(Keyword::ADD_INDEX);
+    ParserKeyword s_drop_index(Keyword::DROP_INDEX);
+    ParserKeyword s_clear_index(Keyword::CLEAR_INDEX);
+    ParserKeyword s_materialize_index(Keyword::MATERIALIZE_INDEX);
 
-    ParserKeyword s_add_statistic("ADD STATISTIC");
-    ParserKeyword s_drop_statistic("DROP STATISTIC");
-    ParserKeyword s_clear_statistic("CLEAR STATISTIC");
-    ParserKeyword s_materialize_statistic("MATERIALIZE STATISTIC");
+    ParserKeyword s_add_statistic(Keyword::ADD_STATISTIC);
+    ParserKeyword s_drop_statistic(Keyword::DROP_STATISTIC);
+    ParserKeyword s_clear_statistic(Keyword::CLEAR_STATISTIC);
+    ParserKeyword s_materialize_statistic(Keyword::MATERIALIZE_STATISTIC);
 
-    ParserKeyword s_add_constraint("ADD CONSTRAINT");
-    ParserKeyword s_drop_constraint("DROP CONSTRAINT");
+    ParserKeyword s_add_constraint(Keyword::ADD_CONSTRAINT);
+    ParserKeyword s_drop_constraint(Keyword::DROP_CONSTRAINT);
 
-    ParserKeyword s_add_projection("ADD PROJECTION");
-    ParserKeyword s_drop_projection("DROP PROJECTION");
-    ParserKeyword s_clear_projection("CLEAR PROJECTION");
-    ParserKeyword s_materialize_projection("MATERIALIZE PROJECTION");
-    ParserKeyword s_modify_comment("MODIFY COMMENT");
+    ParserKeyword s_add_projection(Keyword::ADD_PROJECTION);
+    ParserKeyword s_drop_projection(Keyword::DROP_PROJECTION);
+    ParserKeyword s_clear_projection(Keyword::CLEAR_PROJECTION);
+    ParserKeyword s_materialize_projection(Keyword::MATERIALIZE_PROJECTION);
+    ParserKeyword s_modify_comment(Keyword::MODIFY_COMMENT);
 
-    ParserKeyword s_add("ADD");
-    ParserKeyword s_drop("DROP");
-    ParserKeyword s_modify("MODIFY");
+    ParserKeyword s_add(Keyword::ADD);
+    ParserKeyword s_drop(Keyword::DROP);
+    ParserKeyword s_modify(Keyword::MODIFY);
 
-    ParserKeyword s_attach_partition("ATTACH PARTITION");
-    ParserKeyword s_attach_part("ATTACH PART");
-    ParserKeyword s_detach_partition("DETACH PARTITION");
-    ParserKeyword s_detach_part("DETACH PART");
-    ParserKeyword s_drop_partition("DROP PARTITION");
-    ParserKeyword s_drop_part("DROP PART");
-    ParserKeyword s_forget_partition("FORGET PARTITION");
-    ParserKeyword s_move_partition("MOVE PARTITION");
-    ParserKeyword s_move_part("MOVE PART");
-    ParserKeyword s_drop_detached_partition("DROP DETACHED PARTITION");
-    ParserKeyword s_drop_detached_part("DROP DETACHED PART");
-    ParserKeyword s_fetch_partition("FETCH PARTITION");
-    ParserKeyword s_fetch_part("FETCH PART");
-    ParserKeyword s_replace_partition("REPLACE PARTITION");
-    ParserKeyword s_freeze("FREEZE");
-    ParserKeyword s_unfreeze("UNFREEZE");
-    ParserKeyword s_partition("PARTITION");
+    ParserKeyword s_attach_partition(Keyword::ATTACH_PARTITION);
+    ParserKeyword s_attach_part(Keyword::ATTACH_PART);
+    ParserKeyword s_detach_partition(Keyword::DETACH_PARTITION);
+    ParserKeyword s_detach_part(Keyword::DETACH_PART);
+    ParserKeyword s_drop_partition(Keyword::DROP_PARTITION);
+    ParserKeyword s_drop_part(Keyword::DROP_PART);
+    ParserKeyword s_forget_partition(Keyword::FORGET_PARTITION);
+    ParserKeyword s_move_partition(Keyword::MOVE_PARTITION);
+    ParserKeyword s_move_part(Keyword::MOVE_PART);
+    ParserKeyword s_drop_detached_partition(Keyword::DROP_DETACHED_PARTITION);
+    ParserKeyword s_drop_detached_part(Keyword::DROP_DETACHED_PART);
+    ParserKeyword s_fetch_partition(Keyword::FETCH_PARTITION);
+    ParserKeyword s_fetch_part(Keyword::FETCH_PART);
+    ParserKeyword s_replace_partition(Keyword::REPLACE_PARTITION);
+    ParserKeyword s_freeze(Keyword::FREEZE);
+    ParserKeyword s_unfreeze(Keyword::UNFREEZE);
+    ParserKeyword s_partition(Keyword::PARTITION);
 
-    ParserKeyword s_first("FIRST");
-    ParserKeyword s_after("AFTER");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
-    ParserKeyword s_if_exists("IF EXISTS");
-    ParserKeyword s_from("FROM");
-    ParserKeyword s_in_partition("IN PARTITION");
-    ParserKeyword s_with("WITH");
-    ParserKeyword s_name("NAME");
+    ParserKeyword s_first(Keyword::FIRST);
+    ParserKeyword s_after(Keyword::AFTER);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
+    ParserKeyword s_if_exists(Keyword::IF_EXISTS);
+    ParserKeyword s_from(Keyword::FROM);
+    ParserKeyword s_in_partition(Keyword::IN_PARTITION);
+    ParserKeyword s_with(Keyword::WITH);
+    ParserKeyword s_name(Keyword::NAME);
 
-    ParserKeyword s_to_disk("TO DISK");
-    ParserKeyword s_to_volume("TO VOLUME");
-    ParserKeyword s_to_table("TO TABLE");
-    ParserKeyword s_to_shard("TO SHARD");
+    ParserKeyword s_to_disk(Keyword::TO_DISK);
+    ParserKeyword s_to_volume(Keyword::TO_VOLUME);
+    ParserKeyword s_to_table(Keyword::TO_TABLE);
+    ParserKeyword s_to_shard(Keyword::TO_SHARD);
 
-    ParserKeyword s_delete("DELETE");
-    ParserKeyword s_update("UPDATE");
-    ParserKeyword s_where("WHERE");
-    ParserKeyword s_to("TO");
+    ParserKeyword s_delete(Keyword::DELETE);
+    ParserKeyword s_update(Keyword::UPDATE);
+    ParserKeyword s_where(Keyword::WHERE);
+    ParserKeyword s_to(Keyword::TO);
 
-    ParserKeyword s_remove("REMOVE");
-    ParserKeyword s_default("DEFAULT");
-    ParserKeyword s_materialized("MATERIALIZED");
-    ParserKeyword s_alias("ALIAS");
-    ParserKeyword s_comment("COMMENT");
-    ParserKeyword s_codec("CODEC");
-    ParserKeyword s_ttl("TTL");
-    ParserKeyword s_settings("SETTINGS");
+    ParserKeyword s_remove(Keyword::REMOVE);
+    ParserKeyword s_default(Keyword::DEFAULT);
+    ParserKeyword s_materialized(Keyword::MATERIALIZED);
+    ParserKeyword s_alias(Keyword::ALIAS);
+    ParserKeyword s_comment(Keyword::COMMENT);
+    ParserKeyword s_codec(Keyword::CODEC);
+    ParserKeyword s_ttl(Keyword::TTL);
+    ParserKeyword s_settings(Keyword::SETTINGS);
 
-    ParserKeyword s_remove_ttl("REMOVE TTL");
-    ParserKeyword s_remove_sample_by("REMOVE SAMPLE BY");
-    ParserKeyword s_apply_deleted_mask("APPLY DELETED MASK");
+    ParserKeyword s_remove_ttl(Keyword::REMOVE_TTL);
+    ParserKeyword s_remove_sample_by(Keyword::REMOVE_SAMPLE_BY);
+    ParserKeyword s_apply_deleted_mask(Keyword::APPLY_DELETED_MASK);
 
     ParserToken parser_opening_round_bracket(TokenType::OpeningRoundBracket);
     ParserToken parser_closing_round_bracket(TokenType::ClosingRoundBracket);
@@ -720,19 +720,19 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
                 if (s_remove.ignore(pos, expected))
                 {
                     if (s_default.ignore(pos, expected))
-                        command->remove_property = "DEFAULT";
+                        command->remove_property = toStringView(Keyword::DEFAULT);
                     else if (s_materialized.ignore(pos, expected))
-                        command->remove_property = "MATERIALIZED";
+                        command->remove_property = toStringView(Keyword::MATERIALIZED);
                     else if (s_alias.ignore(pos, expected))
-                        command->remove_property = "ALIAS";
+                        command->remove_property = toStringView(Keyword::ALIAS);
                     else if (s_comment.ignore(pos, expected))
-                        command->remove_property = "COMMENT";
+                        command->remove_property = toStringView(Keyword::COMMENT);
                     else if (s_codec.ignore(pos, expected))
-                        command->remove_property = "CODEC";
+                        command->remove_property = toStringView(Keyword::CODEC);
                     else if (s_ttl.ignore(pos, expected))
-                        command->remove_property = "TTL";
+                        command->remove_property = toStringView(Keyword::TTL);
                     else if (s_settings.ignore(pos, expected))
-                        command->remove_property = "SETTINGS";
+                        command->remove_property = toStringView(Keyword::SETTINGS);
                     else
                         return false;
                 }
@@ -981,9 +981,9 @@ bool ParserAlterQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     auto query = std::make_shared<ASTAlterQuery>();
     node = query;
 
-    ParserKeyword s_alter_table("ALTER TABLE");
-    ParserKeyword s_alter_temporary_table("ALTER TEMPORARY TABLE");
-    ParserKeyword s_alter_database("ALTER DATABASE");
+    ParserKeyword s_alter_table(Keyword::ALTER_TABLE);
+    ParserKeyword s_alter_temporary_table(Keyword::ALTER_TEMPORARY_TABLE);
+    ParserKeyword s_alter_database(Keyword::ALTER_DATABASE);
 
     ASTAlterQuery::AlterObjectType alter_object_type;
 
@@ -1009,7 +1009,7 @@ bool ParserAlterQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             return false;
 
         String cluster_str;
-        if (ParserKeyword{"ON"}.ignore(pos, expected))
+        if (ParserKeyword(Keyword::ON).ignore(pos, expected))
         {
             if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
                 return false;
diff --git a/src/Parsers/ParserBackupQuery.cpp b/src/Parsers/ParserBackupQuery.cpp
index cbe4567ee90..5eab0cb288d 100644
--- a/src/Parsers/ParserBackupQuery.cpp
+++ b/src/Parsers/ParserBackupQuery.cpp
@@ -24,7 +24,7 @@ namespace
 
     bool parsePartitions(IParser::Pos & pos, Expected & expected, std::optional<ASTs> & partitions)
     {
-        if (!ParserKeyword{"PARTITION"}.ignore(pos, expected) && !ParserKeyword{"PARTITIONS"}.ignore(pos, expected))
+        if (!ParserKeyword(Keyword::PARTITION).ignore(pos, expected) && !ParserKeyword(Keyword::PARTITIONS).ignore(pos, expected))
             return false;
 
         ASTs result;
@@ -47,7 +47,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"EXCEPT DATABASE"}.ignore(pos, expected) && !ParserKeyword{"EXCEPT DATABASES"}.ignore(pos, expected))
+            if (!ParserKeyword(Keyword::EXCEPT_DATABASE).ignore(pos, expected) && !ParserKeyword(Keyword::EXCEPT_DATABASES).ignore(pos, expected))
                 return false;
 
             std::set<String> result;
@@ -71,7 +71,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"EXCEPT TABLE"}.ignore(pos, expected) && !ParserKeyword{"EXCEPT TABLES"}.ignore(pos, expected))
+            if (!ParserKeyword(Keyword::EXCEPT_TABLE).ignore(pos, expected) && !ParserKeyword(Keyword::EXCEPT_TABLES).ignore(pos, expected))
                 return false;
 
             std::set<DatabaseAndTableName> result;
@@ -107,8 +107,8 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (ParserKeyword{"TABLE"}.ignore(pos, expected) || ParserKeyword{"DICTIONARY"}.ignore(pos, expected) ||
-                ParserKeyword{"VIEW"}.ignore(pos, expected))
+            if (ParserKeyword(Keyword::TABLE).ignore(pos, expected) || ParserKeyword(Keyword::DICTIONARY).ignore(pos, expected) ||
+                ParserKeyword(Keyword::VIEW).ignore(pos, expected))
             {
                 element.type = ElementType::TABLE;
                 if (!parseDatabaseAndTableName(pos, expected, element.database_name, element.table_name))
@@ -116,7 +116,7 @@ namespace
 
                 element.new_database_name = element.database_name;
                 element.new_table_name = element.table_name;
-                if (ParserKeyword("AS").ignore(pos, expected))
+                if (ParserKeyword(Keyword::AS).ignore(pos, expected))
                 {
                     if (!parseDatabaseAndTableName(pos, expected, element.new_database_name, element.new_table_name))
                         return false;
@@ -126,7 +126,7 @@ namespace
                 return true;
             }
 
-            if (ParserKeyword{"TEMPORARY TABLE"}.ignore(pos, expected))
+            if (ParserKeyword(Keyword::TEMPORARY_TABLE).ignore(pos, expected))
             {
                 element.type = ElementType::TEMPORARY_TABLE;
 
@@ -136,7 +136,7 @@ namespace
                 element.table_name = getIdentifierName(ast);
                 element.new_table_name = element.table_name;
 
-                if (ParserKeyword("AS").ignore(pos, expected))
+                if (ParserKeyword(Keyword::AS).ignore(pos, expected))
                 {
                     ast = nullptr;
                     if (!ParserIdentifier{}.parse(pos, ast, expected))
@@ -147,7 +147,7 @@ namespace
                 return true;
             }
 
-            if (ParserKeyword{"DATABASE"}.ignore(pos, expected))
+            if (ParserKeyword(Keyword::DATABASE).ignore(pos, expected))
             {
                 element.type = ElementType::DATABASE;
 
@@ -157,7 +157,7 @@ namespace
                 element.database_name = getIdentifierName(ast);
                 element.new_database_name = element.database_name;
 
-                if (ParserKeyword("AS").ignore(pos, expected))
+                if (ParserKeyword(Keyword::AS).ignore(pos, expected))
                 {
                     ast = nullptr;
                     if (!ParserIdentifier{}.parse(pos, ast, expected))
@@ -169,7 +169,7 @@ namespace
                 return true;
             }
 
-            if (ParserKeyword{"ALL"}.ignore(pos, expected))
+            if (ParserKeyword(Keyword::ALL).ignore(pos, expected))
             {
                 element.type = ElementType::ALL;
                 parseExceptDatabases(pos, expected, element.except_databases);
@@ -219,7 +219,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"base_backup"}.ignore(pos, expected)
+            return ParserKeyword{Keyword::BASE_BACKUP}.ignore(pos, expected)
                 && ParserToken(TokenType::Equals).ignore(pos, expected)
                 && parseBackupName(pos, expected, base_backup_name);
         });
@@ -234,7 +234,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"cluster_host_ids"}.ignore(pos, expected)
+            return ParserKeyword{Keyword::CLUSTER_HOST_IDS}.ignore(pos, expected)
                 && ParserToken(TokenType::Equals).ignore(pos, expected)
                 && parseClusterHostIDs(pos, expected, cluster_host_ids);
         });
@@ -244,7 +244,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            if (!ParserKeyword{"SETTINGS"}.ignore(pos, expected))
+            if (!ParserKeyword(Keyword::SETTINGS).ignore(pos, expected))
                 return false;
 
             SettingsChanges settings_changes;
@@ -291,9 +291,9 @@ namespace
     bool parseSyncOrAsync(IParser::Pos & pos, Expected & expected, ASTPtr & settings)
     {
         bool async;
-        if (ParserKeyword{"ASYNC"}.ignore(pos, expected))
+        if (ParserKeyword(Keyword::ASYNC).ignore(pos, expected))
             async = true;
-        else if (ParserKeyword{"SYNC"}.ignore(pos, expected))
+        else if (ParserKeyword(Keyword::SYNC).ignore(pos, expected))
             async = false;
         else
             return false;
@@ -318,7 +318,7 @@ namespace
     {
         return IParserBase::wrapParseImpl(pos, [&]
         {
-            return ParserKeyword{"ON"}.ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
+            return ParserKeyword(Keyword::ON).ignore(pos, expected) && ASTQueryWithOnCluster::parse(pos, cluster, expected);
         });
     }
 }
@@ -327,9 +327,9 @@ namespace
 bool ParserBackupQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
     Kind kind;
-    if (ParserKeyword{"BACKUP"}.ignore(pos, expected))
+    if (ParserKeyword(Keyword::BACKUP).ignore(pos, expected))
         kind = Kind::BACKUP;
-    else if (ParserKeyword{"RESTORE"}.ignore(pos, expected))
+    else if (ParserKeyword(Keyword::RESTORE).ignore(pos, expected))
         kind = Kind::RESTORE;
     else
         return false;
@@ -341,7 +341,7 @@ bool ParserBackupQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     String cluster;
     parseOnCluster(pos, expected, cluster);
 
-    if (!ParserKeyword{(kind == Kind::BACKUP) ? "TO" : "FROM"}.ignore(pos, expected))
+    if (!ParserKeyword((kind == Kind::BACKUP) ? Keyword::TO : Keyword::FROM).ignore(pos, expected))
         return false;
 
     ASTPtr backup_name;
diff --git a/src/Parsers/ParserCase.cpp b/src/Parsers/ParserCase.cpp
index 521eec212da..e73ff0e0844 100644
--- a/src/Parsers/ParserCase.cpp
+++ b/src/Parsers/ParserCase.cpp
@@ -10,11 +10,11 @@ namespace DB
 
 bool ParserCase::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_case{"CASE"};
-    ParserKeyword s_when{"WHEN"};
-    ParserKeyword s_then{"THEN"};
-    ParserKeyword s_else{"ELSE"};
-    ParserKeyword s_end{ "END"};
+    ParserKeyword s_case{Keyword::CASE};
+    ParserKeyword s_when{Keyword::WHEN};
+    ParserKeyword s_then{Keyword::THEN};
+    ParserKeyword s_else{Keyword::ELSE};
+    ParserKeyword s_end{ Keyword::END};
     ParserExpressionWithOptionalAlias p_expr{false};
 
     if (!s_case.ignore(pos, expected))
diff --git a/src/Parsers/ParserCheckQuery.cpp b/src/Parsers/ParserCheckQuery.cpp
index a840cfbae5e..42716ba7f2c 100644
--- a/src/Parsers/ParserCheckQuery.cpp
+++ b/src/Parsers/ParserCheckQuery.cpp
@@ -12,7 +12,7 @@ namespace DB
 
 bool ParserCheckQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_check_table("CHECK ALL TABLES");
+    ParserKeyword s_check_table(Keyword::CHECK_ALL_TABLES);
     if (s_check_table.ignore(pos, expected))
     {
         auto query = std::make_shared<ASTCheckAllTablesQuery>();
@@ -25,9 +25,9 @@ bool ParserCheckQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
 bool ParserCheckQuery::parseCheckTable(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_check_table("CHECK TABLE");
-    ParserKeyword s_partition("PARTITION");
-    ParserKeyword s_part("PART");
+    ParserKeyword s_check_table(Keyword::CHECK_TABLE);
+    ParserKeyword s_partition(Keyword::PARTITION);
+    ParserKeyword s_part(Keyword::PART);
     ParserToken s_dot(TokenType::Dot);
 
     ParserPartition partition_parser;
diff --git a/src/Parsers/ParserCreateFunctionQuery.cpp b/src/Parsers/ParserCreateFunctionQuery.cpp
index 2b3cf98a8a7..b912016a439 100644
--- a/src/Parsers/ParserCreateFunctionQuery.cpp
+++ b/src/Parsers/ParserCreateFunctionQuery.cpp
@@ -13,13 +13,13 @@ namespace DB
 
 bool ParserCreateFunctionQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_function("FUNCTION");
-    ParserKeyword s_or_replace("OR REPLACE");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
-    ParserKeyword s_on("ON");
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_function(Keyword::FUNCTION);
+    ParserKeyword s_or_replace(Keyword::OR_REPLACE);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
+    ParserKeyword s_on(Keyword::ON);
     ParserIdentifier function_name_p;
-    ParserKeyword s_as("AS");
+    ParserKeyword s_as(Keyword::AS);
     ParserExpression lambda_p;
 
     ASTPtr function_name;
diff --git a/src/Parsers/ParserCreateIndexQuery.cpp b/src/Parsers/ParserCreateIndexQuery.cpp
index e654656b68a..3b1b9d8ec84 100644
--- a/src/Parsers/ParserCreateIndexQuery.cpp
+++ b/src/Parsers/ParserCreateIndexQuery.cpp
@@ -15,11 +15,12 @@ namespace DB
 
 bool ParserCreateIndexDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_type("TYPE");
-    ParserKeyword s_granularity("GRANULARITY");
+    ParserKeyword s_type(Keyword::TYPE);
+    ParserKeyword s_granularity(Keyword::GRANULARITY);
     ParserToken open(TokenType::OpeningRoundBracket);
     ParserToken close(TokenType::ClosingRoundBracket);
     ParserOrderByExpressionList order_list;
+
     ParserDataType data_type_p;
     ParserExpression expression_p;
     ParserUnsignedInteger granularity_p;
@@ -79,11 +80,12 @@ bool ParserCreateIndexQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expect
     auto query = std::make_shared<ASTCreateIndexQuery>();
     node = query;
 
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_unique("UNIQUE");
-    ParserKeyword s_index("INDEX");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
-    ParserKeyword s_on("ON");
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_unique(Keyword::UNIQUE);
+    ParserKeyword s_index(Keyword::INDEX);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
+    ParserKeyword s_on(Keyword::ON);
+
     ParserIdentifier index_name_p;
     ParserCreateIndexDeclaration parser_create_idx_decl;
 
diff --git a/src/Parsers/ParserCreateQuery.cpp b/src/Parsers/ParserCreateQuery.cpp
index 8ebadf4606f..f2c09e9b050 100644
--- a/src/Parsers/ParserCreateQuery.cpp
+++ b/src/Parsers/ParserCreateQuery.cpp
@@ -40,7 +40,7 @@ namespace
 
 ASTPtr parseComment(IParser::Pos & pos, Expected & expected)
 {
-    ParserKeyword s_comment("COMMENT");
+    ParserKeyword s_comment(Keyword::COMMENT);
     ParserStringLiteral string_literal_parser;
     ASTPtr comment;
 
@@ -88,7 +88,11 @@ bool ParserNestedTable::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 bool ParserSQLSecurity::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
     ParserToken s_eq(TokenType::Equals);
-    ParserKeyword s_definer("DEFINER");
+    ParserKeyword s_definer(Keyword::DEFINER);
+    ParserKeyword s_current_user{Keyword::CURRENT_USER};
+    ParserKeyword s_sql_security{Keyword::SQL_SECURITY};
+    ParserKeyword s_invoker{Keyword::INVOKER};
+    ParserKeyword s_none{Keyword::NONE};
 
     bool is_definer_current_user = false;
     ASTPtr definer;
@@ -99,7 +103,7 @@ bool ParserSQLSecurity::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         if (!definer && s_definer.ignore(pos, expected))
         {
             s_eq.ignore(pos, expected);
-            if (ParserKeyword{"CURRENT_USER"}.ignore(pos, expected))
+            if (s_current_user.ignore(pos, expected))
                 is_definer_current_user = true;
             else if (!ParserUserNameWithHost{}.parse(pos, definer, expected))
                 return false;
@@ -107,13 +111,13 @@ bool ParserSQLSecurity::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             continue;
         }
 
-        if (!type && ParserKeyword{"SQL SECURITY"}.ignore(pos, expected))
+        if (!type && s_sql_security.ignore(pos, expected))
         {
             if (s_definer.ignore(pos, expected))
                 type = SQLSecurityType::DEFINER;
-            else if (ParserKeyword{"INVOKER"}.ignore(pos, expected))
+            else if (s_invoker.ignore(pos, expected))
                 type = SQLSecurityType::INVOKER;
-            else if (ParserKeyword{"NONE"}.ignore(pos, expected))
+            else if (s_none.ignore(pos, expected))
                 type = SQLSecurityType::NONE;
             else
                 return false;
@@ -170,8 +174,8 @@ bool ParserNameList::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
 bool ParserIndexDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_type("TYPE");
-    ParserKeyword s_granularity("GRANULARITY");
+    ParserKeyword s_type(Keyword::TYPE);
+    ParserKeyword s_granularity(Keyword::GRANULARITY);
 
     ParserIdentifier name_p;
     ParserDataType data_type_p;
@@ -225,7 +229,7 @@ bool ParserIndexDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
 
 bool ParserStatisticDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_type("TYPE");
+    ParserKeyword s_type(Keyword::TYPE);
 
     ParserList columns_p(std::make_unique<ParserIdentifier>(), std::make_unique<ParserToken>(TokenType::Comma), false);
     ParserIdentifier type_p;
@@ -252,8 +256,8 @@ bool ParserStatisticDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected &
 
 bool ParserConstraintDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_check("CHECK");
-    ParserKeyword s_assume("ASSUME");
+    ParserKeyword s_check(Keyword::CHECK);
+    ParserKeyword s_assume(Keyword::ASSUME);
 
     ParserIdentifier name_p;
     ParserExpression expression_p;
@@ -317,7 +321,7 @@ bool ParserProjectionDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected &
 
 bool ParserForeignKeyDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_references("REFERENCES");
+    ParserKeyword s_references(Keyword::REFERENCES);
     ParserCompoundIdentifier table_name_p(true, true);
     ParserExpression expression_p;
 
@@ -336,20 +340,20 @@ bool ParserForeignKeyDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected &
     if (!expression_p.parse(pos, expr, expected))
         return false;
 
-    ParserKeyword s_on("ON");
+    ParserKeyword s_on(Keyword::ON);
     while (s_on.ignore(pos, expected))
     {
-        ParserKeyword s_delete("DELETE");
-        ParserKeyword s_update("UPDATE");
+        ParserKeyword s_delete(Keyword::DELETE);
+        ParserKeyword s_update(Keyword::UPDATE);
 
         if (!s_delete.ignore(pos, expected) && !s_update.ignore(pos, expected))
             return false;
 
-        ParserKeyword s_restrict("RESTRICT");
-        ParserKeyword s_cascade("CASCADE");
-        ParserKeyword s_set_null("SET NULL");
-        ParserKeyword s_no_action("NO ACTION");
-        ParserKeyword s_set_default("SET DEFAULT");
+        ParserKeyword s_restrict(Keyword::RESTRICT);
+        ParserKeyword s_cascade(Keyword::CASCADE);
+        ParserKeyword s_set_null(Keyword::SET_NULL);
+        ParserKeyword s_no_action(Keyword::NO_ACTION);
+        ParserKeyword s_set_default(Keyword::SET_DEFAULT);
 
         if (!s_restrict.ignore(pos, expected) && !s_cascade.ignore(pos, expected) &&
             !s_set_null.ignore(pos, expected) && !s_no_action.ignore(pos, expected) &&
@@ -368,11 +372,11 @@ bool ParserForeignKeyDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected &
 
 bool ParserTablePropertyDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_index("INDEX");
-    ParserKeyword s_constraint("CONSTRAINT");
-    ParserKeyword s_projection("PROJECTION");
-    ParserKeyword s_foreign_key("FOREIGN KEY");
-    ParserKeyword s_primary_key("PRIMARY KEY");
+    ParserKeyword s_index(Keyword::INDEX);
+    ParserKeyword s_constraint(Keyword::CONSTRAINT);
+    ParserKeyword s_projection(Keyword::PROJECTION);
+    ParserKeyword s_foreign_key(Keyword::FOREIGN_KEY);
+    ParserKeyword s_primary_key(Keyword::PRIMARY_KEY);
 
     ParserIndexDeclaration index_p;
     ParserConstraintDeclaration constraint_p;
@@ -512,14 +516,14 @@ bool ParserTablePropertiesDeclarationList::parseImpl(Pos & pos, ASTPtr & node, E
 
 bool ParserStorage::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_engine("ENGINE");
+    ParserKeyword s_engine(Keyword::ENGINE);
     ParserToken s_eq(TokenType::Equals);
-    ParserKeyword s_partition_by("PARTITION BY");
-    ParserKeyword s_primary_key("PRIMARY KEY");
-    ParserKeyword s_order_by("ORDER BY");
-    ParserKeyword s_sample_by("SAMPLE BY");
-    ParserKeyword s_ttl("TTL");
-    ParserKeyword s_settings("SETTINGS");
+    ParserKeyword s_partition_by(Keyword::PARTITION_BY);
+    ParserKeyword s_primary_key(Keyword::PRIMARY_KEY);
+    ParserKeyword s_order_by(Keyword::ORDER_BY);
+    ParserKeyword s_sample_by(Keyword::SAMPLE_BY);
+    ParserKeyword s_ttl(Keyword::TTL);
+    ParserKeyword s_settings(Keyword::SETTINGS);
 
     ParserIdentifierWithOptionalParameters ident_with_optional_params_p;
     ParserExpression expression_p;
@@ -651,16 +655,16 @@ bool ParserStorage::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
 bool ParserCreateTableQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_attach("ATTACH");
-    ParserKeyword s_replace("REPLACE");
-    ParserKeyword s_or_replace("OR REPLACE");
-    ParserKeyword s_temporary("TEMPORARY");
-    ParserKeyword s_table("TABLE");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_attach(Keyword::ATTACH);
+    ParserKeyword s_replace(Keyword::REPLACE);
+    ParserKeyword s_or_replace(Keyword::OR_REPLACE);
+    ParserKeyword s_temporary(Keyword::TEMPORARY);
+    ParserKeyword s_table(Keyword::TABLE);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
     ParserCompoundIdentifier table_name_p(/*table_name_with_optional_uuid*/ true, /*allow_query_parameter*/ true);
-    ParserKeyword s_from("FROM");
-    ParserKeyword s_on("ON");
+    ParserKeyword s_from(Keyword::FROM);
+    ParserKeyword s_on(Keyword::ON);
     ParserToken s_dot(TokenType::Dot);
     ParserToken s_comma(TokenType::Comma);
     ParserToken s_lparen(TokenType::OpeningRoundBracket);
@@ -756,13 +760,13 @@ bool ParserCreateTableQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
 
     auto need_parse_as_select = [&is_create_empty, &pos, &expected]()
     {
-        if (ParserKeyword{"EMPTY AS"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::EMPTY_AS}.ignore(pos, expected))
         {
             is_create_empty = true;
             return true;
         }
 
-        return ParserKeyword{"AS"}.ignore(pos, expected);
+        return ParserKeyword{Keyword::AS}.ignore(pos, expected);
     };
 
     /// List of columns.
@@ -895,13 +899,13 @@ bool ParserCreateTableQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
 
 bool ParserCreateLiveViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_attach("ATTACH");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_attach(Keyword::ATTACH);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
     ParserCompoundIdentifier table_name_p(/*table_name_with_optional_uuid*/ true, /*allow_query_parameter*/ true);
-    ParserKeyword s_as("AS");
-    ParserKeyword s_view("VIEW");
-    ParserKeyword s_live("LIVE");
+    ParserKeyword s_as(Keyword::AS);
+    ParserKeyword s_view(Keyword::VIEW);
+    ParserKeyword s_live(Keyword::LIVE);
     ParserToken s_dot(TokenType::Dot);
     ParserToken s_lparen(TokenType::OpeningRoundBracket);
     ParserToken s_rparen(TokenType::ClosingRoundBracket);
@@ -945,14 +949,14 @@ bool ParserCreateLiveViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & e
     if (!table_name_p.parse(pos, table, expected))
         return false;
 
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::ON}.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
             return false;
     }
 
     // TO [db.]table
-    if (ParserKeyword{"TO"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::TO}.ignore(pos, expected))
     {
         if (!table_name_p.parse(pos, to_table, expected))
             return false;
@@ -1018,15 +1022,21 @@ bool ParserCreateLiveViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & e
 
 bool ParserCreateWindowViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_temporary("TEMPORARY");
-    ParserKeyword s_attach("ATTACH");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_temporary(Keyword::TEMPORARY);
+    ParserKeyword s_attach(Keyword::ATTACH);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
     ParserCompoundIdentifier table_name_p(/*table_name_with_optional_uuid*/ true, /*allow_query_parameter*/ true);
-    ParserKeyword s_as("AS");
-    ParserKeyword s_view("VIEW");
-    ParserKeyword s_window("WINDOW");
-    ParserKeyword s_populate("POPULATE");
+    ParserKeyword s_as(Keyword::AS);
+    ParserKeyword s_view(Keyword::VIEW);
+    ParserKeyword s_window(Keyword::WINDOW);
+    ParserKeyword s_populate(Keyword::POPULATE);
+    ParserKeyword s_on(Keyword::ON);
+    ParserKeyword s_to(Keyword::TO);
+    ParserKeyword s_inner(Keyword::INNER);
+    ParserKeyword s_watermark(Keyword::WATERMARK);
+    ParserKeyword s_allowed_lateness(Keyword::ALLOWED_LATENESS);
+    ParserKeyword s_empty(Keyword::EMPTY);
     ParserToken s_dot(TokenType::Dot);
     ParserToken s_eq(TokenType::Equals);
     ParserToken s_lparen(TokenType::OpeningRoundBracket);
@@ -1079,14 +1089,14 @@ bool ParserCreateWindowViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
     if (!table_name_p.parse(pos, table, expected))
         return false;
 
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (s_on.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
             return false;
     }
 
     // TO [db.]table
-    if (ParserKeyword{"TO"}.ignore(pos, expected))
+    if (s_to.ignore(pos, expected))
     {
         if (!table_name_p.parse(pos, to_table, expected))
             return false;
@@ -1102,7 +1112,7 @@ bool ParserCreateWindowViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
             return false;
     }
 
-    if (ParserKeyword{"INNER"}.ignore(pos, expected))
+    if (s_inner.ignore(pos, expected))
     {
         /// Inner table ENGINE for WINDOW VIEW
         storage_inner.parse(pos, inner_storage, expected);
@@ -1115,13 +1125,13 @@ bool ParserCreateWindowViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
     }
 
     // WATERMARK
-    if (ParserKeyword{"WATERMARK"}.ignore(pos, expected))
+    if (s_watermark.ignore(pos, expected))
     {
         s_eq.ignore(pos, expected);
 
-        if (ParserKeyword("STRICTLY_ASCENDING").ignore(pos,expected))
+        if (ParserKeyword(Keyword::STRICTLY_ASCENDING).ignore(pos,expected))
             is_watermark_strictly_ascending = true;
-        else if (ParserKeyword("ASCENDING").ignore(pos,expected))
+        else if (ParserKeyword(Keyword::ASCENDING).ignore(pos,expected))
             is_watermark_ascending = true;
         else if (watermark_p.parse(pos, watermark, expected))
             is_watermark_bounded = true;
@@ -1130,7 +1140,7 @@ bool ParserCreateWindowViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
     }
 
     // ALLOWED LATENESS
-    if (ParserKeyword{"ALLOWED_LATENESS"}.ignore(pos, expected))
+    if (s_allowed_lateness.ignore(pos, expected))
     {
         s_eq.ignore(pos, expected);
         allowed_lateness = true;
@@ -1141,7 +1151,7 @@ bool ParserCreateWindowViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
 
     if (s_populate.ignore(pos, expected))
         is_populate = true;
-    else if (ParserKeyword{"EMPTY"}.ignore(pos, expected))
+    else if (s_empty.ignore(pos, expected))
         is_create_empty = true;
 
     /// AS SELECT ...
@@ -1194,19 +1204,19 @@ bool ParserCreateWindowViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
 
 bool ParserTableOverrideDeclaration::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_table_override("TABLE OVERRIDE");
+    ParserKeyword s_table_override(Keyword::TABLE_OVERRIDE);
     ParserIdentifier table_name_p;
     ParserToken lparen_p(TokenType::OpeningRoundBracket);
     ParserToken rparen_p(TokenType::ClosingRoundBracket);
     ParserTablePropertiesDeclarationList table_properties_p;
     ParserExpression expression_p;
     ParserTTLExpressionList parser_ttl_list;
-    ParserKeyword s_columns("COLUMNS");
-    ParserKeyword s_partition_by("PARTITION BY");
-    ParserKeyword s_primary_key("PRIMARY KEY");
-    ParserKeyword s_order_by("ORDER BY");
-    ParserKeyword s_sample_by("SAMPLE BY");
-    ParserKeyword s_ttl("TTL");
+    ParserKeyword s_columns(Keyword::COLUMNS);
+    ParserKeyword s_partition_by(Keyword::PARTITION_BY);
+    ParserKeyword s_primary_key(Keyword::PRIMARY_KEY);
+    ParserKeyword s_order_by(Keyword::ORDER_BY);
+    ParserKeyword s_sample_by(Keyword::SAMPLE_BY);
+    ParserKeyword s_ttl(Keyword::TTL);
     ASTPtr table_name;
     ASTPtr columns;
     ASTPtr partition_by;
@@ -1332,10 +1342,12 @@ bool ParserTableOverridesDeclarationList::parseImpl(Pos & pos, ASTPtr & node, Ex
 
 bool ParserCreateDatabaseQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_attach("ATTACH");
-    ParserKeyword s_database("DATABASE");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_attach(Keyword::ATTACH);
+    ParserKeyword s_database(Keyword::DATABASE);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
+    ParserKeyword s_on(Keyword::ON);
+    ParserKeyword s_uuid(Keyword::UUID);
     ParserStorage storage_p{ParserStorage::DATABASE_ENGINE};
     ParserIdentifier name_p(true);
     ParserTableOverridesDeclarationList table_overrides_p;
@@ -1366,7 +1378,7 @@ bool ParserCreateDatabaseQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & e
     if (!name_p.parse(pos, database, expected))
         return false;
 
-    if (ParserKeyword("UUID").ignore(pos, expected))
+    if (s_uuid.ignore(pos, expected))
     {
         ParserStringLiteral uuid_p;
         ASTPtr ast_uuid;
@@ -1375,7 +1387,7 @@ bool ParserCreateDatabaseQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & e
         uuid = parseFromString<UUID>(ast_uuid->as<ASTLiteral>()->value.get<String>());
     }
 
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (s_on.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
             return false;
@@ -1411,17 +1423,18 @@ bool ParserCreateDatabaseQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & e
 
 bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_attach("ATTACH");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_attach(Keyword::ATTACH);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
     ParserCompoundIdentifier table_name_p(/*table_name_with_optional_uuid*/ true, /*allow_query_parameter*/ true);
     ParserCompoundIdentifier to_table_name_p(/*table_name_with_optional_uuid*/ true, /*allow_query_parameter*/ false);
-    ParserKeyword s_as("AS");
-    ParserKeyword s_view("VIEW");
-    ParserKeyword s_materialized("MATERIALIZED");
-    ParserKeyword s_populate("POPULATE");
-    ParserKeyword s_empty("EMPTY");
-    ParserKeyword s_or_replace("OR REPLACE");
+    ParserKeyword s_as(Keyword::AS);
+    ParserKeyword s_view(Keyword::VIEW);
+    ParserKeyword s_materialized(Keyword::MATERIALIZED);
+    ParserKeyword s_populate(Keyword::POPULATE);
+    ParserKeyword s_empty(Keyword::EMPTY);
+    ParserKeyword s_or_replace(Keyword::OR_REPLACE);
+    ParserKeyword s_to{Keyword::TO};
     ParserToken s_dot(TokenType::Dot);
     ParserToken s_lparen(TokenType::OpeningRoundBracket);
     ParserToken s_rparen(TokenType::ClosingRoundBracket);
@@ -1484,13 +1497,13 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     if (!table_name_p.parse(pos, table, expected))
         return false;
 
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::ON}.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
             return false;
     }
 
-    if (ParserKeyword{"REFRESH"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::REFRESH}.ignore(pos, expected))
     {
         // REFRESH only with materialized views
         if (!is_materialized_view)
@@ -1499,13 +1512,13 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
             return false;
     }
 
-    if (is_materialized_view && ParserKeyword{"TO INNER UUID"}.ignore(pos, expected))
+    if (is_materialized_view && ParserKeyword{Keyword::TO_INNER_UUID}.ignore(pos, expected))
     {
         ParserStringLiteral literal_p;
         if (!literal_p.parse(pos, to_inner_uuid, expected))
             return false;
     }
-    else if (is_materialized_view && ParserKeyword{"TO"}.ignore(pos, expected))
+    else if (is_materialized_view && ParserKeyword{Keyword::TO}.ignore(pos, expected))
     {
         // TO [db.]table
         if (!table_name_p.parse(pos, to_table, expected))
@@ -1535,7 +1548,7 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
             else if (s_empty.ignore(pos, expected))
                 is_create_empty = true;
 
-            if (ParserKeyword{"TO"}.ignore(pos, expected))
+            if (s_to.ignore(pos, expected))
                 throw Exception(
                     ErrorCodes::SYNTAX_ERROR, "When creating a materialized view you can't declare both 'ENGINE' and 'TO [db].[table]'");
         }
@@ -1617,13 +1630,13 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
 
 bool ParserCreateNamedCollectionQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_named_collection("NAMED COLLECTION");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
-    ParserKeyword s_on("ON");
-    ParserKeyword s_as("AS");
-    ParserKeyword s_not_overridable("NOT OVERRIDABLE");
-    ParserKeyword s_overridable("OVERRIDABLE");
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_named_collection(Keyword::NAMED_COLLECTION);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
+    ParserKeyword s_on(Keyword::ON);
+    ParserKeyword s_as(Keyword::AS);
+    ParserKeyword s_not_overridable(Keyword::NOT_OVERRIDABLE);
+    ParserKeyword s_overridable(Keyword::OVERRIDABLE);
     ParserIdentifier name_p;
     ParserToken s_comma(TokenType::Comma);
 
@@ -1644,6 +1657,7 @@ bool ParserCreateNamedCollectionQuery::parseImpl(Pos & pos, ASTPtr & node, Expec
     if (!name_p.parse(pos, collection_name, expected))
         return false;
 
+
     if (s_on.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
@@ -1685,13 +1699,13 @@ bool ParserCreateNamedCollectionQuery::parseImpl(Pos & pos, ASTPtr & node, Expec
 
 bool ParserCreateDictionaryQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_attach("ATTACH");
-    ParserKeyword s_replace("REPLACE");
-    ParserKeyword s_or_replace("OR REPLACE");
-    ParserKeyword s_dictionary("DICTIONARY");
-    ParserKeyword s_if_not_exists("IF NOT EXISTS");
-    ParserKeyword s_on("ON");
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_attach(Keyword::ATTACH);
+    ParserKeyword s_replace(Keyword::REPLACE);
+    ParserKeyword s_or_replace(Keyword::OR_REPLACE);
+    ParserKeyword s_dictionary(Keyword::DICTIONARY);
+    ParserKeyword s_if_not_exists(Keyword::IF_NOT_EXISTS);
+    ParserKeyword s_on(Keyword::ON);
     ParserCompoundIdentifier dict_name_p(/*table_name_with_optional_uuid*/ true, /*allow_query_parameter*/ true);
     ParserToken s_left_paren(TokenType::OpeningRoundBracket);
     ParserToken s_right_paren(TokenType::ClosingRoundBracket);
diff --git a/src/Parsers/ParserCreateQuery.h b/src/Parsers/ParserCreateQuery.h
index 30bce57f9d9..d001c097114 100644
--- a/src/Parsers/ParserCreateQuery.h
+++ b/src/Parsers/ParserCreateQuery.h
@@ -129,24 +129,24 @@ using ParserCompoundColumnDeclaration = IParserColumnDeclaration<ParserCompoundI
 template <typename NameParser>
 bool IParserColumnDeclaration<NameParser>::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_default{"DEFAULT"};
-    ParserKeyword s_null{"NULL"};
-    ParserKeyword s_not{"NOT"};
-    ParserKeyword s_materialized{"MATERIALIZED"};
-    ParserKeyword s_ephemeral{"EPHEMERAL"};
-    ParserKeyword s_alias{"ALIAS"};
-    ParserKeyword s_auto_increment{"AUTO_INCREMENT"};
-    ParserKeyword s_comment{"COMMENT"};
-    ParserKeyword s_codec{"CODEC"};
-    ParserKeyword s_stat{"STATISTIC"};
-    ParserKeyword s_ttl{"TTL"};
-    ParserKeyword s_remove{"REMOVE"};
-    ParserKeyword s_modify_setting("MODIFY SETTING");
-    ParserKeyword s_reset_setting("RESET SETTING");
-    ParserKeyword s_settings("SETTINGS");
-    ParserKeyword s_type{"TYPE"};
-    ParserKeyword s_collate{"COLLATE"};
-    ParserKeyword s_primary_key{"PRIMARY KEY"};
+    ParserKeyword s_default{Keyword::DEFAULT};
+    ParserKeyword s_null{Keyword::NULL_KEYWORD};
+    ParserKeyword s_not{Keyword::NOT};
+    ParserKeyword s_materialized{Keyword::MATERIALIZED};
+    ParserKeyword s_ephemeral{Keyword::EPHEMERAL};
+    ParserKeyword s_alias{Keyword::ALIAS};
+    ParserKeyword s_auto_increment{Keyword::AUTO_INCREMENT};
+    ParserKeyword s_comment{Keyword::COMMENT};
+    ParserKeyword s_codec{Keyword::CODEC};
+    ParserKeyword s_stat{Keyword::STATISTIC};
+    ParserKeyword s_ttl{Keyword::TTL};
+    ParserKeyword s_remove{Keyword::REMOVE};
+    ParserKeyword s_modify_setting(Keyword::MODIFY_SETTING);
+    ParserKeyword s_reset_setting(Keyword::RESET_SETTING);
+    ParserKeyword s_settings(Keyword::SETTINGS);
+    ParserKeyword s_type{Keyword::TYPE};
+    ParserKeyword s_collate{Keyword::COLLATE};
+    ParserKeyword s_primary_key{Keyword::PRIMARY_KEY};
 
     NameParser name_parser;
     ParserDataType type_parser;
diff --git a/src/Parsers/ParserDataType.cpp b/src/Parsers/ParserDataType.cpp
index b75f17dca72..fcf189e51f4 100644
--- a/src/Parsers/ParserDataType.cpp
+++ b/src/Parsers/ParserDataType.cpp
@@ -64,39 +64,39 @@ bool ParserDataType::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     /// only for certain first words, otherwise we don't know how many words to parse
     if (type_name_upper == "NATIONAL")
     {
-        if (ParserKeyword("CHARACTER LARGE OBJECT").ignore(pos))
-            type_name_suffix = "CHARACTER LARGE OBJECT";
-        else if (ParserKeyword("CHARACTER VARYING").ignore(pos))
-            type_name_suffix = "CHARACTER VARYING";
-        else if (ParserKeyword("CHAR VARYING").ignore(pos))
-            type_name_suffix = "CHAR VARYING";
-        else if (ParserKeyword("CHARACTER").ignore(pos))
-            type_name_suffix = "CHARACTER";
-        else if (ParserKeyword("CHAR").ignore(pos))
-            type_name_suffix = "CHAR";
+        if (ParserKeyword(Keyword::CHARACTER_LARGE_OBJECT).ignore(pos))
+            type_name_suffix = toStringView(Keyword::CHARACTER_LARGE_OBJECT);
+        else if (ParserKeyword(Keyword::CHARACTER_VARYING).ignore(pos))
+            type_name_suffix = toStringView(Keyword::CHARACTER_VARYING);
+        else if (ParserKeyword(Keyword::CHAR_VARYING).ignore(pos))
+            type_name_suffix = toStringView(Keyword::CHAR_VARYING);
+        else if (ParserKeyword(Keyword::CHARACTER).ignore(pos))
+            type_name_suffix = toStringView(Keyword::CHARACTER);
+        else if (ParserKeyword(Keyword::CHAR).ignore(pos))
+            type_name_suffix = toStringView(Keyword::CHAR);
     }
     else if (type_name_upper == "BINARY" ||
              type_name_upper == "CHARACTER" ||
              type_name_upper == "CHAR" ||
              type_name_upper == "NCHAR")
     {
-        if (ParserKeyword("LARGE OBJECT").ignore(pos))
-            type_name_suffix = "LARGE OBJECT";
-        else if (ParserKeyword("VARYING").ignore(pos))
-            type_name_suffix = "VARYING";
+        if (ParserKeyword(Keyword::LARGE_OBJECT).ignore(pos))
+            type_name_suffix = toStringView(Keyword::LARGE_OBJECT);
+        else if (ParserKeyword(Keyword::VARYING).ignore(pos))
+            type_name_suffix = toStringView(Keyword::VARYING);
     }
     else if (type_name_upper == "DOUBLE")
     {
-        if (ParserKeyword("PRECISION").ignore(pos))
-            type_name_suffix = "PRECISION";
+        if (ParserKeyword(Keyword::PRECISION).ignore(pos))
+            type_name_suffix = toStringView(Keyword::PRECISION);
     }
     else if (type_name_upper.find("INT") != std::string::npos)
     {
         /// Support SIGNED and UNSIGNED integer type modifiers for compatibility with MySQL
-        if (ParserKeyword("SIGNED").ignore(pos))
-            type_name_suffix = "SIGNED";
-        else if (ParserKeyword("UNSIGNED").ignore(pos))
-            type_name_suffix = "UNSIGNED";
+        if (ParserKeyword(Keyword::SIGNED).ignore(pos))
+            type_name_suffix = toStringView(Keyword::SIGNED);
+        else if (ParserKeyword(Keyword::UNSIGNED).ignore(pos))
+            type_name_suffix = toStringView(Keyword::UNSIGNED);
         else if (pos->type == TokenType::OpeningRoundBracket)
         {
             ++pos;
@@ -105,10 +105,10 @@ bool ParserDataType::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             if (pos->type != TokenType::ClosingRoundBracket)
                return false;
             ++pos;
-            if (ParserKeyword("SIGNED").ignore(pos))
-                type_name_suffix = "SIGNED";
-            else if (ParserKeyword("UNSIGNED").ignore(pos))
-                type_name_suffix = "UNSIGNED";
+            if (ParserKeyword(Keyword::SIGNED).ignore(pos))
+                type_name_suffix = toStringView(Keyword::SIGNED);
+            else if (ParserKeyword(Keyword::UNSIGNED).ignore(pos))
+                type_name_suffix = toStringView(Keyword::UNSIGNED);
         }
 
     }
diff --git a/src/Parsers/ParserDatabaseOrNone.cpp b/src/Parsers/ParserDatabaseOrNone.cpp
index c53c547aedd..6b319c80f11 100644
--- a/src/Parsers/ParserDatabaseOrNone.cpp
+++ b/src/Parsers/ParserDatabaseOrNone.cpp
@@ -10,7 +10,7 @@ bool ParserDatabaseOrNone::parseImpl(Pos & pos, ASTPtr & node, Expected & expect
     auto result = std::make_shared<ASTDatabaseOrNone>();
     node = result;
 
-    if (ParserKeyword{"NONE"}.ignore(pos, expected))
+    if (ParserKeyword(Keyword::NONE).ignore(pos, expected))
     {
         result->none = true;
         return true;
diff --git a/src/Parsers/ParserDeleteQuery.cpp b/src/Parsers/ParserDeleteQuery.cpp
index 7b27651d82d..00fac45c8ed 100644
--- a/src/Parsers/ParserDeleteQuery.cpp
+++ b/src/Parsers/ParserDeleteQuery.cpp
@@ -13,12 +13,12 @@ bool ParserDeleteQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     auto query = std::make_shared<ASTDeleteQuery>();
     node = query;
 
-    ParserKeyword s_delete("DELETE");
-    ParserKeyword s_from("FROM");
-    ParserKeyword s_where("WHERE");
+    ParserKeyword s_delete(Keyword::DELETE);
+    ParserKeyword s_from(Keyword::FROM);
+    ParserKeyword s_where(Keyword::WHERE);
     ParserExpression parser_exp_elem;
-    ParserKeyword s_settings("SETTINGS");
-    ParserKeyword s_on{"ON"};
+    ParserKeyword s_settings(Keyword::SETTINGS);
+    ParserKeyword s_on{Keyword::ON};
 
     if (s_delete.ignore(pos, expected))
     {
diff --git a/src/Parsers/ParserDescribeCacheQuery.cpp b/src/Parsers/ParserDescribeCacheQuery.cpp
index c6c9cbe8bc0..d0219600892 100644
--- a/src/Parsers/ParserDescribeCacheQuery.cpp
+++ b/src/Parsers/ParserDescribeCacheQuery.cpp
@@ -9,9 +9,9 @@ namespace DB
 
 bool ParserDescribeCacheQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword p_describe("DESCRIBE");
-    ParserKeyword p_desc("DESC");
-    ParserKeyword p_cache("FILESYSTEM CACHE");
+    ParserKeyword p_describe(Keyword::DESCRIBE);
+    ParserKeyword p_desc(Keyword::DESC);
+    ParserKeyword p_cache(Keyword::FILESYSTEM_CACHE);
     ParserLiteral p_cache_name;
 
     if ((!p_describe.ignore(pos, expected) && !p_desc.ignore(pos, expected))
diff --git a/src/Parsers/ParserDescribeTableQuery.cpp b/src/Parsers/ParserDescribeTableQuery.cpp
index fcfc4799dbe..92c0cfacd9b 100644
--- a/src/Parsers/ParserDescribeTableQuery.cpp
+++ b/src/Parsers/ParserDescribeTableQuery.cpp
@@ -14,10 +14,10 @@ namespace DB
 
 bool ParserDescribeTableQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_describe("DESCRIBE");
-    ParserKeyword s_desc("DESC");
-    ParserKeyword s_table("TABLE");
-    ParserKeyword s_settings("SETTINGS");
+    ParserKeyword s_describe(Keyword::DESCRIBE);
+    ParserKeyword s_desc(Keyword::DESC);
+    ParserKeyword s_table(Keyword::TABLE);
+    ParserKeyword s_settings(Keyword::SETTINGS);
     ParserToken s_dot(TokenType::Dot);
     ParserIdentifier name_p;
     ParserSetQuery parser_settings(true);
diff --git a/src/Parsers/ParserDictionary.cpp b/src/Parsers/ParserDictionary.cpp
index ef914e2264a..539ce30e010 100644
--- a/src/Parsers/ParserDictionary.cpp
+++ b/src/Parsers/ParserDictionary.cpp
@@ -165,12 +165,12 @@ bool ParserDictionarySettings::parseImpl(Pos & pos, ASTPtr & node, Expected & ex
 
 bool ParserDictionary::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword primary_key_keyword("PRIMARY KEY");
-    ParserKeyword source_keyword("SOURCE");
-    ParserKeyword lifetime_keyword("LIFETIME");
-    ParserKeyword range_keyword("RANGE");
-    ParserKeyword layout_keyword("LAYOUT");
-    ParserKeyword settings_keyword("SETTINGS");
+    ParserKeyword primary_key_keyword(Keyword::PRIMARY_KEY);
+    ParserKeyword source_keyword(Keyword::SOURCE);
+    ParserKeyword lifetime_keyword(Keyword::LIFETIME);
+    ParserKeyword range_keyword(Keyword::RANGE);
+    ParserKeyword layout_keyword(Keyword::LAYOUT);
+    ParserKeyword settings_keyword(Keyword::SETTINGS);
     ParserToken open(TokenType::OpeningRoundBracket);
     ParserToken close(TokenType::ClosingRoundBracket);
     ParserFunctionWithKeyValueArguments key_value_pairs_p;
diff --git a/src/Parsers/ParserDictionaryAttributeDeclaration.cpp b/src/Parsers/ParserDictionaryAttributeDeclaration.cpp
index 9910c73e541..376cad136ae 100644
--- a/src/Parsers/ParserDictionaryAttributeDeclaration.cpp
+++ b/src/Parsers/ParserDictionaryAttributeDeclaration.cpp
@@ -12,12 +12,12 @@ bool ParserDictionaryAttributeDeclaration::parseImpl(Pos & pos, ASTPtr & node, E
 {
     ParserIdentifier name_parser;
     ParserDataType type_parser;
-    ParserKeyword s_default{"DEFAULT"};
-    ParserKeyword s_expression{"EXPRESSION"};
-    ParserKeyword s_hierarchical{"HIERARCHICAL"};
-    ParserKeyword s_bidirectional{"BIDIRECTIONAL"};
-    ParserKeyword s_injective{"INJECTIVE"};
-    ParserKeyword s_is_object_id{"IS_OBJECT_ID"};
+    ParserKeyword s_default{Keyword::DEFAULT};
+    ParserKeyword s_expression{Keyword::EXPRESSION};
+    ParserKeyword s_hierarchical{Keyword::HIERARCHICAL};
+    ParserKeyword s_bidirectional{Keyword::BIDIRECTIONAL};
+    ParserKeyword s_injective{Keyword::INJECTIVE};
+    ParserKeyword s_is_object_id{Keyword::IS_OBJECT_ID};
     ParserLiteral default_parser;
     ParserArrayOfLiterals array_literals_parser;
     ParserExpression expression_parser;
diff --git a/src/Parsers/ParserDropFunctionQuery.cpp b/src/Parsers/ParserDropFunctionQuery.cpp
index 3f35124f9ab..d98acef3252 100644
--- a/src/Parsers/ParserDropFunctionQuery.cpp
+++ b/src/Parsers/ParserDropFunctionQuery.cpp
@@ -9,10 +9,10 @@ namespace DB
 
 bool ParserDropFunctionQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_drop("DROP");
-    ParserKeyword s_function("FUNCTION");
-    ParserKeyword s_if_exists("IF EXISTS");
-    ParserKeyword s_on("ON");
+    ParserKeyword s_drop(Keyword::DROP);
+    ParserKeyword s_function(Keyword::FUNCTION);
+    ParserKeyword s_if_exists(Keyword::IF_EXISTS);
+    ParserKeyword s_on(Keyword::ON);
     ParserIdentifier function_name_p;
 
     String cluster_str;
diff --git a/src/Parsers/ParserDropIndexQuery.cpp b/src/Parsers/ParserDropIndexQuery.cpp
index 5843d8b94bf..1363c00f252 100644
--- a/src/Parsers/ParserDropIndexQuery.cpp
+++ b/src/Parsers/ParserDropIndexQuery.cpp
@@ -13,10 +13,10 @@ bool ParserDropIndexQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected
     auto query = std::make_shared<ASTDropIndexQuery>();
     node = query;
 
-    ParserKeyword s_drop("DROP");
-    ParserKeyword s_index("INDEX");
-    ParserKeyword s_on("ON");
-    ParserKeyword s_if_exists("IF EXISTS");
+    ParserKeyword s_drop(Keyword::DROP);
+    ParserKeyword s_index(Keyword::INDEX);
+    ParserKeyword s_on(Keyword::ON);
+    ParserKeyword s_if_exists(Keyword::IF_EXISTS);
     ParserIdentifier index_name_p;
 
     String cluster_str;
diff --git a/src/Parsers/ParserDropNamedCollectionQuery.cpp b/src/Parsers/ParserDropNamedCollectionQuery.cpp
index b0b010b5ef6..b438f3b5f4f 100644
--- a/src/Parsers/ParserDropNamedCollectionQuery.cpp
+++ b/src/Parsers/ParserDropNamedCollectionQuery.cpp
@@ -9,10 +9,10 @@ namespace DB
 
 bool ParserDropNamedCollectionQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_drop("DROP");
-    ParserKeyword s_collection("NAMED COLLECTION");
-    ParserKeyword s_if_exists("IF EXISTS");
-    ParserKeyword s_on("ON");
+    ParserKeyword s_drop(Keyword::DROP);
+    ParserKeyword s_collection(Keyword::NAMED_COLLECTION);
+    ParserKeyword s_if_exists(Keyword::IF_EXISTS);
+    ParserKeyword s_on(Keyword::ON);
     ParserIdentifier name_p;
 
     String cluster_str;
diff --git a/src/Parsers/ParserDropQuery.cpp b/src/Parsers/ParserDropQuery.cpp
index 450c8a1afec..fab9938d0b0 100644
--- a/src/Parsers/ParserDropQuery.cpp
+++ b/src/Parsers/ParserDropQuery.cpp
@@ -12,18 +12,18 @@ namespace
 
 bool parseDropQuery(IParser::Pos & pos, ASTPtr & node, Expected & expected, const ASTDropQuery::Kind kind)
 {
-    ParserKeyword s_temporary("TEMPORARY");
-    ParserKeyword s_table("TABLE");
-    ParserKeyword s_dictionary("DICTIONARY");
-    ParserKeyword s_view("VIEW");
-    ParserKeyword s_database("DATABASE");
+    ParserKeyword s_temporary(Keyword::TEMPORARY);
+    ParserKeyword s_table(Keyword::TABLE);
+    ParserKeyword s_dictionary(Keyword::DICTIONARY);
+    ParserKeyword s_view(Keyword::VIEW);
+    ParserKeyword s_database(Keyword::DATABASE);
     ParserToken s_dot(TokenType::Dot);
-    ParserKeyword s_if_exists("IF EXISTS");
-    ParserKeyword s_if_empty("IF EMPTY");
+    ParserKeyword s_if_exists(Keyword::IF_EXISTS);
+    ParserKeyword s_if_empty(Keyword::IF_EMPTY);
     ParserIdentifier name_p(true);
-    ParserKeyword s_permanently("PERMANENTLY");
-    ParserKeyword s_no_delay("NO DELAY");
-    ParserKeyword s_sync("SYNC");
+    ParserKeyword s_permanently(Keyword::PERMANENTLY);
+    ParserKeyword s_no_delay(Keyword::NO_DELAY);
+    ParserKeyword s_sync(Keyword::SYNC);
 
     ASTPtr database;
     ASTPtr table;
@@ -80,7 +80,7 @@ bool parseDropQuery(IParser::Pos & pos, ASTPtr & node, Expected & expected, cons
     }
 
     /// common for tables / dictionaries / databases
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::ON}.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
             return false;
@@ -122,9 +122,9 @@ bool parseDropQuery(IParser::Pos & pos, ASTPtr & node, Expected & expected, cons
 
 bool ParserDropQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_drop("DROP");
-    ParserKeyword s_detach("DETACH");
-    ParserKeyword s_truncate("TRUNCATE");
+    ParserKeyword s_drop(Keyword::DROP);
+    ParserKeyword s_detach(Keyword::DETACH);
+    ParserKeyword s_truncate(Keyword::TRUNCATE);
 
     if (s_drop.ignore(pos, expected))
         return parseDropQuery(pos, node, expected, ASTDropQuery::Kind::Drop);
diff --git a/src/Parsers/ParserExplainQuery.cpp b/src/Parsers/ParserExplainQuery.cpp
index 148b671af71..16ba0701992 100644
--- a/src/Parsers/ParserExplainQuery.cpp
+++ b/src/Parsers/ParserExplainQuery.cpp
@@ -16,15 +16,15 @@ bool ParserExplainQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
 {
     ASTExplainQuery::ExplainKind kind;
 
-    ParserKeyword s_ast("AST");
-    ParserKeyword s_explain("EXPLAIN");
-    ParserKeyword s_syntax("SYNTAX");
-    ParserKeyword s_query_tree("QUERY TREE");
-    ParserKeyword s_pipeline("PIPELINE");
-    ParserKeyword s_plan("PLAN");
-    ParserKeyword s_estimates("ESTIMATE");
-    ParserKeyword s_table_override("TABLE OVERRIDE");
-    ParserKeyword s_current_transaction("CURRENT TRANSACTION");
+    ParserKeyword s_ast(Keyword::AST);
+    ParserKeyword s_explain(Keyword::EXPLAIN);
+    ParserKeyword s_syntax(Keyword::SYNTAX);
+    ParserKeyword s_query_tree(Keyword::QUERY_TREE);
+    ParserKeyword s_pipeline(Keyword::PIPELINE);
+    ParserKeyword s_plan(Keyword::PLAN);
+    ParserKeyword s_estimates(Keyword::ESTIMATE);
+    ParserKeyword s_table_override(Keyword::TABLE_OVERRIDE);
+    ParserKeyword s_current_transaction(Keyword::CURRENT_TRANSACTION);
 
     if (s_explain.ignore(pos, expected))
     {
diff --git a/src/Parsers/ParserExternalDDLQuery.cpp b/src/Parsers/ParserExternalDDLQuery.cpp
index 01e8fff4f3c..ebe210a953a 100644
--- a/src/Parsers/ParserExternalDDLQuery.cpp
+++ b/src/Parsers/ParserExternalDDLQuery.cpp
@@ -27,7 +27,7 @@ namespace ErrorCodes
 bool ParserExternalDDLQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
     ParserFunction p_function;
-    ParserKeyword s_external("EXTERNAL DDL FROM");
+    ParserKeyword s_external(Keyword::EXTERNAL_DDL_FROM);
 
     ASTPtr from;
     auto external_ddl_query = std::make_shared<ASTExternalDDLQuery>();
@@ -61,16 +61,16 @@ bool ParserExternalDDLQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expect
         {
             /// Syntax error is ignored, so we need to convert the error code for parsing failure
 
-            if (ParserKeyword("ALTER TABLE").ignore(pos))
+            if (ParserKeyword(Keyword::ALTER_TABLE).ignore(pos))
                 throw Exception(ErrorCodes::MYSQL_SYNTAX_ERROR, "Cannot parse MySQL alter query.");
 
-            if (ParserKeyword("RENAME TABLE").ignore(pos))
+            if (ParserKeyword(Keyword::RENAME_TABLE).ignore(pos))
                 throw Exception(ErrorCodes::MYSQL_SYNTAX_ERROR, "Cannot parse MySQL rename query.");
 
-            if (ParserKeyword("DROP TABLE").ignore(pos) || ParserKeyword("TRUNCATE").ignore(pos))
+            if (ParserKeyword(Keyword::DROP_TABLE).ignore(pos) || ParserKeyword(Keyword::TRUNCATE).ignore(pos))
                 throw Exception(ErrorCodes::MYSQL_SYNTAX_ERROR, "Cannot parse MySQL drop query.");
 
-            if (ParserKeyword("CREATE TABLE").ignore(pos) || ParserKeyword("CREATE TEMPORARY TABLE").ignore(pos))
+            if (ParserKeyword(Keyword::CREATE_TABLE).ignore(pos) || ParserKeyword(Keyword::CREATE_TEMPORARY_TABLE).ignore(pos))
                 throw Exception(ErrorCodes::MYSQL_SYNTAX_ERROR, "Cannot parse MySQL create query.");
         }
 #endif
diff --git a/src/Parsers/ParserInsertQuery.cpp b/src/Parsers/ParserInsertQuery.cpp
index 8601e12ebcb..d1171dd4815 100644
--- a/src/Parsers/ParserInsertQuery.cpp
+++ b/src/Parsers/ParserInsertQuery.cpp
@@ -26,19 +26,19 @@ namespace ErrorCodes
 bool ParserInsertQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
     /// Create parsers
-    ParserKeyword s_insert_into("INSERT INTO");
-    ParserKeyword s_from_infile("FROM INFILE");
-    ParserKeyword s_compression("COMPRESSION");
-    ParserKeyword s_table("TABLE");
-    ParserKeyword s_function("FUNCTION");
+    ParserKeyword s_insert_into(Keyword::INSERT_INTO);
+    ParserKeyword s_from_infile(Keyword::FROM_INFILE);
+    ParserKeyword s_compression(Keyword::COMPRESSION);
+    ParserKeyword s_table(Keyword::TABLE);
+    ParserKeyword s_function(Keyword::FUNCTION);
     ParserToken s_dot(TokenType::Dot);
-    ParserKeyword s_values("VALUES");
-    ParserKeyword s_format("FORMAT");
-    ParserKeyword s_settings("SETTINGS");
-    ParserKeyword s_select("SELECT");
-    ParserKeyword s_watch("WATCH");
-    ParserKeyword s_partition_by("PARTITION BY");
-    ParserKeyword s_with("WITH");
+    ParserKeyword s_values(Keyword::VALUES);
+    ParserKeyword s_format(Keyword::FORMAT);
+    ParserKeyword s_settings(Keyword::SETTINGS);
+    ParserKeyword s_select(Keyword::SELECT);
+    ParserKeyword s_watch(Keyword::WATCH);
+    ParserKeyword s_partition_by(Keyword::PARTITION_BY);
+    ParserKeyword s_with(Keyword::WITH);
     ParserToken s_lparen(TokenType::OpeningRoundBracket);
     ParserToken s_rparen(TokenType::ClosingRoundBracket);
     ParserToken s_semicolon(TokenType::Semicolon);
diff --git a/src/Parsers/ParserKillQueryQuery.cpp b/src/Parsers/ParserKillQueryQuery.cpp
index 0b1b37e61bf..55bd5100009 100644
--- a/src/Parsers/ParserKillQueryQuery.cpp
+++ b/src/Parsers/ParserKillQueryQuery.cpp
@@ -14,16 +14,16 @@ bool ParserKillQueryQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expect
     String cluster_str;
     auto query = std::make_shared<ASTKillQueryQuery>();
 
-    ParserKeyword p_kill{"KILL"};
-    ParserKeyword p_query{"QUERY"};
-    ParserKeyword p_mutation{"MUTATION"};
-    ParserKeyword p_part_move_to_shard{"PART_MOVE_TO_SHARD"};
-    ParserKeyword p_transaction{"TRANSACTION"};
-    ParserKeyword p_on{"ON"};
-    ParserKeyword p_test{"TEST"};
-    ParserKeyword p_sync{"SYNC"};
-    ParserKeyword p_async{"ASYNC"};
-    ParserKeyword p_where{"WHERE"};
+    ParserKeyword p_kill{Keyword::KILL};
+    ParserKeyword p_query{Keyword::QUERY};
+    ParserKeyword p_mutation{Keyword::MUTATION};
+    ParserKeyword p_part_move_to_shard{Keyword::PART_MOVE_TO_SHARD};
+    ParserKeyword p_transaction{Keyword::TRANSACTION};
+    ParserKeyword p_on{Keyword::ON};
+    ParserKeyword p_test{Keyword::TEST};
+    ParserKeyword p_sync{Keyword::SYNC};
+    ParserKeyword p_async{Keyword::ASYNC};
+    ParserKeyword p_where{Keyword::WHERE};
     ParserExpression p_where_expression;
 
     if (!p_kill.ignore(pos, expected))
diff --git a/src/Parsers/ParserOptimizeQuery.cpp b/src/Parsers/ParserOptimizeQuery.cpp
index e887ff445d2..7162f2ac3da 100644
--- a/src/Parsers/ParserOptimizeQuery.cpp
+++ b/src/Parsers/ParserOptimizeQuery.cpp
@@ -24,12 +24,12 @@ bool ParserOptimizeQueryColumnsSpecification::parseImpl(Pos & pos, ASTPtr & node
 
 bool ParserOptimizeQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_optimize_table("OPTIMIZE TABLE");
-    ParserKeyword s_partition("PARTITION");
-    ParserKeyword s_final("FINAL");
-    ParserKeyword s_deduplicate("DEDUPLICATE");
-    ParserKeyword s_cleanup("CLEANUP");
-    ParserKeyword s_by("BY");
+    ParserKeyword s_optimize_table(Keyword::OPTIMIZE_TABLE);
+    ParserKeyword s_partition(Keyword::PARTITION);
+    ParserKeyword s_final(Keyword::FINAL);
+    ParserKeyword s_deduplicate(Keyword::DEDUPLICATE);
+    ParserKeyword s_cleanup(Keyword::CLEANUP);
+    ParserKeyword s_by(Keyword::BY);
     ParserToken s_dot(TokenType::Dot);
     ParserIdentifier name_p(true);
     ParserPartition partition_p;
@@ -55,7 +55,7 @@ bool ParserOptimizeQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expecte
             return false;
     }
 
-    if (ParserKeyword{"ON"}.ignore(pos, expected) && !ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
+    if (ParserKeyword{Keyword::ON}.ignore(pos, expected) && !ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
         return false;
 
     if (s_partition.ignore(pos, expected))
diff --git a/src/Parsers/ParserPartition.cpp b/src/Parsers/ParserPartition.cpp
index f7d972dd4af..80a28f4803e 100644
--- a/src/Parsers/ParserPartition.cpp
+++ b/src/Parsers/ParserPartition.cpp
@@ -14,8 +14,8 @@ namespace DB
 
 bool ParserPartition::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_id("ID");
-    ParserKeyword s_all("ALL");
+    ParserKeyword s_id(Keyword::ID);
+    ParserKeyword s_all(Keyword::ALL);
     ParserStringLiteral parser_string_literal;
     ParserSubstitution parser_substitution;
     ParserExpression parser_expr;
diff --git a/src/Parsers/ParserProjectionSelectQuery.cpp b/src/Parsers/ParserProjectionSelectQuery.cpp
index b2adb5cf154..9ddd536f847 100644
--- a/src/Parsers/ParserProjectionSelectQuery.cpp
+++ b/src/Parsers/ParserProjectionSelectQuery.cpp
@@ -15,10 +15,10 @@ bool ParserProjectionSelectQuery::parseImpl(Pos & pos, ASTPtr & node, Expected &
     auto select_query = std::make_shared<ASTProjectionSelectQuery>();
     node = select_query;
 
-    ParserKeyword s_with("WITH");
-    ParserKeyword s_select("SELECT");
-    ParserKeyword s_group_by("GROUP BY");
-    ParserKeyword s_order_by("ORDER BY");
+    ParserKeyword s_with(Keyword::WITH);
+    ParserKeyword s_select(Keyword::SELECT);
+    ParserKeyword s_group_by(Keyword::GROUP_BY);
+    ParserKeyword s_order_by(Keyword::ORDER_BY);
 
     ParserNotEmptyExpressionList exp_list_for_with_clause(false);
     ParserNotEmptyExpressionList exp_list_for_select_clause(true); /// Allows aliases without AS keyword.
diff --git a/src/Parsers/ParserQueryWithOutput.cpp b/src/Parsers/ParserQueryWithOutput.cpp
index 4a0b928608b..cb0c10cd1c9 100644
--- a/src/Parsers/ParserQueryWithOutput.cpp
+++ b/src/Parsers/ParserQueryWithOutput.cpp
@@ -105,32 +105,32 @@ bool ParserQueryWithOutput::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     /// FIXME: try to prettify this cast using `as<>()`
     auto & query_with_output = dynamic_cast<ASTQueryWithOutput &>(*query);
 
-    ParserKeyword s_into_outfile("INTO OUTFILE");
+    ParserKeyword s_into_outfile(Keyword::INTO_OUTFILE);
     if (s_into_outfile.ignore(pos, expected))
     {
         ParserStringLiteral out_file_p;
         if (!out_file_p.parse(pos, query_with_output.out_file, expected))
             return false;
 
-        ParserKeyword s_append("APPEND");
+        ParserKeyword s_append(Keyword::APPEND);
         if (s_append.ignore(pos, expected))
         {
             query_with_output.is_outfile_append = true;
         }
 
-        ParserKeyword s_truncate("TRUNCATE");
+        ParserKeyword s_truncate(Keyword::TRUNCATE);
         if (s_truncate.ignore(pos, expected))
         {
             query_with_output.is_outfile_truncate = true;
         }
 
-        ParserKeyword s_stdout("AND STDOUT");
+        ParserKeyword s_stdout(Keyword::AND_STDOUT);
         if (s_stdout.ignore(pos, expected))
         {
             query_with_output.is_into_outfile_with_stdout = true;
         }
 
-        ParserKeyword s_compression_method("COMPRESSION");
+        ParserKeyword s_compression_method(Keyword::COMPRESSION);
         if (s_compression_method.ignore(pos, expected))
         {
             ParserStringLiteral compression;
@@ -138,7 +138,7 @@ bool ParserQueryWithOutput::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
                 return false;
             query_with_output.children.push_back(query_with_output.compression);
 
-            ParserKeyword s_compression_level("LEVEL");
+            ParserKeyword s_compression_level(Keyword::LEVEL);
             if (s_compression_level.ignore(pos, expected))
             {
                 ParserNumber compression_level;
@@ -152,7 +152,7 @@ bool ParserQueryWithOutput::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
 
     }
 
-    ParserKeyword s_format("FORMAT");
+    ParserKeyword s_format(Keyword::FORMAT);
 
     if (s_format.ignore(pos, expected))
     {
@@ -166,7 +166,7 @@ bool ParserQueryWithOutput::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     }
 
     // SETTINGS key1 = value1, key2 = value2, ...
-    ParserKeyword s_settings("SETTINGS");
+    ParserKeyword s_settings(Keyword::SETTINGS);
     if (!query_with_output.settings_ast && s_settings.ignore(pos, expected))
     {
         ParserSetQuery parser_settings(true);
diff --git a/src/Parsers/ParserRefreshStrategy.cpp b/src/Parsers/ParserRefreshStrategy.cpp
index b41473e2aa5..e7912293d85 100644
--- a/src/Parsers/ParserRefreshStrategy.cpp
+++ b/src/Parsers/ParserRefreshStrategy.cpp
@@ -18,9 +18,16 @@ namespace ErrorCodes
 
 bool ParserRefreshStrategy::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
+    ParserKeyword s_after{Keyword::AFTER};
+    ParserKeyword s_every{Keyword::EVERY};
+    ParserKeyword s_offset{Keyword::OFFSET};
+    ParserKeyword s_randomize_for{Keyword::RANDOMIZE_FOR};
+    ParserKeyword s_depends_on{Keyword::DEPENDS_ON};
+    ParserKeyword s_settings{Keyword::SETTINGS};
+
     auto refresh = std::make_shared<ASTRefreshStrategy>();
 
-    if (ParserKeyword{"AFTER"}.ignore(pos, expected))
+    if (s_after.ignore(pos, expected))
     {
         refresh->schedule_kind = RefreshScheduleKind::AFTER;
         ASTPtr period;
@@ -29,14 +36,14 @@ bool ParserRefreshStrategy::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
 
         refresh->set(refresh->period, period);
     }
-    else if (ParserKeyword{"EVERY"}.ignore(pos, expected))
+    else if (s_every.ignore(pos, expected))
     {
         refresh->schedule_kind = RefreshScheduleKind::EVERY;
         ASTPtr period;
         if (!ParserTimeInterval{{.allow_mixing_calendar_and_clock_units = false}}.parse(pos, period, expected))
             return false;
         refresh->set(refresh->period, period);
-        if (ParserKeyword{"OFFSET"}.ignore(pos, expected))
+        if (s_offset.ignore(pos, expected))
         {
             ASTPtr periodic_offset;
             if (!ParserTimeInterval{{.allow_zero = true}}.parse(pos, periodic_offset, expected))
@@ -53,7 +60,7 @@ bool ParserRefreshStrategy::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     if (refresh->schedule_kind == RefreshScheduleKind::UNKNOWN)
         return false;
 
-    if (ParserKeyword{"RANDOMIZE FOR"}.ignore(pos, expected))
+    if (s_randomize_for.ignore(pos, expected))
     {
         ASTPtr spread;
         if (!ParserTimeInterval{{.allow_zero = true}}.parse(pos, spread, expected))
@@ -62,7 +69,7 @@ bool ParserRefreshStrategy::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
         refresh->set(refresh->spread, spread);
     }
 
-    if (ParserKeyword{"DEPENDS ON"}.ignore(pos, expected))
+    if (s_depends_on.ignore(pos, expected))
     {
         if (refresh->schedule_kind == RefreshScheduleKind::AFTER)
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
@@ -81,7 +88,7 @@ bool ParserRefreshStrategy::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     }
 
     // Refresh SETTINGS
-    if (ParserKeyword{"SETTINGS"}.ignore(pos, expected))
+    if (s_settings.ignore(pos, expected))
     {
         /// Settings are written like SET query, so parse them with ParserSetQuery
         ASTPtr settings;
diff --git a/src/Parsers/ParserRenameQuery.cpp b/src/Parsers/ParserRenameQuery.cpp
index f9d29108ed6..6b652c27f6c 100644
--- a/src/Parsers/ParserRenameQuery.cpp
+++ b/src/Parsers/ParserRenameQuery.cpp
@@ -11,15 +11,15 @@ namespace DB
 
 bool ParserRenameQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_rename("RENAME");
-    ParserKeyword s_rename_table("RENAME TABLE");
-    ParserKeyword s_exchange_tables("EXCHANGE TABLES");
-    ParserKeyword s_rename_dictionary("RENAME DICTIONARY");
-    ParserKeyword s_exchange_dictionaries("EXCHANGE DICTIONARIES");
-    ParserKeyword s_rename_database("RENAME DATABASE");
-    ParserKeyword s_if_exists("IF EXISTS");
-    ParserKeyword s_to("TO");
-    ParserKeyword s_and("AND");
+    ParserKeyword s_rename(Keyword::RENAME);
+    ParserKeyword s_rename_table(Keyword::RENAME_TABLE);
+    ParserKeyword s_exchange_tables(Keyword::EXCHANGE_TABLES);
+    ParserKeyword s_rename_dictionary(Keyword::RENAME_DICTIONARY);
+    ParserKeyword s_exchange_dictionaries(Keyword::EXCHANGE_DICTIONARIES);
+    ParserKeyword s_rename_database(Keyword::RENAME_DATABASE);
+    ParserKeyword s_if_exists(Keyword::IF_EXISTS);
+    ParserKeyword s_to(Keyword::TO);
+    ParserKeyword s_and(Keyword::AND);
     ParserToken s_comma(TokenType::Comma);
 
     bool exchange = false;
@@ -39,7 +39,7 @@ bool ParserRenameQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
             return false;
 
         String cluster_str;
-        if (ParserKeyword{"ON"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::ON}.ignore(pos, expected))
         {
             if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
                 return false;
@@ -94,7 +94,7 @@ bool ParserRenameQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     }
 
     String cluster_str;
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::ON}.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
             return false;
diff --git a/src/Parsers/ParserSelectQuery.cpp b/src/Parsers/ParserSelectQuery.cpp
index 641e74b5f18..ce15c7b03fd 100644
--- a/src/Parsers/ParserSelectQuery.cpp
+++ b/src/Parsers/ParserSelectQuery.cpp
@@ -37,35 +37,35 @@ bool ParserSelectQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     auto select_query = std::make_shared<ASTSelectQuery>();
     node = select_query;
 
-    ParserKeyword s_select("SELECT");
-    ParserKeyword s_all("ALL");
-    ParserKeyword s_distinct("DISTINCT");
-    ParserKeyword s_distinct_on("DISTINCT ON");
-    ParserKeyword s_from("FROM");
-    ParserKeyword s_prewhere("PREWHERE");
-    ParserKeyword s_where("WHERE");
-    ParserKeyword s_group_by("GROUP BY");
-    ParserKeyword s_with("WITH");
-    ParserKeyword s_totals("TOTALS");
-    ParserKeyword s_having("HAVING");
-    ParserKeyword s_window("WINDOW");
-    ParserKeyword s_order_by("ORDER BY");
-    ParserKeyword s_limit("LIMIT");
-    ParserKeyword s_settings("SETTINGS");
-    ParserKeyword s_by("BY");
-    ParserKeyword s_rollup("ROLLUP");
-    ParserKeyword s_cube("CUBE");
-    ParserKeyword s_grouping_sets("GROUPING SETS");
-    ParserKeyword s_top("TOP");
-    ParserKeyword s_with_ties("WITH TIES");
-    ParserKeyword s_offset("OFFSET");
-    ParserKeyword s_fetch("FETCH");
-    ParserKeyword s_only("ONLY");
-    ParserKeyword s_row("ROW");
-    ParserKeyword s_rows("ROWS");
-    ParserKeyword s_first("FIRST");
-    ParserKeyword s_next("NEXT");
-    ParserKeyword s_interpolate("INTERPOLATE");
+    ParserKeyword s_select(Keyword::SELECT);
+    ParserKeyword s_all(Keyword::ALL);
+    ParserKeyword s_distinct(Keyword::DISTINCT);
+    ParserKeyword s_distinct_on(Keyword::DISTINCT_ON);
+    ParserKeyword s_from(Keyword::FROM);
+    ParserKeyword s_prewhere(Keyword::PREWHERE);
+    ParserKeyword s_where(Keyword::WHERE);
+    ParserKeyword s_group_by(Keyword::GROUP_BY);
+    ParserKeyword s_with(Keyword::WITH);
+    ParserKeyword s_totals(Keyword::TOTALS);
+    ParserKeyword s_having(Keyword::HAVING);
+    ParserKeyword s_window(Keyword::WINDOW);
+    ParserKeyword s_order_by(Keyword::ORDER_BY);
+    ParserKeyword s_limit(Keyword::LIMIT);
+    ParserKeyword s_settings(Keyword::SETTINGS);
+    ParserKeyword s_by(Keyword::BY);
+    ParserKeyword s_rollup(Keyword::ROLLUP);
+    ParserKeyword s_cube(Keyword::CUBE);
+    ParserKeyword s_grouping_sets(Keyword::GROUPING_SETS);
+    ParserKeyword s_top(Keyword::TOP);
+    ParserKeyword s_with_ties(Keyword::WITH_TIES);
+    ParserKeyword s_offset(Keyword::OFFSET);
+    ParserKeyword s_fetch(Keyword::FETCH);
+    ParserKeyword s_only(Keyword::ONLY);
+    ParserKeyword s_row(Keyword::ROW);
+    ParserKeyword s_rows(Keyword::ROWS);
+    ParserKeyword s_first(Keyword::FIRST);
+    ParserKeyword s_next(Keyword::NEXT);
+    ParserKeyword s_interpolate(Keyword::INTERPOLATE);
 
     ParserNotEmptyExpressionList exp_list(false);
     ParserNotEmptyExpressionList exp_list_for_with_clause(false);
diff --git a/src/Parsers/ParserSetQuery.cpp b/src/Parsers/ParserSetQuery.cpp
index 4ad715ba499..13b881635cd 100644
--- a/src/Parsers/ParserSetQuery.cpp
+++ b/src/Parsers/ParserSetQuery.cpp
@@ -210,9 +210,9 @@ bool ParserSetQuery::parseNameValuePair(SettingChange & change, IParser::Pos & p
     if (!s_eq.ignore(pos, expected))
         return false;
 
-    if (ParserKeyword("TRUE").ignore(pos, expected))
+    if (ParserKeyword(Keyword::TRUE_KEYWORD).ignore(pos, expected))
         value = std::make_shared<ASTLiteral>(Field(static_cast<UInt64>(1)));
-    else if (ParserKeyword("FALSE").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::FALSE_KEYWORD).ignore(pos, expected))
         value = std::make_shared<ASTLiteral>(Field(static_cast<UInt64>(0)));
     /// for SETTINGS disk=disk(type='s3', path='', ...)
     else if (function_p.parse(pos, function_ast, expected) && function_ast->as<ASTFunction>()->name == "disk")
@@ -269,16 +269,16 @@ bool ParserSetQuery::parseNameValuePairWithParameterOrDefault(
     }
 
     /// Default
-    if (ParserKeyword("DEFAULT").ignore(pos, expected))
+    if (ParserKeyword(Keyword::DEFAULT).ignore(pos, expected))
     {
         default_settings = name;
         return true;
     }
 
     /// Setting
-    if (ParserKeyword("TRUE").ignore(pos, expected))
+    if (ParserKeyword(Keyword::TRUE_KEYWORD).ignore(pos, expected))
         node = std::make_shared<ASTLiteral>(Field(static_cast<UInt64>(1)));
-    else if (ParserKeyword("FALSE").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::FALSE_KEYWORD).ignore(pos, expected))
         node = std::make_shared<ASTLiteral>(Field(static_cast<UInt64>(0)));
     else if (function_p.parse(pos, function_ast, expected) && function_ast->as<ASTFunction>()->name == "disk")
     {
@@ -303,13 +303,13 @@ bool ParserSetQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
     if (!parse_only_internals)
     {
-        ParserKeyword s_set("SET");
+        ParserKeyword s_set(Keyword::SET);
 
         if (!s_set.ignore(pos, expected))
             return false;
 
         /// Parse SET TRANSACTION ... queries using ParserTransactionControl
-        if (ParserKeyword{"TRANSACTION"}.check(pos, expected))
+        if (ParserKeyword{Keyword::TRANSACTION}.check(pos, expected))
             return false;
     }
 
diff --git a/src/Parsers/ParserShowColumnsQuery.cpp b/src/Parsers/ParserShowColumnsQuery.cpp
index e5fc5c39701..5d26d7bf1d4 100644
--- a/src/Parsers/ParserShowColumnsQuery.cpp
+++ b/src/Parsers/ParserShowColumnsQuery.cpp
@@ -23,19 +23,19 @@ bool ParserShowColumnsQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
 
     auto query = std::make_shared<ASTShowColumnsQuery>();
 
-    if (!ParserKeyword("SHOW").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::SHOW).ignore(pos, expected))
         return false;
 
-    if (ParserKeyword("EXTENDED").ignore(pos, expected))
+    if (ParserKeyword(Keyword::EXTENDED).ignore(pos, expected))
         query->extended = true;
 
-    if (ParserKeyword("FULL").ignore(pos, expected))
+    if (ParserKeyword(Keyword::FULL).ignore(pos, expected))
         query->full = true;
 
-    if (!(ParserKeyword("COLUMNS").ignore(pos, expected) || ParserKeyword("FIELDS").ignore(pos, expected)))
+    if (!(ParserKeyword(Keyword::COLUMNS).ignore(pos, expected) || ParserKeyword(Keyword::FIELDS).ignore(pos, expected)))
         return false;
 
-    if (ParserKeyword("FROM").ignore(pos, expected) || ParserKeyword("IN").ignore(pos, expected))
+    if (ParserKeyword(Keyword::FROM).ignore(pos, expected) || ParserKeyword(Keyword::IN).ignore(pos, expected))
     {
         if (!ParserCompoundIdentifier().parse(pos, from1, expected))
             return false;
@@ -55,7 +55,7 @@ bool ParserShowColumnsQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
     }
     else
     {
-        if (ParserKeyword("FROM").ignore(pos, expected) || ParserKeyword("IN").ignore(pos, expected))
+        if (ParserKeyword(Keyword::FROM).ignore(pos, expected) || ParserKeyword(Keyword::IN).ignore(pos, expected))
             if (!ParserIdentifier().parse(pos, from2, expected))
                 return false;
 
@@ -65,10 +65,10 @@ bool ParserShowColumnsQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
         query->database = from2_str;
     }
 
-    if (ParserKeyword("NOT").ignore(pos, expected))
+    if (ParserKeyword(Keyword::NOT).ignore(pos, expected))
         query->not_like = true;
 
-    if (bool insensitive = ParserKeyword("ILIKE").ignore(pos, expected); insensitive || ParserKeyword("LIKE").ignore(pos, expected))
+    if (bool insensitive = ParserKeyword(Keyword::ILIKE).ignore(pos, expected); insensitive || ParserKeyword(Keyword::LIKE).ignore(pos, expected))
     {
         if (insensitive)
             query->case_insensitive_like = true;
@@ -78,11 +78,11 @@ bool ParserShowColumnsQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
     }
     else if (query->not_like)
         return false;
-    else if (ParserKeyword("WHERE").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::WHERE).ignore(pos, expected))
         if (!ParserExpressionWithOptionalAlias(false).parse(pos, query->where_expression, expected))
             return false;
 
-    if (ParserKeyword("LIMIT").ignore(pos, expected))
+    if (ParserKeyword(Keyword::LIMIT).ignore(pos, expected))
         if (!ParserExpressionWithOptionalAlias(false).parse(pos, query->limit_length, expected))
             return false;
 
diff --git a/src/Parsers/ParserShowEngineQuery.h b/src/Parsers/ParserShowEngineQuery.h
index e06326436f1..0e9a742c0e9 100644
--- a/src/Parsers/ParserShowEngineQuery.h
+++ b/src/Parsers/ParserShowEngineQuery.h
@@ -20,7 +20,7 @@ protected:
     {
         auto query = std::make_shared<ASTShowEnginesQuery>();
 
-        if (!ParserKeyword("SHOW ENGINES").ignore(pos, expected))
+        if (!ParserKeyword(Keyword::SHOW_ENGINES).ignore(pos, expected))
             return false;
 
         node = query;
diff --git a/src/Parsers/ParserShowFunctionsQuery.cpp b/src/Parsers/ParserShowFunctionsQuery.cpp
index 524d936c4f1..37b68dcec08 100644
--- a/src/Parsers/ParserShowFunctionsQuery.cpp
+++ b/src/Parsers/ParserShowFunctionsQuery.cpp
@@ -13,10 +13,10 @@ bool ParserShowFunctionsQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & ex
     ASTPtr like;
 
     auto query = std::make_shared<ASTShowFunctionsQuery>();
-    if (!ParserKeyword("SHOW FUNCTIONS").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::SHOW_FUNCTIONS).ignore(pos, expected))
         return false;
 
-    if (bool insensitive = ParserKeyword("ILIKE").ignore(pos, expected); insensitive || ParserKeyword("LIKE").ignore(pos, expected))
+    if (bool insensitive = ParserKeyword(Keyword::ILIKE).ignore(pos, expected); insensitive || ParserKeyword(Keyword::LIKE).ignore(pos, expected))
     {
         if (insensitive)
             query->case_insensitive_like = true;
diff --git a/src/Parsers/ParserShowIndexesQuery.cpp b/src/Parsers/ParserShowIndexesQuery.cpp
index 7852ed9806d..495dfc5101f 100644
--- a/src/Parsers/ParserShowIndexesQuery.cpp
+++ b/src/Parsers/ParserShowIndexesQuery.cpp
@@ -22,16 +22,16 @@ bool ParserShowIndexesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
 
     auto query = std::make_shared<ASTShowIndexesQuery>();
 
-    if (!ParserKeyword("SHOW").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::SHOW).ignore(pos, expected))
         return false;
 
-    if (ParserKeyword("EXTENDED").ignore(pos, expected))
+    if (ParserKeyword(Keyword::EXTENDED).ignore(pos, expected))
         query->extended = true;
 
-    if (!(ParserKeyword("INDEX").ignore(pos, expected) || ParserKeyword("INDEXES").ignore(pos, expected) || ParserKeyword("INDICES").ignore(pos, expected) || ParserKeyword("KEYS").ignore(pos, expected)))
+    if (!(ParserKeyword(Keyword::INDEX).ignore(pos, expected) || ParserKeyword(Keyword::INDEXES).ignore(pos, expected) || ParserKeyword(Keyword::INDICES).ignore(pos, expected) || ParserKeyword(Keyword::KEYS).ignore(pos, expected)))
         return false;
 
-    if (ParserKeyword("FROM").ignore(pos, expected) || ParserKeyword("IN").ignore(pos, expected))
+    if (ParserKeyword(Keyword::FROM).ignore(pos, expected) || ParserKeyword(Keyword::IN).ignore(pos, expected))
     {
         if (!ParserCompoundIdentifier().parse(pos, from1, expected))
             return false;
@@ -51,7 +51,7 @@ bool ParserShowIndexesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
     }
     else
     {
-        if (ParserKeyword("FROM").ignore(pos, expected) || ParserKeyword("IN").ignore(pos, expected))
+        if (ParserKeyword(Keyword::FROM).ignore(pos, expected) || ParserKeyword(Keyword::IN).ignore(pos, expected))
             if (!ParserIdentifier().parse(pos, from2, expected))
                 return false;
 
@@ -61,7 +61,7 @@ bool ParserShowIndexesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expe
         query->database = from2_str;
     }
 
-    if (ParserKeyword("WHERE").ignore(pos, expected))
+    if (ParserKeyword(Keyword::WHERE).ignore(pos, expected))
         if (!ParserExpressionWithOptionalAlias(false).parse(pos, query->where_expression, expected))
             return false;
 
diff --git a/src/Parsers/ParserShowProcesslistQuery.h b/src/Parsers/ParserShowProcesslistQuery.h
index de08894e059..29c2970a8a1 100644
--- a/src/Parsers/ParserShowProcesslistQuery.h
+++ b/src/Parsers/ParserShowProcesslistQuery.h
@@ -20,7 +20,7 @@ protected:
     {
         auto query = std::make_shared<ASTShowProcesslistQuery>();
 
-        if (!ParserKeyword("SHOW PROCESSLIST").ignore(pos, expected))
+        if (!ParserKeyword(Keyword::SHOW_PROCESSLIST).ignore(pos, expected))
             return false;
 
         node = query;
diff --git a/src/Parsers/ParserShowSettingQuery.cpp b/src/Parsers/ParserShowSettingQuery.cpp
index 2586cbdfb43..9e4736a5eb7 100644
--- a/src/Parsers/ParserShowSettingQuery.cpp
+++ b/src/Parsers/ParserShowSettingQuery.cpp
@@ -11,7 +11,7 @@ namespace DB
 
 bool ParserShowSettingQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (!ParserKeyword("SHOW SETTING").ignore(pos, expected))
+    if (!ParserKeyword(Keyword::SHOW_SETTING).ignore(pos, expected))
         return false;
 
     ASTPtr setting_name_identifier;
diff --git a/src/Parsers/ParserShowTablesQuery.cpp b/src/Parsers/ParserShowTablesQuery.cpp
index 2b220dd0a0c..68b89bd0551 100644
--- a/src/Parsers/ParserShowTablesQuery.cpp
+++ b/src/Parsers/ParserShowTablesQuery.cpp
@@ -17,25 +17,25 @@ namespace DB
 
 bool ParserShowTablesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_show("SHOW");
-    ParserKeyword s_full("FULL");
-    ParserKeyword s_temporary("TEMPORARY");
-    ParserKeyword s_tables("TABLES");
-    ParserKeyword s_databases("DATABASES");
-    ParserKeyword s_clusters("CLUSTERS");
-    ParserKeyword s_cluster("CLUSTER");
-    ParserKeyword s_dictionaries("DICTIONARIES");
-    ParserKeyword s_caches("FILESYSTEM CACHES");
-    ParserKeyword s_settings("SETTINGS");
-    ParserKeyword s_merges("MERGES");
-    ParserKeyword s_changed("CHANGED");
-    ParserKeyword s_from("FROM");
-    ParserKeyword s_in("IN");
-    ParserKeyword s_not("NOT");
-    ParserKeyword s_like("LIKE");
-    ParserKeyword s_ilike("ILIKE");
-    ParserKeyword s_where("WHERE");
-    ParserKeyword s_limit("LIMIT");
+    ParserKeyword s_show(Keyword::SHOW);
+    ParserKeyword s_full(Keyword::FULL);
+    ParserKeyword s_temporary(Keyword::TEMPORARY);
+    ParserKeyword s_tables(Keyword::TABLES);
+    ParserKeyword s_databases(Keyword::DATABASES);
+    ParserKeyword s_clusters(Keyword::CLUSTERS);
+    ParserKeyword s_cluster(Keyword::CLUSTER);
+    ParserKeyword s_dictionaries(Keyword::DICTIONARIES);
+    ParserKeyword s_caches(Keyword::FILESYSTEM_CACHES);
+    ParserKeyword s_settings(Keyword::SETTINGS);
+    ParserKeyword s_merges(Keyword::MERGES);
+    ParserKeyword s_changed(Keyword::CHANGED);
+    ParserKeyword s_from(Keyword::FROM);
+    ParserKeyword s_in(Keyword::IN);
+    ParserKeyword s_not(Keyword::NOT);
+    ParserKeyword s_like(Keyword::LIKE);
+    ParserKeyword s_ilike(Keyword::ILIKE);
+    ParserKeyword s_where(Keyword::WHERE);
+    ParserKeyword s_limit(Keyword::LIMIT);
     ParserStringLiteral like_p;
     ParserIdentifier name_p(true);
     ParserExpressionWithOptionalAlias exp_elem(false);
@@ -147,7 +147,7 @@ bool ParserShowTablesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
                 return false;
         }
 
-        /// Not expected due to "SHOW SETTINGS PROFILES"
+        /// Not expected due to Keyword::SHOW SETTINGS PROFILES
         if (bool insensitive = s_ilike.ignore(pos, expected); insensitive || s_like.ignore(pos, expected))
         {
             if (insensitive)
diff --git a/src/Parsers/ParserSystemQuery.cpp b/src/Parsers/ParserSystemQuery.cpp
index a50e65aa134..df168e74772 100644
--- a/src/Parsers/ParserSystemQuery.cpp
+++ b/src/Parsers/ParserSystemQuery.cpp
@@ -28,7 +28,7 @@ namespace ErrorCodes
     String cluster;
     bool parsed_on_cluster = false;
 
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::ON}.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster, expected))
             return false;
@@ -52,7 +52,7 @@ namespace ErrorCodes
     if (!parsed_table && require_table)
         return false;
 
-    if (!parsed_on_cluster && ParserKeyword{"ON"}.ignore(pos, expected))
+    if (!parsed_on_cluster && ParserKeyword{Keyword::ON}.ignore(pos, expected))
         if (!ASTQueryWithOnCluster::parse(pos, cluster, expected))
             return false;
 
@@ -82,7 +82,7 @@ enum class SystemQueryTargetType
     String cluster;
     bool parsed_on_cluster = false;
 
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::ON}.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster, expected))
             return false;
@@ -108,7 +108,7 @@ enum class SystemQueryTargetType
             return false;
     }
 
-    if (!parsed_on_cluster && ParserKeyword{"ON"}.ignore(pos, expected))
+    if (!parsed_on_cluster && ParserKeyword{Keyword::ON}.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster, expected))
             return false;
@@ -142,7 +142,7 @@ enum class SystemQueryTargetType
                                     Expected & expected)
 {
     String cluster_str;
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::ON}.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
             return false;
@@ -162,29 +162,29 @@ enum class SystemQueryTargetType
         return false;
     res->replica = ast->as<ASTLiteral &>().value.safeGet<String>();
 
-    if (ParserKeyword{"FROM SHARD"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::FROM_SHARD}.ignore(pos, expected))
     {
         if (!ParserStringLiteral{}.parse(pos, ast, expected))
             return false;
         res->shard = ast->as<ASTLiteral &>().value.safeGet<String>();
     }
 
-    if (ParserKeyword{"FROM"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::FROM}.ignore(pos, expected))
     {
         // way 1. parse replica database
         // way 2. parse replica table
         // way 3. parse replica zkpath
-        if (ParserKeyword{"DATABASE"}.ignore(pos, expected))
+        if (ParserKeyword{Keyword::DATABASE}.ignore(pos, expected))
         {
             ParserIdentifier database_parser;
             if (!database_parser.parse(pos, res->database, expected))
                 return false;
         }
-        else if (!database && ParserKeyword{"TABLE"}.ignore(pos, expected))
+        else if (!database && ParserKeyword{Keyword::TABLE}.ignore(pos, expected))
         {
             parseDatabaseAndTableAsAST(pos, expected, res->database, res->table);
         }
-        else if (ParserKeyword{"ZKPATH"}.ignore(pos, expected))
+        else if (ParserKeyword{Keyword::ZKPATH}.ignore(pos, expected))
         {
             ASTPtr path_ast;
             if (!ParserStringLiteral{}.parse(pos, path_ast, expected))
@@ -205,7 +205,7 @@ enum class SystemQueryTargetType
 
 bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    if (!ParserKeyword{"SYSTEM"}.ignore(pos, expected))
+    if (!ParserKeyword{Keyword::SYSTEM}.ignore(pos, expected))
         return false;
 
     using Type = ASTSystemQuery::Type;
@@ -216,7 +216,7 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
 
     for (const auto & type : magic_enum::enum_values<Type>())
     {
-        if (ParserKeyword{ASTSystemQuery::typeToString(type)}.ignore(pos, expected))
+        if (ParserKeyword::createDeprecated(ASTSystemQuery::typeToString(type)).ignore(pos, expected))
         {
             res->type = type;
             found = true;
@@ -281,12 +281,12 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
                 return false;
             if (res->type == Type::SYNC_REPLICA)
             {
-                if (ParserKeyword{"STRICT"}.ignore(pos, expected))
+                if (ParserKeyword{Keyword::STRICT}.ignore(pos, expected))
                     res->sync_replica_mode = SyncReplicaMode::STRICT;
-                else if (ParserKeyword{"LIGHTWEIGHT"}.ignore(pos, expected))
+                else if (ParserKeyword{Keyword::LIGHTWEIGHT}.ignore(pos, expected))
                 {
                     res->sync_replica_mode = SyncReplicaMode::LIGHTWEIGHT;
-                    if (ParserKeyword{"FROM"}.ignore(pos, expected))
+                    if (ParserKeyword{Keyword::FROM}.ignore(pos, expected))
                     {
                         do
                         {
@@ -297,7 +297,7 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
                         } while (ParserToken{TokenType::Comma}.ignore(pos, expected));
                     }
                 }
-                else if (ParserKeyword{"PULL"}.ignore(pos, expected))
+                else if (ParserKeyword{Keyword::PULL}.ignore(pos, expected))
                     res->sync_replica_mode = SyncReplicaMode::PULL;
             }
             break;
@@ -360,7 +360,7 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
                 return true;
             };
 
-            if (ParserKeyword{"ON VOLUME"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::ON_VOLUME}.ignore(pos, expected))
             {
                 if (!parse_on_volume())
                     return false;
@@ -369,7 +369,7 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
             {
                 if (!parseQueryWithOnCluster(res, pos, expected))
                     return false;
-                if (ParserKeyword{"ON VOLUME"}.ignore(pos, expected))
+                if (ParserKeyword{Keyword::ON_VOLUME}.ignore(pos, expected))
                 {
                     if (!parse_on_volume())
                         return false;
@@ -419,10 +419,10 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
             if (!parseDatabaseAndTableAsAST(pos, expected, res->database, res->table))
                 return false;
 
-            if (ParserKeyword{"UNSET FAKE TIME"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::UNSET_FAKE_TIME}.ignore(pos, expected))
                 break;
 
-            if (!ParserKeyword{"SET FAKE TIME"}.ignore(pos, expected))
+            if (!ParserKeyword{Keyword::SET_FAKE_TIME}.ignore(pos, expected))
                 return false;
             ASTPtr ast;
             if (!ParserStringLiteral{}.parse(pos, ast, expected))
@@ -442,9 +442,9 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
                 return false;
 
             ASTPtr seconds;
-            if (!(ParserKeyword{"FOR"}.ignore(pos, expected)
+            if (!(ParserKeyword{Keyword::FOR}.ignore(pos, expected)
                 && ParserUnsignedInteger().parse(pos, seconds, expected)
-                && ParserKeyword{"SECOND"}.ignore(pos, expected)))   /// SECOND, not SECONDS to be consistent with INTERVAL parsing in SQL
+                && ParserKeyword{Keyword::SECOND}.ignore(pos, expected)))   /// SECOND, not SECONDS to be consistent with INTERVAL parsing in SQL
             {
                 return false;
             }
@@ -459,10 +459,10 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
             if (path_parser.parse(pos, ast, expected))
             {
                 res->filesystem_cache_name = ast->as<ASTLiteral>()->value.safeGet<String>();
-                if (ParserKeyword{"KEY"}.ignore(pos, expected) && ParserIdentifier().parse(pos, ast, expected))
+                if (ParserKeyword{Keyword::KEY}.ignore(pos, expected) && ParserIdentifier().parse(pos, ast, expected))
                 {
                     res->key_to_drop = ast->as<ASTIdentifier>()->name();
-                    if (ParserKeyword{"OFFSET"}.ignore(pos, expected) && ParserLiteral().parse(pos, ast, expected))
+                    if (ParserKeyword{Keyword::OFFSET}.ignore(pos, expected) && ParserLiteral().parse(pos, ast, expected))
                         res->offset_to_drop = ast->as<ASTLiteral>()->value.safeGet<UInt64>();
                 }
             }
@@ -486,18 +486,18 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
         }
         case Type::DROP_SCHEMA_CACHE:
         {
-            if (ParserKeyword{"FOR"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::FOR}.ignore(pos, expected))
             {
-                if (ParserKeyword{"FILE"}.ignore(pos, expected))
-                    res->schema_cache_storage = "FILE";
-                else if (ParserKeyword{"S3"}.ignore(pos, expected))
-                    res->schema_cache_storage = "S3";
-                else if (ParserKeyword{"HDFS"}.ignore(pos, expected))
-                    res->schema_cache_storage = "HDFS";
-                else if (ParserKeyword{"URL"}.ignore(pos, expected))
-                    res->schema_cache_storage = "URL";
-                else if (ParserKeyword{"AZURE"}.ignore(pos, expected))
-                    res->schema_cache_storage = "AZURE";
+                if (ParserKeyword{Keyword::FILE}.ignore(pos, expected))
+                    res->schema_cache_storage = toStringView(Keyword::FILE);
+                else if (ParserKeyword{Keyword::S3}.ignore(pos, expected))
+                    res->schema_cache_storage = toStringView(Keyword::S3);
+                else if (ParserKeyword{Keyword::HDFS}.ignore(pos, expected))
+                    res->schema_cache_storage = toStringView(Keyword::HDFS);
+                else if (ParserKeyword{Keyword::URL}.ignore(pos, expected))
+                    res->schema_cache_storage = toStringView(Keyword::URL);
+                else if (ParserKeyword{Keyword::AZURE}.ignore(pos, expected))
+                    res->schema_cache_storage = toStringView(Keyword::AZURE);
                 else
                     return false;
             }
@@ -505,10 +505,11 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
         }
         case Type::DROP_FORMAT_SCHEMA_CACHE:
         {
-            if (ParserKeyword{"FOR"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::FOR}.ignore(pos, expected))
             {
-                if (ParserKeyword{"Protobuf"}.ignore(pos, expected))
-                    res->schema_cache_format = "Protobuf";
+                if (ParserKeyword{Keyword::PROTOBUF}.ignore(pos, expected))
+                    res->schema_cache_format = toStringView(Keyword::PROTOBUF);
+
                 else
                     return false;
             }
@@ -517,7 +518,7 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
         case Type::UNFREEZE:
         {
             ASTPtr ast;
-            if (ParserKeyword{"WITH NAME"}.ignore(pos, expected) && ParserStringLiteral{}.parse(pos, ast, expected))
+            if (ParserKeyword{Keyword::WITH_NAME}.ignore(pos, expected) && ParserStringLiteral{}.parse(pos, ast, expected))
             {
                 res->backup_name = ast->as<ASTLiteral &>().value.get<const String &>();
             }
@@ -541,7 +542,7 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
 
                 for (const auto & cur_type : magic_enum::enum_values<ServerType::Type>())
                 {
-                    if (ParserKeyword{ServerType::serverTypeToString(cur_type)}.ignore(pos, expected))
+                    if (ParserKeyword::createDeprecated(ServerType::serverTypeToString(cur_type)).ignore(pos, expected))
                     {
                         type = cur_type;
                         break;
@@ -573,7 +574,7 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
             if (!parse_server_type(base_type, base_custom_name))
                 return false;
 
-            if (ParserKeyword{"EXCEPT"}.ignore(pos, expected))
+            if (ParserKeyword{Keyword::EXCEPT}.ignore(pos, expected))
             {
                 if (base_type != ServerType::Type::QUERIES_ALL &&
                     base_type != ServerType::Type::QUERIES_DEFAULT &&
diff --git a/src/Parsers/ParserTablePropertiesQuery.cpp b/src/Parsers/ParserTablePropertiesQuery.cpp
index 94f264fcc89..48a5c0ebde0 100644
--- a/src/Parsers/ParserTablePropertiesQuery.cpp
+++ b/src/Parsers/ParserTablePropertiesQuery.cpp
@@ -12,14 +12,14 @@ namespace DB
 
 bool ParserTablePropertiesQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_exists("EXISTS");
-    ParserKeyword s_temporary("TEMPORARY");
-    ParserKeyword s_show("SHOW");
-    ParserKeyword s_create("CREATE");
-    ParserKeyword s_database("DATABASE");
-    ParserKeyword s_table("TABLE");
-    ParserKeyword s_view("VIEW");
-    ParserKeyword s_dictionary("DICTIONARY");
+    ParserKeyword s_exists(Keyword::EXISTS);
+    ParserKeyword s_temporary(Keyword::TEMPORARY);
+    ParserKeyword s_show(Keyword::SHOW);
+    ParserKeyword s_create(Keyword::CREATE);
+    ParserKeyword s_database(Keyword::DATABASE);
+    ParserKeyword s_table(Keyword::TABLE);
+    ParserKeyword s_view(Keyword::VIEW);
+    ParserKeyword s_dictionary(Keyword::DICTIONARY);
     ParserToken s_dot(TokenType::Dot);
     ParserIdentifier name_p(true);
 
diff --git a/src/Parsers/ParserTablesInSelectQuery.cpp b/src/Parsers/ParserTablesInSelectQuery.cpp
index ca209739dad..ab35141403a 100644
--- a/src/Parsers/ParserTablesInSelectQuery.cpp
+++ b/src/Parsers/ParserTablesInSelectQuery.cpp
@@ -31,11 +31,11 @@ bool ParserTableExpression::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
         return false;
 
     /// FINAL
-    if (ParserKeyword("FINAL").ignore(pos, expected))
+    if (ParserKeyword(Keyword::FINAL).ignore(pos, expected))
         res->final = true;
 
     /// SAMPLE number
-    if (ParserKeyword("SAMPLE").ignore(pos, expected))
+    if (ParserKeyword(Keyword::SAMPLE).ignore(pos, expected))
     {
         ParserSampleRatio ratio;
 
@@ -43,7 +43,7 @@ bool ParserTableExpression::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
             return false;
 
         /// OFFSET number
-        if (ParserKeyword("OFFSET").ignore(pos, expected))
+        if (ParserKeyword(Keyword::OFFSET).ignore(pos, expected))
         {
             if (!ratio.parse(pos, res->sample_offset, expected))
                 return false;
@@ -76,7 +76,7 @@ bool ParserArrayJoin::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
     Pos saved_pos = pos;
     bool has_array_join = false;
 
-    if (ParserKeyword("LEFT ARRAY JOIN").ignore(pos, expected))
+    if (ParserKeyword(Keyword::LEFT_ARRAY_JOIN).ignore(pos, expected))
     {
         res->kind = ASTArrayJoin::Kind::Left;
         has_array_join = true;
@@ -86,9 +86,9 @@ bool ParserArrayJoin::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
         pos = saved_pos;
 
         /// INNER may be specified explicitly, otherwise it is assumed as default.
-        ParserKeyword("INNER").ignore(pos, expected);
+        ParserKeyword(Keyword::INNER).ignore(pos, expected);
 
-        if (ParserKeyword("ARRAY JOIN").ignore(pos, expected))
+        if (ParserKeyword(Keyword::ARRAY_JOIN).ignore(pos, expected))
         {
             res->kind = ASTArrayJoin::Kind::Inner;
             has_array_join = true;
@@ -111,15 +111,15 @@ bool ParserArrayJoin::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 
 void ParserTablesInSelectQueryElement::parseJoinStrictness(Pos & pos, ASTTableJoin & table_join)
 {
-    if (ParserKeyword("ANY").ignore(pos))
+    if (ParserKeyword(Keyword::ANY).ignore(pos))
         table_join.strictness = JoinStrictness::Any;
-    else if (ParserKeyword("ALL").ignore(pos))
+    else if (ParserKeyword(Keyword::ALL).ignore(pos))
         table_join.strictness = JoinStrictness::All;
-    else if (ParserKeyword("ASOF").ignore(pos))
+    else if (ParserKeyword(Keyword::ASOF).ignore(pos))
         table_join.strictness = JoinStrictness::Asof;
-    else if (ParserKeyword("SEMI").ignore(pos))
+    else if (ParserKeyword(Keyword::SEMI).ignore(pos))
         table_join.strictness = JoinStrictness::Semi;
-    else if (ParserKeyword("ANTI").ignore(pos) || ParserKeyword("ONLY").ignore(pos))
+    else if (ParserKeyword(Keyword::ANTI).ignore(pos) || ParserKeyword(Keyword::ONLY).ignore(pos))
         table_join.strictness = JoinStrictness::Anti;
 }
 
@@ -146,9 +146,9 @@ bool ParserTablesInSelectQueryElement::parseImpl(Pos & pos, ASTPtr & node, Expec
         }
         else
         {
-            if (ParserKeyword("GLOBAL").ignore(pos))
+            if (ParserKeyword(Keyword::GLOBAL).ignore(pos))
                 table_join->locality = JoinLocality::Global;
-            else if (ParserKeyword("LOCAL").ignore(pos))
+            else if (ParserKeyword(Keyword::LOCAL).ignore(pos))
                 table_join->locality = JoinLocality::Local;
 
             table_join->strictness = JoinStrictness::Unspecified;
@@ -157,17 +157,17 @@ bool ParserTablesInSelectQueryElement::parseImpl(Pos & pos, ASTPtr & node, Expec
             parseJoinStrictness(pos, *table_join);
 
             bool no_kind = false;
-            if (ParserKeyword("INNER").ignore(pos))
+            if (ParserKeyword(Keyword::INNER).ignore(pos))
                 table_join->kind = JoinKind::Inner;
-            else if (ParserKeyword("LEFT").ignore(pos))
+            else if (ParserKeyword(Keyword::LEFT).ignore(pos))
                 table_join->kind = JoinKind::Left;
-            else if (ParserKeyword("RIGHT").ignore(pos))
+            else if (ParserKeyword(Keyword::RIGHT).ignore(pos))
                 table_join->kind = JoinKind::Right;
-            else if (ParserKeyword("FULL").ignore(pos))
+            else if (ParserKeyword(Keyword::FULL).ignore(pos))
                 table_join->kind = JoinKind::Full;
-            else if (ParserKeyword("CROSS").ignore(pos))
+            else if (ParserKeyword(Keyword::CROSS).ignore(pos))
                 table_join->kind = JoinKind::Cross;
-            else if (ParserKeyword("PASTE").ignore(pos))
+            else if (ParserKeyword(Keyword::PASTE).ignore(pos))
                 table_join->kind = JoinKind::Paste;
             else
                 no_kind = true;
@@ -180,7 +180,7 @@ bool ParserTablesInSelectQueryElement::parseImpl(Pos & pos, ASTPtr & node, Expec
                 || table_join->kind == JoinKind::Right
                 || table_join->kind == JoinKind::Full)
             {
-                ParserKeyword("OUTER").ignore(pos);
+                ParserKeyword(Keyword::OUTER).ignore(pos);
             }
 
             if (no_kind)
@@ -201,7 +201,7 @@ bool ParserTablesInSelectQueryElement::parseImpl(Pos & pos, ASTPtr & node, Expec
                 (table_join->kind != JoinKind::Left && table_join->kind != JoinKind::Right))
                 throw Exception(ErrorCodes::SYNTAX_ERROR, "SEMI|ANTI JOIN should be LEFT or RIGHT.");
 
-            if (!ParserKeyword("JOIN").ignore(pos, expected))
+            if (!ParserKeyword(Keyword::JOIN).ignore(pos, expected))
                 return false;
         }
 
@@ -211,7 +211,7 @@ bool ParserTablesInSelectQueryElement::parseImpl(Pos & pos, ASTPtr & node, Expec
         if (table_join->kind != JoinKind::Comma
             && table_join->kind != JoinKind::Cross && table_join->kind != JoinKind::Paste)
         {
-            if (ParserKeyword("USING").ignore(pos, expected))
+            if (ParserKeyword(Keyword::USING).ignore(pos, expected))
             {
                 /// Expression for USING could be in parentheses or not.
                 bool in_parens = pos->type == TokenType::OpeningRoundBracket;
@@ -228,7 +228,7 @@ bool ParserTablesInSelectQueryElement::parseImpl(Pos & pos, ASTPtr & node, Expec
                     ++pos;
                 }
             }
-            else if (ParserKeyword("ON").ignore(pos, expected))
+            else if (ParserKeyword(Keyword::ON).ignore(pos, expected))
             {
                 if (!ParserExpression().parse(pos, table_join->on_expression, expected))
                     return false;
diff --git a/src/Parsers/ParserTransactionControl.cpp b/src/Parsers/ParserTransactionControl.cpp
index da593170002..43d28850246 100644
--- a/src/Parsers/ParserTransactionControl.cpp
+++ b/src/Parsers/ParserTransactionControl.cpp
@@ -12,13 +12,13 @@ bool ParserTransactionControl::parseImpl(Pos & pos, ASTPtr & node, Expected & ex
     ASTTransactionControl::QueryType action;
     UInt64 snapshot = 0;
 
-    if (ParserKeyword("BEGIN TRANSACTION").ignore(pos, expected))
+    if (ParserKeyword(Keyword::BEGIN_TRANSACTION).ignore(pos, expected))
         action = ASTTransactionControl::BEGIN;
-    else if (ParserKeyword("COMMIT").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::COMMIT).ignore(pos, expected))
         action = ASTTransactionControl::COMMIT;
-    else if (ParserKeyword("ROLLBACK").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::ROLLBACK).ignore(pos, expected))
         action = ASTTransactionControl::ROLLBACK;
-    else if (ParserKeyword("SET TRANSACTION SNAPSHOT").ignore(pos, expected))
+    else if (ParserKeyword(Keyword::SET_TRANSACTION_SNAPSHOT).ignore(pos, expected))
     {
         action = ASTTransactionControl::SET_SNAPSHOT;
         ASTPtr ast;
diff --git a/src/Parsers/ParserUndropQuery.cpp b/src/Parsers/ParserUndropQuery.cpp
index e67fd7f5f01..07ca8a3b5fd 100644
--- a/src/Parsers/ParserUndropQuery.cpp
+++ b/src/Parsers/ParserUndropQuery.cpp
@@ -13,7 +13,7 @@ namespace
 
 bool parseUndropQuery(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_table("TABLE");
+    ParserKeyword s_table(Keyword::TABLE);
     ParserToken s_dot(TokenType::Dot);
     ParserIdentifier name_p(true);
 
@@ -35,7 +35,7 @@ bool parseUndropQuery(IParser::Pos & pos, ASTPtr & node, Expected & expected)
         if (!name_p.parse(pos, table, expected))
             return false;
     }
-    if (ParserKeyword("UUID").ignore(pos, expected))
+    if (ParserKeyword(Keyword::UUID).ignore(pos, expected))
     {
         ParserStringLiteral uuid_p;
         ASTPtr ast_uuid;
@@ -43,7 +43,7 @@ bool parseUndropQuery(IParser::Pos & pos, ASTPtr & node, Expected & expected)
             return false;
         uuid = parseFromString<UUID>(ast_uuid->as<ASTLiteral>()->value.get<String>());
     }
-    if (ParserKeyword{"ON"}.ignore(pos, expected))
+    if (ParserKeyword{Keyword::ON}.ignore(pos, expected))
     {
         if (!ASTQueryWithOnCluster::parse(pos, cluster_str, expected))
             return false;
@@ -70,7 +70,7 @@ bool parseUndropQuery(IParser::Pos & pos, ASTPtr & node, Expected & expected)
 
 bool ParserUndropQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_undrop("UNDROP");
+    ParserKeyword s_undrop(Keyword::UNDROP);
 
     if (s_undrop.ignore(pos, expected))
         return parseUndropQuery(pos, node, expected);
diff --git a/src/Parsers/ParserUseQuery.cpp b/src/Parsers/ParserUseQuery.cpp
index 350e573281c..b510ab9e59b 100644
--- a/src/Parsers/ParserUseQuery.cpp
+++ b/src/Parsers/ParserUseQuery.cpp
@@ -10,7 +10,7 @@ namespace DB
 
 bool ParserUseQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_use("USE");
+    ParserKeyword s_use(Keyword::USE);
     ParserIdentifier name_p{/*allow_query_parameter*/ true};
 
     if (!s_use.ignore(pos, expected))
diff --git a/src/Parsers/ParserWatchQuery.cpp b/src/Parsers/ParserWatchQuery.cpp
index 913d9c4ff3f..ad3aeb6385d 100644
--- a/src/Parsers/ParserWatchQuery.cpp
+++ b/src/Parsers/ParserWatchQuery.cpp
@@ -20,11 +20,11 @@ namespace DB
 
 bool ParserWatchQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
-    ParserKeyword s_watch("WATCH");
+    ParserKeyword s_watch(Keyword::WATCH);
     ParserToken s_dot(TokenType::Dot);
     ParserIdentifier name_p(true);
-    ParserKeyword s_events("EVENTS");
-    ParserKeyword s_limit("LIMIT");
+    ParserKeyword s_events(Keyword::EVENTS);
+    ParserKeyword s_limit(Keyword::LIMIT);
 
     ASTPtr database;
     ASTPtr table;
diff --git a/src/Parsers/ParserWithElement.cpp b/src/Parsers/ParserWithElement.cpp
index a882af19dd9..5b31c929685 100644
--- a/src/Parsers/ParserWithElement.cpp
+++ b/src/Parsers/ParserWithElement.cpp
@@ -13,7 +13,7 @@ namespace DB
 bool ParserWithElement::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
 {
     ParserIdentifier s_ident;
-    ParserKeyword s_as("AS");
+    ParserKeyword s_as(Keyword::AS);
     ParserSubquery s_subquery;
 
     auto old_pos = pos;
diff --git a/src/Parsers/parseIntervalKind.cpp b/src/Parsers/parseIntervalKind.cpp
index 124246f2950..bbcff8826be 100644
--- a/src/Parsers/parseIntervalKind.cpp
+++ b/src/Parsers/parseIntervalKind.cpp
@@ -7,89 +7,88 @@ namespace DB
 {
 bool parseIntervalKind(IParser::Pos & pos, Expected & expected, IntervalKind & result)
 {
-    if (ParserKeyword("NANOSECOND").ignore(pos, expected) || ParserKeyword("NANOSECONDS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_NANOSECOND").ignore(pos, expected)
-        || ParserKeyword("NS").ignore(pos, expected))
+    if (ParserKeyword(Keyword::NANOSECOND).ignore(pos, expected) || ParserKeyword(Keyword::NANOSECONDS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_NANOSECOND).ignore(pos, expected)
+        || ParserKeyword(Keyword::NS).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Nanosecond;
         return true;
     }
 
-    if (ParserKeyword("MICROSECOND").ignore(pos, expected) || ParserKeyword("MICROSECONDS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_MICROSECOND").ignore(pos, expected)
-        || ParserKeyword("MCS").ignore(pos, expected))
+    if (ParserKeyword(Keyword::MICROSECOND).ignore(pos, expected) || ParserKeyword(Keyword::MICROSECONDS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_MICROSECOND).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Microsecond;
         return true;
     }
 
-    if (ParserKeyword("MILLISECOND").ignore(pos, expected) || ParserKeyword("MILLISECONDS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_MILLISECOND").ignore(pos, expected)
-        || ParserKeyword("MS").ignore(pos, expected))
+    if (ParserKeyword(Keyword::MILLISECOND).ignore(pos, expected) || ParserKeyword(Keyword::MILLISECONDS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_MILLISECOND).ignore(pos, expected)
+        || ParserKeyword(Keyword::MS).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Millisecond;
         return true;
     }
 
-    if (ParserKeyword("SECOND").ignore(pos, expected) || ParserKeyword("SECONDS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_SECOND").ignore(pos, expected)
-        || ParserKeyword("SS").ignore(pos, expected) || ParserKeyword("S").ignore(pos, expected))
+    if (ParserKeyword(Keyword::SECOND).ignore(pos, expected) || ParserKeyword(Keyword::SECONDS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_SECOND).ignore(pos, expected)
+        || ParserKeyword(Keyword::SS).ignore(pos, expected) || ParserKeyword(Keyword::S).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Second;
         return true;
     }
 
-    if (ParserKeyword("MINUTE").ignore(pos, expected) || ParserKeyword("MINUTES").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_MINUTE").ignore(pos, expected)
-        || ParserKeyword("MI").ignore(pos, expected) || ParserKeyword("N").ignore(pos, expected))
+    if (ParserKeyword(Keyword::MINUTE).ignore(pos, expected) || ParserKeyword(Keyword::MINUTES).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_MINUTE).ignore(pos, expected)
+        || ParserKeyword(Keyword::MI).ignore(pos, expected) || ParserKeyword(Keyword::N).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Minute;
         return true;
     }
 
-    if (ParserKeyword("HOUR").ignore(pos, expected) || ParserKeyword("HOURS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_HOUR").ignore(pos, expected)
-        || ParserKeyword("HH").ignore(pos, expected) || ParserKeyword("H").ignore(pos, expected))
+    if (ParserKeyword(Keyword::HOUR).ignore(pos, expected) || ParserKeyword(Keyword::HOURS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_HOUR).ignore(pos, expected)
+        || ParserKeyword(Keyword::HH).ignore(pos, expected) || ParserKeyword(Keyword::H).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Hour;
         return true;
     }
 
-    if (ParserKeyword("DAY").ignore(pos, expected) || ParserKeyword("DAYS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_DAY").ignore(pos, expected)
-        || ParserKeyword("DD").ignore(pos, expected) || ParserKeyword("D").ignore(pos, expected))
+    if (ParserKeyword(Keyword::DAY).ignore(pos, expected) || ParserKeyword(Keyword::DAYS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_DAY).ignore(pos, expected)
+        || ParserKeyword(Keyword::DD).ignore(pos, expected) || ParserKeyword(Keyword::D).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Day;
         return true;
     }
 
-    if (ParserKeyword("WEEK").ignore(pos, expected) || ParserKeyword("WEEKS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_WEEK").ignore(pos, expected)
-        || ParserKeyword("WK").ignore(pos, expected) || ParserKeyword("WW").ignore(pos, expected))
+    if (ParserKeyword(Keyword::WEEK).ignore(pos, expected) || ParserKeyword(Keyword::WEEKS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_WEEK).ignore(pos, expected)
+        || ParserKeyword(Keyword::WK).ignore(pos, expected) || ParserKeyword(Keyword::WW).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Week;
         return true;
     }
 
-    if (ParserKeyword("MONTH").ignore(pos, expected) || ParserKeyword("MONTHS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_MONTH").ignore(pos, expected)
-        || ParserKeyword("MM").ignore(pos, expected) || ParserKeyword("M").ignore(pos, expected))
+    if (ParserKeyword(Keyword::MONTH).ignore(pos, expected) || ParserKeyword(Keyword::MONTHS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_MONTH).ignore(pos, expected)
+        || ParserKeyword(Keyword::MM).ignore(pos, expected) || ParserKeyword(Keyword::M).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Month;
         return true;
     }
 
-    if (ParserKeyword("QUARTER").ignore(pos, expected) || ParserKeyword("QUARTERS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_QUARTER").ignore(pos, expected)
-        || ParserKeyword("QQ").ignore(pos, expected) || ParserKeyword("Q").ignore(pos, expected))
+    if (ParserKeyword(Keyword::QUARTER).ignore(pos, expected) || ParserKeyword(Keyword::QUARTERS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_QUARTER).ignore(pos, expected)
+        || ParserKeyword(Keyword::QQ).ignore(pos, expected) || ParserKeyword(Keyword::Q).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Quarter;
         return true;
     }
 
-    if (ParserKeyword("YEAR").ignore(pos, expected) || ParserKeyword("YEARS").ignore(pos, expected)
-        || ParserKeyword("SQL_TSI_YEAR").ignore(pos, expected)
-        || ParserKeyword("YYYY").ignore(pos, expected) || ParserKeyword("YY").ignore(pos, expected))
+    if (ParserKeyword(Keyword::YEAR).ignore(pos, expected) || ParserKeyword(Keyword::YEARS).ignore(pos, expected)
+        || ParserKeyword(Keyword::SQL_TSI_YEAR).ignore(pos, expected)
+        || ParserKeyword(Keyword::YYYY).ignore(pos, expected) || ParserKeyword(Keyword::YY).ignore(pos, expected))
     {
         result = IntervalKind::Kind::Year;
         return true;
diff --git a/src/Storages/System/StorageSystemKeywords.cpp b/src/Storages/System/StorageSystemKeywords.cpp
new file mode 100644
index 00000000000..b9d256bf4b2
--- /dev/null
+++ b/src/Storages/System/StorageSystemKeywords.cpp
@@ -0,0 +1,29 @@
+#include <Common/Macros.h>
+#include <Interpreters/Context.h>
+#include <Storages/System/StorageSystemKeywords.h>
+
+#include <Parsers/CommonParsers.h>
+
+
+namespace DB
+{
+
+ColumnsDescription StorageSystemKeywords::getColumnsDescription()
+{
+    return ColumnsDescription
+    {
+        {"keyword", std::make_shared<DataTypeString>(), "The keyword used in ClickHouse parser."},
+    };
+}
+
+void StorageSystemKeywords::fillData(MutableColumns & res_columns, ContextPtr context, const ActionsDAG::Node *, std::vector<UInt8>) const
+{
+    auto macros = context->getMacros();
+
+    for (const auto & keyword : getAllKeyWords())
+    {
+        res_columns[0]->insert(keyword);
+    }
+}
+
+}
diff --git a/src/Storages/System/StorageSystemKeywords.h b/src/Storages/System/StorageSystemKeywords.h
new file mode 100644
index 00000000000..5574c4a3abc
--- /dev/null
+++ b/src/Storages/System/StorageSystemKeywords.h
@@ -0,0 +1,28 @@
+#pragma once
+
+#include <DataTypes/DataTypeString.h>
+#include <Storages/System/IStorageSystemOneBlock.h>
+
+
+namespace DB
+{
+
+class Context;
+
+
+/** Information about macros for introspection.
+  */
+class StorageSystemKeywords final : public IStorageSystemOneBlock
+{
+public:
+    std::string getName() const override { return "SystemKeywords"; }
+
+    static ColumnsDescription getColumnsDescription();
+
+protected:
+    using IStorageSystemOneBlock::IStorageSystemOneBlock;
+
+    void fillData(MutableColumns & res_columns, ContextPtr, const ActionsDAG::Node *, std::vector<UInt8>) const override;
+};
+
+}
diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index 79475b9695d..0de92c8f2f0 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -1,3 +1,4 @@
+#include "Storages/System/StorageSystemKeywords.h"
 #include "config.h"
 
 #include <Databases/IDatabase.h>
@@ -184,6 +185,7 @@ void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, b
     attachNoDescription<StorageSystemMySQLBinlogs>(context, system_database, "mysql_binlogs", "Shows a list of active binlogs for MaterializedMySQL.");
 #endif
 
+    attach<StorageSystemKeywords>(context, system_database, "keywords", "Contains a list of all keywords used in ClickHouse parser.");
     attachNoDescription<StorageSystemParts>(context, system_database, "parts", "Contains a list of currently existing (both active and inactive) parts of all *-MergeTree tables. Each part is represented by a single row.");
     attachNoDescription<StorageSystemProjectionParts>(context, system_database, "projection_parts", "Contains a list of currently existing projection parts (a copy of some part containing aggregated data or just sorted in different order) created for all the projections for all tables within a cluster.");
     attachNoDescription<StorageSystemDetachedParts>(context, system_database, "detached_parts", "Contains a list of all parts which are being found in /detached directory along with a reason why it was detached. ClickHouse server doesn't use such parts anyhow.");

From 265d91747fceb596d76ea7422f6dfa6995b61870 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Mon, 18 Mar 2024 16:03:12 +0000
Subject: [PATCH 688/985] Remove log debug

---
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 62 +++++--------------
 src/Storages/System/StorageSystemNumbers.cpp  |  2 -
 src/Storages/System/attachSystemTables.cpp    |  1 +
 .../TableFunctionGenerateSeries.cpp           | 23 ++++---
 src/TableFunctions/TableFunctionNumbers.cpp   | 11 ++--
 5 files changed, 35 insertions(+), 64 deletions(-)

diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 52b5eeb2ca3..503dd534d89 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -29,6 +29,15 @@ extern const int TOO_MANY_ROWS;
 namespace
 {
 
+template <iota_supported_types T>
+inline void iota_with_step_optimized(T * begin, size_t count, T first_value, T step)
+{
+    if (step == 1)
+        iota(begin, count, first_value);
+    else
+        iota_with_step(begin, count, first_value, step);
+}
+
 class NumbersSource : public ISource
 {
 public:
@@ -66,14 +75,8 @@ protected:
         UInt64 * pos = vec.data(); /// This also accelerates the code.
 
         UInt64 * current_end = &vec[real_block_size];
-        if (step == 1)
-        {
-            iota(pos, static_cast<size_t>(current_end - pos), curr);
-        }
-        else
-        {
-            iota_with_step(pos, static_cast<size_t>(current_end - pos), curr, step);
-        }
+
+        iota_with_step_optimized(pos, static_cast<size_t>(current_end - pos), curr, step);
 
         next += chunk_step;
 
@@ -101,8 +104,6 @@ using RangesWithStep = std::vector<RangeWithStep>;
 
 std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 step, UInt64 remainder)
 {
-    // LOG_DEBUG(&Poco::Logger::get("Stepped from range"),
-    //                     "stepped from range");
     if ((r.right.get<UInt64>() == 0) && (!r.right_included))
         return std::nullopt;
     UInt64 begin = (r.left.get<UInt64>() / step) * step;
@@ -155,7 +156,7 @@ public:
 
     using RangesStatePtr = std::shared_ptr<RangesState>;
 
-    [[maybe_unused]] NumbersRangedSource(
+    NumbersRangedSource(
         const RangesWithStep & ranges_,
         RangesStatePtr & ranges_state_,
         UInt64 base_block_size_,
@@ -167,17 +168,6 @@ public:
         , base_block_size(base_block_size_)
         , step(step_)
     {
-        // for (const auto& range_with_step : ranges_) {
-        //     // LOG_DEBUG(&Poco::Logger::get("Ranges With Step"),
-        //     //             "Ranges: {} {} {} {} {}",
-        //     //             range_with_step.range.left.get<UInt64>(),
-        //     //             range_with_step.range.right.get<UInt64>(),
-        //     //             range_with_step.range.left_included,
-        //     //             range_with_step.range.right_included,
-        //     //             range_with_step.step);
-        //     // LOG_DEBUG(&Poco::Logger::get("Ranges With Step"),
-        //     //             "Step: {}", step);
-        // }
     }
 
     String getName() const override { return "NumbersRange"; }
@@ -242,8 +232,6 @@ protected:
         RangesPos start, end;
         auto block_size = findRanges(start, end, base_block_size);
 
-        // LOG_DEBUG(&Poco::Logger::get("Found range"), "Evth: {} {} {} {} {} {}", start.offset_in_ranges, static_cast<UInt64>(start.offset_in_range), end.offset_in_ranges, static_cast<UInt64>(end.offset_in_range), base_block_size, block_size);
-
         if (!block_size)
             return {};
 
@@ -259,11 +247,6 @@ protected:
         while (block_size - provided != 0)
         {
             UInt64 need = block_size - provided;
-            // LOG_DEBUG(&Poco::Logger::get("Indices:"),
-            //             "Indices: {} {}, provided: {}",
-            //             ranges.size(),
-            //             cursor.offset_in_ranges,
-            //             provided);
             auto & range = ranges[cursor.offset_in_ranges];
 
             UInt128 can_provide = cursor.offset_in_ranges == end.offset_in_ranges
@@ -286,14 +269,7 @@ protected:
                     auto start_value_64 = static_cast<UInt64>(start_value);
                     auto end_value_64 = static_cast<UInt64>(end_value);
                     auto size = (end_value_64 - start_value_64) / this->step;
-                    if (step == 1)
-                    {
-                        iota(pos, static_cast<size_t>(size), start_value_64);
-                    }
-                    else
-                    {
-                        iota_with_step(pos, static_cast<size_t>(size), start_value_64, step);
-                    }
+                    iota_with_step_optimized(pos, static_cast<size_t>(size), start_value_64, step);
                     pos += size;
                 }
             };
@@ -302,14 +278,7 @@ protected:
             {
                 UInt64 start_value = range.left + cursor.offset_in_range * step;
                 /// end_value will never overflow
-                if (step == 1)
-                {
-                    iota(pos, static_cast<size_t>(need), start_value);
-                }
-                else
-                {
-                    iota_with_step(pos, static_cast<size_t>(need), start_value, step);
-                }
+                iota_with_step_optimized(pos, static_cast<size_t>(need), start_value, step);
                 pos += need;
                 provided += need;
                 cursor.offset_in_range += need;
@@ -467,9 +436,6 @@ Pipe ReadFromSystemNumbersStep::makePipe()
     Pipe pipe;
     Ranges ranges;
 
-
-    // LOG_DEBUG(&Poco::Logger::get("parameters"), "Parameters: {} {} {} {}", numbers_storage.step, numbers_storage.offset, numbers_storage.limit.has_value(), numbers_storage.limit.has_value() ? numbers_storage.limit.value() : UInt64{0});
-
     if (numbers_storage.limit.has_value() && (numbers_storage.limit.value() == 0))
     {
         pipe.addSource(std::make_shared<NullSource>(NumbersSource::createHeader(numbers_storage.column_name)));
diff --git a/src/Storages/System/StorageSystemNumbers.cpp b/src/Storages/System/StorageSystemNumbers.cpp
index d47c592c4b3..32d16ef38f9 100644
--- a/src/Storages/System/StorageSystemNumbers.cpp
+++ b/src/Storages/System/StorageSystemNumbers.cpp
@@ -40,9 +40,7 @@ void StorageSystemNumbers::read(
     size_t max_block_size,
     size_t num_streams)
 {
-    // LOG_DEBUG(&Poco::Logger::get("Reading from SystemNumbers"), "Limit : {}", limit.value());
     query_plan.addStep(std::make_unique<ReadFromSystemNumbersStep>(
         column_names, query_info, storage_snapshot, context, shared_from_this(), max_block_size, num_streams));
 }
-
 }
diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index 3fa55fe28c5..ada812c9f54 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -122,6 +122,7 @@ void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, b
     attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers", "Generates all natural numbers, starting from 0 (to 2^64 - 1, and then again) in sorted order.", false, "number");
     attachNoDescription<StorageSystemNumbers>(context, system_database, "numbers_mt", "Multithreaded version of `system.numbers`. Numbers order is not guaranteed.", true, "number");
     attachNoDescription<StorageSystemNumbers>(context, system_database, "generate_series", "Generates arithmetic progression of natural numbers in sorted order in a given segment with a given step", false, "generate_series");
+    attachNoDescription<StorageSystemNumbers>(context, system_database, "generateSeries", "Generates arithmetic progression of natural numbers in sorted order in a given segment with a given step", false, "generate_series");
     attachNoDescription<StorageSystemZeros>(context, system_database, "zeros", "Produces unlimited number of non-materialized zeros.", false);
     attachNoDescription<StorageSystemZeros>(context, system_database, "zeros_mt", "Multithreaded version of system.zeros.", true);
     attach<StorageSystemDatabases>(context, system_database, "databases", "Lists all databases of the current server.");
diff --git a/src/TableFunctions/TableFunctionGenerateSeries.cpp b/src/TableFunctions/TableFunctionGenerateSeries.cpp
index 65c4c4915c2..ee833250d0b 100644
--- a/src/TableFunctions/TableFunctionGenerateSeries.cpp
+++ b/src/TableFunctions/TableFunctionGenerateSeries.cpp
@@ -24,14 +24,14 @@ namespace ErrorCodes
 namespace
 {
 
-/* numbers(limit), numbers_mt(limit)
- * - the same as SELECT number FROM system.numbers LIMIT limit.
- * Used for testing purposes, as a simple example of table function.
- */
+constexpr std::array<const char *, 2> names = {"generate_series", "generateSeries"};
+
+template <size_t alias_num>
 class TableFunctionGenerateSeries : public ITableFunction
 {
 public:
-    static constexpr auto name = "generate_series";
+    static_assert(alias_num < names.size());
+    static constexpr auto name = names[alias_num];
     std::string getName() const override { return name; }
     bool hasStaticStructure() const override { return true; }
 
@@ -49,13 +49,15 @@ private:
     ColumnsDescription getActualTableStructure(ContextPtr context, bool is_insert_query) const override;
 };
 
-ColumnsDescription TableFunctionGenerateSeries::getActualTableStructure(ContextPtr /*context*/, bool /*is_insert_query*/) const
+template <size_t alias_num>
+ColumnsDescription TableFunctionGenerateSeries<alias_num>::getActualTableStructure(ContextPtr /*context*/, bool /*is_insert_query*/) const
 {
     /// NOTE: https://bugs.llvm.org/show_bug.cgi?id=47418
     return ColumnsDescription{{{"generate_series", std::make_shared<DataTypeUInt64>()}}};
 }
 
-StoragePtr TableFunctionGenerateSeries::executeImpl(
+template <size_t alias_num>
+StoragePtr TableFunctionGenerateSeries<alias_num>::executeImpl(
     const ASTPtr & ast_function,
     ContextPtr context,
     const std::string & table_name,
@@ -86,7 +88,8 @@ StoragePtr TableFunctionGenerateSeries::executeImpl(
     throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires 'limit' or 'offset, limit'.", getName());
 }
 
-UInt64 TableFunctionGenerateSeries::evaluateArgument(ContextPtr context, ASTPtr & argument) const
+template <size_t alias_num>
+UInt64 TableFunctionGenerateSeries<alias_num>::evaluateArgument(ContextPtr context, ASTPtr & argument) const
 {
     const auto & [field, type] = evaluateConstantExpression(argument, context);
 
@@ -108,8 +111,8 @@ UInt64 TableFunctionGenerateSeries::evaluateArgument(ContextPtr context, ASTPtr
 
 void registerTableFunctionGenerateSeries(TableFunctionFactory & factory)
 {
-    factory.registerFunction<TableFunctionGenerateSeries>({.documentation = {}, .allow_readonly = true});
-    // factory.registerFunction<TableFunctionGenerateSeries>({.documentation = {}, .allow_readonly = true});
+    factory.registerFunction<TableFunctionGenerateSeries<0>>({.documentation = {}, .allow_readonly = true});
+    factory.registerFunction<TableFunctionGenerateSeries<1>>({.documentation = {}, .allow_readonly = true});
 }
 
 }
diff --git a/src/TableFunctions/TableFunctionNumbers.cpp b/src/TableFunctions/TableFunctionNumbers.cpp
index bcda8dc6a5e..2989eb5fbef 100644
--- a/src/TableFunctions/TableFunctionNumbers.cpp
+++ b/src/TableFunctions/TableFunctionNumbers.cpp
@@ -1,3 +1,4 @@
+#include <optional>
 #include <DataTypes/DataTypesNumber.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/convertFieldToType.h>
@@ -8,6 +9,7 @@
 #include <TableFunctions/TableFunctionFactory.h>
 #include <Common/FieldVisitorToString.h>
 #include <Common/typeid_cast.h>
+#include "base/types.h"
 #include "registerTableFunctions.h"
 
 
@@ -68,15 +70,16 @@ StoragePtr TableFunctionNumbers<multithreaded>::executeImpl(
     {
         auto arguments = function->arguments->children;
 
-        if (arguments.size() != 1 && arguments.size() != 2)
+        if ((arguments.empty()) || (arguments.size() >= 4))
             throw Exception(
                 ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Table function '{}' requires 'length' or 'offset, length'.", getName());
 
-        UInt64 offset = arguments.size() == 2 ? evaluateArgument(context, arguments[0]) : 0;
-        UInt64 length = arguments.size() == 2 ? evaluateArgument(context, arguments[1]) : evaluateArgument(context, arguments[0]);
+        UInt64 offset = arguments.size() >= 2 ? evaluateArgument(context, arguments[0]) : 0;
+        UInt64 length = arguments.size() >= 2 ? evaluateArgument(context, arguments[1]) : evaluateArgument(context, arguments[0]);
+        UInt64 step = arguments.size() == 3 ? evaluateArgument(context, arguments[2]) : 1;
 
         auto res = std::make_shared<StorageSystemNumbers>(
-            StorageID(getDatabaseName(), table_name), multithreaded, std::string{"number"}, length, offset);
+            StorageID(getDatabaseName(), table_name), multithreaded, std::string{"number"}, length, offset, step);
         res->startup();
         return res;
     }

From d0ed47e655913f66fec5ce31dbf10a2e045424ef Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Mon, 18 Mar 2024 16:04:31 +0000
Subject: [PATCH 689/985] Return right cmake settings

---
 CMakeLists.txt | 22 +++++++++++-----------
 1 file changed, 11 insertions(+), 11 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 6847b1bf994..8c4e16eace2 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -54,19 +54,19 @@ endif ()
 # ccache ignore it.
 option(ENABLE_CHECK_HEAVY_BUILDS "Don't allow C++ translation units to compile too long or to take too much memory while compiling." OFF)
 if (ENABLE_CHECK_HEAVY_BUILDS)
-    # # set DATA (since RSS does not work since 2.6.x+) to 5G
-    # set (RLIMIT_DATA 5000000000)
-    # # set VIRT (RLIMIT_AS) to 10G (DATA*2)
-    # set (RLIMIT_AS 10000000000)
-    # # set CPU time limit to 1000 seconds
-    # set (RLIMIT_CPU 1000)
+    # set DATA (since RSS does not work since 2.6.x+) to 5G
+    set (RLIMIT_DATA 5000000000)
+    # set VIRT (RLIMIT_AS) to 10G (DATA*2)
+    set (RLIMIT_AS 10000000000)
+    # set CPU time limit to 1000 seconds
+    set (RLIMIT_CPU 1000)
 
-    # # -fsanitize=memory and address are too heavy
-    # if (SANITIZE OR SANITIZE_COVERAGE OR WITH_COVERAGE)
-    #    set (RLIMIT_DATA 10000000000) # 10G
-    # endif()
+    # -fsanitize=memory and address are too heavy
+    if (SANITIZE OR SANITIZE_COVERAGE OR WITH_COVERAGE)
+       set (RLIMIT_DATA 10000000000) # 10G
+    endif()
 
-    # set (CMAKE_CXX_COMPILER_LAUNCHER prlimit --as=${RLIMIT_AS} --data=${RLIMIT_DATA} --cpu=${RLIMIT_CPU} ${CMAKE_CXX_COMPILER_LAUNCHER})
+    set (CMAKE_CXX_COMPILER_LAUNCHER prlimit --as=${RLIMIT_AS} --data=${RLIMIT_DATA} --cpu=${RLIMIT_CPU} ${CMAKE_CXX_COMPILER_LAUNCHER})
 endif ()
 
 if (NOT CMAKE_BUILD_TYPE OR CMAKE_BUILD_TYPE STREQUAL "None")

From 13b27a8d3663c6c160b826eef131601f226afacd Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Mon, 18 Mar 2024 16:13:02 +0000
Subject: [PATCH 690/985] refactoring of reading from compact parts

---
 .../MergeTree/MergeTreeReaderCompact.cpp      | 55 ++++++++++---------
 .../MergeTree/MergeTreeReaderCompact.h        |  3 +-
 2 files changed, 32 insertions(+), 26 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeReaderCompact.cpp b/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
index 3835c1e2054..a22bff6b8d2 100644
--- a/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
@@ -78,31 +78,7 @@ void MergeTreeReaderCompact::fillColumnPositions()
         /// we have to read its offsets if they exist.
         if (!position && is_array)
         {
-            NameAndTypePair column_to_read_with_subcolumns = column_to_read;
-            auto [name_in_storage, subcolumn_name] = Nested::splitName(column_to_read.name);
-
-            /// If it is a part of Nested, we need to get the column from
-            /// storage metadata which is converted to Nested type with subcolumns.
-            /// It is required for proper counting of shared streams.
-            if (!subcolumn_name.empty())
-            {
-                /// If column is renamed get the new name from storage metadata.
-                if (alter_conversions->columnHasNewName(name_in_storage))
-                    name_in_storage = alter_conversions->getColumnNewName(name_in_storage);
-
-                if (!storage_columns_with_collected_nested)
-                {
-                    auto options = GetColumnsOptions(GetColumnsOptions::AllPhysical).withExtendedObjects();
-                    auto storage_columns_list = Nested::collect(storage_snapshot->getColumns(options));
-                    storage_columns_with_collected_nested = ColumnsDescription(std::move(storage_columns_list));
-                }
-
-                column_to_read_with_subcolumns = storage_columns_with_collected_nested
-                    ->getColumnOrSubcolumn(
-                        GetColumnsOptions::All,
-                        Nested::concatenateName(name_in_storage, subcolumn_name));
-            }
-
+            auto column_to_read_with_subcolumns = getColumnConvertedToSubcolumnOfNested(column_to_read);
             auto name_level_for_offsets = findColumnForOffsets(column_to_read_with_subcolumns);
 
             if (name_level_for_offsets.has_value())
@@ -119,6 +95,35 @@ void MergeTreeReaderCompact::fillColumnPositions()
     }
 }
 
+NameAndTypePair MergeTreeReaderCompact::getColumnConvertedToSubcolumnOfNested(const NameAndTypePair & column)
+{
+    if (!isArray(column.type))
+        return column;
+
+    /// If it is a part of Nested, we need to get the column from
+    /// storage metadata which is converted to Nested type with subcolumns.
+    /// It is required for proper counting of shared streams.
+    auto [name_in_storage, subcolumn_name] = Nested::splitName(column.name);
+
+    if (subcolumn_name.empty())
+        return column;
+
+    /// If column is renamed get the new name from storage metadata.
+    if (alter_conversions->columnHasNewName(name_in_storage))
+        name_in_storage = alter_conversions->getColumnNewName(name_in_storage);
+
+    if (!storage_columns_with_collected_nested)
+    {
+        auto options = GetColumnsOptions(GetColumnsOptions::AllPhysical).withExtendedObjects();
+        auto storage_columns_list = Nested::collect(storage_snapshot->getColumns(options));
+        storage_columns_with_collected_nested = ColumnsDescription(std::move(storage_columns_list));
+    }
+
+    return storage_columns_with_collected_nested->getColumnOrSubcolumn(
+        GetColumnsOptions::All,
+        Nested::concatenateName(name_in_storage, subcolumn_name));
+}
+
 void MergeTreeReaderCompact::readData(
     const NameAndTypePair & name_and_type,
     ColumnPtr & column,
diff --git a/src/Storages/MergeTree/MergeTreeReaderCompact.h b/src/Storages/MergeTree/MergeTreeReaderCompact.h
index 9c66b4691a3..a783e595af5 100644
--- a/src/Storages/MergeTree/MergeTreeReaderCompact.h
+++ b/src/Storages/MergeTree/MergeTreeReaderCompact.h
@@ -31,10 +31,11 @@ public:
         const ReadBufferFromFileBase::ProfileCallback & profile_callback_,
         clockid_t clock_type_);
 
-    bool canReadIncompleteGranules() const override final { return false; }
+    bool canReadIncompleteGranules() const final { return false; }
 
 protected:
     void fillColumnPositions();
+    NameAndTypePair getColumnConvertedToSubcolumnOfNested(const NameAndTypePair & column);
 
     using InputStreamGetter = ISerialization::InputStreamGetter;
 

From 3fd5c6920579d927ee994646115211cae046c2e6 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Mon, 18 Mar 2024 16:17:54 +0000
Subject: [PATCH 691/985] Add docs

---
 docs/en/sql-reference/table-functions/numbers.md | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/docs/en/sql-reference/table-functions/numbers.md b/docs/en/sql-reference/table-functions/numbers.md
index 7d3437b7d53..e0ff19b9824 100644
--- a/docs/en/sql-reference/table-functions/numbers.md
+++ b/docs/en/sql-reference/table-functions/numbers.md
@@ -8,6 +8,7 @@ sidebar_label: numbers
 
 `numbers(N)` – Returns a table with the single ‘number’ column (UInt64) that contains integers from 0 to N-1.
 `numbers(N, M)` - Returns a table with the single ‘number’ column (UInt64) that contains integers from N to (N + M - 1).
+`numbers(N, M, S)` - Returns a table with the single ‘number’ column (UInt64) that contains integers from N to (N + M - 1) with step S.
 
 Similar to the `system.numbers` table, it can be used for testing and generating successive values, `numbers(N, M)` more efficient than `system.numbers`.
 
@@ -21,6 +22,15 @@ SELECT * FROM system.numbers WHERE number BETWEEN 0 AND 9;
 SELECT * FROM system.numbers WHERE number IN (0, 1, 2, 3, 4, 5, 6, 7, 8, 9);
 ```
 
+And the following queries are equivalent:
+
+``` sql
+SELECT number * 2 FROM numbers(10);
+SELECT (number - 10) * 2 FROM numbers(10, 10);
+SELECT * FROM numbers(0, 20, 2);
+```
+
+
 Examples:
 
 ``` sql

From 2061fb25c5e88766bdce1f5a2ea9f0a734edbcf9 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Mon, 18 Mar 2024 16:21:08 +0000
Subject: [PATCH 692/985] Add alias to doc

---
 docs/en/sql-reference/table-functions/generate_series.md | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/table-functions/generate_series.md b/docs/en/sql-reference/table-functions/generate_series.md
index c5d29369627..9370cea8580 100644
--- a/docs/en/sql-reference/table-functions/generate_series.md
+++ b/docs/en/sql-reference/table-functions/generate_series.md
@@ -22,4 +22,7 @@ And the following queries return tables with the same content but different colu
 ``` sql
 SELECT * FROM numbers(10, 11) WHERE number % 3 == (10 % 3);
 SELECT * FROM generate_series(10, 20, 3) ;
-```
\ No newline at end of file
+```
+
+### Alias
+generateSeries
\ No newline at end of file

From b814fabcd3224ab6904e5f8f947ca79a8f8ba02b Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Mon, 18 Mar 2024 17:18:01 +0100
Subject: [PATCH 693/985] Disallow s3queue sharded mode

---
 src/Core/Settings.h                     |  1 +
 src/Core/SettingsChangesHistory.h       |  1 +
 src/Storages/S3Queue/StorageS3Queue.cpp | 14 ++++++++++++--
 src/Storages/S3Queue/StorageS3Queue.h   |  3 ++-
 4 files changed, 16 insertions(+), 3 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 415063eee84..8508fc5d2d3 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -114,6 +114,7 @@ class IColumn;
     M(Bool, enable_s3_requests_logging, false, "Enable very explicit logging of S3 requests. Makes sense for debug only.", 0) \
     M(String, s3queue_default_zookeeper_path, "/clickhouse/s3queue/", "Default zookeeper path prefix for S3Queue engine", 0) \
     M(Bool, s3queue_enable_logging_to_s3queue_log, false, "Enable writing to system.s3queue_log. The value can be overwritten per table with table settings", 0) \
+    M(Bool, s3queue_allow_experimental_sharded_mode, false, "Enable experimental sharded mode of S3Queue table engine. It is experimental because it will be rewritten", 0) \
     M(UInt64, hdfs_replication, 0, "The actual number of replications can be specified when the hdfs file is created.", 0) \
     M(Bool, hdfs_truncate_on_insert, false, "Enables or disables truncate before insert in s3 engine tables", 0) \
     M(Bool, hdfs_create_new_file_on_insert, false, "Enables or disables creating a new file on each insert in hdfs engine tables", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 072b9803682..ff5289230ca 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -100,6 +100,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"keeper_max_retries", 10, 10, "Max retries for general keeper operations"},
               {"keeper_retry_initial_backoff_ms", 100, 100, "Initial backoff timeout for general keeper operations"},
               {"keeper_retry_max_backoff_ms", 5000, 5000, "Max backoff timeout for general keeper operations"},
+              {"s3queue_allow_experimental_sharded_mode", false, false, "Enable experimental sharded mode of S3Queue table engine. It is experimental because it will be rewritten"},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 6e7ac2b47b8..048816fe4f1 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -105,7 +105,8 @@ StorageS3Queue::StorageS3Queue(
     const String & comment,
     ContextPtr context_,
     std::optional<FormatSettings> format_settings_,
-    ASTStorage * engine_args)
+    ASTStorage * engine_args,
+    LoadingStrictnessLevel mode)
     : IStorage(table_id_)
     , WithContext(context_)
     , s3queue_settings(std::move(s3queue_settings_))
@@ -129,6 +130,14 @@ StorageS3Queue::StorageS3Queue(
         throw Exception(ErrorCodes::QUERY_NOT_ALLOWED, "S3Queue url must either end with '/' or contain globs");
     }
 
+    if (mode == LoadingStrictnessLevel::CREATE
+        && !context_->getSettingsRef().s3queue_allow_experimental_sharded_mode
+        && s3queue_settings->mode == S3QueueMode::ORDERED
+        && s3queue_settings->s3queue_total_shards_num)
+    {
+        throw Exception(ErrorCodes::QUERY_NOT_ALLOWED, "S3Queue sharded mode is not allowed. To enable use `s3queue_allow_experimental_sharded_mode`");
+    }
+
     checkAndAdjustSettings(*s3queue_settings, context_->getSettingsRef());
 
     configuration.update(context_);
@@ -663,7 +672,8 @@ void registerStorageS3QueueImpl(const String & name, StorageFactory & factory)
                 args.comment,
                 args.getContext(),
                 format_settings,
-                args.storage_def);
+                args.storage_def,
+                args.mode);
         },
         {
             .supports_settings = true,
diff --git a/src/Storages/S3Queue/StorageS3Queue.h b/src/Storages/S3Queue/StorageS3Queue.h
index bdd3ab7b687..33fccc20b84 100644
--- a/src/Storages/S3Queue/StorageS3Queue.h
+++ b/src/Storages/S3Queue/StorageS3Queue.h
@@ -37,7 +37,8 @@ public:
         const String & comment,
         ContextPtr context_,
         std::optional<FormatSettings> format_settings_,
-        ASTStorage * engine_args);
+        ASTStorage * engine_args,
+        LoadingStrictnessLevel mode);
 
     String getName() const override { return "S3Queue"; }
 

From 4c27287c6d40f803121d2ef7263799c7460c4b6e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 18 Mar 2024 17:30:29 +0100
Subject: [PATCH 694/985] Fix crash in arrayPartialReverseSort

---
 src/Functions/array/arraySort.cpp             |  5 ++++-
 ...013_fuzz_arrayPartialReverseSort.reference | 14 ++++++++++++++
 .../03013_fuzz_arrayPartialReverseSort.sql    | 19 +++++++++++++++++++
 3 files changed, 37 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/03013_fuzz_arrayPartialReverseSort.reference
 create mode 100644 tests/queries/0_stateless/03013_fuzz_arrayPartialReverseSort.sql

diff --git a/src/Functions/array/arraySort.cpp b/src/Functions/array/arraySort.cpp
index 184b1f82280..6c8741e6eec 100644
--- a/src/Functions/array/arraySort.cpp
+++ b/src/Functions/array/arraySort.cpp
@@ -46,7 +46,10 @@ ColumnPtr ArraySortImpl<positive, is_partial>::execute(
                     ErrorCodes::LOGICAL_ERROR,
                     "Expected fixed arguments to get the limit for partial array sort"
                 );
-            return fixed_arguments[0].column.get()->getUInt(0);
+
+            /// During dryRun the input column might be empty
+            if (!fixed_arguments[0].column->empty())
+                return fixed_arguments[0].column->getUInt(0);
         }
         return 0;
     }();
diff --git a/tests/queries/0_stateless/03013_fuzz_arrayPartialReverseSort.reference b/tests/queries/0_stateless/03013_fuzz_arrayPartialReverseSort.reference
new file mode 100644
index 00000000000..5832f8b7a52
--- /dev/null
+++ b/tests/queries/0_stateless/03013_fuzz_arrayPartialReverseSort.reference
@@ -0,0 +1,14 @@
+[]
+[]
+[1,0]
+[]
+[3,2]
+[]
+[5,4]
+[]
+[]
+[1,0]
+[]
+[3,2]
+[]
+[5,4]
diff --git a/tests/queries/0_stateless/03013_fuzz_arrayPartialReverseSort.sql b/tests/queries/0_stateless/03013_fuzz_arrayPartialReverseSort.sql
new file mode 100644
index 00000000000..f575ae952dd
--- /dev/null
+++ b/tests/queries/0_stateless/03013_fuzz_arrayPartialReverseSort.sql
@@ -0,0 +1,19 @@
+SELECT res
+FROM
+(
+    SELECT
+        arrayPartialReverseSort(2, if(number % 2, emptyArrayUInt64(), range(number))) AS arr,
+        arrayResize(arr, if(empty(arr), 0, 2)) AS res
+    FROM system.numbers
+    LIMIT 7
+);
+
+SELECT res
+FROM
+(
+    SELECT
+        arrayPartialReverseSort(materialize(2), if(number % 2, emptyArrayUInt64(), range(number))) AS arr,
+        arrayResize(arr, if(empty(arr), 0, 2)) AS res
+    FROM system.numbers
+    LIMIT 7
+);

From 84051d8604ce6cbd03510cf77bda53a3f95382fa Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Mon, 18 Mar 2024 17:34:16 +0100
Subject: [PATCH 695/985] Don't run 01459_manual_write_to_replicas in debug
 build as it's too slow

---
 tests/queries/0_stateless/01459_manual_write_to_replicas.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01459_manual_write_to_replicas.sh b/tests/queries/0_stateless/01459_manual_write_to_replicas.sh
index a9a6d27c145..56620d848a3 100755
--- a/tests/queries/0_stateless/01459_manual_write_to_replicas.sh
+++ b/tests/queries/0_stateless/01459_manual_write_to_replicas.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: replica, no-parallel
+# Tags: replica, no-parallel, no-debug
 
 set -e
 

From c67c04b89a319cc3d0bcbcc7c3eea169b49d96f5 Mon Sep 17 00:00:00 2001
From: Arthur Passos <arthur.ti@outlook.com>
Date: Mon, 18 Mar 2024 13:44:36 -0300
Subject: [PATCH 696/985] fix typo

---
 src/Storages/MergeTree/SimpleMergeSelector.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/MergeTree/SimpleMergeSelector.h b/src/Storages/MergeTree/SimpleMergeSelector.h
index c20eaa6e8de..a12b8ba48cb 100644
--- a/src/Storages/MergeTree/SimpleMergeSelector.h
+++ b/src/Storages/MergeTree/SimpleMergeSelector.h
@@ -26,7 +26,7 @@ Then we need some balance between optimization of these two metrics.
 But some optimizations may improve both metrics.
 
 For example, we can look at the "merge tree" - the tree of data parts that were merged.
-If the tree is perfectly balanced then its depth is proportonal to the log(data size),
+If the tree is perfectly balanced then its depth is proportional to the log(data size),
 the total amount of work is proportional to data_size * log(data_size)
 and the write amplification is proportional to log(data_size).
 If it's not balanced (e.g. every new data part is always merged with existing data parts),

From 90c4b0aaf0e5ed0823b24d6c5ce48e726accf451 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Mon, 18 Mar 2024 16:52:21 +0000
Subject: [PATCH 697/985] Add word to aspell-dictg

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 57a8e0d5840..edc3d993ed9 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1581,6 +1581,7 @@ gccMurmurHash
 gcem
 generateRandom
 generateRandomStructure
+generateSeries
 generateULID
 generateUUIDv
 geoDistance

From b3e9f07e2eaf3703c19497e3fe86a90a7e0b846d Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 18 Mar 2024 16:54:59 +0000
Subject: [PATCH 698/985] Deprecate name collisions for now.

---
 src/Interpreters/ActionsDAG.cpp                        |  4 ----
 .../QueryPlan/Optimizations/liftUpFunctions.cpp        | 10 +++++-----
 2 files changed, 5 insertions(+), 9 deletions(-)

diff --git a/src/Interpreters/ActionsDAG.cpp b/src/Interpreters/ActionsDAG.cpp
index 86a5b91ad63..37ef217cb6d 100644
--- a/src/Interpreters/ActionsDAG.cpp
+++ b/src/Interpreters/ActionsDAG.cpp
@@ -1757,10 +1757,6 @@ ActionsDAG::SplitResult ActionsDAG::split(std::unordered_set<const Node *> split
         }
     }
 
-    /// All input nodes are needed by split to make sure first DAG and initial DAG have equal inputs,
-    for (const auto * input: inputs)
-        data[input].needed_by_split_node = true;
-
     /// DFS. Move nodes to one of the DAGs.
     for (const auto & node : nodes)
     {
diff --git a/src/Processors/QueryPlan/Optimizations/liftUpFunctions.cpp b/src/Processors/QueryPlan/Optimizations/liftUpFunctions.cpp
index 3fc2d64b11f..b280e2d3cc6 100644
--- a/src/Processors/QueryPlan/Optimizations/liftUpFunctions.cpp
+++ b/src/Processors/QueryPlan/Optimizations/liftUpFunctions.cpp
@@ -29,14 +29,14 @@ const DB::DataStream & getChildOutputStream(DB::QueryPlan::Node & node)
 namespace DB::QueryPlanOptimizations
 {
 
-/// This is a check that output columns does not have the same name
+/// This is a check that nodes columns does not have the same name
 /// This is ok for DAG, but may introduce a bug in a SotringStep cause columns are selected by name.
-static bool areOutputsConvertableToBlock(const ActionsDAG::NodeRawConstPtrs & outputs)
+static bool areNodesConvertableToBlock(const ActionsDAG::NodeRawConstPtrs & nodes)
 {
     std::unordered_set<std::string_view> names;
-    for (const auto & output : outputs)
+    for (const auto & node : nodes)
     {
-        if (!names.emplace(output->result_name).second)
+        if (!names.emplace(node->result_name).second)
             return false;
     }
 
@@ -72,7 +72,7 @@ size_t tryExecuteFunctionsAfterSorting(QueryPlan::Node * parent_node, QueryPlan:
     if (unneeded_for_sorting->trivial())
         return 0;
 
-    if (!areOutputsConvertableToBlock(needed_for_sorting->getOutputs()))
+    if (!areNodesConvertableToBlock(needed_for_sorting->getOutputs()) || !areNodesConvertableToBlock(unneeded_for_sorting->getInputs()))
         return 0;
 
     // Sorting (parent_node) -> Expression (child_node)

From 613c31038ae76be09d35a151e6446024b07f127b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 18:40:03 +0100
Subject: [PATCH 699/985] Fix recompilation of regexps during backtracking in
 the parser

---
 src/Analyzer/MatcherNode.cpp                  | 23 +++++---
 src/Analyzer/MatcherNode.h                    | 13 ++---
 src/Analyzer/QueryTreeBuilder.cpp             | 11 +---
 .../JoinToSubqueryTransformVisitor.cpp        | 12 +++-
 .../TranslateQualifiedNamesVisitor.cpp        | 15 ++++-
 src/Parsers/ASTColumnsMatcher.cpp             | 57 +++++--------------
 src/Parsers/ASTColumnsMatcher.h               | 18 ++----
 src/Parsers/ExpressionElementParsers.cpp      | 23 ++++----
 8 files changed, 73 insertions(+), 99 deletions(-)

diff --git a/src/Analyzer/MatcherNode.cpp b/src/Analyzer/MatcherNode.cpp
index ae2b654ab13..d0efb0646b3 100644
--- a/src/Analyzer/MatcherNode.cpp
+++ b/src/Analyzer/MatcherNode.cpp
@@ -4,7 +4,6 @@
 #include <Common/SipHash.h>
 
 #include <IO/WriteBuffer.h>
-#include <IO/WriteHelpers.h>
 #include <IO/Operators.h>
 
 #include <Parsers/ASTIdentifier.h>
@@ -14,9 +13,15 @@
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTColumnsTransformers.h>
 
+
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int CANNOT_COMPILE_REGEXP;
+}
+
 const char * toString(MatcherNodeType matcher_node_type)
 {
     switch (matcher_node_type)
@@ -48,20 +53,20 @@ MatcherNode::MatcherNode(Identifier qualified_identifier_, ColumnTransformersNod
 {
 }
 
-MatcherNode::MatcherNode(std::shared_ptr<re2::RE2> columns_matcher_, ColumnTransformersNodes column_transformers_)
+MatcherNode::MatcherNode(const String & pattern_, ColumnTransformersNodes column_transformers_)
     : MatcherNode(MatcherNodeType::COLUMNS_REGEXP,
         {} /*qualified_identifier*/,
         {} /*columns_identifiers*/,
-        std::move(columns_matcher_),
+        std::move(pattern_),
         std::move(column_transformers_))
 {
 }
 
-MatcherNode::MatcherNode(Identifier qualified_identifier_, std::shared_ptr<re2::RE2> columns_matcher_, ColumnTransformersNodes column_transformers_)
+MatcherNode::MatcherNode(Identifier qualified_identifier_, const String & pattern_, ColumnTransformersNodes column_transformers_)
     : MatcherNode(MatcherNodeType::COLUMNS_REGEXP,
         std::move(qualified_identifier_),
         {} /*columns_identifiers*/,
-        std::move(columns_matcher_),
+        std::move(pattern_),
         std::move(column_transformers_))
 {
 }
@@ -87,14 +92,18 @@ MatcherNode::MatcherNode(Identifier qualified_identifier_, Identifiers columns_i
 MatcherNode::MatcherNode(MatcherNodeType matcher_type_,
     Identifier qualified_identifier_,
     Identifiers columns_identifiers_,
-    std::shared_ptr<re2::RE2> columns_matcher_,
+    const String & pattern_,
     ColumnTransformersNodes column_transformers_)
     : IQueryTreeNode(children_size)
     , matcher_type(matcher_type_)
     , qualified_identifier(qualified_identifier_)
     , columns_identifiers(columns_identifiers_)
-    , columns_matcher(columns_matcher_)
 {
+    columns_matcher = std::make_shared<re2::RE2>(pattern_, re2::RE2::Quiet);
+    if (!columns_matcher->ok())
+        throw DB::Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
+            "COLUMNS pattern {} cannot be compiled: {}", pattern_, columns_matcher->error());
+
     auto column_transformers_list_node = std::make_shared<ListNode>();
 
     auto & column_transformers_nodes = column_transformers_list_node->getNodes();
diff --git a/src/Analyzer/MatcherNode.h b/src/Analyzer/MatcherNode.h
index 87ee5ee92bb..2217fde6eff 100644
--- a/src/Analyzer/MatcherNode.h
+++ b/src/Analyzer/MatcherNode.h
@@ -6,6 +6,7 @@
 #include <Parsers/ASTAsterisk.h>
 #include <Common/re2.h>
 
+
 namespace DB
 {
 
@@ -58,10 +59,10 @@ public:
     explicit MatcherNode(Identifier qualified_identifier_, ColumnTransformersNodes column_transformers_ = {});
 
     /// Variant unqualified COLUMNS('regexp')
-    explicit MatcherNode(std::shared_ptr<re2::RE2> columns_matcher_, ColumnTransformersNodes column_transformers_ = {});
+    explicit MatcherNode(const String & pattern_, ColumnTransformersNodes column_transformers_ = {});
 
     /// Variant qualified COLUMNS('regexp')
-    explicit MatcherNode(Identifier qualified_identifier_, std::shared_ptr<re2::RE2> columns_matcher_, ColumnTransformersNodes column_transformers_ = {});
+    explicit MatcherNode(Identifier qualified_identifier_, const String & pattern_, ColumnTransformersNodes column_transformers_ = {});
 
     /// Variant unqualified COLUMNS(column_name_1, ...)
     explicit MatcherNode(Identifiers columns_identifiers_, ColumnTransformersNodes column_transformers_ = {});
@@ -81,12 +82,6 @@ public:
         return matcher_type == MatcherNodeType::ASTERISK;
     }
 
-    /// Returns true if matcher is columns regexp or columns list matcher, false otherwise
-    bool isColumnsMatcher() const
-    {
-        return matcher_type == MatcherNodeType::COLUMNS_REGEXP || matcher_type == MatcherNodeType::COLUMNS_LIST;
-    }
-
     /// Returns true if matcher is qualified, false otherwise
     bool isQualified() const
     {
@@ -152,7 +147,7 @@ private:
     explicit MatcherNode(MatcherNodeType matcher_type_,
         Identifier qualified_identifier_,
         Identifiers columns_identifiers_,
-        std::shared_ptr<re2::RE2> columns_matcher_,
+        const String & pattern_,
         ColumnTransformersNodes column_transformers_);
 
     MatcherNodeType matcher_type;
diff --git a/src/Analyzer/QueryTreeBuilder.cpp b/src/Analyzer/QueryTreeBuilder.cpp
index 14559cca887..df80f46b3cd 100644
--- a/src/Analyzer/QueryTreeBuilder.cpp
+++ b/src/Analyzer/QueryTreeBuilder.cpp
@@ -2,11 +2,7 @@
 
 #include <Common/FieldVisitorToString.h>
 
-#include <DataTypes/IDataType.h>
-#include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/FieldToDataType.h>
-#include <Parsers/ParserSelectQuery.h>
 #include <Parsers/ParserSelectWithUnionQuery.h>
 #include <Parsers/ASTSelectWithUnionQuery.h>
 #include <Parsers/ASTSelectIntersectExceptQuery.h>
@@ -33,13 +29,11 @@
 #include <Analyzer/MatcherNode.h>
 #include <Analyzer/ColumnTransformers.h>
 #include <Analyzer/ConstantNode.h>
-#include <Analyzer/ColumnNode.h>
 #include <Analyzer/FunctionNode.h>
 #include <Analyzer/LambdaNode.h>
 #include <Analyzer/SortNode.h>
 #include <Analyzer/InterpolateNode.h>
 #include <Analyzer/WindowNode.h>
-#include <Analyzer/TableNode.h>
 #include <Analyzer/TableFunctionNode.h>
 #include <Analyzer/QueryNode.h>
 #include <Analyzer/ArrayJoinNode.h>
@@ -50,7 +44,6 @@
 
 #include <Interpreters/StorageID.h>
 #include <Interpreters/Context.h>
-#include <Functions/FunctionFactory.h>
 
 
 namespace DB
@@ -661,7 +654,7 @@ QueryTreeNodePtr QueryTreeBuilder::buildExpression(const ASTPtr & expression, co
     else if (const auto * columns_regexp_matcher = expression->as<ASTColumnsRegexpMatcher>())
     {
         auto column_transformers = buildColumnTransformers(columns_regexp_matcher->transformers, context);
-        result = std::make_shared<MatcherNode>(columns_regexp_matcher->getMatcher(), std::move(column_transformers));
+        result = std::make_shared<MatcherNode>(columns_regexp_matcher->getPattern(), std::move(column_transformers));
     }
     else if (const auto * columns_list_matcher = expression->as<ASTColumnsListMatcher>())
     {
@@ -681,7 +674,7 @@ QueryTreeNodePtr QueryTreeBuilder::buildExpression(const ASTPtr & expression, co
     {
         auto & qualified_identifier = qualified_columns_regexp_matcher->qualifier->as<ASTIdentifier &>();
         auto column_transformers = buildColumnTransformers(qualified_columns_regexp_matcher->transformers, context);
-        result = std::make_shared<MatcherNode>(Identifier(qualified_identifier.name_parts), qualified_columns_regexp_matcher->getMatcher(), std::move(column_transformers));
+        result = std::make_shared<MatcherNode>(Identifier(qualified_identifier.name_parts), qualified_columns_regexp_matcher->getPattern(), std::move(column_transformers));
     }
     else if (const auto * qualified_columns_list_matcher = expression->as<ASTQualifiedColumnsListMatcher>())
     {
diff --git a/src/Interpreters/JoinToSubqueryTransformVisitor.cpp b/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
index 5c4ae528fc1..209f8e68b8f 100644
--- a/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
+++ b/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
@@ -15,11 +15,10 @@
 #include <Parsers/ASTColumnsTransformers.h>
 #include <Parsers/ASTQualifiedAsterisk.h>
 #include <Parsers/ParserTablesInSelectQuery.h>
-#include <Parsers/ExpressionListParsers.h>
 #include <Parsers/parseQuery.h>
-#include <IO/WriteHelpers.h>
 #include <Core/Defines.h>
 #include <Common/StringUtils/StringUtils.h>
+#include <Common/re2.h>
 
 namespace DB
 {
@@ -30,6 +29,7 @@ namespace ErrorCodes
     extern const int AMBIGUOUS_COLUMN_NAME;
     extern const int NOT_IMPLEMENTED;
     extern const int UNKNOWN_IDENTIFIER;
+    extern const int CANNOT_COMPILE_REGEXP;
 }
 
 namespace
@@ -204,11 +204,17 @@ private:
             {
                 has_asterisks = true;
 
+                String pattern = columns_regexp_matcher->getPattern();
+                auto regexp = std::make_shared<re2::RE2>(pattern, re2::RE2::Quiet);
+                if (!regexp->ok())
+                    throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
+                        "COLUMNS pattern {} cannot be compiled: {}", pattern, regexp->error());
+
                 for (auto & table_name : data.tables_order)
                     data.addTableColumns(
                         table_name,
                         columns,
-                        [&](const String & column_name) { return columns_regexp_matcher->isColumnMatching(column_name); });
+                        [&](const String & column_name) { return re2::RE2::PartialMatch(column_name, *regexp); });
 
                 if (columns_regexp_matcher->transformers)
                 {
diff --git a/src/Interpreters/TranslateQualifiedNamesVisitor.cpp b/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
index 3de7e217e53..e3690d0fcc0 100644
--- a/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
+++ b/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
@@ -1,4 +1,3 @@
-#include <cstring>
 #include <Poco/String.h>
 
 #include <Interpreters/TranslateQualifiedNamesVisitor.h>
@@ -6,7 +5,6 @@
 
 #include <Common/typeid_cast.h>
 #include <Common/StringUtils/StringUtils.h>
-#include <Core/Names.h>
 #include <DataTypes/DataTypeTuple.h>
 
 #include <Parsers/ASTIdentifier.h>
@@ -21,6 +19,7 @@
 #include <Parsers/ASTColumnsMatcher.h>
 #include <Parsers/ASTColumnsTransformers.h>
 #include <Storages/StorageView.h>
+#include <Common/re2.h>
 
 
 namespace DB
@@ -31,7 +30,10 @@ namespace ErrorCodes
     extern const int UNKNOWN_IDENTIFIER;
     extern const int UNSUPPORTED_JOIN_KEYS;
     extern const int LOGICAL_ERROR;
+    extern const int CANNOT_COMPILE_REGEXP;
 }
+
+
 bool TranslateQualifiedNamesMatcher::Data::matchColumnName(std::string_view name, const String & column_name, DataTypePtr column_type)
 {
     if (name.size() < column_name.size())
@@ -275,12 +277,19 @@ void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPt
         }
         else if (const auto * asterisk_regexp_pattern = child->as<ASTColumnsRegexpMatcher>())
         {
+            String pattern = asterisk_regexp_pattern->getPattern();
+            auto regexp = std::make_shared<re2::RE2>(pattern, re2::RE2::Quiet);
+            if (!regexp->ok())
+                throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
+                    "COLUMNS pattern {} cannot be compiled: {}", pattern, regexp->error());
+
             bool first_table = true;
             for (const auto & table : tables_with_columns)
             {
                 for (const auto & column : table.columns)
                 {
-                    if (asterisk_regexp_pattern->isColumnMatching(column.name) && (first_table || !data.join_using_columns.contains(column.name)))
+                    if (re2::RE2::PartialMatch(column.name, *regexp)
+                        && (first_table || !data.join_using_columns.contains(column.name)))
                     {
                         addIdentifier(columns, table.table, column.name);
                     }
diff --git a/src/Parsers/ASTColumnsMatcher.cpp b/src/Parsers/ASTColumnsMatcher.cpp
index c2854e2235c..dac3661d482 100644
--- a/src/Parsers/ASTColumnsMatcher.cpp
+++ b/src/Parsers/ASTColumnsMatcher.cpp
@@ -34,14 +34,14 @@ void ASTColumnsRegexpMatcher::appendColumnName(WriteBuffer & ostr) const
         writeCString(".", ostr);
     }
     writeCString("COLUMNS(", ostr);
-    writeQuotedString(original_pattern, ostr);
+    writeQuotedString(pattern, ostr);
     writeChar(')', ostr);
 }
 
 void ASTColumnsRegexpMatcher::updateTreeHashImpl(SipHash & hash_state, bool ignore_aliases) const
 {
-    hash_state.update(original_pattern.size());
-    hash_state.update(original_pattern);
+    hash_state.update(pattern.size());
+    hash_state.update(pattern);
     IAST::updateTreeHashImpl(hash_state, ignore_aliases);
 }
 
@@ -56,7 +56,7 @@ void ASTColumnsRegexpMatcher::formatImpl(const FormatSettings & settings, Format
     }
 
     settings.ostr << "COLUMNS" << (settings.hilite ? hilite_none : "") << "(";
-    settings.ostr << quoteString(original_pattern);
+    settings.ostr << quoteString(pattern);
     settings.ostr << ")";
 
     if (transformers)
@@ -65,28 +65,14 @@ void ASTColumnsRegexpMatcher::formatImpl(const FormatSettings & settings, Format
     }
 }
 
-void ASTColumnsRegexpMatcher::setPattern(String pattern)
+void ASTColumnsRegexpMatcher::setPattern(String pattern_)
 {
-    original_pattern = std::move(pattern);
-    column_matcher = std::make_shared<RE2>(original_pattern, RE2::Quiet);
-    if (!column_matcher->ok())
-        throw DB::Exception(DB::ErrorCodes::CANNOT_COMPILE_REGEXP,
-            "COLUMNS pattern {} cannot be compiled: {}", original_pattern, column_matcher->error());
+    pattern = std::move(pattern_);
 }
 
 const String & ASTColumnsRegexpMatcher::getPattern() const
 {
-    return original_pattern;
-}
-
-const std::shared_ptr<re2::RE2> & ASTColumnsRegexpMatcher::getMatcher() const
-{
-    return column_matcher;
-}
-
-bool ASTColumnsRegexpMatcher::isColumnMatching(const String & column_name) const
-{
-    return RE2::PartialMatch(column_name, *column_matcher);
+    return pattern;
 }
 
 ASTPtr ASTColumnsListMatcher::clone() const
@@ -166,37 +152,24 @@ void ASTQualifiedColumnsRegexpMatcher::appendColumnName(WriteBuffer & ostr) cons
 {
     qualifier->appendColumnName(ostr);
     writeCString(".COLUMNS(", ostr);
-    writeQuotedString(original_pattern, ostr);
+    writeQuotedString(pattern, ostr);
     writeChar(')', ostr);
 }
 
-void ASTQualifiedColumnsRegexpMatcher::setPattern(String pattern, bool set_matcher)
+void ASTQualifiedColumnsRegexpMatcher::setPattern(String pattern_)
 {
-    original_pattern = std::move(pattern);
-
-    if (!set_matcher)
-        return;
-
-    column_matcher = std::make_shared<RE2>(original_pattern, RE2::Quiet);
-    if (!column_matcher->ok())
-        throw DB::Exception(DB::ErrorCodes::CANNOT_COMPILE_REGEXP,
-            "COLUMNS pattern {} cannot be compiled: {}", original_pattern, column_matcher->error());
+    pattern = std::move(pattern_);
 }
 
-void ASTQualifiedColumnsRegexpMatcher::setMatcher(std::shared_ptr<re2::RE2> matcher)
+const String & ASTQualifiedColumnsRegexpMatcher::getPattern() const
 {
-    column_matcher = std::move(matcher);
-}
-
-const std::shared_ptr<re2::RE2> & ASTQualifiedColumnsRegexpMatcher::getMatcher() const
-{
-    return column_matcher;
+    return pattern;
 }
 
 void ASTQualifiedColumnsRegexpMatcher::updateTreeHashImpl(SipHash & hash_state, bool ignore_aliases) const
 {
-    hash_state.update(original_pattern.size());
-    hash_state.update(original_pattern);
+    hash_state.update(pattern.size());
+    hash_state.update(pattern);
     IAST::updateTreeHashImpl(hash_state, ignore_aliases);
 }
 
@@ -207,7 +180,7 @@ void ASTQualifiedColumnsRegexpMatcher::formatImpl(const FormatSettings & setting
     qualifier->formatImpl(settings, state, frame);
 
     settings.ostr << ".COLUMNS" << (settings.hilite ? hilite_none : "") << "(";
-    settings.ostr << quoteString(original_pattern);
+    settings.ostr << quoteString(pattern);
     settings.ostr << ")";
 
     if (transformers)
diff --git a/src/Parsers/ASTColumnsMatcher.h b/src/Parsers/ASTColumnsMatcher.h
index 6fc5581a4eb..e5191b74b72 100644
--- a/src/Parsers/ASTColumnsMatcher.h
+++ b/src/Parsers/ASTColumnsMatcher.h
@@ -2,11 +2,6 @@
 
 #include <Parsers/IAST.h>
 
-namespace re2
-{
-class RE2;
-}
-
 
 namespace DB
 {
@@ -25,8 +20,6 @@ public:
     void appendColumnName(WriteBuffer & ostr) const override;
     void setPattern(String pattern);
     const String & getPattern() const;
-    const std::shared_ptr<re2::RE2> & getMatcher() const;
-    bool isColumnMatching(const String & column_name) const;
     void updateTreeHashImpl(SipHash & hash_state, bool ignore_aliases) const override;
 
     ASTPtr expression;
@@ -35,8 +28,7 @@ protected:
     void formatImpl(const FormatSettings & settings, FormatState &, FormatStateStacked) const override;
 
 private:
-    std::shared_ptr<re2::RE2> column_matcher;
-    String original_pattern;
+    String pattern;
 };
 
 /// Same as the above but use a list of column names to do matching.
@@ -62,9 +54,8 @@ public:
     ASTPtr clone() const override;
 
     void appendColumnName(WriteBuffer & ostr) const override;
-    const std::shared_ptr<re2::RE2> & getMatcher() const;
-    void setPattern(String pattern, bool set_matcher = true);
-    void setMatcher(std::shared_ptr<re2::RE2> matcher);
+    void setPattern(String pattern_);
+    const String & getPattern() const;
     void updateTreeHashImpl(SipHash & hash_state, bool ignore_aliases) const override;
 
     ASTPtr qualifier;
@@ -73,8 +64,7 @@ protected:
     void formatImpl(const FormatSettings & settings, FormatState &, FormatStateStacked) const override;
 
 private:
-    std::shared_ptr<re2::RE2> column_matcher;
-    String original_pattern;
+    String pattern;
 };
 
 /// Same as ASTColumnsListMatcher. Qualified identifier is first child.
diff --git a/src/Parsers/ExpressionElementParsers.cpp b/src/Parsers/ExpressionElementParsers.cpp
index 1135fe88c16..67f4a306292 100644
--- a/src/Parsers/ExpressionElementParsers.cpp
+++ b/src/Parsers/ExpressionElementParsers.cpp
@@ -36,7 +36,6 @@
 #include <Parsers/ExpressionListParsers.h>
 #include <Parsers/IAST_fwd.h>
 #include <Parsers/ParserSelectWithUnionQuery.h>
-#include <Parsers/ParserCase.h>
 #include <Parsers/ExpressionElementParsers.h>
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/ParserExplainQuery.h>
@@ -44,6 +43,7 @@
 
 #include <Interpreters/StorageID.h>
 
+
 namespace DB
 {
 
@@ -1628,7 +1628,7 @@ bool ParserColumnsTransformers::parseImpl(Pos & pos, ASTPtr & node, Expected & e
             is_strict = true;
 
         ASTs identifiers;
-        ASTPtr regex_node;
+        ASTPtr regexp_node;
         ParserStringLiteral regex;
         auto parse_id = [&identifiers, &pos, &expected]
         {
@@ -1644,7 +1644,7 @@ bool ParserColumnsTransformers::parseImpl(Pos & pos, ASTPtr & node, Expected & e
         {
             // support one or more parameter
             ++pos;
-            if (!ParserList::parseUtil(pos, expected, parse_id, false) && !regex.parse(pos, regex_node, expected))
+            if (!ParserList::parseUtil(pos, expected, parse_id, false) && !regex.parse(pos, regexp_node, expected))
                 return false;
 
             if (pos->type != TokenType::ClosingRoundBracket)
@@ -1654,13 +1654,13 @@ bool ParserColumnsTransformers::parseImpl(Pos & pos, ASTPtr & node, Expected & e
         else
         {
             // only one parameter
-            if (!parse_id() && !regex.parse(pos, regex_node, expected))
+            if (!parse_id() && !regex.parse(pos, regexp_node, expected))
                 return false;
         }
 
         auto res = std::make_shared<ASTColumnsExceptTransformer>();
-        if (regex_node)
-            res->setPattern(regex_node->as<ASTLiteral &>().value.get<String>());
+        if (regexp_node)
+            res->setPattern(regexp_node->as<ASTLiteral &>().value.get<String>());
         else
             res->children = std::move(identifiers);
         res->is_strict = is_strict;
@@ -1794,11 +1794,11 @@ static bool parseColumnsMatcherBody(IParser::Pos & pos, ASTPtr & node, Expected
     ++pos;
 
     ParserList columns_p(std::make_unique<ParserCompoundIdentifier>(false, true), std::make_unique<ParserToken>(TokenType::Comma), false);
-    ParserStringLiteral regex;
+    ParserStringLiteral regexp;
 
     ASTPtr column_list;
-    ASTPtr regex_node;
-    if (!columns_p.parse(pos, column_list, expected) && !regex.parse(pos, regex_node, expected))
+    ASTPtr regexp_node;
+    if (!columns_p.parse(pos, column_list, expected) && !regexp.parse(pos, regexp_node, expected))
         return false;
 
     if (pos->type != TokenType::ClosingRoundBracket)
@@ -1832,7 +1832,7 @@ static bool parseColumnsMatcherBody(IParser::Pos & pos, ASTPtr & node, Expected
     else
     {
         auto regexp_matcher = std::make_shared<ASTColumnsRegexpMatcher>();
-        regexp_matcher->setPattern(regex_node->as<ASTLiteral &>().value.get<String>());
+        regexp_matcher->setPattern(regexp_node->as<ASTLiteral &>().value.get<String>());
 
         if (!transformers->children.empty())
         {
@@ -1895,8 +1895,7 @@ bool ParserQualifiedColumnsMatcher::parseImpl(Pos & pos, ASTPtr & node, Expected
     else if (auto * column_regexp_matcher = node->as<ASTColumnsRegexpMatcher>())
     {
         auto result = std::make_shared<ASTQualifiedColumnsRegexpMatcher>();
-        result->setPattern(column_regexp_matcher->getPattern(), false);
-        result->setMatcher(column_regexp_matcher->getMatcher());
+        result->setPattern(column_regexp_matcher->getPattern());
 
         result->qualifier = std::move(identifier_node);
         result->children.push_back(result->qualifier);

From 05ee8369b298cb7091ac621bee4098f801353f3f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 18:54:13 +0100
Subject: [PATCH 700/985] Add a test

---
 .../03013_parser_regexp_recompilation.reference          | 1 +
 .../0_stateless/03013_parser_regexp_recompilation.sh     | 9 +++++++++
 2 files changed, 10 insertions(+)
 create mode 100644 tests/queries/0_stateless/03013_parser_regexp_recompilation.reference
 create mode 100755 tests/queries/0_stateless/03013_parser_regexp_recompilation.sh

diff --git a/tests/queries/0_stateless/03013_parser_regexp_recompilation.reference b/tests/queries/0_stateless/03013_parser_regexp_recompilation.reference
new file mode 100644
index 00000000000..8e0782c44f2
--- /dev/null
+++ b/tests/queries/0_stateless/03013_parser_regexp_recompilation.reference
@@ -0,0 +1 @@
+SYNTAX_ERROR
diff --git a/tests/queries/0_stateless/03013_parser_regexp_recompilation.sh b/tests/queries/0_stateless/03013_parser_regexp_recompilation.sh
new file mode 100755
index 00000000000..ea7a72ce73d
--- /dev/null
+++ b/tests/queries/0_stateless/03013_parser_regexp_recompilation.sh
@@ -0,0 +1,9 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+# This query is incorrect, but its parsing should not be slow (tens of seconds):
+
+${CLICKHOUSE_LOCAL} < "$CURDIR"/03013_parser_regexp_recompilation.txt 2>&1 | grep --text -o -F 'SYNTAX_ERROR'

From 597b72dc5221fdcd2d4e87f24489d0d164a90527 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Mon, 18 Mar 2024 18:54:28 +0100
Subject: [PATCH 701/985] Add a test

---
 .../03013_parser_regexp_recompilation.txt       | Bin 0 -> 55948 bytes
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 tests/queries/0_stateless/03013_parser_regexp_recompilation.txt

diff --git a/tests/queries/0_stateless/03013_parser_regexp_recompilation.txt b/tests/queries/0_stateless/03013_parser_regexp_recompilation.txt
new file mode 100644
index 0000000000000000000000000000000000000000..a861059c3a1322eae212bca0f4b5fc2e1be7de1e
GIT binary patch
literal 55948
zcmeHQUymEN5tmcMD1^38MNyy#ut5Re-R5lEAEQYc7{SF>f&<QH^iD2N^g&f@*${ds
zxjJ2%GtPbLhw5`bNIy$CB!@fvx8!;$SyH%-J+tI+IQ-3U$layY$7j8xey@0P)Ia*>
z=)70Fm`;8eT#kp6qIde;@oBI4)6vPv_Ty(K&!3*2Z*Sf9yX-2vzv|w;yVb64_W@Ml
zb<pir)kYo4FnXuc`G}DYySnUu;$j6Q`=cv_0-v<Mri5miVNl@HQ$l4+TS{R&8;`u|
zIx9gY+C0s0iB(F{!UKFD%S4W%rU#BR1(1bHhyTvcBw(zjgzEPL--Q&5<F}wuUV6Vq
zuQ5nL0F|IDor$2$dHIbkL7tn-D6u4C&OiZdi~utnO%UV4_0ln6QQKn)oy4Uc>P%?m
zABexEgk}%Akip624<;s*YKZacMd!E4FYaVM;@YvUzVjX4_?VUPq5V9^DnOwpI)+RG
zua*EL$5?Nt>y%O;3zr^JdBGB>IG_Pw*~Mx~sO7wlEGup9Ezkv*?g!pg)mgOKpq`vO
zTRV<9tF?|2TrM*o<22_>-x~xPsLQC+Zc*r7bzu>wny~){+f-WaVUb3KhPz+O!Us>p
zGaHA<uU+JPqKJroMELh+iE7SrMR)5jHB_@Py<g`6YQvY%{u&DJ+|jCx8|nlKMFnh0
zML2KCb(aa;2MZw$xk!Y6dG{`b&q9t@t{TGBV#>2jCg(OSHF<N4q(0hp(Sk&|#X1eq
zoEW%~8pE>)deYK7W=K|ELS?!&9<-6GwpXw}#ikSctLv-;q4yi6<+%0*twzlTvP|SC
zYWkj&V~SJGjIg|$hlsN-e~gwO%N@%oiPSjE&z?OkUXLcD*(dYS*>Li5dbzz*oE$$r
z?iYt&b&pTaduRRP__Y75m=6Z8uHU{L>=oy|liuTgQ5N5-*28e?-J0e%gZa&y(N*!N
zn9r_br^)Xff}c9dXwhi57)^%XUyKGX$CKg3cz$2&8mq4dZ>Cpc+R)F>$5W<hFr2-<
zz8p>FFbFC9s&g^CVk$4DuLu9Q9?iyLg!lLM?(gjvdwYN6|84CSThIHCw|0u7^J2bR
z%!|*8eMY8F7^vIxo#HbnVJ_&M{rTwRudeIrXmV41fav_9&lG*X|5dm9SbVx*A1+RM
zP*iMBis#3Z`QgECF)WT|v*FG5w-?jl{0|Rzb{I0R$CJ^cr=!d1>_$1??|WC6{LK|6
zZ=1wPO_)SPSxsxr(|&(?YD8=<DM0pffGjEvEi6DhapNe)AR6&3Q{@jx<nrots^V~3
znX2HN^W668dh!C=4`ysC&qssH;g5si%a^m!)fG=c2YY*L{!fZ;{!)y8ci!vwk59il
zFUFIXqaO#aXT!<$#c(#B-!QE#5e+XcrvDtUvJ0;J@1vVXkXph^gSK`g&;AZvLq!$t
zwaH(&rBYV6X>Z~szPz!Cy@7L^M@G^mbI*D09~^x7`4<OY9)5A~@bkmH!-o&|_i83|
zyY(WX^-4!|#C~Ko6NlW9M&R%Ay=zy(Hm`@xFJ}n43mXRJW^A^r6zSw5({0{s=e@QO
zKWaO}pVbx|Ae*=z%V+kDeHb(1rRKIuLa;rlwrjZ2W;E}$Yw&yDstWf;d+oaJD(8it
zh&E%dO<%YFaND`<z<-_JG`nhEPx062`GqUV1^(BpJW(v~y90fbE9~=`X1+j|Q;0Px
zp<zCImf*7o!x3O@_4$Q+!}rz0avHeK)n`6?mi#o6@JZt@Cp;WhHhH#-)|^w!1F?L9
z@=58-!zI*`DB{BPpU*+*!g30?*!oLYCI7Z+NdXF~14j4svs6U1jt!~7dZ8m9$uhA-
ze2|j*y7$sVte!=^NV#<2{D@X9)rSw0tl@#7wL&-_$->7a2+3&IMGMM6cM_aENV$+U
zO#(MkYj_qx4{27QRC-D<3G83kN``)A{Xl2%Cw`&ThAClANm`AX4P=?fQPkp&2d(xd
z*A4{ra1gx_)8Zq-nb4=W{L`=m0q$5vi6wEEtHUyz@s;S)z-)_rQ@G%-0QpGP!Vdnq
zKGMohy!l9${Lz4XX3u@Dv|WG%G7qV)l2HCk1gC+Qk9(ufM0K0?pWbI8Jd3TJe91?$
z>{IF=JgW1NEc)*WnxDuzbf3O*mgXZ_WPOutwanF~+q~D#N3x9I$w#vCzmG9O;(c$c
zB$W5sYp~a@bMsGcuT9@Y=ObC{Ehl@!S+YO$H7DHqU#t3SN@zx2m%?p88iF(8rETz4
zt>`MyS+r?EJ^2@HT04$;thJ63+|B|>Uj8Uy0@C@8KJ$?*l>{8<RL~*Jb+e-cA+Ci{
zGT-99oaC=n03W?-LpqhWu*2HUh%<$}Pr5EVSj&8#H9_KII4;!rpxnMNPB^uzs}dB<
zXU`A`pd6pTITD2!ZD{h#{8g*UsWxZY6*E9>{8DB3)J#5mCa_)<!ck|>I;9x`W&p74
zz5+kR#}+2JB{c1&_onTnuI}p;5o>TrO>1S`I1SOJN#I86Th&=)3|HLZpjEz$IGr5r
z7U%*y5R`WsfKjU!R(6tO`ZZUq8wYphyg^(vNoiD5f;vzqqgdpkrYXMe%(g_Xk*7Kx
z*h!Msl6C6WoD{f`dXoE4=rzr=eP|EK-IB;TU?8=TtY%qV8x-^fMqOJ{7gB@uqDlTI
z0t7nFB0fk-efoG{opAkuxuaD}gEn#^WrRt%SuBPmQX<eAxV%l%CK<UQC>#42oW0gg
z+?KPp6jUqarEh7G;?eI-R*2St0lj0#NV!D>q97}W&@gAoRt|!OASEK}JYXD-qI_Hn
z2rs<@fnGFl(SpP)7OO0f3>OH-5fP9Y8-|qGtyq3n4Pgr{S&)-72>^|yh%Mg7v^O7b
zTEXQsn*%peaSm_`VJEagDmphs3tGLC0;eGXw`$c=*Q)xM47Fl$&<opzU<ZQojy2E%
zH;ckFzbvX^KymqH5kiqZp`d0L#W~Vs5<2vR)L^}6nqL-~5F$QENqzcwV4ZONf&8ac
zOM_N*fkE8Fz=W~Uz(orZuUM?IKr&oFgD`L-HEtxr7Fx0(KZp2&f+A*y*211OX{U<E
z-kYotn?0jqH*g9<gOP|jT~9?3c}02U0^TvuP8E;6uC3qINOWeiV^fS3eOJ+jpMQ18
z<Q-~T+lWZMw&qL#G2sf9&7Nhke#e=DGlx?bToGlc19dWrMK0QK!YdWTl7>FakMM|H
zL*THPPL)T1(W~@36!Zm#F73Swslj@oAV0#JKq5X!NqzcwV4ZON&OM~3P#Tnc5fplH
z*cDx72FeJNaI@ITCxRmat$|y!M|d)H!b*Ug6NiXd=NH5zEU5_RO~4zUBD6F@0cvfM
z=v(`jc8msa>zrVD3V8$XUn^zfs-{OLdgzd~jfmuE$L`FXaI!*)s56df8$@1FUYRq2
z6F5>RG5lbD$C;x11`Ks<10HptPDZiFMVGlB5~IjZWa!QGOAKmuQS`nqFkEdMWg#_K
zFPi2jG800?2Pvsf9}lb(uAk((AS(?@o(zRv9Ck&QnSnCGB-|{v@`>PxKx^RE=ZOr)
zuKxf5?7vF8n3cd<#s~nV{j!X|rkNftZE0_+Lu%>D%V%^mwZS3g->qrwIOed{I=ENW
zBZMBYpxnM>m<VE5S0yNzcNB;OP>xSvl~st*h9<wvg|Tv~&6#$^3{V@tRGD`aHnyT<
zSqSH!UJ$cWpdP)ai5B$v7s{9AV>a`s8D_TvfRc)E-jZ97f77R%%}1i8p1_TSA$ews
zec^}efHn-vH*p2119dWrMJ~Gh)g{09K}V)fD5%**(fhu@aJ6xih16iZXqsRAm=Gd9
zNJ)MAcwn7y{ek?aRZD}CCqtnZhh5QSW}u8P2{((ad?Gj^&>Fb)dGW(X?Sw*`CV?A?
z-Kx$a;@XPEK{r_;S_cMnj~yfBCItZ2s^u6OqAgoF2pWQvh^+H~aX5<daV_8}K<_}H
z7Y$srAn}UDDhnjT1+<t6+(?ZLL(1%SVb58rBQo;Vz~v<E3krg=m95hInD*x5RRH7w
z_d#Tr=Kx=g0H-l)dI<x2VY?9QKv3Sj4;5Frv^V*}kY5&=k-+Zr%OV7&_2LeSw9rS*
zE{cLpCZR)5NDbDDruk)&2_fQxl+>q>2i6JK?@D^UGHFoqWGM9Fuq&Eh7Wq8!fxh=B
z*Q5;1yiN0YnV_sEbMOPNEU5_Rm5UV9a28n_p#YUNSs^w%XT@&doN!i%I$clOAo7ax
z%ItS1aHNo8X!DyLn_|2wVic1z0YfJF?j>ge2rzq&IsZ==Tw?WQDtaZurO8AOvQqsA
z^E<AY+Cb{Z?5#x|sFP7Fa?yqpUa27cH_Vjz5gxH?2pl%ksqzRgdX;{Mg1*4erM-6{
zHCQhc<VScDNW=#zsZSpdtP`$3m;s4^G$?s86nb&k6<uZq$_SHiv)IZff+GU0fm^dj
zcrtXtN`S~@saPVWo`n^lyfQzLRcN_6ilNQ7jzLhVTp}6XjoTV`skCcV)1x#`CphRP
zOaEr0ou9}cCiEx~ciHcN1I`qjIh?xSiYP-JsFP7Fa?xe(hlKU{i447%KKN0yi=y{^
zf#GW7C=02<deJmLk(m%8K1fM@`gmZSaQ*Jhg}YQ5w5nSU#EmW|(ZEFu60caSvOqE!
zVGAO=V9lP$7VBe-UDitpJ;`5s0MxW!a45SULy-~y?#b59?tlMtxpmt|7Mr_k-@GgC
l-~S)0gLRh?y%SKLu9troFD}NTe?6S{X0z$6I4j<D{|{)~`gQ;S

literal 0
HcmV?d00001


From 69ef7c6f19d4d383fe8fdb7f510147e376bff016 Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Mon, 18 Mar 2024 18:15:54 +0000
Subject: [PATCH 702/985] add logging

---
 src/Common/AsyncLoader.cpp              | 35 ++++++++++++++++++++++---
 src/Common/AsyncLoader.h                |  4 ++-
 src/Common/tests/gtest_async_loader.cpp |  2 +-
 src/Interpreters/Context.cpp            |  3 ++-
 4 files changed, 37 insertions(+), 7 deletions(-)

diff --git a/src/Common/AsyncLoader.cpp b/src/Common/AsyncLoader.cpp
index 4a39454ccbb..e4896ce32ab 100644
--- a/src/Common/AsyncLoader.cpp
+++ b/src/Common/AsyncLoader.cpp
@@ -2,6 +2,7 @@
 
 #include <limits>
 #include <optional>
+#include <magic_enum.hpp>
 #include <fmt/format.h>
 #include <base/defines.h>
 #include <base/scope_guard.h>
@@ -196,9 +197,10 @@ void LoadTask::remove()
     }
 }
 
-AsyncLoader::AsyncLoader(std::vector<PoolInitializer> pool_initializers, bool log_failures_, bool log_progress_)
+AsyncLoader::AsyncLoader(std::vector<PoolInitializer> pool_initializers, bool log_failures_, bool log_progress_, bool log_events_)
     : log_failures(log_failures_)
     , log_progress(log_progress_)
+    , log_events(log_events_)
     , log(getLogger("AsyncLoader"))
 {
     pools.reserve(pool_initializers.size());
@@ -327,6 +329,8 @@ void AsyncLoader::schedule(const LoadJobSet & jobs_to_schedule)
             ALLOW_ALLOCATIONS_IN_SCOPE;
             scheduled_jobs.try_emplace(job);
             job->scheduled(++last_job_id);
+            if (log_events)
+                LOG_DEBUG(log, "Schedule load job '{}' into {}", job->name, getPoolName(job->pool()));
         });
     }
 
@@ -582,6 +586,9 @@ void AsyncLoader::finish(const LoadJobPtr & job, LoadStatus status, std::excepti
     else if (status == LoadStatus::CANCELED)
         job->canceled(reason);
 
+    if (log_events)
+        LOG_DEBUG(log, "Finish load job '{}' with status {}", job->name, magic_enum::enum_name(status));
+
     Info & info = scheduled_jobs[job];
     if (info.isReady())
     {
@@ -661,6 +668,9 @@ void AsyncLoader::prioritize(const LoadJobPtr & job, size_t new_pool_id, std::un
 
     job->pool_id.store(new_pool_id);
 
+    if (log_events)
+        LOG_DEBUG(log, "Prioritize load job '{}': {} -> {}", job->name, old_pool.name, new_pool.name);
+
     // Recurse into dependencies
     for (const auto & dep : job->dependencies)
         prioritize(dep, new_pool_id, lock);
@@ -765,6 +775,9 @@ void AsyncLoader::wait(std::unique_lock<std::mutex> & job_lock, const LoadJobPtr
     if (job->load_status != LoadStatus::PENDING) // Shortcut just to avoid incrementing ProfileEvents
         return;
 
+    if (log_events)
+        LOG_DEBUG(log, "Wait load job '{}' in {}", job->name, getPoolName(job->executionPool()));
+
     Stopwatch watch;
     job->waiters++;
     job->finished.wait(job_lock, [&] { return job->load_status != LoadStatus::PENDING; });
@@ -789,6 +802,13 @@ bool AsyncLoader::canWorkerLive(Pool & pool, std::unique_lock<std::mutex> &)
         && (!current_priority || *current_priority >= pool.priority);
 }
 
+void AsyncLoader::setCurrentPriority(std::unique_lock<std::mutex> &, std::optional<Priority> priority)
+{
+    if (log_event && current_priority != priority)
+        LOG_DEBUG(log, "Change current priority: {} -> {}", current_priority, priority);
+    current_priority = priority;
+}
+
 void AsyncLoader::updateCurrentPriorityAndSpawn(std::unique_lock<std::mutex> & lock)
 {
     // Find current priority.
@@ -799,7 +819,7 @@ void AsyncLoader::updateCurrentPriorityAndSpawn(std::unique_lock<std::mutex> & l
         if (pool.isActive() && (!priority || *priority > pool.priority))
             priority = pool.priority;
     }
-    current_priority = priority;
+    setCurrentPriority(lock, priority);
 
     // Spawn workers in all pools with current priority
     for (Pool & pool : pools)
@@ -809,10 +829,12 @@ void AsyncLoader::updateCurrentPriorityAndSpawn(std::unique_lock<std::mutex> & l
     }
 }
 
-void AsyncLoader::spawn(Pool & pool, std::unique_lock<std::mutex> &)
+void AsyncLoader::spawn(Pool & pool, std::unique_lock<std::mutex> & lock)
 {
+    setCurrentPriority(lock, pool.priority); // canSpawnWorker() ensures this would not decrease current_priority
     pool.workers++;
-    current_priority = pool.priority; // canSpawnWorker() ensures this would not decrease current_priority
+    if (log_events)
+        LOG_DEBUG(log, "Spawn loader worker #{} in {}", pool.workers, pool.name);
     NOEXCEPT_SCOPE({
         ALLOW_ALLOCATIONS_IN_SCOPE;
         pool.thread_pool->scheduleOrThrowOnError([this, &pool] { worker(pool); });
@@ -842,6 +864,8 @@ void AsyncLoader::worker(Pool & pool)
 
             if (!canWorkerLive(pool, lock))
             {
+                if (log_events)
+                    LOG_DEBUG(log, "Stop worked in {}", pool.name);
                 if (--pool.workers == 0)
                     updateCurrentPriorityAndSpawn(lock); // It will spawn lower priority workers if needed
                 return;
@@ -852,6 +876,9 @@ void AsyncLoader::worker(Pool & pool)
             job = it->second;
             pool.ready_queue.erase(it);
             scheduled_jobs.find(job)->second.ready_seqno = 0; // This job is no longer in the ready queue
+
+            if (log_events)
+                LOG_DEBUG(log, "Execute load job '{}' in {}", job->name, pool.name);
         }
 
         ALLOW_ALLOCATIONS_IN_SCOPE;
diff --git a/src/Common/AsyncLoader.h b/src/Common/AsyncLoader.h
index b1b336d24dc..a5c7049ee0e 100644
--- a/src/Common/AsyncLoader.h
+++ b/src/Common/AsyncLoader.h
@@ -327,7 +327,7 @@ private:
     };
 
 public:
-    AsyncLoader(std::vector<PoolInitializer> pool_initializers, bool log_failures_, bool log_progress_);
+    AsyncLoader(std::vector<PoolInitializer> pool_initializers, bool log_failures_, bool log_progress_, bool log_events_);
 
     // WARNING: all tasks instances should be destructed before associated AsyncLoader.
     ~AsyncLoader();
@@ -407,6 +407,7 @@ private:
     void wait(std::unique_lock<std::mutex> & job_lock, const LoadJobPtr & job);
     bool canSpawnWorker(Pool & pool, std::unique_lock<std::mutex> & lock);
     bool canWorkerLive(Pool & pool, std::unique_lock<std::mutex> & lock);
+    void setCurrentPriority(std::unique_lock<std::mutex> & lock, std::optional<Priority> priority);
     void updateCurrentPriorityAndSpawn(std::unique_lock<std::mutex> & lock);
     void spawn(Pool & pool, std::unique_lock<std::mutex> & lock);
     void worker(Pool & pool);
@@ -415,6 +416,7 @@ private:
     // Logging
     const bool log_failures; // Worker should log all exceptions caught from job functions.
     const bool log_progress; // Periodically log total progress
+    const bool log_events; // Log all important events: job start/end, waits, prioritizations
     LoggerPtr log;
 
     mutable std::mutex mutex; // Guards all the fields below.
diff --git a/src/Common/tests/gtest_async_loader.cpp b/src/Common/tests/gtest_async_loader.cpp
index fc2537abcfc..b7b14bbedd4 100644
--- a/src/Common/tests/gtest_async_loader.cpp
+++ b/src/Common/tests/gtest_async_loader.cpp
@@ -50,7 +50,7 @@ struct AsyncLoaderTest
     pcg64 rng{randomSeed()};
 
     explicit AsyncLoaderTest(std::vector<Initializer> initializers)
-        : loader(getPoolInitializers(initializers), /* log_failures = */ false, /* log_progress = */ false)
+        : loader(getPoolInitializers(initializers), /* log_failures = */ false, /* log_progress = */ false, /* log_events = */ false)
     {
         loader.stop(); // All tests call `start()` manually to better control ordering
     }
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 6a0657a842c..48c0618f5a9 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -2461,7 +2461,8 @@ AsyncLoader & Context::getAsyncLoader() const
                 }
             },
             /* log_failures = */ true,
-            /* log_progress = */ true);
+            /* log_progress = */ true,
+            /* log_events = */ true);
     });
 
     return *shared->async_loader;

From 4f30ac72a1ef01f7c783c192639933e32d2f0397 Mon Sep 17 00:00:00 2001
From: William Schoeffel <wschoeffel@securityscorecard.io>
Date: Mon, 18 Mar 2024 15:18:47 -0300
Subject: [PATCH 703/985] fix typo in variable name legacy

---
 src/Storages/MergeTree/MergeTreePartInfo.cpp | 10 +++++-----
 src/Storages/MergeTree/MergeTreePartInfo.h   |  2 +-
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreePartInfo.cpp b/src/Storages/MergeTree/MergeTreePartInfo.cpp
index 8c1b630e85e..f3a974a22af 100644
--- a/src/Storages/MergeTree/MergeTreePartInfo.cpp
+++ b/src/Storages/MergeTree/MergeTreePartInfo.cpp
@@ -131,7 +131,7 @@ std::optional<MergeTreePartInfo> MergeTreePartInfo::tryParsePartName(
         /// "Part 20170601_20170630_0_2_999999999 intersects 201706_0_1_4294967295".
         /// So we replace unexpected max level to make contains(...) method and comparison operators work
         /// correctly with such virtual parts. On part name serialization we will use legacy max level to keep the name unchanged.
-        part_info.use_leagcy_max_level = true;
+        part_info.use_legacy_max_level = true;
         level = MAX_LEVEL;
     }
 
@@ -205,7 +205,7 @@ String MergeTreePartInfo::getPartNameV1() const
     writeChar('_', wb);
     writeIntText(max_block, wb);
     writeChar('_', wb);
-    if (use_leagcy_max_level)
+    if (use_legacy_max_level)
     {
         assert(level == MAX_LEVEL);
         writeIntText(LEGACY_MAX_LEVEL, wb);
@@ -244,7 +244,7 @@ String MergeTreePartInfo::getPartNameV0(DayNum left_date, DayNum right_date) con
     writeChar('_', wb);
     writeIntText(max_block, wb);
     writeChar('_', wb);
-    if (use_leagcy_max_level)
+    if (use_legacy_max_level)
     {
         assert(level == MAX_LEVEL);
         writeIntText(LEGACY_MAX_LEVEL, wb);
@@ -274,7 +274,7 @@ void MergeTreePartInfo::serialize(WriteBuffer & out) const
     writeIntBinary(max_block, out);
     writeIntBinary(level, out);
     writeIntBinary(mutation, out);
-    writeBoolText(use_leagcy_max_level, out);
+    writeBoolText(use_legacy_max_level, out);
 }
 
 
@@ -297,7 +297,7 @@ void MergeTreePartInfo::deserialize(ReadBuffer & in)
     readIntBinary(max_block, in);
     readIntBinary(level, in);
     readIntBinary(mutation, in);
-    readBoolText(use_leagcy_max_level, in);
+    readBoolText(use_legacy_max_level, in);
 }
 
 bool MergeTreePartInfo::areAllBlockNumbersCovered(const MergeTreePartInfo & blocks_range, std::vector<MergeTreePartInfo> candidates)
diff --git a/src/Storages/MergeTree/MergeTreePartInfo.h b/src/Storages/MergeTree/MergeTreePartInfo.h
index 5fbb5d70bf3..9bb79e21144 100644
--- a/src/Storages/MergeTree/MergeTreePartInfo.h
+++ b/src/Storages/MergeTree/MergeTreePartInfo.h
@@ -26,7 +26,7 @@ struct MergeTreePartInfo
     UInt32 level = 0;
     Int64 mutation = 0;   /// If the part has been mutated or contains mutated parts, is equal to mutation version number.
 
-    bool use_leagcy_max_level = false;  /// For compatibility. TODO remove it
+    bool use_legacy_max_level = false;  /// For compatibility. TODO remove it
 
     MergeTreePartInfo() = default;
 

From e2c692e194e8f02a623a21568d1b50980754b019 Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Mon, 18 Mar 2024 18:24:36 +0000
Subject: [PATCH 704/985] fix build

---
 src/Common/AsyncLoader.cpp | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/Common/AsyncLoader.cpp b/src/Common/AsyncLoader.cpp
index e4896ce32ab..02dada7b8f9 100644
--- a/src/Common/AsyncLoader.cpp
+++ b/src/Common/AsyncLoader.cpp
@@ -804,8 +804,10 @@ bool AsyncLoader::canWorkerLive(Pool & pool, std::unique_lock<std::mutex> &)
 
 void AsyncLoader::setCurrentPriority(std::unique_lock<std::mutex> &, std::optional<Priority> priority)
 {
-    if (log_event && current_priority != priority)
-        LOG_DEBUG(log, "Change current priority: {} -> {}", current_priority, priority);
+    if (log_events && current_priority != priority)
+        LOG_DEBUG(log, "Change current priority: {} -> {}",
+            current_priority ? std::to_string(*current_priority) : "none",
+            priority ? std::to_string(*priority) : "none");
     current_priority = priority;
 }
 

From 7dbd96cf4ee028a2b74342ff1a5a1f13d1c7ff5f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Mon, 18 Mar 2024 19:43:13 +0100
Subject: [PATCH 705/985] Fix

---
 docker/test/fuzzer/run-fuzzer.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index e8eb2d21e4d..e3b5a99018f 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -317,7 +317,7 @@ quit
 
         IS_SANITIZED=$(clickhouse-local --query "SELECT value LIKE '%-fsanitize=%' FROM system.build_options WHERE name = 'CXX_FLAGS'")
 
-        if [ "${IS_SANITIZED}" -eq "1" ] && rg --text 'Sanitizer:? (out-of-memory|out of memory|failed to allocate)|Child process was terminated by signal 9' stderr.log
+        if [ "${IS_SANITIZED}" -eq "1" ] && rg --text 'Sanitizer:? (out-of-memory|out of memory|failed to allocate)|Child process was terminated by signal 9' description.txt
         then
             # OOM of sanitizer is not a problem we can handle - treat it as success, but preserve the description.
             # Why? Because sanitizers have the memory overhead, that is not controllable from inside clickhouse-server.

From 3def01f1f6951d11a142f80ef64f3d315ba92a4d Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 18 Mar 2024 18:53:01 +0000
Subject: [PATCH 706/985] Fixing 01083_expressions_in_engine_arguments with
 analyzer.

---
 src/Storages/StorageBuffer.cpp | 29 ++++++++++++++++++++++++-----
 src/Storages/StorageValues.cpp | 33 +++++++++++++++++++++++++++++++++
 src/Storages/StorageValues.h   |  7 +++++++
 tests/analyzer_tech_debt.txt   |  1 -
 4 files changed, 64 insertions(+), 6 deletions(-)

diff --git a/src/Storages/StorageBuffer.cpp b/src/Storages/StorageBuffer.cpp
index 2925038ec8e..ab656e5e3ff 100644
--- a/src/Storages/StorageBuffer.cpp
+++ b/src/Storages/StorageBuffer.cpp
@@ -1,5 +1,6 @@
 #include <Interpreters/InterpreterInsertQuery.h>
 #include <Interpreters/InterpreterSelectQuery.h>
+#include <Interpreters/InterpreterSelectQueryAnalyzer.h>
 #include <Interpreters/addMissingDefaults.h>
 #include <Interpreters/castColumn.h>
 #include <Interpreters/evaluateConstantExpression.h>
@@ -24,6 +25,7 @@
 #include <Storages/AlterCommands.h>
 #include <Storages/StorageBuffer.h>
 #include <Storages/StorageFactory.h>
+#include <Storages/StorageValues.h>
 #include <Storages/checkAndGetLiteralArgument.h>
 #include <base/getThreadId.h>
 #include <base/range.h>
@@ -366,11 +368,28 @@ void StorageBuffer::read(
     if (processed_stage > QueryProcessingStage::FetchColumns)
     {
         /// TODO: Find a way to support projections for StorageBuffer
-        auto interpreter = InterpreterSelectQuery(
-                query_info.query, local_context, std::move(pipe_from_buffers),
-                SelectQueryOptions(processed_stage));
-        interpreter.addStorageLimits(*query_info.storage_limits);
-        interpreter.buildQueryPlan(buffers_plan);
+        if (local_context->getSettingsRef().allow_experimental_analyzer)
+        {
+            auto storage = std::make_shared<StorageValues>(
+                    getStorageID(),
+                    storage_snapshot->getAllColumnsDescription(),
+                    std::move(pipe_from_buffers),
+                    *getVirtualsPtr());
+
+            auto interpreter = InterpreterSelectQueryAnalyzer(
+                    query_info.query, local_context, storage,
+                    SelectQueryOptions(processed_stage));
+            interpreter.addStorageLimits(*query_info.storage_limits);
+            buffers_plan = std::move(interpreter).extractQueryPlan();
+        }
+        else
+        {
+            auto interpreter = InterpreterSelectQuery(
+                    query_info.query, local_context, std::move(pipe_from_buffers),
+                    SelectQueryOptions(processed_stage));
+            interpreter.addStorageLimits(*query_info.storage_limits);
+            interpreter.buildQueryPlan(buffers_plan);
+        }
     }
     else
     {
diff --git a/src/Storages/StorageValues.cpp b/src/Storages/StorageValues.cpp
index a930ffd1307..3a293c06b37 100644
--- a/src/Storages/StorageValues.cpp
+++ b/src/Storages/StorageValues.cpp
@@ -2,6 +2,7 @@
 #include <Storages/ColumnsDescription.h>
 #include <Storages/StorageValues.h>
 #include <Processors/Sources/SourceFromSingleChunk.h>
+#include <Processors/Transforms/ExpressionTransform.h>
 #include <QueryPipeline/Pipe.h>
 
 
@@ -21,6 +22,19 @@ StorageValues::StorageValues(
     setVirtuals(std::move(virtuals_));
 }
 
+StorageValues::StorageValues(
+    const StorageID & table_id_,
+    const ColumnsDescription & columns_,
+    Pipe prepared_pipe_,
+    VirtualColumnsDescription virtuals_)
+    : IStorage(table_id_), prepared_pipe(std::move(prepared_pipe_))
+{
+    StorageInMemoryMetadata storage_metadata;
+    storage_metadata.setColumns(columns_);
+    setInMemoryMetadata(storage_metadata);
+    setVirtuals(std::move(virtuals_));
+}
+
 Pipe StorageValues::read(
     const Names & column_names,
     const StorageSnapshotPtr & storage_snapshot,
@@ -32,6 +46,25 @@ Pipe StorageValues::read(
 {
     storage_snapshot->check(column_names);
 
+    if (!prepared_pipe.empty())
+    {
+        auto dag = std::make_shared<ActionsDAG>(prepared_pipe.getHeader().getColumnsWithTypeAndName());
+        ActionsDAG::NodeRawConstPtrs outputs;
+        outputs.reserve(column_names.size());
+        for (const auto & name : column_names)
+            outputs.push_back(dag->getOutputs()[prepared_pipe.getHeader().getPositionByName(name)]);
+
+        dag->getOutputs().swap( outputs);
+        auto expression = std::make_shared<ExpressionActions>(dag);
+
+        prepared_pipe.addSimpleTransform([&](const Block & header)
+        {
+            return std::make_shared<ExpressionTransform>(header, expression);
+        });
+
+        return std::move(prepared_pipe);
+    }
+
     /// Get only required columns.
     Block block;
     for (const auto & name : column_names)
diff --git a/src/Storages/StorageValues.h b/src/Storages/StorageValues.h
index ebb182ab667..37992928d55 100644
--- a/src/Storages/StorageValues.h
+++ b/src/Storages/StorageValues.h
@@ -20,6 +20,12 @@ public:
         const Block & res_block_,
         VirtualColumnsDescription virtuals_ = {});
 
+    StorageValues(
+        const StorageID & table_id_,
+        const ColumnsDescription & columns_,
+        Pipe prepared_pipe_,
+        VirtualColumnsDescription virtuals_ = {});
+
     std::string getName() const override { return "Values"; }
 
     Pipe read(
@@ -39,6 +45,7 @@ public:
 
 private:
     Block res_block;
+    Pipe prepared_pipe;
 };
 
 }
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index 42aa579658e..8335108e243 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -2,7 +2,6 @@
 00717_merge_and_distributed
 00725_memory_tracking
 01062_pm_all_join_with_block_continuation
-01083_expressions_in_engine_arguments
 01155_rename_move_materialized_view
 01584_distributed_buffer_cannot_find_column
 01624_soft_constraints

From ebaee8e5f62551b7c11d76ccdd7abac0bf4c23a0 Mon Sep 17 00:00:00 2001
From: Kirill Nikiforov <allmazz@allmazz.me>
Date: Mon, 18 Mar 2024 22:00:27 +0300
Subject: [PATCH 707/985] Add support for `ATTACH PARTITION ALL` (#61107)

---
 .../statements/alter/partition.md             |  1 +
 src/Storages/MergeTree/MergeTreeData.cpp      | 18 +++++---
 .../0_stateless/00753_alter_attach.reference  | 16 +++++++
 .../0_stateless/00753_alter_attach.sql        | 43 +++++++++++++++++++
 4 files changed, 73 insertions(+), 5 deletions(-)

diff --git a/docs/en/sql-reference/statements/alter/partition.md b/docs/en/sql-reference/statements/alter/partition.md
index a21ef4f4af5..ce5cecf6fd6 100644
--- a/docs/en/sql-reference/statements/alter/partition.md
+++ b/docs/en/sql-reference/statements/alter/partition.md
@@ -350,6 +350,7 @@ ALTER TABLE mt DELETE IN PARTITION ID '2' WHERE p = 2;
 You can specify the partition expression in `ALTER ... PARTITION` queries in different ways:
 
 - As a value from the `partition` column of the `system.parts` table. For example, `ALTER TABLE visits DETACH PARTITION 201901`.
+- Using the keyword `ALL`. It can be used only with DROP/DETACH/ATTACH. For example, `ALTER TABLE visits ATTACH PARTITION ALL`.
 - As a tuple of expressions or constants that matches (in types) the table partitioning keys tuple. In the case of a single element partitioning key, the expression should be wrapped in the `tuple (...)` function. For example, `ALTER TABLE visits DETACH PARTITION tuple(toYYYYMM(toDate('2019-01-25')))`.
 - Using the partition ID. Partition ID is a string identifier of the partition (human-readable, if possible) that is used as the names of partitions in the file system and in ZooKeeper. The partition ID must be specified in the `PARTITION ID` clause, in a single quotes. For example, `ALTER TABLE visits DETACH PARTITION ID '201901'`.
 - In the [ALTER ATTACH PART](#alter_attach-partition) and [DROP DETACHED PART](#alter_drop-detached) query, to specify the name of a part, use string literal with a value from the `name` column of the [system.detached_parts](/docs/en/operations/system-tables/detached_parts.md/#system_tables-detached_parts) table. For example, `ALTER TABLE visits ATTACH PART '201901_1_1_0'`.
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index a22a1904345..a5e309ae793 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -4875,8 +4875,8 @@ void MergeTreeData::checkAlterPartitionIsPossible(
                 const auto * partition_ast = command.partition->as<ASTPartition>();
                 if (partition_ast && partition_ast->all)
                 {
-                    if (command.type != PartitionCommand::DROP_PARTITION)
-                        throw DB::Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Only support DROP/DETACH PARTITION ALL currently");
+                    if (command.type != PartitionCommand::DROP_PARTITION && command.type != PartitionCommand::ATTACH_PARTITION)
+                        throw DB::Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Only support DROP/DETACH/ATTACH PARTITION ALL currently");
                 }
                 else
                 {
@@ -6109,15 +6109,23 @@ MergeTreeData::MutableDataPartsVector MergeTreeData::tryLoadPartsToAttach(const
     }
     else
     {
-        String partition_id = getPartitionIDFromQuery(partition, local_context);
-        LOG_DEBUG(log, "Looking for parts for partition {} in {}", partition_id, source_dir);
+        String partition_id;
+        if (partition->as<ASTPartition>()->all)
+        {
+            LOG_DEBUG(log, "Looking for parts for all partitions in {}", source_dir);
+        }
+        else
+        {
+            partition_id = getPartitionIDFromQuery(partition, local_context);
+            LOG_DEBUG(log, "Looking for parts for partition {} in {}", partition_id, source_dir);
+        }
 
         ActiveDataPartSet active_parts(format_version);
 
         auto detached_parts = getDetachedParts();
         std::erase_if(detached_parts, [&partition_id](const DetachedPartInfo & part_info)
         {
-            return !part_info.valid_name || !part_info.prefix.empty() || part_info.partition_id != partition_id;
+            return !part_info.valid_name || !part_info.prefix.empty() || (!partition_id.empty() && part_info.partition_id != partition_id);
         });
 
         for (const auto & part_info : detached_parts)
diff --git a/tests/queries/0_stateless/00753_alter_attach.reference b/tests/queries/0_stateless/00753_alter_attach.reference
index b0d2a3d031c..301d5ebf451 100644
--- a/tests/queries/0_stateless/00753_alter_attach.reference
+++ b/tests/queries/0_stateless/00753_alter_attach.reference
@@ -22,3 +22,19 @@
 2	2
 1	1
 1	1
+1	1
+2	2
+3	3
+2	2
+3	3
+1	1
+2	2
+3	3
+1	1
+2	2
+3	3
+2	2
+3	3
+1	1
+2	2
+3	3
diff --git a/tests/queries/0_stateless/00753_alter_attach.sql b/tests/queries/0_stateless/00753_alter_attach.sql
index 299d0dd995f..7f2b1214613 100644
--- a/tests/queries/0_stateless/00753_alter_attach.sql
+++ b/tests/queries/0_stateless/00753_alter_attach.sql
@@ -90,3 +90,46 @@ OPTIMIZE TABLE partition_all2 PARTITION ALL; -- { serverError 344 }
 
 DROP TABLE partition_all;
 DROP TABLE partition_all2;
+
+-- test ATTACH ALL
+CREATE TABLE partition_attach_all (x UInt64, p UInt8) ENGINE = MergeTree ORDER BY x PARTITION BY p;
+INSERT INTO partition_attach_all VALUES (1, 1), (2, 2), (3, 3);
+
+ALTER TABLE partition_attach_all DETACH PARTITION ALL;
+SELECT * FROM partition_attach_all ORDER BY x;
+ALTER TABLE partition_attach_all ATTACH PARTITION ALL;
+SELECT * FROM partition_attach_all ORDER BY x;
+
+ALTER TABLE partition_attach_all DETACH PARTITION 1;
+SELECT * FROM partition_attach_all ORDER BY x;
+ALTER TABLE partition_attach_all ATTACH PARTITION ALL;
+SELECT * FROM partition_attach_all ORDER BY x;
+
+ALTER TABLE partition_attach_all DROP PARTITION ALL;
+SELECT * FROM partition_attach_all ORDER BY x;
+ALTER TABLE partition_attach_all ATTACH PARTITION ALL;
+SELECT * FROM partition_attach_all ORDER BY x;
+
+CREATE TABLE replicated_partition_attach_all (x UInt64, p UInt8)
+    ENGINE = ReplicatedMergeTree('/clickhouse/tables/test_00753_{database}/replicated_partition_attach_all', '1')
+        ORDER BY x
+        PARTITION BY p;
+INSERT INTO replicated_partition_attach_all VALUES (1, 1), (2, 2), (3, 3);
+
+ALTER TABLE replicated_partition_attach_all DETACH PARTITION ALL;
+SELECT * FROM replicated_partition_attach_all ORDER BY x;
+ALTER TABLE replicated_partition_attach_all ATTACH PARTITION ALL;
+SELECT * FROM replicated_partition_attach_all ORDER BY x;
+
+ALTER TABLE replicated_partition_attach_all DETACH PARTITION 1;
+SELECT * FROM replicated_partition_attach_all ORDER BY x;
+ALTER TABLE replicated_partition_attach_all ATTACH PARTITION ALL;
+SELECT * FROM replicated_partition_attach_all ORDER BY x;
+
+ALTER TABLE replicated_partition_attach_all DROP PARTITION ALL;
+SELECT * FROM replicated_partition_attach_all ORDER BY x;
+ALTER TABLE replicated_partition_attach_all ATTACH PARTITION ALL;
+SELECT * FROM replicated_partition_attach_all ORDER BY x;
+
+DROP TABLE partition_attach_all;
+DROP TABLE replicated_partition_attach_all;

From c99a874305693856362b4682c7b635ac04457a1c Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 18 Mar 2024 20:13:52 +0100
Subject: [PATCH 708/985] Update StorageValues.cpp

---
 src/Storages/StorageValues.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageValues.cpp b/src/Storages/StorageValues.cpp
index 3a293c06b37..894b1404a21 100644
--- a/src/Storages/StorageValues.cpp
+++ b/src/Storages/StorageValues.cpp
@@ -54,7 +54,7 @@ Pipe StorageValues::read(
         for (const auto & name : column_names)
             outputs.push_back(dag->getOutputs()[prepared_pipe.getHeader().getPositionByName(name)]);
 
-        dag->getOutputs().swap( outputs);
+        dag->getOutputs().swap(outputs);
         auto expression = std::make_shared<ExpressionActions>(dag);
 
         prepared_pipe.addSimpleTransform([&](const Block & header)

From e97443ddd16123d8b5aa854abc510f26cf67a147 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Mon, 18 Mar 2024 20:15:34 +0100
Subject: [PATCH 709/985] Update StorageBuffer.cpp

---
 src/Storages/StorageBuffer.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/StorageBuffer.cpp b/src/Storages/StorageBuffer.cpp
index ab656e5e3ff..dbcd47c5745 100644
--- a/src/Storages/StorageBuffer.cpp
+++ b/src/Storages/StorageBuffer.cpp
@@ -365,9 +365,9 @@ void StorageBuffer::read(
     /** If the sources from the table were processed before some non-initial stage of query execution,
       * then sources from the buffers must also be wrapped in the processing pipeline before the same stage.
       */
+    /// TODO: Find a way to support projections for StorageBuffer
     if (processed_stage > QueryProcessingStage::FetchColumns)
     {
-        /// TODO: Find a way to support projections for StorageBuffer
         if (local_context->getSettingsRef().allow_experimental_analyzer)
         {
             auto storage = std::make_shared<StorageValues>(

From 72932424eb00da56c0e6d2655d1ceb19fddcf86e Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Mon, 18 Mar 2024 19:36:45 +0000
Subject: [PATCH 710/985] fix issue with allocations

---
 src/Common/AsyncLoader.cpp | 43 ++++++++++++++++++++++++++++++--------
 1 file changed, 34 insertions(+), 9 deletions(-)

diff --git a/src/Common/AsyncLoader.cpp b/src/Common/AsyncLoader.cpp
index 02dada7b8f9..7d420b3beef 100644
--- a/src/Common/AsyncLoader.cpp
+++ b/src/Common/AsyncLoader.cpp
@@ -587,7 +587,12 @@ void AsyncLoader::finish(const LoadJobPtr & job, LoadStatus status, std::excepti
         job->canceled(reason);
 
     if (log_events)
-        LOG_DEBUG(log, "Finish load job '{}' with status {}", job->name, magic_enum::enum_name(status));
+    {
+        NOEXCEPT_SCOPE({
+            ALLOW_ALLOCATIONS_IN_SCOPE;
+            LOG_DEBUG(log, "Finish load job '{}' with status {}", job->name, magic_enum::enum_name(status));
+        });
+    }
 
     Info & info = scheduled_jobs[job];
     if (info.isReady())
@@ -669,7 +674,12 @@ void AsyncLoader::prioritize(const LoadJobPtr & job, size_t new_pool_id, std::un
     job->pool_id.store(new_pool_id);
 
     if (log_events)
-        LOG_DEBUG(log, "Prioritize load job '{}': {} -> {}", job->name, old_pool.name, new_pool.name);
+    {
+        NOEXCEPT_SCOPE({
+            ALLOW_ALLOCATIONS_IN_SCOPE;
+            LOG_DEBUG(log, "Prioritize load job '{}': {} -> {}", job->name, old_pool.name, new_pool.name);
+        });
+    }
 
     // Recurse into dependencies
     for (const auto & dep : job->dependencies)
@@ -805,9 +815,14 @@ bool AsyncLoader::canWorkerLive(Pool & pool, std::unique_lock<std::mutex> &)
 void AsyncLoader::setCurrentPriority(std::unique_lock<std::mutex> &, std::optional<Priority> priority)
 {
     if (log_events && current_priority != priority)
-        LOG_DEBUG(log, "Change current priority: {} -> {}",
-            current_priority ? std::to_string(*current_priority) : "none",
-            priority ? std::to_string(*priority) : "none");
+    {
+        NOEXCEPT_SCOPE({
+            ALLOW_ALLOCATIONS_IN_SCOPE;
+            LOG_DEBUG(log, "Change current priority: {} -> {}",
+                current_priority ? std::to_string(*current_priority) : "none",
+                priority ? std::to_string(*priority) : "none");
+        });
+    }
     current_priority = priority;
 }
 
@@ -835,10 +850,10 @@ void AsyncLoader::spawn(Pool & pool, std::unique_lock<std::mutex> & lock)
 {
     setCurrentPriority(lock, pool.priority); // canSpawnWorker() ensures this would not decrease current_priority
     pool.workers++;
-    if (log_events)
-        LOG_DEBUG(log, "Spawn loader worker #{} in {}", pool.workers, pool.name);
     NOEXCEPT_SCOPE({
         ALLOW_ALLOCATIONS_IN_SCOPE;
+        if (log_events)
+            LOG_DEBUG(log, "Spawn loader worker #{} in {}", pool.workers, pool.name);
         pool.thread_pool->scheduleOrThrowOnError([this, &pool] { worker(pool); });
     });
 }
@@ -867,7 +882,12 @@ void AsyncLoader::worker(Pool & pool)
             if (!canWorkerLive(pool, lock))
             {
                 if (log_events)
-                    LOG_DEBUG(log, "Stop worked in {}", pool.name);
+                {
+                    NOEXCEPT_SCOPE({
+                        ALLOW_ALLOCATIONS_IN_SCOPE;
+                        LOG_DEBUG(log, "Stop worked in {}", pool.name);
+                    });
+                }
                 if (--pool.workers == 0)
                     updateCurrentPriorityAndSpawn(lock); // It will spawn lower priority workers if needed
                 return;
@@ -880,7 +900,12 @@ void AsyncLoader::worker(Pool & pool)
             scheduled_jobs.find(job)->second.ready_seqno = 0; // This job is no longer in the ready queue
 
             if (log_events)
-                LOG_DEBUG(log, "Execute load job '{}' in {}", job->name, pool.name);
+            {
+                NOEXCEPT_SCOPE({
+                    ALLOW_ALLOCATIONS_IN_SCOPE;
+                    LOG_DEBUG(log, "Execute load job '{}' in {}", job->name, pool.name);
+                });
+            }
         }
 
         ALLOW_ALLOCATIONS_IN_SCOPE;

From 6aa88ed5e958899def7dd8d35ae686a4030588bf Mon Sep 17 00:00:00 2001
From: serxa <sergei@clickhouse.com>
Date: Mon, 18 Mar 2024 19:49:05 +0000
Subject: [PATCH 711/985] typo

---
 src/Common/AsyncLoader.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Common/AsyncLoader.cpp b/src/Common/AsyncLoader.cpp
index 7d420b3beef..52cfbba8e0c 100644
--- a/src/Common/AsyncLoader.cpp
+++ b/src/Common/AsyncLoader.cpp
@@ -786,7 +786,7 @@ void AsyncLoader::wait(std::unique_lock<std::mutex> & job_lock, const LoadJobPtr
         return;
 
     if (log_events)
-        LOG_DEBUG(log, "Wait load job '{}' in {}", job->name, getPoolName(job->executionPool()));
+        LOG_DEBUG(log, "Wait load job '{}' in {}", job->name, getPoolName(job->pool_id));
 
     Stopwatch watch;
     job->waiters++;
@@ -885,7 +885,7 @@ void AsyncLoader::worker(Pool & pool)
                 {
                     NOEXCEPT_SCOPE({
                         ALLOW_ALLOCATIONS_IN_SCOPE;
-                        LOG_DEBUG(log, "Stop worked in {}", pool.name);
+                        LOG_DEBUG(log, "Stop worker in {}", pool.name);
                     });
                 }
                 if (--pool.workers == 0)

From 9af69b42668c9c4363af1865e86d04453ad5ddcc Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Mon, 18 Mar 2024 21:05:09 +0100
Subject: [PATCH 712/985] fix read_rows count with external group by

---
 src/Processors/ISource.h                           | 2 +-
 src/Processors/Transforms/AggregatingTransform.cpp | 2 ++
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Processors/ISource.h b/src/Processors/ISource.h
index 8c140d0d0a3..778042c5b56 100644
--- a/src/Processors/ISource.h
+++ b/src/Processors/ISource.h
@@ -44,7 +44,7 @@ public:
     void setStorageLimits(const std::shared_ptr<const StorageLimitsList> & storage_limits_) override;
 
     /// Default implementation for all the sources.
-    std::optional<ReadProgress> getReadProgress() final;
+    std::optional<ReadProgress> getReadProgress() override;
 
     void addTotalRowsApprox(size_t value);
     void addTotalBytes(size_t value);
diff --git a/src/Processors/Transforms/AggregatingTransform.cpp b/src/Processors/Transforms/AggregatingTransform.cpp
index 74da97f2199..ea5c525d5f2 100644
--- a/src/Processors/Transforms/AggregatingTransform.cpp
+++ b/src/Processors/Transforms/AggregatingTransform.cpp
@@ -80,6 +80,8 @@ namespace
             return convertToChunk(block);
         }
 
+        std::optional<ReadProgress> getReadProgress() override { return std::nullopt; }
+
     private:
         TemporaryFileStream * tmp_stream;
     };

From 94a347cc419c2af101933d211d028771efd9e966 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Mon, 18 Mar 2024 20:34:15 +0000
Subject: [PATCH 713/985] Suppress bugprone-forward-declaration-namespace

---
 .clang-tidy | 1 +
 1 file changed, 1 insertion(+)

diff --git a/.clang-tidy b/.clang-tidy
index e7900cbe2aa..13c1b116ead 100644
--- a/.clang-tidy
+++ b/.clang-tidy
@@ -20,6 +20,7 @@ Checks: [
   '-bugprone-branch-clone',
   '-bugprone-easily-swappable-parameters',
   '-bugprone-exception-escape',
+  '-bugprone-forward-declaration-namespace',
   '-bugprone-implicit-widening-of-multiplication-result',
   '-bugprone-narrowing-conversions',
   '-bugprone-not-null-terminated-result',

From 8c55162e92661bcbde94470c1eb822b7e3dc4879 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Mon, 18 Mar 2024 19:24:52 +0100
Subject: [PATCH 714/985] Fix string search with const position

---
 src/Functions/FunctionsStringSearch.h            | 16 ++++++++++++++--
 .../03013_position_const_start_pos.reference     |  0
 .../03013_position_const_start_pos.sql           |  3 +++
 3 files changed, 17 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/03013_position_const_start_pos.reference
 create mode 100644 tests/queries/0_stateless/03013_position_const_start_pos.sql

diff --git a/src/Functions/FunctionsStringSearch.h b/src/Functions/FunctionsStringSearch.h
index 53d99198134..64de5d98ae3 100644
--- a/src/Functions/FunctionsStringSearch.h
+++ b/src/Functions/FunctionsStringSearch.h
@@ -190,14 +190,26 @@ public:
         {
             if (col_haystack_const && col_needle_const)
             {
-                const auto is_col_start_pos_const = !column_start_pos || isColumnConst(*column_start_pos);
+                auto column_start_position_arg = column_start_pos;
+                bool is_col_start_pos_const = false;
+                if (column_start_pos)
+                {
+                    if (const ColumnConst * const_column_start_pos = typeid_cast<const ColumnConst *>(&*column_start_pos))
+                    {
+                        is_col_start_pos_const = true;
+                        column_start_position_arg = const_column_start_pos->getDataColumnPtr();
+                    }
+                }
+                else
+                    is_col_start_pos_const = true;
+
                 vec_res.resize(is_col_start_pos_const ? 1 : column_start_pos->size());
                 const auto null_map = create_null_map();
 
                 Impl::constantConstant(
                     col_haystack_const->getValue<String>(),
                     col_needle_const->getValue<String>(),
-                    column_start_pos,
+                    column_start_position_arg,
                     vec_res,
                     null_map.get());
 
diff --git a/tests/queries/0_stateless/03013_position_const_start_pos.reference b/tests/queries/0_stateless/03013_position_const_start_pos.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03013_position_const_start_pos.sql b/tests/queries/0_stateless/03013_position_const_start_pos.sql
new file mode 100644
index 00000000000..0c6da694b6b
--- /dev/null
+++ b/tests/queries/0_stateless/03013_position_const_start_pos.sql
@@ -0,0 +1,3 @@
+CREATE TABLE 03013_position_const_start_pos (n Int16) ENGINE = Memory;
+INSERT INTO 03013_position_const_start_pos SELECT * FROM generateRandom() LIMIT 1000;
+SELECT position(concat(NULLIF(1, 1), materialize(3)), 'ca', 2) FROM 03013_position_const_start_pos FORMAT Null;

From c1daf104afda843fdefbc635fec1f92ba14bfe45 Mon Sep 17 00:00:00 2001
From: danila-ermakov <152204142+danila-ermakov@users.noreply.github.com>
Date: Mon, 18 Mar 2024 18:23:31 -0400
Subject: [PATCH 715/985] queries -> queries-file  cli.md

queries-file should be used to specify file
---
 docs/en/interfaces/cli.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/interfaces/cli.md b/docs/en/interfaces/cli.md
index 2b90d684c13..1eb426af617 100644
--- a/docs/en/interfaces/cli.md
+++ b/docs/en/interfaces/cli.md
@@ -178,7 +178,7 @@ You can pass parameters to `clickhouse-client` (all parameters have a default va
 - `--password` – The password. Default value: empty string.
 - `--ask-password` - Prompt the user to enter a password.
 - `--query, -q` – The query to process when using non-interactive mode. `--query` can be specified multiple times, e.g. `--query "SELECT 1" --query "SELECT 2"`. Cannot be used simultaneously with `--queries-file`.
-- `--queries-file` – file path with queries to execute. `--queries-file` can be specified multiple times, e.g. `--query queries1.sql --query queries2.sql`. Cannot be used simultaneously with `--query`.
+- `--queries-file` – file path with queries to execute. `--queries-file` can be specified multiple times, e.g. `--queries-file  queries1.sql --queries-file  queries2.sql`. Cannot be used simultaneously with `--query`.
 - `--multiquery, -n` – If specified, multiple queries separated by semicolons can be listed after the `--query` option. For convenience, it is also possible to omit `--query` and pass the queries directly after `--multiquery`.
 - `--multiline, -m` – If specified, allow multiline queries (do not send the query on Enter).
 - `--database, -d` – Select the current default database. Default value: the current database from the server settings (‘default’ by default).

From 306f642d97ce51bed6fda59cac1c3e3465f6ef5a Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Sun, 17 Mar 2024 11:57:01 +0100
Subject: [PATCH 716/985] Update dictionary's comment in the same safe manner
 too.

---
 src/Dictionaries/DictionaryFactory.cpp         |  6 +-----
 src/Dictionaries/IDictionary.h                 | 14 ++++++++------
 .../ExternalDictionariesLoader.cpp             | 13 +++++++++----
 src/Storages/StorageDictionary.cpp             | 18 +++++++++---------
 4 files changed, 27 insertions(+), 24 deletions(-)

diff --git a/src/Dictionaries/DictionaryFactory.cpp b/src/Dictionaries/DictionaryFactory.cpp
index a566fb27de4..337121822ea 100644
--- a/src/Dictionaries/DictionaryFactory.cpp
+++ b/src/Dictionaries/DictionaryFactory.cpp
@@ -55,11 +55,7 @@ DictionaryPtr DictionaryFactory::create(
         if (found != registered_layouts.end())
         {
             const auto & layout_creator = found->second.layout_create_function;
-            auto result = layout_creator(name, dict_struct, config, config_prefix, std::move(source_ptr), global_context, created_from_ddl);
-            if (config.hasProperty(config_prefix + ".comment"))
-                result->setDictionaryComment(config.getString(config_prefix + ".comment"));
-
-            return result;
+            return layout_creator(name, dict_struct, config, config_prefix, std::move(source_ptr), global_context, created_from_ddl);
         }
     }
 
diff --git a/src/Dictionaries/IDictionary.h b/src/Dictionaries/IDictionary.h
index 9770e93669e..bab80d3cd57 100644
--- a/src/Dictionaries/IDictionary.h
+++ b/src/Dictionaries/IDictionary.h
@@ -332,12 +332,6 @@ public:
         return std::static_pointer_cast<const IDictionary>(IExternalLoadable::shared_from_this());
     }
 
-    void setDictionaryComment(String new_comment)
-    {
-        std::lock_guard lock{mutex};
-        dictionary_comment = std::move(new_comment);
-    }
-
     String getDictionaryComment() const
     {
         std::lock_guard lock{mutex};
@@ -454,6 +448,14 @@ public:
         dictionary_id = new_dictionary_id;
     }
 
+    /// Internally called by ExternalDictionariesLoader.
+    /// In order to update the dictionary comment change its configuration first and then call ExternalDictionariesLoader::reloadConfig().
+    void updateDictionaryComment(const String & new_dictionary_comment)
+    {
+        std::lock_guard lock{mutex};
+        dictionary_comment = new_dictionary_comment;
+    }
+
 private:
     mutable std::mutex mutex;
     StorageID dictionary_id TSA_GUARDED_BY(mutex);
diff --git a/src/Interpreters/ExternalDictionariesLoader.cpp b/src/Interpreters/ExternalDictionariesLoader.cpp
index 0591a6232d0..68f22df2947 100644
--- a/src/Interpreters/ExternalDictionariesLoader.cpp
+++ b/src/Interpreters/ExternalDictionariesLoader.cpp
@@ -45,14 +45,17 @@ ExternalLoader::LoadablePtr ExternalDictionariesLoader::create(
 bool ExternalDictionariesLoader::doesConfigChangeRequiresReloadingObject(const Poco::Util::AbstractConfiguration & old_config, const String & old_key_in_config,
                                                                          const Poco::Util::AbstractConfiguration & new_config, const String & new_key_in_config) const
 {
+    std::unordered_set<std::string_view> ignore_keys;
+    ignore_keys.insert("comment"); /// We always can change the comment without reloading a dictionary.
+
     /// If the database is atomic then a dictionary can be renamed without reloading.
     if (!old_config.getString(old_key_in_config + ".uuid", "").empty() && !new_config.getString(new_key_in_config + ".uuid", "").empty())
     {
-        static const std::unordered_set<std::string_view> ignore_keys{"name", "database"};
-        bool only_name_or_database_may_differ = isSameConfigurationIgnoringKeys(old_config, old_key_in_config, new_config, new_key_in_config, ignore_keys);
-        return !only_name_or_database_may_differ;
+        ignore_keys.insert("name");
+        ignore_keys.insert("database");
     }
-    return true;
+
+    return !isSameConfigurationIgnoringKeys(old_config, old_key_in_config, new_config, new_key_in_config, ignore_keys);
 }
 
 void ExternalDictionariesLoader::updateObjectFromConfigWithoutReloading(IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config) const
@@ -67,6 +70,8 @@ void ExternalDictionariesLoader::updateObjectFromConfigWithoutReloading(IExterna
         if ((new_dictionary_id.uuid == old_dictionary_id.uuid) && (new_dictionary_id.uuid != UUIDHelpers::Nil))
             dict.updateDictionaryID(new_dictionary_id);
     }
+
+    dict.updateDictionaryComment(config.getString(key_in_config + ".comment", ""));
 }
 
 ExternalDictionariesLoader::DictPtr ExternalDictionariesLoader::getDictionary(const std::string & dictionary_name, ContextPtr local_context) const
diff --git a/src/Storages/StorageDictionary.cpp b/src/Storages/StorageDictionary.cpp
index 414c66e9522..a0c4156a704 100644
--- a/src/Storages/StorageDictionary.cpp
+++ b/src/Storages/StorageDictionary.cpp
@@ -278,19 +278,19 @@ void StorageDictionary::alter(const AlterCommands & params, ContextPtr alter_con
 
     auto new_comment = getInMemoryMetadataPtr()->comment;
 
-    auto storage_id = getStorageID();
-    const auto & external_dictionaries_loader = getContext()->getExternalDictionariesLoader();
-    auto result = external_dictionaries_loader.getLoadResult(storage_id.getInternalDictionaryName());
+    /// It's better not to update an associated `IDictionary` directly here because it can be not loaded yet or
+    /// it can be in the process of loading or reloading right now.
+    /// The correct way is to update the dictionary's configuration first and then ask ExternalDictionariesLoader to reload our dictionary.
 
-    if (result.object)
     {
-        auto dictionary = std::static_pointer_cast<const IDictionary>(result.object);
-        auto * dictionary_non_const = const_cast<IDictionary *>(dictionary.get());
-        dictionary_non_const->setDictionaryComment(new_comment);
+        std::lock_guard lock(dictionary_config_mutex);
+        auto new_configuration = ConfigHelper::clone(*configuration);
+        new_configuration->setString("dictionary.comment", new_comment);
+        configuration = new_configuration;
     }
 
-    std::lock_guard lock(dictionary_config_mutex);
-    configuration->setString("dictionary.comment", new_comment);
+    const auto & external_dictionaries_loader = getContext()->getExternalDictionariesLoader();
+    external_dictionaries_loader.reloadConfig(getStorageID().getInternalDictionaryName());
 }
 
 void registerStorageDictionary(StorageFactory & factory)

From c8375cd16777010a35d11340bf7b8c9c60c1fa1e Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Mon, 18 Mar 2024 16:44:55 +0100
Subject: [PATCH 717/985] Better code: remove unnecessary usage of const_cast
 and std::function.

---
 src/Dictionaries/CacheDictionary.h            |  2 +-
 src/Dictionaries/DirectDictionary.h           |  2 +-
 src/Dictionaries/FlatDictionary.h             |  2 +-
 src/Dictionaries/HashedArrayDictionary.h      |  2 +-
 src/Dictionaries/HashedDictionary.h           |  2 +-
 src/Dictionaries/IPAddressDictionary.h        |  2 +-
 .../PolygonDictionaryImplementations.cpp      |  6 +-
 .../PolygonDictionaryImplementations.h        |  6 +-
 src/Dictionaries/RangeHashedDictionary.h      |  2 +-
 src/Dictionaries/RegExpTreeDictionary.h       |  2 +-
 ...alUserDefinedExecutableFunctionsLoader.cpp |  2 +-
 ...rnalUserDefinedExecutableFunctionsLoader.h |  2 +-
 .../UserDefinedExecutableFunction.h           |  2 +-
 .../ExternalDictionariesLoader.cpp            |  2 +-
 src/Interpreters/ExternalDictionariesLoader.h |  4 +-
 src/Interpreters/ExternalLoader.cpp           | 60 +++++--------------
 src/Interpreters/ExternalLoader.h             |  7 ++-
 src/Interpreters/IExternalLoadable.h          |  2 +-
 18 files changed, 41 insertions(+), 68 deletions(-)

diff --git a/src/Dictionaries/CacheDictionary.h b/src/Dictionaries/CacheDictionary.h
index 8897fb40fa9..50f59e3eddb 100644
--- a/src/Dictionaries/CacheDictionary.h
+++ b/src/Dictionaries/CacheDictionary.h
@@ -98,7 +98,7 @@ public:
 
     bool supportUpdates() const override { return false; }
 
-    std::shared_ptr<const IExternalLoadable> clone() const override
+    std::shared_ptr<IExternalLoadable> clone() const override
     {
         return std::make_shared<CacheDictionary>(
                 getDictionaryID(),
diff --git a/src/Dictionaries/DirectDictionary.h b/src/Dictionaries/DirectDictionary.h
index 8bf183fd1ab..d4b4cd8e698 100644
--- a/src/Dictionaries/DirectDictionary.h
+++ b/src/Dictionaries/DirectDictionary.h
@@ -50,7 +50,7 @@ public:
 
     double getLoadFactor() const override { return 0; }
 
-    std::shared_ptr<const IExternalLoadable> clone() const override
+    std::shared_ptr<IExternalLoadable> clone() const override
     {
         return std::make_shared<DirectDictionary>(getDictionaryID(), dict_struct, source_ptr->clone());
     }
diff --git a/src/Dictionaries/FlatDictionary.h b/src/Dictionaries/FlatDictionary.h
index 231819ab4ee..7b00ce57455 100644
--- a/src/Dictionaries/FlatDictionary.h
+++ b/src/Dictionaries/FlatDictionary.h
@@ -57,7 +57,7 @@ public:
 
     double getLoadFactor() const override { return static_cast<double>(element_count) / bucket_count; }
 
-    std::shared_ptr<const IExternalLoadable> clone() const override
+    std::shared_ptr<IExternalLoadable> clone() const override
     {
         return std::make_shared<FlatDictionary>(getDictionaryID(), dict_struct, source_ptr->clone(), configuration, update_field_loaded_block);
     }
diff --git a/src/Dictionaries/HashedArrayDictionary.h b/src/Dictionaries/HashedArrayDictionary.h
index 4b2570ad928..d4bb67b9606 100644
--- a/src/Dictionaries/HashedArrayDictionary.h
+++ b/src/Dictionaries/HashedArrayDictionary.h
@@ -73,7 +73,7 @@ public:
 
     double getLoadFactor() const override { return static_cast<double>(total_element_count) / bucket_count; }
 
-    std::shared_ptr<const IExternalLoadable> clone() const override
+    std::shared_ptr<IExternalLoadable> clone() const override
     {
         return std::make_shared<HashedArrayDictionary<dictionary_key_type, sharded>>(getDictionaryID(), dict_struct, source_ptr->clone(), configuration, update_field_loaded_block);
     }
diff --git a/src/Dictionaries/HashedDictionary.h b/src/Dictionaries/HashedDictionary.h
index 37812de29d9..4080c018289 100644
--- a/src/Dictionaries/HashedDictionary.h
+++ b/src/Dictionaries/HashedDictionary.h
@@ -116,7 +116,7 @@ public:
 
     double getLoadFactor() const override { return static_cast<double>(element_count) / bucket_count; }
 
-    std::shared_ptr<const IExternalLoadable> clone() const override
+    std::shared_ptr<IExternalLoadable> clone() const override
     {
         return std::make_shared<HashedDictionary<dictionary_key_type, sparse, sharded>>(
             getDictionaryID(),
diff --git a/src/Dictionaries/IPAddressDictionary.h b/src/Dictionaries/IPAddressDictionary.h
index cebdefcf7ae..bdd02157077 100644
--- a/src/Dictionaries/IPAddressDictionary.h
+++ b/src/Dictionaries/IPAddressDictionary.h
@@ -57,7 +57,7 @@ public:
 
     double getLoadFactor() const override { return static_cast<double>(element_count) / bucket_count; }
 
-    std::shared_ptr<const IExternalLoadable> clone() const override
+    std::shared_ptr<IExternalLoadable> clone() const override
     {
         return std::make_shared<IPAddressDictionary>(getDictionaryID(), dict_struct, source_ptr->clone(), configuration);
     }
diff --git a/src/Dictionaries/PolygonDictionaryImplementations.cpp b/src/Dictionaries/PolygonDictionaryImplementations.cpp
index 3feca2ec410..64d29458430 100644
--- a/src/Dictionaries/PolygonDictionaryImplementations.cpp
+++ b/src/Dictionaries/PolygonDictionaryImplementations.cpp
@@ -29,7 +29,7 @@ PolygonDictionarySimple::PolygonDictionarySimple(
 {
 }
 
-std::shared_ptr<const IExternalLoadable> PolygonDictionarySimple::clone() const
+std::shared_ptr<IExternalLoadable> PolygonDictionarySimple::clone() const
 {
     return std::make_shared<PolygonDictionarySimple>(
             this->getDictionaryID(),
@@ -76,7 +76,7 @@ PolygonDictionaryIndexEach::PolygonDictionaryIndexEach(
     }
 }
 
-std::shared_ptr<const IExternalLoadable> PolygonDictionaryIndexEach::clone() const
+std::shared_ptr<IExternalLoadable> PolygonDictionaryIndexEach::clone() const
 {
     return std::make_shared<PolygonDictionaryIndexEach>(
             this->getDictionaryID(),
@@ -126,7 +126,7 @@ PolygonDictionaryIndexCell::PolygonDictionaryIndexCell(
 {
 }
 
-std::shared_ptr<const IExternalLoadable> PolygonDictionaryIndexCell::clone() const
+std::shared_ptr<IExternalLoadable> PolygonDictionaryIndexCell::clone() const
 {
     return std::make_shared<PolygonDictionaryIndexCell>(
             this->getDictionaryID(),
diff --git a/src/Dictionaries/PolygonDictionaryImplementations.h b/src/Dictionaries/PolygonDictionaryImplementations.h
index 912d501bcde..690ff3a0f1b 100644
--- a/src/Dictionaries/PolygonDictionaryImplementations.h
+++ b/src/Dictionaries/PolygonDictionaryImplementations.h
@@ -23,7 +23,7 @@ public:
             DictionaryLifetime dict_lifetime_,
             Configuration configuration_);
 
-    std::shared_ptr<const IExternalLoadable> clone() const override;
+    std::shared_ptr<IExternalLoadable> clone() const override;
 
 private:
     bool find(const Point & point, size_t & polygon_index) const override;
@@ -47,7 +47,7 @@ public:
             int min_intersections_,
             int max_depth_);
 
-    std::shared_ptr<const IExternalLoadable> clone() const override;
+    std::shared_ptr<IExternalLoadable> clone() const override;
 
     static constexpr size_t kMinIntersectionsDefault = 1;
     static constexpr size_t kMaxDepthDefault = 5;
@@ -75,7 +75,7 @@ public:
             size_t min_intersections_,
             size_t max_depth_);
 
-    std::shared_ptr<const IExternalLoadable> clone() const override;
+    std::shared_ptr<IExternalLoadable> clone() const override;
 
     static constexpr size_t kMinIntersectionsDefault = 1;
     static constexpr size_t kMaxDepthDefault = 5;
diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index 1a6ee7e81d4..9f7dc5dc68a 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -101,7 +101,7 @@ public:
 
     double getLoadFactor() const override { return static_cast<double>(element_count) / bucket_count; }
 
-    std::shared_ptr<const IExternalLoadable> clone() const override
+    std::shared_ptr<IExternalLoadable> clone() const override
     {
         auto result = std::make_shared<RangeHashedDictionary>(
             getDictionaryID(),
diff --git a/src/Dictionaries/RegExpTreeDictionary.h b/src/Dictionaries/RegExpTreeDictionary.h
index 9e14abb49d0..a361c68879e 100644
--- a/src/Dictionaries/RegExpTreeDictionary.h
+++ b/src/Dictionaries/RegExpTreeDictionary.h
@@ -86,7 +86,7 @@ public:
 
     bool hasHierarchy() const override { return false; }
 
-    std::shared_ptr<const IExternalLoadable> clone() const override
+    std::shared_ptr<IExternalLoadable> clone() const override
     {
         return std::make_shared<RegExpTreeDictionary>(
             getDictionaryID(), structure, source_ptr->clone(), configuration, use_vectorscan, flag_case_insensitive, flag_dotall);
diff --git a/src/Functions/UserDefined/ExternalUserDefinedExecutableFunctionsLoader.cpp b/src/Functions/UserDefined/ExternalUserDefinedExecutableFunctionsLoader.cpp
index db98f88e53b..a4f17aa1201 100644
--- a/src/Functions/UserDefined/ExternalUserDefinedExecutableFunctionsLoader.cpp
+++ b/src/Functions/UserDefined/ExternalUserDefinedExecutableFunctionsLoader.cpp
@@ -120,7 +120,7 @@ void ExternalUserDefinedExecutableFunctionsLoader::reloadFunction(const std::str
     loadOrReload(user_defined_function_name);
 }
 
-ExternalLoader::LoadablePtr ExternalUserDefinedExecutableFunctionsLoader::create(const std::string & name,
+ExternalLoader::LoadableMutablePtr ExternalUserDefinedExecutableFunctionsLoader::createObject(const std::string & name,
     const Poco::Util::AbstractConfiguration & config,
     const std::string & key_in_config,
     const std::string &) const
diff --git a/src/Functions/UserDefined/ExternalUserDefinedExecutableFunctionsLoader.h b/src/Functions/UserDefined/ExternalUserDefinedExecutableFunctionsLoader.h
index 1a62175eb0c..eb86986c391 100644
--- a/src/Functions/UserDefined/ExternalUserDefinedExecutableFunctionsLoader.h
+++ b/src/Functions/UserDefined/ExternalUserDefinedExecutableFunctionsLoader.h
@@ -28,7 +28,7 @@ public:
     void reloadFunction(const std::string & user_defined_function_name) const;
 
 protected:
-    LoadablePtr create(const std::string & name,
+    LoadableMutablePtr createObject(const std::string & name,
         const Poco::Util::AbstractConfiguration & config,
         const std::string & key_in_config,
         const std::string & repository_name) const override;
diff --git a/src/Functions/UserDefined/UserDefinedExecutableFunction.h b/src/Functions/UserDefined/UserDefinedExecutableFunction.h
index 989f9dfe895..d48be215c7d 100644
--- a/src/Functions/UserDefined/UserDefinedExecutableFunction.h
+++ b/src/Functions/UserDefined/UserDefinedExecutableFunction.h
@@ -62,7 +62,7 @@ public:
         return true;
     }
 
-    std::shared_ptr<const IExternalLoadable> clone() const override
+    std::shared_ptr<IExternalLoadable> clone() const override
     {
         return std::make_shared<UserDefinedExecutableFunction>(configuration, coordinator, lifetime);
     }
diff --git a/src/Interpreters/ExternalDictionariesLoader.cpp b/src/Interpreters/ExternalDictionariesLoader.cpp
index 68f22df2947..34ad240d089 100644
--- a/src/Interpreters/ExternalDictionariesLoader.cpp
+++ b/src/Interpreters/ExternalDictionariesLoader.cpp
@@ -32,7 +32,7 @@ ExternalDictionariesLoader::ExternalDictionariesLoader(ContextPtr global_context
         enablePeriodicUpdates(true);
 }
 
-ExternalLoader::LoadablePtr ExternalDictionariesLoader::create(
+ExternalLoader::LoadableMutablePtr ExternalDictionariesLoader::createObject(
         const std::string & name, const Poco::Util::AbstractConfiguration & config,
         const std::string & key_in_config, const std::string & repository_name) const
 {
diff --git a/src/Interpreters/ExternalDictionariesLoader.h b/src/Interpreters/ExternalDictionariesLoader.h
index f3aa8fa5f8e..0fc58aa1edf 100644
--- a/src/Interpreters/ExternalDictionariesLoader.h
+++ b/src/Interpreters/ExternalDictionariesLoader.h
@@ -40,8 +40,8 @@ public:
     static void resetAll();
 
 protected:
-    LoadablePtr create(const std::string & name, const Poco::Util::AbstractConfiguration & config,
-            const std::string & key_in_config, const std::string & repository_name) const override;
+    LoadableMutablePtr createObject(const std::string & name, const Poco::Util::AbstractConfiguration & config,
+                                    const std::string & key_in_config, const std::string & repository_name) const override;
 
     bool doesConfigChangeRequiresReloadingObject(const Poco::Util::AbstractConfiguration & old_config, const String & old_key_in_config,
                                                  const Poco::Util::AbstractConfiguration & new_config, const String & new_key_in_config) const override;
diff --git a/src/Interpreters/ExternalLoader.cpp b/src/Interpreters/ExternalLoader.cpp
index 6ab083f9fb7..bd56a540128 100644
--- a/src/Interpreters/ExternalLoader.cpp
+++ b/src/Interpreters/ExternalLoader.cpp
@@ -87,9 +87,6 @@ namespace
                 lock = std::unique_lock(mutex);
         }
     };
-
-    using DoesConfigChangeRequiresReloadingObjectFunction = std::function<bool(const Poco::Util::AbstractConfiguration & config_1, const String & key_in_config_1, const Poco::Util::AbstractConfiguration & config_2, const String & key_in_config_2)>;
-    using UpdateObjectFromConfigWithoutReloadingFunction = std::function<void(const IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config)>;
 }
 
 
@@ -98,10 +95,7 @@ namespace
 class ExternalLoader::LoadablesConfigReader : private boost::noncopyable
 {
 public:
-    LoadablesConfigReader(const String & type_name_, LoggerPtr log_)
-        : type_name(type_name_), log(log_)
-    {
-    }
+    LoadablesConfigReader(const String & type_name_, LoggerPtr log_) : type_name(type_name_), log(log_) { }
     ~LoadablesConfigReader() = default;
 
     using Repository = IExternalLoaderConfigRepository;
@@ -397,21 +391,8 @@ private:
 class ExternalLoader::LoadingDispatcher : private boost::noncopyable
 {
 public:
-    /// Called to load or reload an object.
-    using CreateObjectFunction = std::function<LoadablePtr(
-        const String & /* name */, const ObjectConfig & /* config */, const LoadablePtr & /* previous_version */)>;
-
-    LoadingDispatcher(
-        const CreateObjectFunction & create_object_function_,
-        const DoesConfigChangeRequiresReloadingObjectFunction & does_config_change_requires_reloading_object_,
-        const UpdateObjectFromConfigWithoutReloadingFunction & update_object_from_config_without_reloading_,
-        const String & type_name_,
-        LoggerPtr log_)
-        : create_object(create_object_function_)
-        , does_config_change_requires_reloading_object(does_config_change_requires_reloading_object_)
-        , update_object_from_config_without_reloading(update_object_from_config_without_reloading_)
-        , type_name(type_name_)
-        , log(log_)
+    LoadingDispatcher(const String & type_name_, LoggerPtr log_, const ExternalLoader & external_loader_)
+        : type_name(type_name_), log(log_), external_loader(external_loader_)
     {
     }
 
@@ -471,11 +452,11 @@ public:
                 if (config_changed)
                 {
                     if (info.object)
-                        update_object_from_config_without_reloading(*info.object, *new_config->config, new_config->key_in_config);
+                        external_loader.updateObjectFromConfigWithoutReloading(*info.object, *new_config->config, new_config->key_in_config);
 
                     if (info.triedToLoad())
                     {
-                        bool config_change_requires_reloading = does_config_change_requires_reloading_object(*previous_config->config, previous_config->key_in_config, *new_config->config, new_config->key_in_config);
+                        bool config_change_requires_reloading = external_loader.doesConfigChangeRequiresReloadingObject(*previous_config->config, previous_config->key_in_config, *new_config->config, new_config->key_in_config);
                         if (config_change_requires_reloading)
                         {
                             /// The object has been tried to load before, so it is currently in use or was in use
@@ -786,7 +767,7 @@ private:
         }
 
         String name;
-        LoadablePtr object;
+        LoadableMutablePtr object;
         std::shared_ptr<const ObjectConfig> config;
         TimePoint loading_start_time;
         TimePoint loading_end_time;
@@ -1046,17 +1027,17 @@ private:
     }
 
     /// Load one object, returns object ptr or exception.
-    std::pair<LoadablePtr, std::exception_ptr>
+    std::pair<LoadableMutablePtr, std::exception_ptr>
     loadSingleObject(const String & name, const ObjectConfig & config, LoadablePtr previous_version)
     {
         /// Use `create_function` to perform the actual loading.
         /// It's much better to do it with `mutex` unlocked because the loading can take a lot of time
         /// and require access to other objects.
-        LoadablePtr new_object;
+        LoadableMutablePtr new_object;
         std::exception_ptr new_exception;
         try
         {
-            new_object = create_object(name, config, previous_version);
+            new_object = external_loader.createOrCloneObject(name, config, previous_version);
         }
         catch (...)
         {
@@ -1070,7 +1051,7 @@ private:
         const String & name,
         size_t loading_id,
         LoadablePtr previous_version,
-        LoadablePtr new_object,
+        LoadableMutablePtr new_object,
         std::exception_ptr new_exception,
         size_t error_count,
         const LoadingGuardForAsyncLoad &)
@@ -1134,7 +1115,7 @@ private:
 
         if (new_object)
         {
-            update_object_from_config_without_reloading(*new_object, *info->config->config, info->config->key_in_config);
+            external_loader.updateObjectFromConfigWithoutReloading(*new_object, *info->config->config, info->config->key_in_config);
             info->object = new_object;
         }
 
@@ -1210,11 +1191,9 @@ private:
         }
     }
 
-    const CreateObjectFunction create_object;
-    const DoesConfigChangeRequiresReloadingObjectFunction does_config_change_requires_reloading_object;
-    const UpdateObjectFromConfigWithoutReloadingFunction update_object_from_config_without_reloading;
     const String type_name;
-    LoggerPtr log;
+    const LoggerPtr log;
+    const ExternalLoader & external_loader;
 
     mutable std::mutex mutex;
     std::condition_variable event;
@@ -1296,14 +1275,7 @@ private:
 
 ExternalLoader::ExternalLoader(const String & type_name_, LoggerPtr log_)
     : config_files_reader(std::make_unique<LoadablesConfigReader>(type_name_, log_))
-    , loading_dispatcher(std::make_unique<LoadingDispatcher>(
-          [this](auto && a, auto && b, auto && c) { return createObject(a, b, c); },
-          [this](const Poco::Util::AbstractConfiguration & config_1, const String & key_in_config_1, const Poco::Util::AbstractConfiguration & config_2, const String & key_in_config_2)
-                { return doesConfigChangeRequiresReloadingObject(config_1, key_in_config_1, config_2, key_in_config_2); },
-          [this](const IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config)
-                { return updateObjectFromConfigWithoutReloading(const_cast<IExternalLoadable &>(object), config, key_in_config); },
-          type_name_,
-          log_))
+    , loading_dispatcher(std::make_unique<LoadingDispatcher>(type_name_, log_, *this))
     , periodic_updater(std::make_unique<PeriodicUpdater>(*config_files_reader, *loading_dispatcher))
     , type_name(type_name_)
     , log(log_)
@@ -1530,13 +1502,13 @@ void ExternalLoader::reloadConfig(const String & repository_name, const String &
     loading_dispatcher->setConfiguration(config_files_reader->read(repository_name, path));
 }
 
-ExternalLoader::LoadablePtr ExternalLoader::createObject(
+ExternalLoader::LoadableMutablePtr ExternalLoader::createOrCloneObject(
     const String & name, const ObjectConfig & config, const LoadablePtr & previous_version) const
 {
     if (previous_version)
         return previous_version->clone();
 
-    return create(name, *config.config, config.key_in_config, config.repository_name);
+    return createObject(name, *config.config, config.key_in_config, config.repository_name);
 }
 
 template ExternalLoader::LoadablePtr ExternalLoader::getLoadResult<ExternalLoader::LoadablePtr>(const String &) const;
diff --git a/src/Interpreters/ExternalLoader.h b/src/Interpreters/ExternalLoader.h
index 781d8ca9e7b..c746ce39b2d 100644
--- a/src/Interpreters/ExternalLoader.h
+++ b/src/Interpreters/ExternalLoader.h
@@ -50,6 +50,7 @@ class ExternalLoader
 {
 public:
     using LoadablePtr = std::shared_ptr<const IExternalLoadable>;
+    using LoadableMutablePtr = std::shared_ptr<IExternalLoadable>;
     using Loadables = std::vector<LoadablePtr>;
     using Status = ExternalLoaderStatus;
 
@@ -211,7 +212,7 @@ public:
     void reloadConfig(const String & repository_name, const String & path) const;
 
 protected:
-    virtual LoadablePtr create(const String & name, const Poco::Util::AbstractConfiguration & config, const String & key_in_config, const String & repository_name) const = 0;
+    virtual LoadableMutablePtr createObject(const String & name, const Poco::Util::AbstractConfiguration & config, const String & key_in_config, const String & repository_name) const = 0;
 
     /// Returns whether the object must be reloaded after a specified change in its configuration.
     virtual bool doesConfigChangeRequiresReloadingObject(const Poco::Util::AbstractConfiguration & /* old_config */, const String & /* old_key_in_config */,
@@ -227,7 +228,7 @@ private:
 
     Strings getAllTriedToLoadNames() const;
 
-    LoadablePtr createObject(const String & name, const ObjectConfig & config, const LoadablePtr & previous_version) const;
+    LoadableMutablePtr createOrCloneObject(const String & name, const ObjectConfig & config, const LoadablePtr & previous_version) const;
 
     class LoadablesConfigReader;
     std::unique_ptr<LoadablesConfigReader> config_files_reader;
@@ -239,7 +240,7 @@ private:
     std::unique_ptr<PeriodicUpdater> periodic_updater;
 
     const String type_name;
-    LoggerPtr log;
+    const LoggerPtr log;
 };
 
 }
diff --git a/src/Interpreters/IExternalLoadable.h b/src/Interpreters/IExternalLoadable.h
index 3c004508b0a..1076bd88027 100644
--- a/src/Interpreters/IExternalLoadable.h
+++ b/src/Interpreters/IExternalLoadable.h
@@ -43,7 +43,7 @@ public:
     /// If lifetime exceeded and isModified(), ExternalLoader replace current object with the result of clone().
     virtual bool isModified() const = 0;
     /// Returns new object with the same configuration. Is used to update modified object when lifetime exceeded.
-    virtual std::shared_ptr<const IExternalLoadable> clone() const = 0;
+    virtual std::shared_ptr<IExternalLoadable> clone() const = 0;
 };
 
 }

From a1a4bd3514f72b4545fbb734749dcb9d7f513007 Mon Sep 17 00:00:00 2001
From: nemonlou <nemonlou@qq.com>
Date: Wed, 6 Mar 2024 10:42:30 +0800
Subject: [PATCH 718/985] make nulls direction configuable for
 FullSortingMergeJoin

---
 src/Core/Settings.h                           |  1 +
 src/Interpreters/InterpreterSelectQuery.cpp   |  7 +-
 src/Processors/QueryPlan/JoinStep.cpp         |  8 +-
 src/Processors/QueryPlan/JoinStep.h           |  4 +-
 .../Transforms/MergeJoinTransform.cpp         | 82 ++++++++++++-------
 .../Transforms/MergeJoinTransform.h           | 16 +++-
 src/QueryPipeline/QueryPipelineBuilder.cpp    |  3 +-
 src/QueryPipeline/QueryPipelineBuilder.h      |  1 +
 8 files changed, 84 insertions(+), 38 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index a3c5638d97f..8d48b3f5e68 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -891,6 +891,7 @@ class IColumn;
     M(Int64, ignore_cold_parts_seconds, 0, "Only available in ClickHouse Cloud. Exclude new data parts from SELECT queries until they're either pre-warmed (see cache_populated_by_fetch) or this many seconds old. Only for Replicated-/SharedMergeTree.", 0) \
     M(Int64, prefer_warmed_unmerged_parts_seconds, 0, "Only available in ClickHouse Cloud. If a merged part is less than this many seconds old and is not pre-warmed (see cache_populated_by_fetch), but all its source parts are available and pre-warmed, SELECT queries will read from those parts instead. Only for ReplicatedMergeTree. Note that this only checks whether CacheWarmer processed the part; if the part was fetched into cache by something else, it'll still be considered cold until CacheWarmer gets to it; if it was warmed, then evicted from cache, it'll still be considered warm.", 0) \
     M(Bool, iceberg_engine_ignore_schema_evolution, false, "Ignore schema evolution in Iceberg table engine and read all data using latest schema saved on table creation. Note that it can lead to incorrect result", 0) \
+    M(Bool, nulls_biggest_in_smj, true, "Treat nulls as biggest in sort. Used in sort merge join for compare null keys.", 0) \
 
 // End of COMMON_SETTINGS
 // Please add settings related to formats into the FORMAT_FACTORY_SETTINGS, move obsolete settings to OBSOLETE_SETTINGS and obsolete format settings to OBSOLETE_FORMAT_SETTINGS.
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 7c87dadfce6..6f0a9fa9bfb 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -1693,9 +1693,10 @@ void InterpreterSelectQuery::executeImpl(QueryPlan & query_plan, std::optional<P
                     auto add_sorting = [&settings, this] (QueryPlan & plan, const Names & key_names, JoinTableSide join_pos)
                     {
                         SortDescription order_descr;
+                        int nulls_direction = settings.nulls_biggest_in_smj ? 1 : -1;
                         order_descr.reserve(key_names.size());
                         for (const auto & key_name : key_names)
-                            order_descr.emplace_back(key_name);
+                            order_descr.emplace_back(key_name, 1, nulls_direction);
 
                         SortingStep::Settings sort_settings(*context);
 
@@ -1761,13 +1762,15 @@ void InterpreterSelectQuery::executeImpl(QueryPlan & query_plan, std::optional<P
                         add_sorting(*joined_plan, join_clause.key_names_right, JoinTableSide::Right);
                     }
 
+                    int null_direct_hint = settings.nulls_biggest_in_smj ? 1 : -1;
                     QueryPlanStepPtr join_step = std::make_unique<JoinStep>(
                         query_plan.getCurrentDataStream(),
                         joined_plan->getCurrentDataStream(),
                         expressions.join,
                         settings.max_block_size,
                         max_streams,
-                        analysis_result.optimize_read_in_order);
+                        analysis_result.optimize_read_in_order,
+                        null_direct_hint);
 
                     join_step->setStepDescription(fmt::format("JOIN {}", expressions.join->pipelineType()));
                     std::vector<QueryPlanPtr> plans;
diff --git a/src/Processors/QueryPlan/JoinStep.cpp b/src/Processors/QueryPlan/JoinStep.cpp
index 1931b1eb3a1..0c46ce7893d 100644
--- a/src/Processors/QueryPlan/JoinStep.cpp
+++ b/src/Processors/QueryPlan/JoinStep.cpp
@@ -44,8 +44,10 @@ JoinStep::JoinStep(
     JoinPtr join_,
     size_t max_block_size_,
     size_t max_streams_,
-    bool keep_left_read_in_order_)
-    : join(std::move(join_)), max_block_size(max_block_size_), max_streams(max_streams_), keep_left_read_in_order(keep_left_read_in_order_)
+    bool keep_left_read_in_order_,
+    int null_direction_hint_)
+    : join(std::move(join_)), max_block_size(max_block_size_), max_streams(max_streams_), keep_left_read_in_order(keep_left_read_in_order_),
+    null_direction_hint(null_direction_hint_)
 {
     updateInputStreams(DataStreams{left_stream_, right_stream_});
 }
@@ -58,7 +60,7 @@ QueryPipelineBuilderPtr JoinStep::updatePipeline(QueryPipelineBuilders pipelines
     if (join->pipelineType() == JoinPipelineType::YShaped)
     {
         auto joined_pipeline = QueryPipelineBuilder::joinPipelinesYShaped(
-            std::move(pipelines[0]), std::move(pipelines[1]), join, output_stream->header, max_block_size, &processors);
+            std::move(pipelines[0]), std::move(pipelines[1]), join, output_stream->header, max_block_size, null_direction_hint, &processors);
         joined_pipeline->resize(max_streams);
         return joined_pipeline;
     }
diff --git a/src/Processors/QueryPlan/JoinStep.h b/src/Processors/QueryPlan/JoinStep.h
index a9059a083fe..08909ce48a9 100644
--- a/src/Processors/QueryPlan/JoinStep.h
+++ b/src/Processors/QueryPlan/JoinStep.h
@@ -19,7 +19,8 @@ public:
         JoinPtr join_,
         size_t max_block_size_,
         size_t max_streams_,
-        bool keep_left_read_in_order_);
+        bool keep_left_read_in_order_,
+        int null_direction_hint_ = 1);
 
     String getName() const override { return "Join"; }
 
@@ -42,6 +43,7 @@ private:
     size_t max_block_size;
     size_t max_streams;
     bool keep_left_read_in_order;
+    int null_direction_hint;
 };
 
 /// Special step for the case when Join is already filled.
diff --git a/src/Processors/Transforms/MergeJoinTransform.cpp b/src/Processors/Transforms/MergeJoinTransform.cpp
index 2d313d4ea5c..c8e3a806a9f 100644
--- a/src/Processors/Transforms/MergeJoinTransform.cpp
+++ b/src/Processors/Transforms/MergeJoinTransform.cpp
@@ -43,7 +43,7 @@ FullMergeJoinCursorPtr createCursor(const Block & block, const Names & columns)
 }
 
 template <bool has_left_nulls, bool has_right_nulls>
-int nullableCompareAt(const IColumn & left_column, const IColumn & right_column, size_t lhs_pos, size_t rhs_pos, int null_direction_hint = 1)
+int nullableCompareAt(const IColumn & left_column, const IColumn & right_column, size_t lhs_pos, size_t rhs_pos, int null_direction_hint)
 {
     if constexpr (has_left_nulls && has_right_nulls)
     {
@@ -88,35 +88,36 @@ int nullableCompareAt(const IColumn & left_column, const IColumn & right_column,
 }
 
 int ALWAYS_INLINE compareCursors(const SortCursorImpl & lhs, size_t lpos,
-                                 const SortCursorImpl & rhs, size_t rpos)
+                                 const SortCursorImpl & rhs, size_t rpos,
+                                 int null_direction_hint)
 {
     for (size_t i = 0; i < lhs.sort_columns_size; ++i)
     {
         /// TODO(@vdimir): use nullableCompareAt only if there's nullable columns
-        int cmp = nullableCompareAt<true, true>(*lhs.sort_columns[i], *rhs.sort_columns[i], lpos, rpos);
+        int cmp = nullableCompareAt<true, true>(*lhs.sort_columns[i], *rhs.sort_columns[i], lpos, rpos, null_direction_hint);
         if (cmp != 0)
             return cmp;
     }
     return 0;
 }
 
-int ALWAYS_INLINE compareCursors(const SortCursorImpl & lhs, const SortCursorImpl & rhs)
+int ALWAYS_INLINE compareCursors(const SortCursorImpl & lhs, const SortCursorImpl & rhs, int null_direction_hint)
 {
-    return compareCursors(lhs, lhs.getRow(), rhs, rhs.getRow());
+    return compareCursors(lhs, lhs.getRow(), rhs, rhs.getRow(), null_direction_hint);
 }
 
-bool ALWAYS_INLINE totallyLess(SortCursorImpl & lhs, SortCursorImpl & rhs)
+bool ALWAYS_INLINE totallyLess(SortCursorImpl & lhs, SortCursorImpl & rhs, int null_direction_hint)
 {
     /// The last row of left cursor is less than the current row of the right cursor.
-    int cmp = compareCursors(lhs, lhs.rows - 1, rhs, rhs.getRow());
+    int cmp = compareCursors(lhs, lhs.rows - 1, rhs, rhs.getRow(), null_direction_hint);
     return cmp < 0;
 }
 
-int ALWAYS_INLINE totallyCompare(SortCursorImpl & lhs, SortCursorImpl & rhs)
+int ALWAYS_INLINE totallyCompare(SortCursorImpl & lhs, SortCursorImpl & rhs, int null_direction_hint)
 {
-    if (totallyLess(lhs, rhs))
+    if (totallyLess(lhs, rhs, null_direction_hint))
         return -1;
-    if (totallyLess(rhs, lhs))
+    if (totallyLess(rhs, lhs, null_direction_hint))
         return 1;
     return 0;
 }
@@ -270,9 +271,11 @@ bool FullMergeJoinCursor::fullyCompleted() const
 MergeJoinAlgorithm::MergeJoinAlgorithm(
     JoinPtr table_join_,
     const Blocks & input_headers,
-    size_t max_block_size_)
+    size_t max_block_size_,
+    int null_direction_hint_)
     : table_join(table_join_)
     , max_block_size(max_block_size_)
+    , null_direction_hint(null_direction_hint_)
     , log(getLogger("MergeJoinAlgorithm"))
 {
     if (input_headers.size() != 2)
@@ -356,7 +359,7 @@ void MergeJoinAlgorithm::consume(Input & input, size_t source_num)
     cursors[source_num]->setChunk(std::move(input.chunk));
 }
 
-template <JoinKind kind>
+template <JoinKind kind, NullOrder nullOrder>
 struct AllJoinImpl
 {
     constexpr static bool enabled = isInner(kind) || isLeft(kind) || isRight(kind) || isFull(kind);
@@ -382,7 +385,7 @@ struct AllJoinImpl
             lpos = left_cursor->getRow();
             rpos = right_cursor->getRow();
 
-            cmp = compareCursors(left_cursor.cursor, right_cursor.cursor);
+            cmp = compareCursors(left_cursor.cursor, right_cursor.cursor, nullDirection(nullOrder));
             if (cmp == 0)
             {
                 size_t lnum = nextDistinct(left_cursor.cursor);
@@ -432,19 +435,37 @@ struct AllJoinImpl
     }
 };
 
-template <template<JoinKind> class Impl, typename ... Args>
-void dispatchKind(JoinKind kind, Args && ... args)
+template <template<JoinKind, NullOrder> class Impl, typename ... Args>
+void dispatchKind(JoinKind kind, int null_direction_hint,  Args && ... args)
 {
-    if (Impl<JoinKind::Inner>::enabled && kind == JoinKind::Inner)
-        return Impl<JoinKind::Inner>::join(std::forward<Args>(args)...);
-    else if (Impl<JoinKind::Left>::enabled && kind == JoinKind::Left)
-        return Impl<JoinKind::Left>::join(std::forward<Args>(args)...);
-    else if (Impl<JoinKind::Right>::enabled && kind == JoinKind::Right)
-        return Impl<JoinKind::Right>::join(std::forward<Args>(args)...);
-    else if (Impl<JoinKind::Full>::enabled && kind == JoinKind::Full)
-        return Impl<JoinKind::Full>::join(std::forward<Args>(args)...);
+    if (isSmall(null_direction_hint))
+    {
+        if (Impl<JoinKind::Inner, NullOrder::SMALLEST>::enabled && kind == JoinKind::Inner)
+            return Impl<JoinKind::Inner, NullOrder::SMALLEST>::join(std::forward<Args>(args)...);
+        else if (Impl<JoinKind::Left, NullOrder::SMALLEST>::enabled && kind == JoinKind::Left)
+            return Impl<JoinKind::Left, NullOrder::SMALLEST>::join(std::forward<Args>(args)...);
+        else if (Impl<JoinKind::Right, NullOrder::SMALLEST>::enabled && kind == JoinKind::Right)
+            return Impl<JoinKind::Right, NullOrder::SMALLEST>::join(std::forward<Args>(args)...);
+        else if (Impl<JoinKind::Full, NullOrder::SMALLEST>::enabled && kind == JoinKind::Full)
+            return Impl<JoinKind::Full, NullOrder::SMALLEST>::join(std::forward<Args>(args)...);
+        else
+            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported join kind: \"{}\"", kind);
+
+    }
     else
-        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported join kind: \"{}\"", kind);
+    {
+        if (Impl<JoinKind::Inner, NullOrder::BIGGEST>::enabled && kind == JoinKind::Inner)
+            return Impl<JoinKind::Inner, NullOrder::BIGGEST>::join(std::forward<Args>(args)...);
+        else if (Impl<JoinKind::Left, NullOrder::BIGGEST>::enabled && kind == JoinKind::Left)
+            return Impl<JoinKind::Left, NullOrder::BIGGEST>::join(std::forward<Args>(args)...);
+        else if (Impl<JoinKind::Right, NullOrder::BIGGEST>::enabled && kind == JoinKind::Right)
+            return Impl<JoinKind::Right, NullOrder::BIGGEST>::join(std::forward<Args>(args)...);
+        else if (Impl<JoinKind::Full, NullOrder::BIGGEST>::enabled && kind == JoinKind::Full)
+            return Impl<JoinKind::Full, NullOrder::BIGGEST>::join(std::forward<Args>(args)...);
+        else
+            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported join kind: \"{}\"", kind);
+
+    }
 }
 
 std::optional<MergeJoinAlgorithm::Status> MergeJoinAlgorithm::handleAllJoinState()
@@ -517,7 +538,7 @@ MergeJoinAlgorithm::Status MergeJoinAlgorithm::allJoin(JoinKind kind)
 {
     PaddedPODArray<UInt64> idx_map[2];
 
-    dispatchKind<AllJoinImpl>(kind, *cursors[0], *cursors[1], max_block_size, idx_map[0], idx_map[1], all_join_state);
+    dispatchKind<AllJoinImpl>(kind, null_direction_hint, *cursors[0], *cursors[1], max_block_size, idx_map[0], idx_map[1], all_join_state);
     assert(idx_map[0].size() == idx_map[1].size());
 
     Chunk result;
@@ -567,7 +588,7 @@ MergeJoinAlgorithm::Status MergeJoinAlgorithm::allJoin(JoinKind kind)
 }
 
 
-template <JoinKind kind>
+template <JoinKind kind, NullOrder order>
 struct AnyJoinImpl
 {
     constexpr static bool enabled = isInner(kind) || isLeft(kind) || isRight(kind);
@@ -599,7 +620,7 @@ struct AnyJoinImpl
             lpos = left_cursor->getRow();
             rpos = right_cursor->getRow();
 
-            cmp = compareCursors(left_cursor.cursor, right_cursor.cursor);
+            cmp = compareCursors(left_cursor.cursor, right_cursor.cursor, nullDirection(order));
             if (cmp == 0)
             {
                 if constexpr (isLeftOrFull(kind))
@@ -723,7 +744,7 @@ MergeJoinAlgorithm::Status MergeJoinAlgorithm::anyJoin(JoinKind kind)
     PaddedPODArray<UInt64> idx_map[2];
     size_t prev_pos[] = {current_left.getRow(), current_right.getRow()};
 
-    dispatchKind<AnyJoinImpl>(kind, *cursors[0], *cursors[1], idx_map[0], idx_map[1], any_join_state);
+    dispatchKind<AnyJoinImpl>(kind, null_direction_hint, *cursors[0], *cursors[1], idx_map[0], idx_map[1], any_join_state);
 
     assert(idx_map[0].empty() || idx_map[1].empty() || idx_map[0].size() == idx_map[1].size());
     size_t num_result_rows = std::max(idx_map[0].size(), idx_map[1].size());
@@ -816,7 +837,7 @@ IMergingAlgorithm::Status MergeJoinAlgorithm::merge()
     }
 
     /// check if blocks are not intersecting at all
-    if (int cmp = totallyCompare(cursors[0]->cursor, cursors[1]->cursor); cmp != 0)
+    if (int cmp = totallyCompare(cursors[0]->cursor, cursors[1]->cursor, null_direction_hint); cmp != 0)
     {
         if (cmp < 0)
         {
@@ -851,6 +872,7 @@ MergeJoinTransform::MergeJoinTransform(
         const Blocks & input_headers,
         const Block & output_header,
         size_t max_block_size,
+        int null_direction_hint_,
         UInt64 limit_hint_)
     : IMergingTransform<MergeJoinAlgorithm>(
         input_headers,
@@ -859,7 +881,7 @@ MergeJoinTransform::MergeJoinTransform(
         limit_hint_,
         /* always_read_till_end_= */ false,
         /* empty_chunk_on_finish_= */ true,
-        table_join, input_headers, max_block_size)
+        table_join, input_headers, max_block_size, null_direction_hint_)
     , log(getLogger("MergeJoinTransform"))
 {
     LOG_TRACE(log, "Use MergeJoinTransform");
diff --git a/src/Processors/Transforms/MergeJoinTransform.h b/src/Processors/Transforms/MergeJoinTransform.h
index 959550067f7..43485321122 100644
--- a/src/Processors/Transforms/MergeJoinTransform.h
+++ b/src/Processors/Transforms/MergeJoinTransform.h
@@ -220,6 +220,17 @@ private:
     bool recieved_all_blocks = false;
 };
 
+/// Join method.
+enum class NullOrder
+{
+    SMALLEST, /// null is treated as smallest
+    BIGGEST ///  null is treated as biggest
+};
+
+inline constexpr bool isSmall(int null_direction)        { return null_direction == 1; }
+
+inline constexpr int nullDirection(NullOrder order) {return order == NullOrder::SMALLEST ? 1 : -1;}
+
 /*
  * This class is used to join chunks from two sorted streams.
  * It is used in MergeJoinTransform.
@@ -227,7 +238,8 @@ private:
 class MergeJoinAlgorithm final : public IMergingAlgorithm
 {
 public:
-    explicit MergeJoinAlgorithm(JoinPtr table_join, const Blocks & input_headers, size_t max_block_size_);
+    explicit MergeJoinAlgorithm(JoinPtr table_join, const Blocks & input_headers, size_t max_block_size_,
+                                int null_direction_hint = 1);
 
     const char * getName() const override { return "MergeJoinAlgorithm"; }
     void initialize(Inputs inputs) override;
@@ -258,6 +270,7 @@ private:
     JoinPtr table_join;
 
     size_t max_block_size;
+    int null_direction_hint;
 
     struct Statistic
     {
@@ -282,6 +295,7 @@ public:
         const Blocks & input_headers,
         const Block & output_header,
         size_t max_block_size,
+        int null_direction_hint,
         UInt64 limit_hint = 0);
 
     String getName() const override { return "MergeJoinTransform"; }
diff --git a/src/QueryPipeline/QueryPipelineBuilder.cpp b/src/QueryPipeline/QueryPipelineBuilder.cpp
index 67a8fe5dcab..e338c3ce0fa 100644
--- a/src/QueryPipeline/QueryPipelineBuilder.cpp
+++ b/src/QueryPipeline/QueryPipelineBuilder.cpp
@@ -349,6 +349,7 @@ std::unique_ptr<QueryPipelineBuilder> QueryPipelineBuilder::joinPipelinesYShaped
     JoinPtr join,
     const Block & out_header,
     size_t max_block_size,
+    int null_direction_hint,
     Processors * collected_processors)
 {
     left->checkInitializedAndNotCompleted();
@@ -376,7 +377,7 @@ std::unique_ptr<QueryPipelineBuilder> QueryPipelineBuilder::joinPipelinesYShaped
     }
     else
     {
-        auto joining = std::make_shared<MergeJoinTransform>(join, inputs, out_header, max_block_size);
+        auto joining = std::make_shared<MergeJoinTransform>(join, inputs, out_header, max_block_size, null_direction_hint);
         return mergePipelines(std::move(left), std::move(right), std::move(joining), collected_processors);
     }
 }
diff --git a/src/QueryPipeline/QueryPipelineBuilder.h b/src/QueryPipeline/QueryPipelineBuilder.h
index f0b2ead687e..4753f957a25 100644
--- a/src/QueryPipeline/QueryPipelineBuilder.h
+++ b/src/QueryPipeline/QueryPipelineBuilder.h
@@ -137,6 +137,7 @@ public:
         JoinPtr table_join,
         const Block & out_header,
         size_t max_block_size,
+        int null_direction_hint,
         Processors * collected_processors = nullptr);
 
     /// Add other pipeline and execute it before current one.

From 0b5fc743f2e0711556ab4628aecd13e5fcd1a9b8 Mon Sep 17 00:00:00 2001
From: nemonlou <nemonlou@qq.com>
Date: Tue, 12 Mar 2024 09:55:02 +0800
Subject: [PATCH 719/985] make nulls direction configuable for
 FullSortingMergeJoin(fix review comments)

---
 src/Core/Settings.h                           |  1 -
 src/Interpreters/InterpreterSelectQuery.cpp   |  7 +--
 .../Transforms/MergeJoinTransform.cpp         | 56 +++++++------------
 .../Transforms/MergeJoinTransform.h           | 11 ----
 4 files changed, 22 insertions(+), 53 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 8d48b3f5e68..a3c5638d97f 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -891,7 +891,6 @@ class IColumn;
     M(Int64, ignore_cold_parts_seconds, 0, "Only available in ClickHouse Cloud. Exclude new data parts from SELECT queries until they're either pre-warmed (see cache_populated_by_fetch) or this many seconds old. Only for Replicated-/SharedMergeTree.", 0) \
     M(Int64, prefer_warmed_unmerged_parts_seconds, 0, "Only available in ClickHouse Cloud. If a merged part is less than this many seconds old and is not pre-warmed (see cache_populated_by_fetch), but all its source parts are available and pre-warmed, SELECT queries will read from those parts instead. Only for ReplicatedMergeTree. Note that this only checks whether CacheWarmer processed the part; if the part was fetched into cache by something else, it'll still be considered cold until CacheWarmer gets to it; if it was warmed, then evicted from cache, it'll still be considered warm.", 0) \
     M(Bool, iceberg_engine_ignore_schema_evolution, false, "Ignore schema evolution in Iceberg table engine and read all data using latest schema saved on table creation. Note that it can lead to incorrect result", 0) \
-    M(Bool, nulls_biggest_in_smj, true, "Treat nulls as biggest in sort. Used in sort merge join for compare null keys.", 0) \
 
 // End of COMMON_SETTINGS
 // Please add settings related to formats into the FORMAT_FACTORY_SETTINGS, move obsolete settings to OBSOLETE_SETTINGS and obsolete format settings to OBSOLETE_FORMAT_SETTINGS.
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 6f0a9fa9bfb..7c87dadfce6 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -1693,10 +1693,9 @@ void InterpreterSelectQuery::executeImpl(QueryPlan & query_plan, std::optional<P
                     auto add_sorting = [&settings, this] (QueryPlan & plan, const Names & key_names, JoinTableSide join_pos)
                     {
                         SortDescription order_descr;
-                        int nulls_direction = settings.nulls_biggest_in_smj ? 1 : -1;
                         order_descr.reserve(key_names.size());
                         for (const auto & key_name : key_names)
-                            order_descr.emplace_back(key_name, 1, nulls_direction);
+                            order_descr.emplace_back(key_name);
 
                         SortingStep::Settings sort_settings(*context);
 
@@ -1762,15 +1761,13 @@ void InterpreterSelectQuery::executeImpl(QueryPlan & query_plan, std::optional<P
                         add_sorting(*joined_plan, join_clause.key_names_right, JoinTableSide::Right);
                     }
 
-                    int null_direct_hint = settings.nulls_biggest_in_smj ? 1 : -1;
                     QueryPlanStepPtr join_step = std::make_unique<JoinStep>(
                         query_plan.getCurrentDataStream(),
                         joined_plan->getCurrentDataStream(),
                         expressions.join,
                         settings.max_block_size,
                         max_streams,
-                        analysis_result.optimize_read_in_order,
-                        null_direct_hint);
+                        analysis_result.optimize_read_in_order);
 
                     join_step->setStepDescription(fmt::format("JOIN {}", expressions.join->pipelineType()));
                     std::vector<QueryPlanPtr> plans;
diff --git a/src/Processors/Transforms/MergeJoinTransform.cpp b/src/Processors/Transforms/MergeJoinTransform.cpp
index c8e3a806a9f..6288a850d76 100644
--- a/src/Processors/Transforms/MergeJoinTransform.cpp
+++ b/src/Processors/Transforms/MergeJoinTransform.cpp
@@ -359,7 +359,7 @@ void MergeJoinAlgorithm::consume(Input & input, size_t source_num)
     cursors[source_num]->setChunk(std::move(input.chunk));
 }
 
-template <JoinKind kind, NullOrder nullOrder>
+template <JoinKind kind>
 struct AllJoinImpl
 {
     constexpr static bool enabled = isInner(kind) || isLeft(kind) || isRight(kind) || isFull(kind);
@@ -369,7 +369,8 @@ struct AllJoinImpl
                      size_t max_block_size,
                      PaddedPODArray<UInt64> & left_map,
                      PaddedPODArray<UInt64> & right_map,
-                     std::unique_ptr<AllJoinState> & state)
+                     std::unique_ptr<AllJoinState> & state,
+                     int null_direction_hint)
     {
         right_map.clear();
         right_map.reserve(max_block_size);
@@ -385,7 +386,7 @@ struct AllJoinImpl
             lpos = left_cursor->getRow();
             rpos = right_cursor->getRow();
 
-            cmp = compareCursors(left_cursor.cursor, right_cursor.cursor, nullDirection(nullOrder));
+            cmp = compareCursors(left_cursor.cursor, right_cursor.cursor, null_direction_hint);
             if (cmp == 0)
             {
                 size_t lnum = nextDistinct(left_cursor.cursor);
@@ -435,37 +436,19 @@ struct AllJoinImpl
     }
 };
 
-template <template<JoinKind, NullOrder> class Impl, typename ... Args>
-void dispatchKind(JoinKind kind, int null_direction_hint,  Args && ... args)
+template <template<JoinKind> class Impl, typename ... Args>
+void dispatchKind(JoinKind kind, Args && ... args)
 {
-    if (isSmall(null_direction_hint))
-    {
-        if (Impl<JoinKind::Inner, NullOrder::SMALLEST>::enabled && kind == JoinKind::Inner)
-            return Impl<JoinKind::Inner, NullOrder::SMALLEST>::join(std::forward<Args>(args)...);
-        else if (Impl<JoinKind::Left, NullOrder::SMALLEST>::enabled && kind == JoinKind::Left)
-            return Impl<JoinKind::Left, NullOrder::SMALLEST>::join(std::forward<Args>(args)...);
-        else if (Impl<JoinKind::Right, NullOrder::SMALLEST>::enabled && kind == JoinKind::Right)
-            return Impl<JoinKind::Right, NullOrder::SMALLEST>::join(std::forward<Args>(args)...);
-        else if (Impl<JoinKind::Full, NullOrder::SMALLEST>::enabled && kind == JoinKind::Full)
-            return Impl<JoinKind::Full, NullOrder::SMALLEST>::join(std::forward<Args>(args)...);
+    if (Impl<JoinKind::Inner>::enabled && kind == JoinKind::Inner)
+            return Impl<JoinKind::Inner>::join(std::forward<Args>(args)...);
+        else if (Impl<JoinKind::Left>::enabled && kind == JoinKind::Left)
+            return Impl<JoinKind::Left>::join(std::forward<Args>(args)...);
+        else if (Impl<JoinKind::Right>::enabled && kind == JoinKind::Right)
+            return Impl<JoinKind::Right>::join(std::forward<Args>(args)...);
+        else if (Impl<JoinKind::Full>::enabled && kind == JoinKind::Full)
+            return Impl<JoinKind::Full>::join(std::forward<Args>(args)...);
         else
             throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported join kind: \"{}\"", kind);
-
-    }
-    else
-    {
-        if (Impl<JoinKind::Inner, NullOrder::BIGGEST>::enabled && kind == JoinKind::Inner)
-            return Impl<JoinKind::Inner, NullOrder::BIGGEST>::join(std::forward<Args>(args)...);
-        else if (Impl<JoinKind::Left, NullOrder::BIGGEST>::enabled && kind == JoinKind::Left)
-            return Impl<JoinKind::Left, NullOrder::BIGGEST>::join(std::forward<Args>(args)...);
-        else if (Impl<JoinKind::Right, NullOrder::BIGGEST>::enabled && kind == JoinKind::Right)
-            return Impl<JoinKind::Right, NullOrder::BIGGEST>::join(std::forward<Args>(args)...);
-        else if (Impl<JoinKind::Full, NullOrder::BIGGEST>::enabled && kind == JoinKind::Full)
-            return Impl<JoinKind::Full, NullOrder::BIGGEST>::join(std::forward<Args>(args)...);
-        else
-            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported join kind: \"{}\"", kind);
-
-    }
 }
 
 std::optional<MergeJoinAlgorithm::Status> MergeJoinAlgorithm::handleAllJoinState()
@@ -538,7 +521,7 @@ MergeJoinAlgorithm::Status MergeJoinAlgorithm::allJoin(JoinKind kind)
 {
     PaddedPODArray<UInt64> idx_map[2];
 
-    dispatchKind<AllJoinImpl>(kind, null_direction_hint, *cursors[0], *cursors[1], max_block_size, idx_map[0], idx_map[1], all_join_state);
+    dispatchKind<AllJoinImpl>(kind, *cursors[0], *cursors[1], max_block_size, idx_map[0], idx_map[1], all_join_state, null_direction_hint);
     assert(idx_map[0].size() == idx_map[1].size());
 
     Chunk result;
@@ -588,7 +571,7 @@ MergeJoinAlgorithm::Status MergeJoinAlgorithm::allJoin(JoinKind kind)
 }
 
 
-template <JoinKind kind, NullOrder order>
+template <JoinKind kind>
 struct AnyJoinImpl
 {
     constexpr static bool enabled = isInner(kind) || isLeft(kind) || isRight(kind);
@@ -597,7 +580,8 @@ struct AnyJoinImpl
                      FullMergeJoinCursor & right_cursor,
                      PaddedPODArray<UInt64> & left_map,
                      PaddedPODArray<UInt64> & right_map,
-                     AnyJoinState & state)
+                     AnyJoinState & state,
+                     int null_direction_hint)
     {
         assert(enabled);
 
@@ -620,7 +604,7 @@ struct AnyJoinImpl
             lpos = left_cursor->getRow();
             rpos = right_cursor->getRow();
 
-            cmp = compareCursors(left_cursor.cursor, right_cursor.cursor, nullDirection(order));
+            cmp = compareCursors(left_cursor.cursor, right_cursor.cursor, null_direction_hint);
             if (cmp == 0)
             {
                 if constexpr (isLeftOrFull(kind))
@@ -744,7 +728,7 @@ MergeJoinAlgorithm::Status MergeJoinAlgorithm::anyJoin(JoinKind kind)
     PaddedPODArray<UInt64> idx_map[2];
     size_t prev_pos[] = {current_left.getRow(), current_right.getRow()};
 
-    dispatchKind<AnyJoinImpl>(kind, null_direction_hint, *cursors[0], *cursors[1], idx_map[0], idx_map[1], any_join_state);
+    dispatchKind<AnyJoinImpl>(kind, *cursors[0], *cursors[1], idx_map[0], idx_map[1], any_join_state, null_direction_hint);
 
     assert(idx_map[0].empty() || idx_map[1].empty() || idx_map[0].size() == idx_map[1].size());
     size_t num_result_rows = std::max(idx_map[0].size(), idx_map[1].size());
diff --git a/src/Processors/Transforms/MergeJoinTransform.h b/src/Processors/Transforms/MergeJoinTransform.h
index 43485321122..8af486ea34b 100644
--- a/src/Processors/Transforms/MergeJoinTransform.h
+++ b/src/Processors/Transforms/MergeJoinTransform.h
@@ -220,17 +220,6 @@ private:
     bool recieved_all_blocks = false;
 };
 
-/// Join method.
-enum class NullOrder
-{
-    SMALLEST, /// null is treated as smallest
-    BIGGEST ///  null is treated as biggest
-};
-
-inline constexpr bool isSmall(int null_direction)        { return null_direction == 1; }
-
-inline constexpr int nullDirection(NullOrder order) {return order == NullOrder::SMALLEST ? 1 : -1;}
-
 /*
  * This class is used to join chunks from two sorted streams.
  * It is used in MergeJoinTransform.

From 5cf22bae6f40ab1beb258cf22a9b0627c601495d Mon Sep 17 00:00:00 2001
From: nemonlou <nemonlou@qq.com>
Date: Tue, 12 Mar 2024 10:04:37 +0800
Subject: [PATCH 720/985] minor: fix style change

---
 .../Transforms/MergeJoinTransform.cpp          | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/src/Processors/Transforms/MergeJoinTransform.cpp b/src/Processors/Transforms/MergeJoinTransform.cpp
index 6288a850d76..37a178810cb 100644
--- a/src/Processors/Transforms/MergeJoinTransform.cpp
+++ b/src/Processors/Transforms/MergeJoinTransform.cpp
@@ -440,15 +440,15 @@ template <template<JoinKind> class Impl, typename ... Args>
 void dispatchKind(JoinKind kind, Args && ... args)
 {
     if (Impl<JoinKind::Inner>::enabled && kind == JoinKind::Inner)
-            return Impl<JoinKind::Inner>::join(std::forward<Args>(args)...);
-        else if (Impl<JoinKind::Left>::enabled && kind == JoinKind::Left)
-            return Impl<JoinKind::Left>::join(std::forward<Args>(args)...);
-        else if (Impl<JoinKind::Right>::enabled && kind == JoinKind::Right)
-            return Impl<JoinKind::Right>::join(std::forward<Args>(args)...);
-        else if (Impl<JoinKind::Full>::enabled && kind == JoinKind::Full)
-            return Impl<JoinKind::Full>::join(std::forward<Args>(args)...);
-        else
-            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported join kind: \"{}\"", kind);
+        return Impl<JoinKind::Inner>::join(std::forward<Args>(args)...);
+    else if (Impl<JoinKind::Left>::enabled && kind == JoinKind::Left)
+        return Impl<JoinKind::Left>::join(std::forward<Args>(args)...);
+    else if (Impl<JoinKind::Right>::enabled && kind == JoinKind::Right)
+        return Impl<JoinKind::Right>::join(std::forward<Args>(args)...);
+    else if (Impl<JoinKind::Full>::enabled && kind == JoinKind::Full)
+        return Impl<JoinKind::Full>::join(std::forward<Args>(args)...);
+    else
+         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported join kind: \"{}\"", kind);
 }
 
 std::optional<MergeJoinAlgorithm::Status> MergeJoinAlgorithm::handleAllJoinState()

From 8d49ff7350304619386cb849851432a5ca434619 Mon Sep 17 00:00:00 2001
From: Dan Wu <wudanzy@google.com>
Date: Tue, 19 Mar 2024 03:12:32 +0000
Subject: [PATCH 721/985] Add tests for system.parts_columns table.

---
 .../03010_read_system_parts_table_test.reference       | 10 ++++++++--
 .../0_stateless/03010_read_system_parts_table_test.sql |  3 ++-
 2 files changed, 10 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/03010_read_system_parts_table_test.reference b/tests/queries/0_stateless/03010_read_system_parts_table_test.reference
index 6847786761e..c2dd177f245 100644
--- a/tests/queries/0_stateless/03010_read_system_parts_table_test.reference
+++ b/tests/queries/0_stateless/03010_read_system_parts_table_test.reference
@@ -1,4 +1,10 @@
 00000000-0000-0000-0000-000000000000	1231_1_1_0
 00000000-0000-0000-0000-000000000000	6666_2_2_0
-users
-users
+00000000-0000-0000-0000-000000000000	1231_1_1_0	users
+00000000-0000-0000-0000-000000000000	6666_2_2_0	users
+00000000-0000-0000-0000-000000000000	1231_1_1_0	users	uid
+00000000-0000-0000-0000-000000000000	1231_1_1_0	users	name
+00000000-0000-0000-0000-000000000000	1231_1_1_0	users	age
+00000000-0000-0000-0000-000000000000	6666_2_2_0	users	uid
+00000000-0000-0000-0000-000000000000	6666_2_2_0	users	name
+00000000-0000-0000-0000-000000000000	6666_2_2_0	users	age
diff --git a/tests/queries/0_stateless/03010_read_system_parts_table_test.sql b/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
index 8871822af4e..a50005b2312 100644
--- a/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
+++ b/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
@@ -6,5 +6,6 @@ INSERT INTO users VALUES (6666, 'Ksenia', 48);
 
 SELECT uuid, name from system.parts WHERE database = currentDatabase() AND table = 'users';
 
-SELECT table from system.parts WHERE database = currentDatabase() AND uuid = '00000000-0000-0000-0000-000000000000';
+SELECT uuid, name, table from system.parts WHERE database = currentDatabase() AND table = 'users' AND uuid = '00000000-0000-0000-0000-000000000000';
+SELECT uuid, name, table, column from system.parts_columns WHERE database = currentDatabase() AND table = 'users' AND uuid = '00000000-0000-0000-0000-000000000000';
 DROP TABLE IF EXISTS users;

From 8ff21d7e47c25637b87f3ab674421cfc0a2c4487 Mon Sep 17 00:00:00 2001
From: nemonlou <nemonlou@qq.com>
Date: Tue, 19 Mar 2024 10:59:32 +0800
Subject: [PATCH 722/985] fix review comments

---
 src/Interpreters/FullSortingMergeJoin.h         |  7 ++++++-
 src/Processors/QueryPlan/JoinStep.cpp           |  8 +++-----
 src/Processors/QueryPlan/JoinStep.h             |  4 +---
 .../Transforms/MergeJoinTransform.cpp           | 17 +++++++++++------
 src/Processors/Transforms/MergeJoinTransform.h  |  6 ++----
 src/QueryPipeline/QueryPipelineBuilder.cpp      |  3 +--
 src/QueryPipeline/QueryPipelineBuilder.h        |  1 -
 7 files changed, 24 insertions(+), 22 deletions(-)

diff --git a/src/Interpreters/FullSortingMergeJoin.h b/src/Interpreters/FullSortingMergeJoin.h
index 7688d44f7a9..7e07c2004b6 100644
--- a/src/Interpreters/FullSortingMergeJoin.h
+++ b/src/Interpreters/FullSortingMergeJoin.h
@@ -21,9 +21,11 @@ namespace ErrorCodes
 class FullSortingMergeJoin : public IJoin
 {
 public:
-    explicit FullSortingMergeJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block_)
+    explicit FullSortingMergeJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block_,
+                                  int null_direction_ = 1)
         : table_join(table_join_)
         , right_sample_block(right_sample_block_)
+        , null_direction(null_direction_)
     {
         LOG_TRACE(getLogger("FullSortingMergeJoin"), "Will use full sorting merge join");
     }
@@ -31,6 +33,8 @@ public:
     std::string getName() const override { return "FullSortingMergeJoin"; }
     const TableJoin & getTableJoin() const override { return *table_join; }
 
+    int getNullDirection() const { return null_direction; }
+
     bool addBlockToJoin(const Block & /* block */, bool /* check_limits */) override
     {
         throw Exception(ErrorCodes::LOGICAL_ERROR, "FullSortingMergeJoin::addBlockToJoin should not be called");
@@ -119,6 +123,7 @@ private:
     std::shared_ptr<TableJoin> table_join;
     Block right_sample_block;
     Block totals;
+    int null_direction;
 };
 
 }
diff --git a/src/Processors/QueryPlan/JoinStep.cpp b/src/Processors/QueryPlan/JoinStep.cpp
index 0c46ce7893d..1931b1eb3a1 100644
--- a/src/Processors/QueryPlan/JoinStep.cpp
+++ b/src/Processors/QueryPlan/JoinStep.cpp
@@ -44,10 +44,8 @@ JoinStep::JoinStep(
     JoinPtr join_,
     size_t max_block_size_,
     size_t max_streams_,
-    bool keep_left_read_in_order_,
-    int null_direction_hint_)
-    : join(std::move(join_)), max_block_size(max_block_size_), max_streams(max_streams_), keep_left_read_in_order(keep_left_read_in_order_),
-    null_direction_hint(null_direction_hint_)
+    bool keep_left_read_in_order_)
+    : join(std::move(join_)), max_block_size(max_block_size_), max_streams(max_streams_), keep_left_read_in_order(keep_left_read_in_order_)
 {
     updateInputStreams(DataStreams{left_stream_, right_stream_});
 }
@@ -60,7 +58,7 @@ QueryPipelineBuilderPtr JoinStep::updatePipeline(QueryPipelineBuilders pipelines
     if (join->pipelineType() == JoinPipelineType::YShaped)
     {
         auto joined_pipeline = QueryPipelineBuilder::joinPipelinesYShaped(
-            std::move(pipelines[0]), std::move(pipelines[1]), join, output_stream->header, max_block_size, null_direction_hint, &processors);
+            std::move(pipelines[0]), std::move(pipelines[1]), join, output_stream->header, max_block_size, &processors);
         joined_pipeline->resize(max_streams);
         return joined_pipeline;
     }
diff --git a/src/Processors/QueryPlan/JoinStep.h b/src/Processors/QueryPlan/JoinStep.h
index 08909ce48a9..a9059a083fe 100644
--- a/src/Processors/QueryPlan/JoinStep.h
+++ b/src/Processors/QueryPlan/JoinStep.h
@@ -19,8 +19,7 @@ public:
         JoinPtr join_,
         size_t max_block_size_,
         size_t max_streams_,
-        bool keep_left_read_in_order_,
-        int null_direction_hint_ = 1);
+        bool keep_left_read_in_order_);
 
     String getName() const override { return "Join"; }
 
@@ -43,7 +42,6 @@ private:
     size_t max_block_size;
     size_t max_streams;
     bool keep_left_read_in_order;
-    int null_direction_hint;
 };
 
 /// Special step for the case when Join is already filled.
diff --git a/src/Processors/Transforms/MergeJoinTransform.cpp b/src/Processors/Transforms/MergeJoinTransform.cpp
index 37a178810cb..b63598483ef 100644
--- a/src/Processors/Transforms/MergeJoinTransform.cpp
+++ b/src/Processors/Transforms/MergeJoinTransform.cpp
@@ -16,6 +16,7 @@
 #include <Core/SortCursor.h>
 #include <Core/SortDescription.h>
 #include <IO/WriteHelpers.h>
+#include <Interpreters/FullSortingMergeJoin.h>
 #include <Interpreters/TableJoin.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
 #include <Processors/Transforms/MergeJoinTransform.h>
@@ -271,11 +272,9 @@ bool FullMergeJoinCursor::fullyCompleted() const
 MergeJoinAlgorithm::MergeJoinAlgorithm(
     JoinPtr table_join_,
     const Blocks & input_headers,
-    size_t max_block_size_,
-    int null_direction_hint_)
+    size_t max_block_size_)
     : table_join(table_join_)
     , max_block_size(max_block_size_)
-    , null_direction_hint(null_direction_hint_)
     , log(getLogger("MergeJoinAlgorithm"))
 {
     if (input_headers.size() != 2)
@@ -305,6 +304,13 @@ MergeJoinAlgorithm::MergeJoinAlgorithm(
         size_t right_idx = input_headers[1].getPositionByName(right_key);
         left_to_right_key_remap[left_idx] = right_idx;
     }
+
+    auto smjPtr = typeid_cast<const FullSortingMergeJoin *>(table_join.get());
+    if (smjPtr)
+    {
+        null_direction_hint = smjPtr->getNullDirection();
+    }
+
 }
 
 void MergeJoinAlgorithm::logElapsed(double seconds)
@@ -448,7 +454,7 @@ void dispatchKind(JoinKind kind, Args && ... args)
     else if (Impl<JoinKind::Full>::enabled && kind == JoinKind::Full)
         return Impl<JoinKind::Full>::join(std::forward<Args>(args)...);
     else
-         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported join kind: \"{}\"", kind);
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Unsupported join kind: \"{}\"", kind);
 }
 
 std::optional<MergeJoinAlgorithm::Status> MergeJoinAlgorithm::handleAllJoinState()
@@ -856,7 +862,6 @@ MergeJoinTransform::MergeJoinTransform(
         const Blocks & input_headers,
         const Block & output_header,
         size_t max_block_size,
-        int null_direction_hint_,
         UInt64 limit_hint_)
     : IMergingTransform<MergeJoinAlgorithm>(
         input_headers,
@@ -865,7 +870,7 @@ MergeJoinTransform::MergeJoinTransform(
         limit_hint_,
         /* always_read_till_end_= */ false,
         /* empty_chunk_on_finish_= */ true,
-        table_join, input_headers, max_block_size, null_direction_hint_)
+        table_join, input_headers, max_block_size)
     , log(getLogger("MergeJoinTransform"))
 {
     LOG_TRACE(log, "Use MergeJoinTransform");
diff --git a/src/Processors/Transforms/MergeJoinTransform.h b/src/Processors/Transforms/MergeJoinTransform.h
index 8af486ea34b..cf9331abd59 100644
--- a/src/Processors/Transforms/MergeJoinTransform.h
+++ b/src/Processors/Transforms/MergeJoinTransform.h
@@ -227,8 +227,7 @@ private:
 class MergeJoinAlgorithm final : public IMergingAlgorithm
 {
 public:
-    explicit MergeJoinAlgorithm(JoinPtr table_join, const Blocks & input_headers, size_t max_block_size_,
-                                int null_direction_hint = 1);
+    explicit MergeJoinAlgorithm(JoinPtr table_join, const Blocks & input_headers, size_t max_block_size_);
 
     const char * getName() const override { return "MergeJoinAlgorithm"; }
     void initialize(Inputs inputs) override;
@@ -259,7 +258,7 @@ private:
     JoinPtr table_join;
 
     size_t max_block_size;
-    int null_direction_hint;
+    int null_direction_hint = 1;
 
     struct Statistic
     {
@@ -284,7 +283,6 @@ public:
         const Blocks & input_headers,
         const Block & output_header,
         size_t max_block_size,
-        int null_direction_hint,
         UInt64 limit_hint = 0);
 
     String getName() const override { return "MergeJoinTransform"; }
diff --git a/src/QueryPipeline/QueryPipelineBuilder.cpp b/src/QueryPipeline/QueryPipelineBuilder.cpp
index e338c3ce0fa..67a8fe5dcab 100644
--- a/src/QueryPipeline/QueryPipelineBuilder.cpp
+++ b/src/QueryPipeline/QueryPipelineBuilder.cpp
@@ -349,7 +349,6 @@ std::unique_ptr<QueryPipelineBuilder> QueryPipelineBuilder::joinPipelinesYShaped
     JoinPtr join,
     const Block & out_header,
     size_t max_block_size,
-    int null_direction_hint,
     Processors * collected_processors)
 {
     left->checkInitializedAndNotCompleted();
@@ -377,7 +376,7 @@ std::unique_ptr<QueryPipelineBuilder> QueryPipelineBuilder::joinPipelinesYShaped
     }
     else
     {
-        auto joining = std::make_shared<MergeJoinTransform>(join, inputs, out_header, max_block_size, null_direction_hint);
+        auto joining = std::make_shared<MergeJoinTransform>(join, inputs, out_header, max_block_size);
         return mergePipelines(std::move(left), std::move(right), std::move(joining), collected_processors);
     }
 }
diff --git a/src/QueryPipeline/QueryPipelineBuilder.h b/src/QueryPipeline/QueryPipelineBuilder.h
index 4753f957a25..f0b2ead687e 100644
--- a/src/QueryPipeline/QueryPipelineBuilder.h
+++ b/src/QueryPipeline/QueryPipelineBuilder.h
@@ -137,7 +137,6 @@ public:
         JoinPtr table_join,
         const Block & out_header,
         size_t max_block_size,
-        int null_direction_hint,
         Processors * collected_processors = nullptr);
 
     /// Add other pipeline and execute it before current one.

From a742b235a4c7cfca6f5e6ce65fd6ebd897a2364b Mon Sep 17 00:00:00 2001
From: liuneng <1398775315@qq.com>
Date: Tue, 19 Mar 2024 17:12:13 +0800
Subject: [PATCH 723/985] add pass covert in single value to equal

---
 src/Analyzer/Passes/ConvertInToEqualsPass.cpp | 55 +++++++++++++++++++
 src/Analyzer/Passes/ConvertInToEqualsPass.h   | 24 ++++++++
 src/Analyzer/QueryTreePassManager.cpp         |  2 +
 src/Core/Settings.h                           |  1 +
 4 files changed, 82 insertions(+)
 create mode 100644 src/Analyzer/Passes/ConvertInToEqualsPass.cpp
 create mode 100644 src/Analyzer/Passes/ConvertInToEqualsPass.h

diff --git a/src/Analyzer/Passes/ConvertInToEqualsPass.cpp b/src/Analyzer/Passes/ConvertInToEqualsPass.cpp
new file mode 100644
index 00000000000..cf9f1dd6ad1
--- /dev/null
+++ b/src/Analyzer/Passes/ConvertInToEqualsPass.cpp
@@ -0,0 +1,55 @@
+#include <Analyzer/ColumnNode.h>
+#include <Analyzer/ConstantNode.h>
+#include <Analyzer/FunctionNode.h>
+#include <Analyzer/InDepthQueryTreeVisitor.h>
+#include <Analyzer/Passes/ConvertInToEqualsPass.h>
+#include <Functions/FunctionsComparison.h>
+#include <Functions/IFunctionAdaptors.h>
+
+namespace DB
+{
+
+using FunctionEquals = FunctionComparison<EqualsOp, NameEquals>;
+
+class ConvertInToEqualsPassVisitor : public InDepthQueryTreeVisitorWithContext<ConvertInToEqualsPassVisitor>
+{
+public:
+    using Base = InDepthQueryTreeVisitorWithContext<ConvertInToEqualsPassVisitor>;
+    using Base::Base;
+
+    FunctionOverloadResolverPtr createInternalFunctionEqualOverloadResolver()
+    {
+        return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionEquals>(getContext()->getSettings().decimal_check_overflow));
+    }
+
+    void enterImpl(QueryTreeNodePtr & node)
+    {
+        if (!getSettings().optimize_in_to_equal)
+            return;
+        auto * func_node = node->as<FunctionNode>();
+        if (!func_node || func_node->getFunctionName() != "in" || func_node->getArguments().getNodes().size() != 2)
+            return ;
+        auto args = func_node->getArguments().getNodes();
+        auto * column_node = args[0]->as<ColumnNode>();
+        auto * constant_node = args[1]->as<ConstantNode>();
+        if (!column_node || !constant_node)
+            return ;
+        if (constant_node->getValue().getType() == Field::Types::Which::Tuple)
+            return;
+        auto const_value = std::make_shared<ConstantNode>(constant_node->getValue());
+
+        auto equal_resolver = createInternalFunctionEqualOverloadResolver();
+        auto equal = std::make_shared<FunctionNode>("equals");
+        QueryTreeNodes arguments{column_node->clone(), const_value};
+        equal->getArguments().getNodes() = std::move(arguments);
+        equal->resolveAsFunction(equal_resolver);
+        node = equal;
+    }
+};
+
+void ConvertInToEqualsPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
+{
+    ConvertInToEqualsPassVisitor visitor(std::move(context));
+    visitor.visit(query_tree_node);
+}
+}
diff --git a/src/Analyzer/Passes/ConvertInToEqualsPass.h b/src/Analyzer/Passes/ConvertInToEqualsPass.h
new file mode 100644
index 00000000000..1f40645498a
--- /dev/null
+++ b/src/Analyzer/Passes/ConvertInToEqualsPass.h
@@ -0,0 +1,24 @@
+#pragma once
+
+#include <Analyzer/IQueryTreePass.h>
+
+namespace DB {
+
+/** Optimize `in` to `equals` if possible.
+  *
+  * Example: SELECT * from test where x IN (1);
+  * Result: SELECT * from test where x = 1;
+  *
+  */
+class ConvertInToEqualsPass final : public IQueryTreePass {
+public:
+    String getName() override { return "ConvertInToEqualsPass"; }
+
+    String getDescription() override { return "Convert in to equal"; }
+
+    void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
+};
+}
+
+
+
diff --git a/src/Analyzer/QueryTreePassManager.cpp b/src/Analyzer/QueryTreePassManager.cpp
index 9c07884a464..284e6bc2809 100644
--- a/src/Analyzer/QueryTreePassManager.cpp
+++ b/src/Analyzer/QueryTreePassManager.cpp
@@ -28,6 +28,7 @@
 #include <Analyzer/Passes/MultiIfToIfPass.h>
 #include <Analyzer/Passes/IfConstantConditionPass.h>
 #include <Analyzer/Passes/IfChainToMultiIfPass.h>
+#include <Analyzer/Passes/ConvertInToEqualsPass.h>
 #include <Analyzer/Passes/OrderByTupleEliminationPass.h>
 #include <Analyzer/Passes/NormalizeCountVariantsPass.h>
 #include <Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.h>
@@ -263,6 +264,7 @@ void addQueryTreePasses(QueryTreePassManager & manager, bool only_analyze)
     manager.addPass(std::make_unique<SumIfToCountIfPass>());
     manager.addPass(std::make_unique<RewriteArrayExistsToHasPass>());
     manager.addPass(std::make_unique<NormalizeCountVariantsPass>());
+    manager.addPass(std::make_unique<ConvertInToEqualsPass>());
 
     /// should before AggregateFunctionsArithmericOperationsPass
     manager.addPass(std::make_unique<AggregateFunctionOfGroupByKeysPass>());
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index e6adb00137f..19655d6493d 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -593,6 +593,7 @@ class IColumn;
     M(Bool, optimize_functions_to_subcolumns, false, "Transform functions to subcolumns, if possible, to reduce amount of read data. E.g. 'length(arr)' -> 'arr.size0', 'col IS NULL' -> 'col.null' ", 0) \
     M(Bool, optimize_using_constraints, false, "Use constraints for query optimization", 0)                                                                                                                                           \
     M(Bool, optimize_substitute_columns, false, "Use constraints for column substitution", 0)                                                                                                                                         \
+    M(Bool, optimize_in_to_equal, true, "Convert the constant in to equal", 0)   \
     M(Bool, optimize_append_index, false, "Use constraints in order to append index condition (indexHint)", 0) \
     M(Bool, optimize_time_filter_with_preimage, true, "Optimize Date and DateTime predicates by converting functions into equivalent comparisons without conversions (e.g. toYear(col) = 2023 -> col >= '2023-01-01' AND col <= '2023-12-31')", 0) \
     M(Bool, normalize_function_names, true, "Normalize function names to their canonical names", 0) \

From 532d72a7d8b74eeb1608f103e8540a7b7deb1294 Mon Sep 17 00:00:00 2001
From: liuneng <1398775315@qq.com>
Date: Tue, 19 Mar 2024 17:30:16 +0800
Subject: [PATCH 724/985] add test case

---
 ...qualsPass.cpp => ConvertInToEqualPass.cpp} | 10 ++---
 ...nToEqualsPass.h => ConvertInToEqualPass.h} |  4 +-
 src/Analyzer/QueryTreePassManager.cpp         |  4 +-
 tests/performance/function_in.xml             | 30 +++++++++++++++
 .../03013_optimize_in_to_equal.reference      | 37 +++++++++++++++++++
 .../03013_optimize_in_to_equal.sql            | 10 +++++
 6 files changed, 86 insertions(+), 9 deletions(-)
 rename src/Analyzer/Passes/{ConvertInToEqualsPass.cpp => ConvertInToEqualPass.cpp} (84%)
 rename src/Analyzer/Passes/{ConvertInToEqualsPass.h => ConvertInToEqualPass.h} (75%)
 create mode 100644 tests/performance/function_in.xml
 create mode 100644 tests/queries/0_stateless/03013_optimize_in_to_equal.reference
 create mode 100644 tests/queries/0_stateless/03013_optimize_in_to_equal.sql

diff --git a/src/Analyzer/Passes/ConvertInToEqualsPass.cpp b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
similarity index 84%
rename from src/Analyzer/Passes/ConvertInToEqualsPass.cpp
rename to src/Analyzer/Passes/ConvertInToEqualPass.cpp
index cf9f1dd6ad1..26db3a4f4aa 100644
--- a/src/Analyzer/Passes/ConvertInToEqualsPass.cpp
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
@@ -2,7 +2,7 @@
 #include <Analyzer/ConstantNode.h>
 #include <Analyzer/FunctionNode.h>
 #include <Analyzer/InDepthQueryTreeVisitor.h>
-#include <Analyzer/Passes/ConvertInToEqualsPass.h>
+#include <Analyzer/Passes/ConvertInToEqualPass.h>
 #include <Functions/FunctionsComparison.h>
 #include <Functions/IFunctionAdaptors.h>
 
@@ -11,10 +11,10 @@ namespace DB
 
 using FunctionEquals = FunctionComparison<EqualsOp, NameEquals>;
 
-class ConvertInToEqualsPassVisitor : public InDepthQueryTreeVisitorWithContext<ConvertInToEqualsPassVisitor>
+class ConvertInToEqualPassVisitor : public InDepthQueryTreeVisitorWithContext<ConvertInToEqualPassVisitor>
 {
 public:
-    using Base = InDepthQueryTreeVisitorWithContext<ConvertInToEqualsPassVisitor>;
+    using Base = InDepthQueryTreeVisitorWithContext<ConvertInToEqualPassVisitor>;
     using Base::Base;
 
     FunctionOverloadResolverPtr createInternalFunctionEqualOverloadResolver()
@@ -47,9 +47,9 @@ public:
     }
 };
 
-void ConvertInToEqualsPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
+void ConvertInToEqualPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
 {
-    ConvertInToEqualsPassVisitor visitor(std::move(context));
+    ConvertInToEqualPassVisitor visitor(std::move(context));
     visitor.visit(query_tree_node);
 }
 }
diff --git a/src/Analyzer/Passes/ConvertInToEqualsPass.h b/src/Analyzer/Passes/ConvertInToEqualPass.h
similarity index 75%
rename from src/Analyzer/Passes/ConvertInToEqualsPass.h
rename to src/Analyzer/Passes/ConvertInToEqualPass.h
index 1f40645498a..19b83c0f65f 100644
--- a/src/Analyzer/Passes/ConvertInToEqualsPass.h
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.h
@@ -10,9 +10,9 @@ namespace DB {
   * Result: SELECT * from test where x = 1;
   *
   */
-class ConvertInToEqualsPass final : public IQueryTreePass {
+class ConvertInToEqualPass final : public IQueryTreePass {
 public:
-    String getName() override { return "ConvertInToEqualsPass"; }
+    String getName() override { return "ConvertInToEqualPass"; }
 
     String getDescription() override { return "Convert in to equal"; }
 
diff --git a/src/Analyzer/QueryTreePassManager.cpp b/src/Analyzer/QueryTreePassManager.cpp
index 284e6bc2809..14eb179680c 100644
--- a/src/Analyzer/QueryTreePassManager.cpp
+++ b/src/Analyzer/QueryTreePassManager.cpp
@@ -28,7 +28,7 @@
 #include <Analyzer/Passes/MultiIfToIfPass.h>
 #include <Analyzer/Passes/IfConstantConditionPass.h>
 #include <Analyzer/Passes/IfChainToMultiIfPass.h>
-#include <Analyzer/Passes/ConvertInToEqualsPass.h>
+#include <Analyzer/Passes/ConvertInToEqualPass.h>
 #include <Analyzer/Passes/OrderByTupleEliminationPass.h>
 #include <Analyzer/Passes/NormalizeCountVariantsPass.h>
 #include <Analyzer/Passes/AggregateFunctionsArithmericOperationsPass.h>
@@ -264,7 +264,7 @@ void addQueryTreePasses(QueryTreePassManager & manager, bool only_analyze)
     manager.addPass(std::make_unique<SumIfToCountIfPass>());
     manager.addPass(std::make_unique<RewriteArrayExistsToHasPass>());
     manager.addPass(std::make_unique<NormalizeCountVariantsPass>());
-    manager.addPass(std::make_unique<ConvertInToEqualsPass>());
+    manager.addPass(std::make_unique<ConvertInToEqualPass>());
 
     /// should before AggregateFunctionsArithmericOperationsPass
     manager.addPass(std::make_unique<AggregateFunctionOfGroupByKeysPass>());
diff --git a/tests/performance/function_in.xml b/tests/performance/function_in.xml
new file mode 100644
index 00000000000..16e6bb91469
--- /dev/null
+++ b/tests/performance/function_in.xml
@@ -0,0 +1,30 @@
+<test>
+    <settings>
+        <max_insert_threads>8</max_insert_threads>
+        <max_threads>1</max_threads>
+    </settings>
+
+    <create_query>
+        CREATE TABLE t_nullable
+        (
+        key_string1 Nullable(String),
+        key_string2 Nullable(String),
+        key_string3 Nullable(String),
+        key_int64_1 Nullable(Int64),
+        key_int64_2 Nullable(Int64),
+        key_int64_3 Nullable(Int64),
+        key_int64_4 Nullable(Int64),
+        key_int64_5 Nullable(Int64),
+        m1 Int64,
+        m2 Int64
+        )
+        ENGINE = Memory
+    </create_query>
+    <fill_query>insert into t_nullable select ['aaaaaa','bbaaaa','ccaaaa','ddaaaa'][number % 101 + 1], ['aa','bb','cc','dd'][number % 100 + 1], ['aa','bb','cc','dd'][number % 102 + 1], number%10+1, number%10+2, number%10+3, number%10+4,number%10+5, number%6000+1, number%5000+2 from numbers_mt(30000000)</fill_query>
+    <query>select * from t_nullable where key_string1 in ('aaaaaa') format Null</query>
+    <query>select * from t_nullable where key_string1 in ('aaaaaa') format Null SETTINGS allow_experimental_analyzer=1</query>
+    <query>select * from t_nullable where key_string2 in ('3') format Null</query>
+    <query>select * from t_nullable where key_string2 in ('3') format Null SETTINGS allow_experimental_analyzer=1</query>
+    <drop_query>drop table if exists t_nullable</drop_query>
+
+</test>
\ No newline at end of file
diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.reference b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
new file mode 100644
index 00000000000..f55a7b76eaf
--- /dev/null
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
@@ -0,0 +1,37 @@
+a	1
+-------------------
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: equals, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: \'a\', constant_value_type: String
+  SETTINGS allow_experimental_analyzer=1
+-------------------
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: in, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: Tuple_(\'a\', \'b\'), constant_value_type: Tuple(String, String)
+  SETTINGS allow_experimental_analyzer=1
diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
new file mode 100644
index 00000000000..9d80825ceb4
--- /dev/null
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
@@ -0,0 +1,10 @@
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (x String, y Int32) ENGINE = MergeTree() ORDER BY x;
+
+INSERT INTO test VALUES ('a', 1), ('b', 2), ('c', 3), ('d', 4), ('e', 5);
+
+select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
+explain query tree select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
+explain query tree select * from test where x in ('a','b') SETTINGS allow_experimental_analyzer = 1;
\ No newline at end of file

From 24a59546c7247c596627f708754d7fc7e6a08093 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Tue, 19 Mar 2024 09:42:40 +0000
Subject: [PATCH 725/985] ASdd documentation

---
 docs/en/sql-reference/table-functions/generateSeries.md   | 8 ++++++++
 docs/en/sql-reference/table-functions/generate_series.md  | 5 +----
 ...4_all_new_table_functions_must_be_documented.reference | 1 +
 .../0_stateless/02992_all_columns_should_have_comment.sql | 2 +-
 4 files changed, 11 insertions(+), 5 deletions(-)
 create mode 100644 docs/en/sql-reference/table-functions/generateSeries.md

diff --git a/docs/en/sql-reference/table-functions/generateSeries.md b/docs/en/sql-reference/table-functions/generateSeries.md
new file mode 100644
index 00000000000..9dd2e09b6a7
--- /dev/null
+++ b/docs/en/sql-reference/table-functions/generateSeries.md
@@ -0,0 +1,8 @@
+---
+slug: /en/sql-reference/table-functions/generateSeries
+sidebar_position: 147
+sidebar_label: generateSeries
+---
+
+### AliasTo
+[generate_series](generate_series.md)
\ No newline at end of file
diff --git a/docs/en/sql-reference/table-functions/generate_series.md b/docs/en/sql-reference/table-functions/generate_series.md
index 9370cea8580..c5d29369627 100644
--- a/docs/en/sql-reference/table-functions/generate_series.md
+++ b/docs/en/sql-reference/table-functions/generate_series.md
@@ -22,7 +22,4 @@ And the following queries return tables with the same content but different colu
 ``` sql
 SELECT * FROM numbers(10, 11) WHERE number % 3 == (10 % 3);
 SELECT * FROM generate_series(10, 20, 3) ;
-```
-
-### Alias
-generateSeries
\ No newline at end of file
+```
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference b/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference
index 1e4f21a6722..57ffeca9d43 100644
--- a/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference
+++ b/tests/queries/0_stateless/02414_all_new_table_functions_must_be_documented.reference
@@ -4,6 +4,7 @@ dictionary
 executable
 file
 generateRandom
+generateSeries
 generate_series
 input
 jdbc
diff --git a/tests/queries/0_stateless/02992_all_columns_should_have_comment.sql b/tests/queries/0_stateless/02992_all_columns_should_have_comment.sql
index b90faeac359..e233f08cc79 100644
--- a/tests/queries/0_stateless/02992_all_columns_should_have_comment.sql
+++ b/tests/queries/0_stateless/02992_all_columns_should_have_comment.sql
@@ -1,4 +1,4 @@
 SYSTEM FLUSH LOGS;
 SELECT 'Column ' || name || ' from table ' || concat(database, '.', table) || ' should have a comment'
 FROM system.columns
-WHERE (database = 'system') AND (comment = '') AND (table NOT ILIKE '%_log_%') AND (table NOT IN ('numbers', 'numbers_mt', 'one', 'generate_series')) AND (default_kind != 'ALIAS');
+WHERE (database = 'system') AND (comment = '') AND (table NOT ILIKE '%_log_%') AND (table NOT IN ('numbers', 'numbers_mt', 'one', 'generate_series', 'generateSeries')) AND (default_kind != 'ALIAS');

From 761c612295c8f09ff12fc697e482069ac7bd61a2 Mon Sep 17 00:00:00 2001
From: liuneng <1398775315@qq.com>
Date: Tue, 19 Mar 2024 18:29:07 +0800
Subject: [PATCH 726/985] fix style

---
 src/Analyzer/Passes/ConvertInToEqualPass.h | 11 ++++-------
 1 file changed, 4 insertions(+), 7 deletions(-)

diff --git a/src/Analyzer/Passes/ConvertInToEqualPass.h b/src/Analyzer/Passes/ConvertInToEqualPass.h
index 19b83c0f65f..7de75e94f04 100644
--- a/src/Analyzer/Passes/ConvertInToEqualPass.h
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.h
@@ -2,15 +2,15 @@
 
 #include <Analyzer/IQueryTreePass.h>
 
-namespace DB {
-
+namespace DB
+{
 /** Optimize `in` to `equals` if possible.
   *
   * Example: SELECT * from test where x IN (1);
   * Result: SELECT * from test where x = 1;
-  *
   */
-class ConvertInToEqualPass final : public IQueryTreePass {
+class ConvertInToEqualPass final : public IQueryTreePass
+{
 public:
     String getName() override { return "ConvertInToEqualPass"; }
 
@@ -19,6 +19,3 @@ public:
     void run(QueryTreeNodePtr & query_tree_node, ContextPtr context) override;
 };
 }
-
-
-

From 87e2c09febe17ce45e29d7d02397193f23b250cc Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Tue, 19 Mar 2024 10:31:05 +0000
Subject: [PATCH 727/985] Correct typo

---
 docs/en/sql-reference/table-functions/generateSeries.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/table-functions/generateSeries.md b/docs/en/sql-reference/table-functions/generateSeries.md
index 9dd2e09b6a7..addf539a959 100644
--- a/docs/en/sql-reference/table-functions/generateSeries.md
+++ b/docs/en/sql-reference/table-functions/generateSeries.md
@@ -4,5 +4,5 @@ sidebar_position: 147
 sidebar_label: generateSeries
 ---
 
-### AliasTo
+### Alias To
 [generate_series](generate_series.md)
\ No newline at end of file

From 12cd566681143d017b9b4fbfc3ff5d11af7b4f1a Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 19 Mar 2024 11:47:53 +0100
Subject: [PATCH 728/985] Update config for test

---
 tests/integration/test_storage_s3_queue/configs/users.xml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/integration/test_storage_s3_queue/configs/users.xml b/tests/integration/test_storage_s3_queue/configs/users.xml
index 1c096c7da8f..e47df8e4b94 100644
--- a/tests/integration/test_storage_s3_queue/configs/users.xml
+++ b/tests/integration/test_storage_s3_queue/configs/users.xml
@@ -3,6 +3,7 @@
         <default>
             <stream_like_engine_allow_direct_select>1</stream_like_engine_allow_direct_select>
             <s3queue_enable_logging_to_s3queue_log>1</s3queue_enable_logging_to_s3queue_log>
+            <s3queue_allow_experimental_sharded_mode>1</s3queue_allow_experimental_sharded_mode>
         </default>
     </profiles>
 </clickhouse>

From eb75926e50d03ddba7327c3377b11ead3e221c80 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Wed, 21 Feb 2024 14:33:01 +0100
Subject: [PATCH 729/985] Parallel flush of pending INSERT blocks of
 Distributed engine

Parallelism will work only if you have multi disk policy for table (like
everything in Distributed engine right now).

This will work for DETACH/server shutdown and SYSTEM FLUSH DISTRIBUTED

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageDistributed.cpp | 27 +++++++++++++++++++--------
 1 file changed, 19 insertions(+), 8 deletions(-)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 3b766ac8d26..6554af1f7e6 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -1734,16 +1734,27 @@ void StorageDistributed::flushClusterNodesAllData(ContextPtr local_context)
             directory_queues.push_back(node.second.directory_queue);
     }
 
-    bool need_flush = getDistributedSettingsRef().flush_on_detach;
-    if (!need_flush)
+    if (getDistributedSettingsRef().flush_on_detach)
+    {
+        LOG_INFO(log, "Flushing pending INSERT blocks");
+
+        Stopwatch watch;
+        ThreadPool pool(CurrentMetrics::StorageDistributedThreads, CurrentMetrics::StorageDistributedThreadsActive, CurrentMetrics::StorageDistributedThreadsScheduled, directory_queues.size());
+        for (const auto & node : directory_queues)
+        {
+            pool.scheduleOrThrowOnError([node_to_flush = node]()
+            {
+                node_to_flush->flushAllData();
+            });
+        }
+        pool.wait();
+        LOG_INFO(log, "Pending INSERT blocks flushed, took {} ms.", watch.elapsedMilliseconds());
+    }
+    else
+    {
         LOG_INFO(log, "Skip flushing data (due to flush_on_detach=0)");
 
-    /// TODO: Maybe it should be executed in parallel
-    for (auto & node : directory_queues)
-    {
-        if (need_flush)
-            node->flushAllData();
-        else
+        for (auto & node : directory_queues)
             node->shutdownWithoutFlush();
     }
 }

From 929dc6fa12ced13309fea73229a0c5213cdc0f30 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 22 Feb 2024 15:41:19 +0100
Subject: [PATCH 730/985] Attach to query for threads in Distributed engine
 background ops

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageDistributed.cpp | 28 +++++++++++++++++++++++++++-
 1 file changed, 27 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 6554af1f7e6..e25e3425359 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -1287,10 +1287,19 @@ void StorageDistributed::initializeFromDisk()
     /// Make initialization for large number of disks parallel.
     ThreadPool pool(CurrentMetrics::StorageDistributedThreads, CurrentMetrics::StorageDistributedThreadsActive, CurrentMetrics::StorageDistributedThreadsScheduled, disks.size());
 
+    ThreadGroupPtr thread_group = CurrentThread::getGroup();
     for (const DiskPtr & disk : disks)
     {
         pool.scheduleOrThrowOnError([&]()
         {
+            SCOPE_EXIT_SAFE(
+                if (thread_group)
+                    CurrentThread::detachFromGroupIfNotDetached();
+            );
+            if (thread_group)
+                CurrentThread::attachToGroup(thread_group);
+            setThreadName("DistInit");
+
             initializeDirectoryQueuesForDisk(disk);
         });
     }
@@ -1302,6 +1311,14 @@ void StorageDistributed::initializeFromDisk()
     {
         pool.scheduleOrThrowOnError([&, i]()
         {
+            SCOPE_EXIT_SAFE(
+                if (thread_group)
+                    CurrentThread::detachFromGroupIfNotDetached();
+            );
+            if (thread_group)
+                CurrentThread::attachToGroup(thread_group);
+            setThreadName("DistInit");
+
             last_increment[i] = getMaximumFileNumber(paths[i]);
         });
     }
@@ -1739,11 +1756,20 @@ void StorageDistributed::flushClusterNodesAllData(ContextPtr local_context)
         LOG_INFO(log, "Flushing pending INSERT blocks");
 
         Stopwatch watch;
+        ThreadGroupPtr thread_group = CurrentThread::getGroup();
         ThreadPool pool(CurrentMetrics::StorageDistributedThreads, CurrentMetrics::StorageDistributedThreadsActive, CurrentMetrics::StorageDistributedThreadsScheduled, directory_queues.size());
         for (const auto & node : directory_queues)
         {
-            pool.scheduleOrThrowOnError([node_to_flush = node]()
+            pool.scheduleOrThrowOnError([node_to_flush = node, &thread_group]()
             {
+                SCOPE_EXIT_SAFE(
+                    if (thread_group)
+                        CurrentThread::detachFromGroupIfNotDetached();
+                );
+                if (thread_group)
+                    CurrentThread::attachToGroup(thread_group);
+                setThreadName("DistFlush");
+
                 node_to_flush->flushAllData();
             });
         }

From 118e30882ae2ed33f622dd1eb57f45440523cb67 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Tue, 19 Mar 2024 12:01:19 +0100
Subject: [PATCH 731/985] Fix test with token

---
 tests/queries/0_stateless/02481_async_insert_dedup.python | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02481_async_insert_dedup.python b/tests/queries/0_stateless/02481_async_insert_dedup.python
index 0e80a21bf46..24512836290 100644
--- a/tests/queries/0_stateless/02481_async_insert_dedup.python
+++ b/tests/queries/0_stateless/02481_async_insert_dedup.python
@@ -119,7 +119,7 @@ q = queue.Queue(100)
 total_number = 10000
 
 use_token = False
-if len(sys.argv) > 3 and sys.argv[2] == "token":
+if len(sys.argv) >= 3 and sys.argv[2] == "token":
     use_token = True
 
 gen = Thread(target=generate_data, args=[q, total_number, use_token])

From a6506e8e581759f188988daa6c57c07c3c012c86 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 19 Mar 2024 12:05:13 +0100
Subject: [PATCH 732/985] Missed sending the process to background

---
 docker/test/fuzzer/run-fuzzer.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index e3b5a99018f..c9e1681401d 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -181,7 +181,7 @@ function fuzz
         --pid-file /var/run/clickhouse-server/clickhouse-server.pid \
         --  --path db \
             --logger.console=0 \
-            --logger.log=server.log > stderr.log 2>&1
+            --logger.log=server.log > stderr.log 2>&1 &
     server_pid=$!
 
     kill -0 $server_pid

From ba6d6e9258d86c9e83f3cc945c880ef29dbe1ead Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 19 Mar 2024 11:40:03 +0000
Subject: [PATCH 733/985] Add a comment after #61458

---
 src/Interpreters/ActionsDAG.h | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/src/Interpreters/ActionsDAG.h b/src/Interpreters/ActionsDAG.h
index bd56d20d0e8..6b0b098a4ba 100644
--- a/src/Interpreters/ActionsDAG.h
+++ b/src/Interpreters/ActionsDAG.h
@@ -336,8 +336,12 @@ public:
 
     /// Split ActionsDAG into two DAGs, where first part contains all nodes from split_nodes and their children.
     /// Execution of first then second parts on block is equivalent to execution of initial DAG.
-    /// First DAG and initial DAG have equal inputs, second DAG and initial DAG has equal outputs.
-    /// Second DAG inputs may contain less inputs then first DAG (but also include other columns).
+    /// Inputs and outputs of original DAG are splitted between the first and the second DAGs.
+    /// Intermediate result can apper in first outputs and second inputs.
+    /// Example:
+    ///   initial DAG    : (a, b, c, d, e) -> (w, x, y, z)  | 1 a 2 b 3 c 4 d 5 e 6      ->  1 2 3 4 5 6 w x y z
+    ///   split (first)  : (a, c, d) -> (i, j, k, w, y)     | 1 a 2 b 3 c 4 d 5 e 6      ->  1 2 b 3 4 5 e 6 i j k w y
+    ///   split (second) : (i, j, k, y, b, e) -> (x, y, z)  | 1 2 b 3 4 5 e 6 i j k w y  ->  1 2 3 4 5 6 w x y z
     SplitResult split(std::unordered_set<const Node *> split_nodes, bool create_split_nodes_mapping = false) const;
 
     /// Splits actions into two parts. Returned first half may be swapped with ARRAY JOIN.

From 8b1df937a567cec4acc6702288d979d4489bb83f Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Tue, 19 Mar 2024 07:09:28 -0400
Subject: [PATCH 734/985] Use scheduleFromThreadPool for parallel processing in
 distributed storage

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Storages/StorageDistributed.cpp | 63 ++++++++++++++---------------
 1 file changed, 30 insertions(+), 33 deletions(-)

diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index e25e3425359..7819aa7683a 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -23,6 +23,7 @@
 
 #include <Columns/ColumnConst.h>
 
+#include <Common/threadPoolCallbackRunner.h>
 #include <Common/Macros.h>
 #include <Common/ProfileEvents.h>
 #include <Common/escapeForFileName.h>
@@ -282,6 +283,17 @@ size_t getClusterQueriedNodes(const Settings & settings, const ClusterPtr & clus
     return (num_remote_shards + num_local_shards) * settings.max_parallel_replicas;
 }
 
+template <class F>
+void waitFutures(F & futures)
+{
+    for (auto & future : futures)
+        future.wait();
+    /// Make sure there is no exception.
+    for (auto & future : futures)
+        future.get();
+    futures.clear();
+}
+
 }
 
 /// For destruction of std::unique_ptr of type that is incomplete in class definition.
@@ -1286,42 +1298,30 @@ void StorageDistributed::initializeFromDisk()
 
     /// Make initialization for large number of disks parallel.
     ThreadPool pool(CurrentMetrics::StorageDistributedThreads, CurrentMetrics::StorageDistributedThreadsActive, CurrentMetrics::StorageDistributedThreadsScheduled, disks.size());
+    std::vector<std::future<void>> futures;
 
-    ThreadGroupPtr thread_group = CurrentThread::getGroup();
     for (const DiskPtr & disk : disks)
     {
-        pool.scheduleOrThrowOnError([&]()
+        auto future = scheduleFromThreadPool<void>([this, disk_to_init = disk]
         {
-            SCOPE_EXIT_SAFE(
-                if (thread_group)
-                    CurrentThread::detachFromGroupIfNotDetached();
-            );
-            if (thread_group)
-                CurrentThread::attachToGroup(thread_group);
-            setThreadName("DistInit");
-
-            initializeDirectoryQueuesForDisk(disk);
-        });
+            initializeDirectoryQueuesForDisk(disk_to_init);
+        }, pool, "DistInit");
+        futures.push_back(std::move(future));
     }
+    waitFutures(futures);
     pool.wait();
 
     const auto & paths = getDataPaths();
     std::vector<UInt64> last_increment(paths.size());
     for (size_t i = 0; i < paths.size(); ++i)
     {
-        pool.scheduleOrThrowOnError([&, i]()
+        auto future = scheduleFromThreadPool<void>([&paths, &last_increment, i]
         {
-            SCOPE_EXIT_SAFE(
-                if (thread_group)
-                    CurrentThread::detachFromGroupIfNotDetached();
-            );
-            if (thread_group)
-                CurrentThread::attachToGroup(thread_group);
-            setThreadName("DistInit");
-
             last_increment[i] = getMaximumFileNumber(paths[i]);
-        });
+        }, pool, "DistInit");
+        futures.push_back(std::move(future));
     }
+    waitFutures(futures);
     pool.wait();
 
     for (const auto inc : last_increment)
@@ -1756,24 +1756,21 @@ void StorageDistributed::flushClusterNodesAllData(ContextPtr local_context)
         LOG_INFO(log, "Flushing pending INSERT blocks");
 
         Stopwatch watch;
-        ThreadGroupPtr thread_group = CurrentThread::getGroup();
         ThreadPool pool(CurrentMetrics::StorageDistributedThreads, CurrentMetrics::StorageDistributedThreadsActive, CurrentMetrics::StorageDistributedThreadsScheduled, directory_queues.size());
+        std::vector<std::future<void>> futures;
+
         for (const auto & node : directory_queues)
         {
-            pool.scheduleOrThrowOnError([node_to_flush = node, &thread_group]()
+            auto future = scheduleFromThreadPool<void>([node_to_flush = node]
             {
-                SCOPE_EXIT_SAFE(
-                    if (thread_group)
-                        CurrentThread::detachFromGroupIfNotDetached();
-                );
-                if (thread_group)
-                    CurrentThread::attachToGroup(thread_group);
-                setThreadName("DistFlush");
-
                 node_to_flush->flushAllData();
-            });
+            }, pool, "DistFlush");
+            futures.push_back(std::move(future));
         }
+
+        waitFutures(futures);
         pool.wait();
+
         LOG_INFO(log, "Pending INSERT blocks flushed, took {} ms.", watch.elapsedMilliseconds());
     }
     else

From 44b985a2bc9afd94fd206bb8699eabb69fae4e3f Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Tue, 19 Mar 2024 13:26:32 +0100
Subject: [PATCH 735/985] Update install.md


From 6b43d2e1971ac9303ca30692740c1469ddd39504 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 19 Mar 2024 13:27:26 +0100
Subject: [PATCH 736/985] Improve logging in build_download_helper

---
 tests/ci/build_download_helper.py | 21 +++++++++++++++++++--
 1 file changed, 19 insertions(+), 2 deletions(-)

diff --git a/tests/ci/build_download_helper.py b/tests/ci/build_download_helper.py
index 66734f58b23..b8469767876 100644
--- a/tests/ci/build_download_helper.py
+++ b/tests/ci/build_download_helper.py
@@ -120,12 +120,14 @@ def read_build_urls(build_name: str, reports_path: Union[Path, str]) -> List[str
     for root, _, files in os.walk(reports_path):
         for file in files:
             if file.endswith(f"_{build_name}.json"):
-                logging.info("Found build report json %s", file)
+                logging.info("Found build report json %s for %s", file, build_name)
                 with open(
                     os.path.join(root, file), "r", encoding="utf-8"
                 ) as file_handler:
                     build_report = json.load(file_handler)
                     return build_report["build_urls"]  # type: ignore
+
+    logging.info("A build report is not found for %s", build_name)
     return []
 
 
@@ -197,7 +199,7 @@ def download_builds_filter(
 ):
     build_name = get_build_name_for_check(check_name)
     urls = read_build_urls(build_name, reports_path)
-    print(urls)
+    logging.info("The build report for %s contains the next URLs: %s", build_name, urls)
 
     if not urls:
         raise DownloadException("No build URLs found")
@@ -223,6 +225,21 @@ def download_clickhouse_binary(check_name, reports_path, result_path):
     )
 
 
+def get_clickhouse_binary_url(check_name, reports_path):
+    build_name = get_build_name_for_check(check_name)
+    urls = read_build_urls(build_name, reports_path)
+    logging.info("The build report for %s contains the next URLs: %s", build_name, urls)
+    for url in urls:
+        check_url = url
+        if "?" in check_url:
+            check_url = check_url.split("?")[0]
+
+        if check_url.endswith("clickhouse"):
+            return url
+
+    return None
+
+
 def download_performance_build(check_name, reports_path, result_path):
     download_builds_filter(
         check_name,

From f2f770d73a002eb559af43f3e25d338b009c1daa Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 19 Mar 2024 13:37:21 +0100
Subject: [PATCH 737/985] Update src/Interpreters/ActionsDAG.h

Co-authored-by: Sergei Trifonov <sergei@clickhouse.com>
---
 src/Interpreters/ActionsDAG.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/ActionsDAG.h b/src/Interpreters/ActionsDAG.h
index 6b0b098a4ba..469fe9ea7f1 100644
--- a/src/Interpreters/ActionsDAG.h
+++ b/src/Interpreters/ActionsDAG.h
@@ -336,7 +336,7 @@ public:
 
     /// Split ActionsDAG into two DAGs, where first part contains all nodes from split_nodes and their children.
     /// Execution of first then second parts on block is equivalent to execution of initial DAG.
-    /// Inputs and outputs of original DAG are splitted between the first and the second DAGs.
+    /// Inputs and outputs of original DAG are split between the first and the second DAGs.
     /// Intermediate result can apper in first outputs and second inputs.
     /// Example:
     ///   initial DAG    : (a, b, c, d, e) -> (w, x, y, z)  | 1 a 2 b 3 c 4 d 5 e 6      ->  1 2 3 4 5 6 w x y z

From 8494e7389d21307781b91a030e22f05dac6deeb7 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 19 Mar 2024 13:47:20 +0100
Subject: [PATCH 738/985] Update setting names

---
 src/Common/BufferAllocationPolicy.cpp | 14 +++++++-------
 src/Common/BufferAllocationPolicy.h   | 12 ++++++------
 2 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/src/Common/BufferAllocationPolicy.cpp b/src/Common/BufferAllocationPolicy.cpp
index 2b00d4f84d0..14d009008b9 100644
--- a/src/Common/BufferAllocationPolicy.cpp
+++ b/src/Common/BufferAllocationPolicy.cpp
@@ -12,7 +12,7 @@ class FixedSizeBufferAllocationPolicy : public IBufferAllocationPolicy
 
 public:
     explicit FixedSizeBufferAllocationPolicy(const IBufferAllocationPolicy::Settings & settings_)
-        : buffer_size(settings_.strict_upload_part_size)
+        : buffer_size(settings_.strict_size)
     {
         chassert(buffer_size > 0);
     }
@@ -46,11 +46,11 @@ class ExpBufferAllocationPolicy : public DB::IBufferAllocationPolicy
 
 public:
     explicit ExpBufferAllocationPolicy(const IBufferAllocationPolicy::Settings & settings_)
-        : first_size(std::max(settings_.max_single_part_upload_size, settings_.min_upload_part_size))
-        , second_size(settings_.min_upload_part_size)
-        , multiply_factor(settings_.upload_part_size_multiply_factor)
-        , multiply_threshold(settings_.upload_part_size_multiply_parts_count_threshold)
-        , max_size(settings_.max_upload_part_size)
+        : first_size(std::max(settings_.max_single_size, settings_.min_size))
+        , second_size(settings_.min_size)
+        , multiply_factor(settings_.multiply_factor)
+        , multiply_threshold(settings_.multiply_parts_count_threshold)
+        , max_size(settings_.max_size)
     {
         chassert(first_size > 0);
         chassert(second_size > 0);
@@ -93,7 +93,7 @@ IBufferAllocationPolicy::~IBufferAllocationPolicy() = default;
 
 IBufferAllocationPolicy::IBufferAllocationPolicyPtr IBufferAllocationPolicy::create(IBufferAllocationPolicy::Settings settings_)
 {
-    if (settings_.strict_upload_part_size > 0)
+    if (settings_.strict_size > 0)
         return std::make_unique<FixedSizeBufferAllocationPolicy>(settings_);
     else
         return std::make_unique<ExpBufferAllocationPolicy>(settings_);
diff --git a/src/Common/BufferAllocationPolicy.h b/src/Common/BufferAllocationPolicy.h
index 3ada9e52fdf..dd04139e694 100644
--- a/src/Common/BufferAllocationPolicy.h
+++ b/src/Common/BufferAllocationPolicy.h
@@ -15,12 +15,12 @@ public:
 
     struct Settings
     {
-        size_t strict_upload_part_size = 0;
-        size_t min_upload_part_size = 16 * 1024 * 1024;
-        size_t max_upload_part_size = 5ULL * 1024 * 1024 * 1024;
-        size_t upload_part_size_multiply_factor = 2;
-        size_t upload_part_size_multiply_parts_count_threshold = 500;
-        size_t max_single_part_upload_size = 32 * 1024 * 1024;
+        size_t strict_size = 0;
+        size_t min_size = 16 * 1024 * 1024;
+        size_t max_size = 5ULL * 1024 * 1024 * 1024;
+        size_t multiply_factor = 2;
+        size_t multiply_parts_count_threshold = 500;
+        size_t max_single_size = 32 * 1024 * 1024;
     };
 
 
From 3f46a5d93d5d7dee5ec0a81481c737ab9d7e4f7f Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Tue, 19 Mar 2024 13:01:25 +0000
Subject: [PATCH 739/985] Fix clickhouse-test client option and
 CLICKHOUSE_URL_PARAMS interference

---
 tests/clickhouse-test | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 057502379ed..13d1200758e 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -2900,7 +2900,7 @@ def get_additional_client_options(args):
     if args.client_option:
         client_options = " ".join("--" + option for option in args.client_option)
         if "CLICKHOUSE_CLIENT_OPT" in os.environ:
-            return os.environ["CLICKHOUSE_CLIENT_OPT"] + client_options
+            return os.environ["CLICKHOUSE_CLIENT_OPT"] + " " + client_options
         else:
             return client_options
     else:
@@ -3360,7 +3360,6 @@ if __name__ == "__main__":
         else:
             os.environ["CLICKHOUSE_CLIENT_OPT"] = ""
 
-        os.environ["CLICKHOUSE_CLIENT_OPT"] += get_additional_client_options(args)
         if args.secure:
             os.environ["CLICKHOUSE_CLIENT_OPT"] += " --secure "
 

From 4efddb5ed47e6c7c323e9138b82e47cc71e7831c Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 19 Mar 2024 14:01:31 +0100
Subject: [PATCH 740/985] Add type checking to build_download_helper

---
 tests/ci/build_download_helper.py        | 37 +++++++++++++++++-------
 tests/ci/performance_comparison_check.py |  2 +-
 tests/ci/unit_tests_check.py             |  2 +-
 3 files changed, 28 insertions(+), 13 deletions(-)

diff --git a/tests/ci/build_download_helper.py b/tests/ci/build_download_helper.py
index b8469767876..0d89515d5d8 100644
--- a/tests/ci/build_download_helper.py
+++ b/tests/ci/build_download_helper.py
@@ -6,7 +6,7 @@ import os
 import sys
 import time
 from pathlib import Path
-from typing import Any, Callable, List, Union
+from typing import Any, Callable, List, Optional, Union
 
 # isort: off
 import requests
@@ -185,18 +185,21 @@ def download_build_with_progress(url: str, path: Path) -> None:
 
 
 def download_builds(
-    result_path: str, build_urls: List[str], filter_fn: Callable[[str], bool]
+    result_path: Path, build_urls: List[str], filter_fn: Callable[[str], bool]
 ) -> None:
     for url in build_urls:
         if filter_fn(url):
             fname = os.path.basename(url.replace("%2B", "+").replace("%20", " "))
             logging.info("Will download %s to %s", fname, result_path)
-            download_build_with_progress(url, Path(result_path) / fname)
+            download_build_with_progress(url, result_path / fname)
 
 
 def download_builds_filter(
-    check_name, reports_path, result_path, filter_fn=lambda _: True
-):
+    check_name: str,
+    reports_path: Union[Path, str],
+    result_path: Path,
+    filter_fn: Callable[[str], bool] = lambda _: True,
+) -> None:
     build_name = get_build_name_for_check(check_name)
     urls = read_build_urls(build_name, reports_path)
     logging.info("The build report for %s contains the next URLs: %s", build_name, urls)
@@ -207,25 +210,33 @@ def download_builds_filter(
     download_builds(result_path, urls, filter_fn)
 
 
-def download_all_deb_packages(check_name, reports_path, result_path):
+def download_all_deb_packages(
+    check_name: str, reports_path: Union[Path, str], result_path: Path
+) -> None:
     download_builds_filter(
         check_name, reports_path, result_path, lambda x: x.endswith("deb")
     )
 
 
-def download_unit_tests(check_name, reports_path, result_path):
+def download_unit_tests(
+    check_name: str, reports_path: Union[Path, str], result_path: Path
+) -> None:
     download_builds_filter(
         check_name, reports_path, result_path, lambda x: x.endswith("unit_tests_dbms")
     )
 
 
-def download_clickhouse_binary(check_name, reports_path, result_path):
+def download_clickhouse_binary(
+    check_name: str, reports_path: Union[Path, str], result_path: Path
+) -> None:
     download_builds_filter(
         check_name, reports_path, result_path, lambda x: x.endswith("clickhouse")
     )
 
 
-def get_clickhouse_binary_url(check_name, reports_path):
+def get_clickhouse_binary_url(
+    check_name: str, reports_path: Union[Path, str]
+) -> Optional[str]:
     build_name = get_build_name_for_check(check_name)
     urls = read_build_urls(build_name, reports_path)
     logging.info("The build report for %s contains the next URLs: %s", build_name, urls)
@@ -240,7 +251,9 @@ def get_clickhouse_binary_url(check_name, reports_path):
     return None
 
 
-def download_performance_build(check_name, reports_path, result_path):
+def download_performance_build(
+    check_name: str, reports_path: Union[Path, str], result_path: Path
+) -> None:
     download_builds_filter(
         check_name,
         reports_path,
@@ -249,7 +262,9 @@ def download_performance_build(check_name, reports_path, result_path):
     )
 
 
-def download_fuzzers(check_name, reports_path, result_path):
+def download_fuzzers(
+    check_name: str, reports_path: Union[Path, str], result_path: Path
+) -> None:
     download_builds_filter(
         check_name,
         reports_path,
diff --git a/tests/ci/performance_comparison_check.py b/tests/ci/performance_comparison_check.py
index f0af15397c7..c238fbae603 100644
--- a/tests/ci/performance_comparison_check.py
+++ b/tests/ci/performance_comparison_check.py
@@ -155,7 +155,7 @@ def main():
     }
 
     download_builds_filter(
-        check_name, REPORT_PATH, TEMP_PATH, lambda url: "performance.tar.zst" in url
+        check_name, REPORT_PATH, temp_path, lambda url: "performance.tar.zst" in url
     )
     assert os.path.exists(f"{TEMP_PATH}/performance.tar.zst"), "Perf artifact not found"
 
diff --git a/tests/ci/unit_tests_check.py b/tests/ci/unit_tests_check.py
index 2c2862d926a..b66a4312657 100644
--- a/tests/ci/unit_tests_check.py
+++ b/tests/ci/unit_tests_check.py
@@ -166,7 +166,7 @@ def main():
 
     docker_image = pull_image(get_docker_image(IMAGE_NAME))
 
-    download_unit_tests(check_name, REPORT_PATH, TEMP_PATH)
+    download_unit_tests(check_name, REPORT_PATH, temp_path)
 
     tests_binary = temp_path / "unit_tests_dbms"
     os.chmod(tests_binary, 0o777)

From 4457c1a1330604756f1a5310f8331358de97eb1b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 19 Mar 2024 14:07:25 +0100
Subject: [PATCH 741/985] Update analyzer_tech_debt.txt

---
 tests/analyzer_tech_debt.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index 8335108e243..2f949396d0c 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -2,8 +2,8 @@
 00717_merge_and_distributed
 00725_memory_tracking
 01062_pm_all_join_with_block_continuation
+01083_expressions_in_engine_arguments
 01155_rename_move_materialized_view
-01584_distributed_buffer_cannot_find_column
 01624_soft_constraints
 01747_join_view_filter_dictionary
 01761_cast_to_enum_nullable

From c16922493a614779d989701b9bed4195a503d6e9 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 19 Mar 2024 14:54:06 +0100
Subject: [PATCH 742/985] Removed detachPart & reallocateBuffer functions

---
 .../IO/WriteBufferFromAzureBlobStorage.cpp    | 58 +++++--------------
 .../IO/WriteBufferFromAzureBlobStorage.h      |  7 +--
 2 files changed, 16 insertions(+), 49 deletions(-)

diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index 41d7187afda..50763f7f189 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -18,12 +18,6 @@ namespace ProfileEvents
 namespace DB
 {
 
-struct WriteBufferFromAzureBlobStorage::PartData
-{
-    Memory<> memory;
-    size_t data_size = 0;
-};
-
 WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> blob_container_client_,
     const String & blob_path_,
@@ -108,53 +102,31 @@ void WriteBufferFromAzureBlobStorage::finalizeImpl()
 void WriteBufferFromAzureBlobStorage::nextImpl()
 {
     task_tracker->waitIfAny();
-
-    reallocateBuffer();
-    detachBuffer();
-
-    while (!detached_part_data.empty())
-    {
-        writePart(std::move(detached_part_data.front()));
-        detached_part_data.pop_front();
-    }
-
+    writePart();
     allocateBuffer();
 }
 
 void WriteBufferFromAzureBlobStorage::allocateBuffer()
 {
     buffer_allocation_policy->nextBuffer();
-    memory = Memory(buffer_allocation_policy->getBufferSize());
+    auto size = buffer_allocation_policy->getBufferSize();
+
+    if (buffer_allocation_policy->getBufferNumber() == 1)
+    {
+        size = std::min(size_t(DBMS_DEFAULT_BUFFER_SIZE), size);
+    }
+
+    memory = Memory(size);
     WriteBuffer::set(memory.data(), memory.size());
 }
 
-
-void WriteBufferFromAzureBlobStorage::reallocateBuffer()
-{
-    if (available() > 0)
-        return;
-
-    if (memory.size() == buffer_allocation_policy->getBufferSize())
-        return;
-
-    memory.resize(buffer_allocation_policy->getBufferSize());
-
-    WriteBuffer::set(memory.data(), memory.size());
-
-    chassert(offset() == 0);
-}
-
-void WriteBufferFromAzureBlobStorage::detachBuffer()
+void WriteBufferFromAzureBlobStorage::writePart()
 {
     size_t data_size = size_t(position() - memory.data());
-    auto buf = std::move(memory);
+    auto data = std::move(memory);
     WriteBuffer::set(nullptr, 0);
-    detached_part_data.push_back({std::move(buf), data_size});
-}
 
-void WriteBufferFromAzureBlobStorage::writePart(WriteBufferFromAzureBlobStorage::PartData && data)
-{
-    if (data.data_size == 0)
+    if (data_size == 0)
         return;
 
     auto upload_worker = [&] ()
@@ -162,11 +134,11 @@ void WriteBufferFromAzureBlobStorage::writePart(WriteBufferFromAzureBlobStorage:
         auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
         const std::string & block_id = block_ids.emplace_back(getRandomASCIIString(64));
 
-        Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(data.memory.data()), data.data_size);
-        execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, max_unexpected_write_error_retries, data.data_size);
+        Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(data.data()), data_size);
+        execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, max_unexpected_write_error_retries, data_size);
 
         if (write_settings.remote_throttler)
-            write_settings.remote_throttler->add(data.data_size, ProfileEvents::RemoteWriteThrottlerBytes, ProfileEvents::RemoteWriteThrottlerSleepMicroseconds);
+            write_settings.remote_throttler->add(data_size, ProfileEvents::RemoteWriteThrottlerBytes, ProfileEvents::RemoteWriteThrottlerSleepMicroseconds);
     };
 
     task_tracker->add(std::move(upload_worker));
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
index f047dd53724..a210a75030a 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
@@ -48,12 +48,8 @@ public:
 private:
     struct PartData;
 
-    void writePart(WriteBufferFromAzureBlobStorage::PartData && data);
-    void detachBuffer();
+    void writePart();
     void allocateBuffer();
-    void allocateFirstBuffer();
-    void reallocateFirstBuffer();
-    void reallocateBuffer();
 
     void finalizeImpl() override;
     void execWithRetry(std::function<void()> func, size_t num_tries, size_t cost = 0);
@@ -81,7 +77,6 @@ private:
     bool first_buffer=true;
 
     std::unique_ptr<TaskTracker> task_tracker;
-    std::deque<PartData> detached_part_data;
 };
 
 }

From 939554ec0a62aa5a1b0395a72b95a17be8578d1b Mon Sep 17 00:00:00 2001
From: Ilya Golshtein <igolshtein@altinity.com>
Date: Sat, 9 Mar 2024 07:52:23 +0000
Subject: [PATCH 743/985] contrib: update cppkafka to v0.4.1@9c5ea0e3

---
 contrib/cppkafka                     |  2 +-
 src/Storages/Kafka/KafkaConsumer.cpp | 12 +-----------
 2 files changed, 2 insertions(+), 12 deletions(-)

diff --git a/contrib/cppkafka b/contrib/cppkafka
index 5a119f689f8..9c5ea0e3324 160000
--- a/contrib/cppkafka
+++ b/contrib/cppkafka
@@ -1 +1 @@
-Subproject commit 5a119f689f8a4d90d10a9635e7ee2bee5c127de1
+Subproject commit 9c5ea0e332486961e612deacc6e3f0c1874c688d
diff --git a/src/Storages/Kafka/KafkaConsumer.cpp b/src/Storages/Kafka/KafkaConsumer.cpp
index 47167e19a38..7075dcb71ca 100644
--- a/src/Storages/Kafka/KafkaConsumer.cpp
+++ b/src/Storages/Kafka/KafkaConsumer.cpp
@@ -599,24 +599,14 @@ void KafkaConsumer::setExceptionInfo(const std::string & text, bool with_stacktr
     exceptions_buffer.push_back({enriched_text, static_cast<UInt64>(Poco::Timestamp().epochTime())});
 }
 
-/*
- * Needed until
- * https://github.com/mfontanini/cppkafka/pull/309
- * is merged,
- * because consumer->get_member_id() contains a leak
- */
 std::string KafkaConsumer::getMemberId() const
 {
     if (!consumer)
         return "";
 
-    char * memberid_ptr = rd_kafka_memberid(consumer->get_handle());
-    std::string memberid_string = memberid_ptr;
-    rd_kafka_mem_free(nullptr, memberid_ptr);
-    return memberid_string;
+    return consumer->get_member_id();
 }
 
-
 KafkaConsumer::Stat KafkaConsumer::getStat() const
 {
     KafkaConsumer::Stat::Assignments assignments;

From 4e2e5a015b162d63dd192dc1cdb0cb622a524cf1 Mon Sep 17 00:00:00 2001
From: Nikolay Degterinsky <43110995+evillique@users.noreply.github.com>
Date: Tue, 19 Mar 2024 16:29:50 +0100
Subject: [PATCH 744/985] Fixes

---
 src/Interpreters/InterpreterCreateQuery.cpp | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index fb421ee0a5e..38918918c92 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -1087,6 +1087,7 @@ BlockIO InterpreterCreateQuery::createTable(ASTCreateQuery & create)
     // If this is a stub ATTACH query, read the query definition from the database
     if (create.attach && !create.storage && !create.columns_list)
     {
+        // In case of an ON CLUSTER query, the database may not be present on the initiator node
         auto database = DatabaseCatalog::instance().tryGetDatabase(database_name);
         if (database && database->shouldReplicateQuery(getContext(), query_ptr))
         {
@@ -1253,6 +1254,7 @@ BlockIO InterpreterCreateQuery::createTable(ASTCreateQuery & create)
 
     DatabasePtr database;
     bool need_add_to_database = !create.temporary;
+    // In case of an ON CLUSTER query, the database may not be present on the initiator node
     if (need_add_to_database)
         database = DatabaseCatalog::instance().tryGetDatabase(database_name);
 
@@ -1273,7 +1275,7 @@ BlockIO InterpreterCreateQuery::createTable(ASTCreateQuery & create)
                 "CREATE AS SELECT is not supported with Replicated databases. Use separate CREATE and INSERT queries");
     }
 
-    if (need_add_to_database && database && database->shouldReplicateQuery(getContext(), query_ptr))
+    if (database && database->shouldReplicateQuery(getContext(), query_ptr))
     {
         chassert(!ddl_guard);
         auto guard = DatabaseCatalog::instance().getDDLGuard(create.getDatabase(), create.getTable());

From 029488f336d44b58a3b685aaa9846a7d69a5c40d Mon Sep 17 00:00:00 2001
From: Peter <peter279k@gmail.com>
Date: Tue, 19 Mar 2024 23:54:08 +0800
Subject: [PATCH 745/985] Add words to ignore spell checking

---
 utils/check-style/aspell-ignore/en/aspell-dict.txt | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index 57a8e0d5840..77aaacf0240 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -162,6 +162,7 @@ ClickHouseVapor
 ClickVisual
 ClickableSquare
 CloudDetails
+CloudStorage
 CodeBlock
 CodeLLDB
 Codecs
@@ -460,6 +461,7 @@ LOCALTIME
 LOCALTIMESTAMP
 LONGLONG
 Levenshtein
+Liao
 LibFuzzer
 LightHouse
 LineAsString
@@ -957,6 +959,7 @@ TotalRowsOfMergeTreeTables
 TotalTemporaryFiles
 Tradeoff
 Transactional
+Tsai
 Tukey
 TwoColumnList
 UBSan

From 9da870864aaf4f30a34d348903c70a38f36e88a2 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 19 Mar 2024 16:02:05 +0100
Subject: [PATCH 746/985] Fix 01244_optimize_distributed_group_by_sharding_key
 by ordering output

---
 .../01244_optimize_distributed_group_by_sharding_key.reference  | 2 +-
 .../01244_optimize_distributed_group_by_sharding_key.sql        | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.reference b/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.reference
index a4a6b87de25..9921a1eaac9 100644
--- a/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.reference
+++ b/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.reference
@@ -60,9 +60,9 @@ LIMIT OFFSET
 OFFSET distributed_push_down_limit=0
 1	1
 OFFSET distributed_push_down_limit=1
-1	1
 1	0
 1	1
+1	1
 WHERE LIMIT OFFSET
 1	1
 LIMIT BY 1
diff --git a/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql b/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql
index e80f41b173c..63dbd9c2cc9 100644
--- a/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql
+++ b/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql
@@ -69,7 +69,7 @@ select count(), * from dist_01247 group by number limit 1 offset 1;
 select 'OFFSET distributed_push_down_limit=0';
 select count(), * from dist_01247 group by number offset 1 settings distributed_push_down_limit=0;
 select 'OFFSET distributed_push_down_limit=1';
-select count(), * from dist_01247 group by number offset 1 settings distributed_push_down_limit=1;
+select count(), * from dist_01247 group by number order by count(), number offset 1 settings distributed_push_down_limit=1;
 -- this will emulate different data on for different shards
 select 'WHERE LIMIT OFFSET';
 select count(), * from dist_01247 where number = _shard_num-1 group by number order by number limit 1 offset 1;

From 56e48c5d64c6e9ab3441908c04014f3e3e87de74 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 19 Mar 2024 16:56:46 +0100
Subject: [PATCH 747/985] Increase compiler memory for riscv

---
 CMakeLists.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 8c4e16eace2..d345705ae53 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -61,8 +61,8 @@ if (ENABLE_CHECK_HEAVY_BUILDS)
     # set CPU time limit to 1000 seconds
     set (RLIMIT_CPU 1000)
 
-    # -fsanitize=memory and address are too heavy
-    if (SANITIZE OR SANITIZE_COVERAGE OR WITH_COVERAGE)
+    # Sanitizers are too heavy. Also RISCV has some extra memory requirements
+    if (SANITIZE OR SANITIZE_COVERAGE OR WITH_COVERAGE OR ARCH_RISCV64)
        set (RLIMIT_DATA 10000000000) # 10G
     endif()
 

From 6987622737a6ecf8dc9d7d49a6cfd4867dc36a5b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 19 Mar 2024 15:57:19 +0000
Subject: [PATCH 748/985] Remove some tests from analyzer_tech_debt

---
 tests/analyzer_tech_debt.txt                              | 4 +---
 .../0_stateless/01083_expressions_in_engine_arguments.sql | 2 +-
 .../0_stateless/01925_join_materialized_columns.reference | 3 +++
 .../0_stateless/01925_join_materialized_columns.sql       | 8 +++++---
 tests/queries/0_stateless/02354_vector_search_queries.sql | 2 --
 5 files changed, 10 insertions(+), 9 deletions(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index 7cd73705e77..7dd6d059a71 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -1,13 +1,11 @@
 00223_shard_distributed_aggregation_memory_efficient
 00725_memory_tracking
 01062_pm_all_join_with_block_continuation
-01083_expressions_in_engine_arguments
 01155_rename_move_materialized_view
 01584_distributed_buffer_cannot_find_column
 01624_soft_constraints
-01747_join_view_filter_dictionary
 01925_join_materialized_columns
-02354_annoy
+02354_vector_search_queries
 # Check after constants refactoring
 02901_parallel_replicas_rollup
 # Flaky. Please don't delete them without fixing them:
diff --git a/tests/queries/0_stateless/01083_expressions_in_engine_arguments.sql b/tests/queries/0_stateless/01083_expressions_in_engine_arguments.sql
index b162fdb21fd..7e4f77ccdb4 100644
--- a/tests/queries/0_stateless/01083_expressions_in_engine_arguments.sql
+++ b/tests/queries/0_stateless/01083_expressions_in_engine_arguments.sql
@@ -28,7 +28,7 @@ CREATE TABLE url (n UInt64, col String) ENGINE=URL
 (
     replace
     (
-        'https://localhost:8443/?query='  || 'select n, _table from ' || currentDatabase() || '.merge format CSV', ' ', '+'
+        'http://localhost:8123/?query='  || 'select n, _table from ' || currentDatabase() || '.merge format CSV', ' ', '+'
     ),
     CSV
 );
diff --git a/tests/queries/0_stateless/01925_join_materialized_columns.reference b/tests/queries/0_stateless/01925_join_materialized_columns.reference
index 5125b322aed..1d2ab582038 100644
--- a/tests/queries/0_stateless/01925_join_materialized_columns.reference
+++ b/tests/queries/0_stateless/01925_join_materialized_columns.reference
@@ -10,6 +10,8 @@
 -
 2020-01-01 12:00:00	fact1	t1_val1	2020-01-01 12:00:00	fact1	t2_val2
 2020-01-01 13:00:00	fact3	t1_val3	2020-01-01 12:00:00	fact1	t2_val2
+2020-01-01	2020-01-01 12:00:00	fact1	t1_val1	2020-01-01 12:00:00	fact1	t2_val2
+2020-01-01	2020-01-01 13:00:00	fact3	t1_val3	2020-01-01 12:00:00	fact1	t2_val2
 -
 2020-01-01 12:00:00	fact1	t1_val1	2019-01-01 12:00:00	fact4	t2_val2
 2020-01-01 12:00:00	fact1	t1_val1	2020-01-01 12:00:00	fact1	t2_val2
@@ -32,3 +34,4 @@ fact2t1_val2	fact2t1_val2
 2020-01-01 12:00:00
 2020-01-01 12:00:00
 2020-01-01 12:00:00
+2020-01-01 12:00:00
diff --git a/tests/queries/0_stateless/01925_join_materialized_columns.sql b/tests/queries/0_stateless/01925_join_materialized_columns.sql
index 271c230c35b..abb6fda3bfb 100644
--- a/tests/queries/0_stateless/01925_join_materialized_columns.sql
+++ b/tests/queries/0_stateless/01925_join_materialized_columns.sql
@@ -32,7 +32,8 @@ SELECT t1.dt, t2.dt FROM t1 JOIN t2 ON t1.foo = t2.bar ORDER BY t1.dt;
 SELECT '-';
 SELECT * FROM t1 ALL JOIN t2 ON t1.dt = t2.dt ORDER BY t1.time, t2.time;
 SELECT '-';
-SELECT * FROM t1 ALL JOIN t2 USING (dt) ORDER BY t1.time, t2.time;
+SELECT * FROM t1 ALL JOIN t2 USING (dt) ORDER BY t1.time, t2.time settings allow_experimental_analyzer=0;
+SELECT * FROM t1 ALL JOIN t2 USING (dt) ORDER BY t1.time, t2.time settings allow_experimental_analyzer=1;
 SELECT '-';
 SELECT * FROM t1 JOIN t2 ON t1.dt1 = t2.dt2 ORDER BY t1.time, t1.dimension_1, t2.time, t2.dimension_2;
 SELECT '-';
@@ -51,5 +52,6 @@ SELECT t1.time as talias FROM t1 JOIN t2 ON talias = t2.time;
 SELECT t1.time as talias FROM t1 JOIN t2 ON talias = t2.time_alias;
 SELECT t2.time as talias FROM t1 JOIN t2 ON t1.time = talias;
 SELECT t2.time as talias FROM t1 JOIN t2 ON t1.time_alias = talias;
-SELECT time as talias FROM t1 JOIN t2 ON t1.time = talias; -- { serverError AMBIGUOUS_COLUMN_NAME }
-SELECT time as talias FROM t1 JOIN t2 ON talias = t2.time; -- { serverError AMBIGUOUS_COLUMN_NAME }
+SELECT time as talias FROM t1 JOIN t2 ON t1.time = talias; -- { serverError AMBIGUOUS_COLUMN_NAME, INVALID_JOIN_ON_EXPRESSION }
+SELECT time as talias FROM t1 JOIN t2 ON talias = t2.time settings allow_experimental_analyzer=0; -- { serverError AMBIGUOUS_COLUMN_NAME }
+SELECT time as talias FROM t1 JOIN t2 ON talias = t2.time settings allow_experimental_analyzer=1;
diff --git a/tests/queries/0_stateless/02354_vector_search_queries.sql b/tests/queries/0_stateless/02354_vector_search_queries.sql
index 2ccf869fdba..64051aa8544 100644
--- a/tests/queries/0_stateless/02354_vector_search_queries.sql
+++ b/tests/queries/0_stateless/02354_vector_search_queries.sql
@@ -8,8 +8,6 @@
 SET allow_experimental_annoy_index = 1;
 SET allow_experimental_usearch_index = 1;
 
-SET allow_experimental_analyzer = 0;
-
 SELECT 'ARRAY, 10 rows, index_granularity = 8192, GRANULARITY = 1 million --> 1 granule, 1 indexed block';
 
 DROP TABLE IF EXISTS tab_annoy;

From b1d8521a5bff044e2fb53eb548c9810723a892e9 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Tue, 19 Mar 2024 16:58:33 +0100
Subject: [PATCH 749/985] Update 01083_expressions_in_engine_arguments.sql

---
 .../0_stateless/01083_expressions_in_engine_arguments.sql       | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01083_expressions_in_engine_arguments.sql b/tests/queries/0_stateless/01083_expressions_in_engine_arguments.sql
index 7e4f77ccdb4..b162fdb21fd 100644
--- a/tests/queries/0_stateless/01083_expressions_in_engine_arguments.sql
+++ b/tests/queries/0_stateless/01083_expressions_in_engine_arguments.sql
@@ -28,7 +28,7 @@ CREATE TABLE url (n UInt64, col String) ENGINE=URL
 (
     replace
     (
-        'http://localhost:8123/?query='  || 'select n, _table from ' || currentDatabase() || '.merge format CSV', ' ', '+'
+        'https://localhost:8443/?query='  || 'select n, _table from ' || currentDatabase() || '.merge format CSV', ' ', '+'
     ),
     CSV
 );

From de855ca917798adea684d25bfb8d287303c30d70 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 19 Mar 2024 17:04:29 +0100
Subject: [PATCH 750/985] Reduce header dependencies

---
 base/base/IPv4andIPv6.h                       |  6 +-
 programs/benchmark/Benchmark.cpp              |  3 +-
 programs/format/Format.cpp                    |  3 +-
 programs/server/Server.cpp                    |  1 +
 src/Access/Common/QuotaDefs.cpp               |  1 +
 src/Access/IAccessStorage.h                   |  2 +
 src/Access/User.cpp                           |  1 +
 .../AggregateFunctionRetention.cpp            |  8 +--
 .../AggregateFunctionSequenceMatch.cpp        |  2 +
 src/Analyzer/Passes/QueryAnalysisPass.cpp     |  1 +
 src/Backups/BackupEntriesCollector.cpp        |  1 +
 src/Backups/BackupIO_Default.h                |  1 +
 src/Backups/BackupIO_Disk.h                   |  2 +
 src/Backups/BackupIO_S3.h                     |  1 +
 src/Client/ClientBase.cpp                     |  9 +--
 src/Client/LocalConnection.cpp                |  5 +-
 src/Common/HTTPConnectionPool.cpp             | 11 ++--
 src/Common/Scheduler/IResourceManager.h       |  3 +
 src/Common/Scheduler/ResouceLink.cpp          | 25 ++++++++
 src/Common/Scheduler/ResourceGuard.h          |  3 +-
 src/Common/Scheduler/ResourceLink.h           | 24 ++-----
 src/Common/SymbolIndex.cpp                    |  4 +-
 src/Common/ThreadStatus.h                     |  6 +-
 src/Common/formatIPv6.h                       |  7 +-
 ..._proxy_configuration_resolver_provider.cpp |  2 +
 src/Core/BaseSettings.h                       | 64 -------------------
 src/Core/BaseSettingsProgramOptions.h         | 60 +++++++++++++++++
 src/Core/LogsLevel.h                          | 16 +++++
 src/Core/SettingsEnums.h                      | 19 ++----
 src/Daemon/SentryWriter.cpp                   |  1 +
 src/DataTypes/DataTypeDomainBool.cpp          |  5 +-
 src/DataTypes/DataTypeFactory.h               |  1 -
 src/DataTypes/DataTypeTuple.cpp               |  2 +-
 src/DataTypes/DataTypeTuple.h                 |  2 +-
 src/DataTypes/IDataType.cpp                   |  2 +-
 src/DataTypes/IDataType.h                     |  9 ++-
 src/DataTypes/ObjectUtils.h                   |  1 +
 .../Serializations/SerializationInfo.h        | 26 ++++----
 .../SerializationInfoSettings.h               | 14 ++++
 .../gtest_DataType_deserializeAsText.cpp      |  1 +
 src/Databases/DatabaseAtomic.cpp              |  1 +
 src/Databases/DatabaseMemory.cpp              |  1 +
 src/Databases/DatabaseOnDisk.cpp              |  3 +-
 src/Databases/DatabaseReplicated.cpp          |  1 +
 src/Databases/DatabasesCommon.cpp             |  1 +
 src/Databases/IDatabase.cpp                   |  9 +--
 .../ObjectStorages/DiskObjectStorage.cpp      |  1 +
 src/Formats/FormatFactory.h                   |  1 +
 src/Formats/FormatSchemaInfo.h                |  1 +
 src/Formats/ReadSchemaUtils.cpp               |  1 +
 src/Formats/SchemaInferenceUtils.h            |  6 ++
 src/Functions/DateTimeTransforms.h            |  1 +
 src/Functions/FunctionJoinGet.cpp             |  7 +-
 .../FunctionsStringHashFixedString.cpp        |  2 +-
 src/Functions/appendTrailingCharIfAbsent.cpp  |  3 +-
 src/Functions/array/arrayIntersect.cpp        |  1 +
 src/Functions/dateDiff.cpp                    |  2 +-
 src/Functions/date_trunc.cpp                  |  3 +-
 src/Functions/hasColumnInTable.cpp            |  1 +
 .../keyvaluepair/ArgumentExtractor.h          |  1 +
 src/Functions/tupleConcat.cpp                 |  2 +
 src/IO/CachedInMemoryReadBufferFromFile.h     |  3 +-
 src/IO/ReadHelpers.h                          |  9 ++-
 src/IO/S3/copyS3File.h                        |  1 +
 src/IO/examples/read_buffer_from_hdfs.cpp     |  2 +
 src/Interpreters/ActionLocksManager.cpp       |  1 +
 src/Interpreters/ActionsVisitor.cpp           |  1 +
 src/Interpreters/ActionsVisitor.h             |  5 +-
 src/Interpreters/AsynchronousInsertQueue.cpp  |  1 +
 src/Interpreters/CollectJoinOnKeysVisitor.h   |  7 +-
 src/Interpreters/Context.h                    | 15 ++++-
 src/Interpreters/DDLTask.cpp                  |  3 +-
 src/Interpreters/DatabaseCatalog.cpp          | 40 ++++++++++++
 src/Interpreters/DatabaseCatalog.h            | 64 -------------------
 src/Interpreters/IKeyValueEntity.h            |  1 +
 .../InJoinSubqueriesPreprocessor.cpp          |  1 +
 src/Interpreters/InterpreterCheckQuery.cpp    |  1 +
 .../InterpreterCreateIndexQuery.cpp           |  5 +-
 src/Interpreters/InterpreterDescribeQuery.cpp |  1 +
 .../InterpreterDropIndexQuery.cpp             |  1 +
 src/Interpreters/InterpreterDropQuery.cpp     |  1 +
 src/Interpreters/InterpreterExistsQuery.cpp   |  1 +
 src/Interpreters/InterpreterInsertQuery.cpp   |  1 +
 .../InterpreterKillQueryQuery.cpp             |  1 +
 src/Interpreters/InterpreterOptimizeQuery.cpp |  1 +
 src/Interpreters/InterpreterRenameQuery.cpp   |  1 +
 .../InterpreterShowCreateQuery.cpp            |  1 +
 .../InterpreterShowFunctionsQuery.cpp         |  6 +-
 src/Interpreters/InterpreterUndropQuery.cpp   |  1 +
 src/Interpreters/InterpreterWatchQuery.cpp    |  3 +-
 src/Interpreters/JoinedTables.cpp             |  1 +
 ...writeSumFunctionWithSumAndCountVisitor.cpp |  2 +
 src/Interpreters/SystemLog.cpp                |  1 +
 src/Interpreters/SystemLog.h                  |  3 +-
 src/Interpreters/TableNameHints.h             | 39 +++++++++++
 src/Interpreters/executeDDLQueryOnCluster.cpp |  1 +
 src/Interpreters/getTableExpressions.cpp      |  1 +
 src/Interpreters/interpretSubquery.cpp        |  5 +-
 src/Interpreters/loadMetadata.cpp             |  5 +-
 src/Planner/PlannerJoinTree.cpp               |  1 +
 .../Impl/JSONColumnsBlockInputFormatBase.h    |  1 +
 src/Processors/Formats/Impl/Parquet/Write.h   |  1 +
 .../CreateSetAndFilterOnTheFlyTransform.cpp   |  2 +
 .../getSourceFromASTInsertQuery.cpp           |  1 +
 src/Server/GRPCServer.cpp                     |  1 +
 src/Server/MySQLHandler.cpp                   |  5 +-
 src/Server/PrometheusMetricsWriter.cpp        |  2 +
 .../Distributed/DistributedSettings.cpp       |  7 +-
 src/Storages/ExecutableSettings.cpp           |  6 +-
 src/Storages/ExecutableSettings.h             |  1 +
 src/Storages/FileLog/StorageFileLog.cpp       |  1 +
 .../extractZkPathFromCreateQuery.cpp          |  7 +-
 src/Storages/RocksDB/StorageSystemRocksDB.cpp |  1 +
 src/Storages/S3Queue/StorageS3Queue.cpp       |  3 +-
 src/Storages/StorageMaterializedView.cpp      |  7 +-
 src/Storages/StorageNull.cpp                  |  3 +-
 src/Storages/System/StorageSystemClusters.cpp |  1 +
 src/Storages/System/StorageSystemColumns.cpp  |  1 +
 .../System/StorageSystemDatabases.cpp         |  1 +
 .../System/StorageSystemDistributionQueue.cpp |  1 +
 .../StorageSystemDroppedTablesParts.cpp       |  1 +
 src/Storages/System/StorageSystemGraphite.cpp |  1 +
 .../System/StorageSystemMutations.cpp         |  1 +
 .../System/StorageSystemPartsBase.cpp         |  1 +
 src/Storages/System/StorageSystemTables.cpp   |  1 +
 .../StorageSystemZooKeeperConnection.cpp      |  2 +
 src/Storages/buildQueryTreeForShard.cpp       |  1 +
 src/Storages/getStructureOfRemoteTable.cpp    |  1 +
 src/TableFunctions/TableFunctionMerge.cpp     |  1 +
 129 files changed, 439 insertions(+), 266 deletions(-)
 create mode 100644 src/Common/Scheduler/ResouceLink.cpp
 create mode 100644 src/Core/BaseSettingsProgramOptions.h
 create mode 100644 src/Core/LogsLevel.h
 create mode 100644 src/DataTypes/Serializations/SerializationInfoSettings.h
 create mode 100644 src/Interpreters/TableNameHints.h

diff --git a/base/base/IPv4andIPv6.h b/base/base/IPv4andIPv6.h
index e2f93b54124..9b1e518c161 100644
--- a/base/base/IPv4andIPv6.h
+++ b/base/base/IPv4andIPv6.h
@@ -1,8 +1,7 @@
 #pragma once
 
-#include <base/strong_typedef.h>
 #include <base/extended_types.h>
-#include <Common/formatIPv6.h>
+#include <base/strong_typedef.h>
 #include <Common/memcmpSmall.h>
 
 namespace DB
@@ -62,7 +61,8 @@ namespace std
     {
         size_t operator()(const DB::IPv6 & x) const
         {
-            return std::hash<std::string_view>{}(std::string_view(reinterpret_cast<const char*>(&x.toUnderType()), IPV6_BINARY_LENGTH));
+            return std::hash<std::string_view>{}(
+                std::string_view(reinterpret_cast<const char *>(&x.toUnderType()), sizeof(DB::IPv6::UnderlyingType)));
         }
     };
 
diff --git a/programs/benchmark/Benchmark.cpp b/programs/benchmark/Benchmark.cpp
index 45dadfef774..eecc352d073 100644
--- a/programs/benchmark/Benchmark.cpp
+++ b/programs/benchmark/Benchmark.cpp
@@ -34,6 +34,7 @@
 #include <Common/StudentTTest.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/ErrorCodes.h>
+#include <Core/BaseSettingsProgramOptions.h>
 
 
 /** A tool for evaluating ClickHouse performance.
@@ -623,7 +624,7 @@ int mainEntryClickHouseBenchmark(int argc, char ** argv)
         ;
 
         Settings settings;
-        settings.addProgramOptions(desc);
+        addProgramOptions(settings, desc);
 
         boost::program_options::variables_map options;
         boost::program_options::store(boost::program_options::parse_command_line(argc, argv, desc), options);
diff --git a/programs/format/Format.cpp b/programs/format/Format.cpp
index 50f801f2560..fc73eda6815 100644
--- a/programs/format/Format.cpp
+++ b/programs/format/Format.cpp
@@ -17,6 +17,7 @@
 #include <Common/ErrorCodes.h>
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/TerminalSize.h>
+#include <Core/BaseSettingsProgramOptions.h>
 
 #include <Interpreters/Context.h>
 #include <Functions/FunctionFactory.h>
@@ -102,7 +103,7 @@ int mainEntryClickHouseFormat(int argc, char ** argv)
         {
             std::string_view name = field.getName();
             if (name == "max_parser_depth" || name == "max_query_size")
-                cmd_settings.addProgramOption(desc, name, field);
+                addProgramOption(cmd_settings, desc, name, field);
         }
 
         boost::program_options::variables_map options;
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index b67a4eccd15..59dadd14b20 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -36,6 +36,7 @@
 #include <Common/getNumberOfPhysicalCPUCores.h>
 #include <Common/getExecutablePath.h>
 #include <Common/ProfileEvents.h>
+#include <Common/Scheduler/IResourceManager.h>
 #include <Common/ThreadProfileEvents.h>
 #include <Common/ThreadStatus.h>
 #include <Common/getMappedArea.h>
diff --git a/src/Access/Common/QuotaDefs.cpp b/src/Access/Common/QuotaDefs.cpp
index 04c16a562d2..2a22b80f65d 100644
--- a/src/Access/Common/QuotaDefs.cpp
+++ b/src/Access/Common/QuotaDefs.cpp
@@ -2,6 +2,7 @@
 #include <Common/Exception.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
+#include <base/range.h>
 
 #include <boost/algorithm/string/case_conv.hpp>
 #include <boost/algorithm/string/classification.hpp>
diff --git a/src/Access/IAccessStorage.h b/src/Access/IAccessStorage.h
index ad78bf92e02..b00c8bac849 100644
--- a/src/Access/IAccessStorage.h
+++ b/src/Access/IAccessStorage.h
@@ -13,6 +13,8 @@
 #include <optional>
 #include <vector>
 
+#include <boost/noncopyable.hpp>
+
 
 namespace Poco { class Logger; }
 namespace Poco::Net { class IPAddress; }
diff --git a/src/Access/User.cpp b/src/Access/User.cpp
index 91477e5f3aa..39930c9cf76 100644
--- a/src/Access/User.cpp
+++ b/src/Access/User.cpp
@@ -1,4 +1,5 @@
 #include <Access/User.h>
+#include <Common/StringUtils/StringUtils.h>
 #include <Core/Protocol.h>
 #include <base/insertAtEnd.h>
 
diff --git a/src/AggregateFunctions/AggregateFunctionRetention.cpp b/src/AggregateFunctions/AggregateFunctionRetention.cpp
index a004f3527a2..5eaa1a7a39c 100644
--- a/src/AggregateFunctions/AggregateFunctionRetention.cpp
+++ b/src/AggregateFunctions/AggregateFunctionRetention.cpp
@@ -1,16 +1,16 @@
 #include <AggregateFunctions/AggregateFunctionFactory.h>
+#include <AggregateFunctions/IAggregateFunction.h>
 #include <AggregateFunctions/FactoryHelpers.h>
-
-#include <unordered_set>
 #include <Columns/ColumnArray.h>
 #include <Common/assert_cast.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeArray.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
-#include <bitset>
+#include <base/range.h>
 
-#include <AggregateFunctions/IAggregateFunction.h>
+#include <bitset>
+#include <unordered_set>
 
 
 namespace DB
diff --git a/src/AggregateFunctions/AggregateFunctionSequenceMatch.cpp b/src/AggregateFunctions/AggregateFunctionSequenceMatch.cpp
index ff9259e3aac..bc3d4da5e39 100644
--- a/src/AggregateFunctions/AggregateFunctionSequenceMatch.cpp
+++ b/src/AggregateFunctions/AggregateFunctionSequenceMatch.cpp
@@ -10,6 +10,8 @@
 #include <Common/assert_cast.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
+#include <base/range.h>
+
 #include <bitset>
 #include <stack>
 
diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 1da5d86edf3..d8a196ee3d4 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -48,6 +48,7 @@
 #include <Interpreters/SelectQueryOptions.h>
 #include <Interpreters/Set.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/ExternalDictionariesLoader.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
 
diff --git a/src/Backups/BackupEntriesCollector.cpp b/src/Backups/BackupEntriesCollector.cpp
index 5c0b80aa894..c71ce195388 100644
--- a/src/Backups/BackupEntriesCollector.cpp
+++ b/src/Backups/BackupEntriesCollector.cpp
@@ -6,6 +6,7 @@
 #include <Backups/DDLAdjustingForBackupVisitor.h>
 #include <Databases/IDatabase.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/formatAST.h>
 #include <Storages/IStorage.h>
diff --git a/src/Backups/BackupIO_Default.h b/src/Backups/BackupIO_Default.h
index 639293f22d9..4dba0324703 100644
--- a/src/Backups/BackupIO_Default.h
+++ b/src/Backups/BackupIO_Default.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <Backups/BackupIO.h>
+#include <Common/Logger.h>
 #include <IO/ReadSettings.h>
 #include <IO/WriteSettings.h>
 
diff --git a/src/Backups/BackupIO_Disk.h b/src/Backups/BackupIO_Disk.h
index 575ec3f5707..3d3253877bd 100644
--- a/src/Backups/BackupIO_Disk.h
+++ b/src/Backups/BackupIO_Disk.h
@@ -1,7 +1,9 @@
 #pragma once
 
 #include <Backups/BackupIO_Default.h>
+#include <Common/Logger.h>
 #include <Disks/DiskType.h>
+
 #include <filesystem>
 
 
diff --git a/src/Backups/BackupIO_S3.h b/src/Backups/BackupIO_S3.h
index 8ab8e1fb566..57108d122ea 100644
--- a/src/Backups/BackupIO_S3.h
+++ b/src/Backups/BackupIO_S3.h
@@ -4,6 +4,7 @@
 
 #if USE_AWS_S3
 #include <Backups/BackupIO_Default.h>
+#include <Common/Logger.h>
 #include <Disks/DiskType.h>
 #include <IO/S3Common.h>
 #include <Storages/StorageS3Settings.h>
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index d561a64895b..582dc2c9e6b 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -9,6 +9,7 @@
 #include <base/safeExit.h>
 #include <base/scope_guard.h>
 #include <Core/Block.h>
+#include <Core/BaseSettingsProgramOptions.h>
 #include <Core/Protocol.h>
 #include <Common/DateLUT.h>
 #include <Common/MemoryTracker.h>
@@ -2714,9 +2715,9 @@ private:
 void ClientBase::parseAndCheckOptions(OptionsDescription & options_description, po::variables_map & options, Arguments & arguments)
 {
     if (allow_repeated_settings)
-        cmd_settings.addProgramOptionsAsMultitokens(options_description.main_description.value());
+        addProgramOptionsAsMultitokens(cmd_settings, options_description.main_description.value());
     else
-        cmd_settings.addProgramOptions(options_description.main_description.value());
+        addProgramOptions(cmd_settings, options_description.main_description.value());
 
     if (allow_merge_tree_settings)
     {
@@ -2737,9 +2738,9 @@ void ClientBase::parseAndCheckOptions(OptionsDescription & options_description,
                     return;
 
                 if (allow_repeated_settings)
-                    cmd_merge_tree_settings.addProgramOptionAsMultitoken(main_options, name, setting);
+                    addProgramOptionAsMultitoken(cmd_merge_tree_settings, main_options, name, setting);
                 else
-                    cmd_merge_tree_settings.addProgramOption(main_options, name, setting);
+                    addProgramOption(cmd_merge_tree_settings, main_options, name, setting);
             };
 
             const auto & setting_name = setting.getName();
diff --git a/src/Client/LocalConnection.cpp b/src/Client/LocalConnection.cpp
index dbb115f44ef..afcaa4d6098 100644
--- a/src/Client/LocalConnection.cpp
+++ b/src/Client/LocalConnection.cpp
@@ -1,13 +1,14 @@
 #include "LocalConnection.h"
+#include <Core/Protocol.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/executeQuery.h>
 #include <Processors/Executors/CompletedPipelineExecutor.h>
 #include <Processors/Executors/PullingAsyncPipelineExecutor.h>
-#include <Processors/Executors/PushingPipelineExecutor.h>
 #include <Processors/Executors/PushingAsyncPipelineExecutor.h>
+#include <Processors/Executors/PushingPipelineExecutor.h>
 #include <Storages/IStorage.h>
 #include <Common/ConcurrentBoundedQueue.h>
 #include <Common/CurrentThread.h>
-#include <Core/Protocol.h>
 
 
 namespace DB
diff --git a/src/Common/HTTPConnectionPool.cpp b/src/Common/HTTPConnectionPool.cpp
index a21438a11a2..f729b8ea8d0 100644
--- a/src/Common/HTTPConnectionPool.cpp
+++ b/src/Common/HTTPConnectionPool.cpp
@@ -10,14 +10,15 @@
 #include <Common/MemoryTrackerSwitcher.h>
 #include <Common/SipHash.h>
 
-#include <Poco/Net/HTTPClientSession.h>
-#include <Poco/Net/HTTPStream.h>
-#include <Poco/Net/HTTPFixedLengthStream.h>
 #include <Poco/Net/HTTPChunkedStream.h>
+#include <Poco/Net/HTTPClientSession.h>
+#include <Poco/Net/HTTPFixedLengthStream.h>
+#include <Poco/Net/HTTPRequest.h>
+#include <Poco/Net/HTTPResponse.h>
+#include <Poco/Net/HTTPStream.h>
 #include <Poco/Timespan.h>
 
-#include <Poco/Net/HTTPResponse.h>
-#include <Poco/Net/HTTPRequest.h>
+#include <queue>
 
 #include "config.h"
 
diff --git a/src/Common/Scheduler/IResourceManager.h b/src/Common/Scheduler/IResourceManager.h
index 0af74e00960..8a7077ac3d5 100644
--- a/src/Common/Scheduler/IResourceManager.h
+++ b/src/Common/Scheduler/IResourceManager.h
@@ -12,6 +12,9 @@
 namespace DB
 {
 
+class ISchedulerNode;
+using SchedulerNodePtr = std::shared_ptr<ISchedulerNode>;
+
 /*
  * Instance of derived class holds everything required for resource consumption,
  * including resources currently registered at `SchedulerRoot`. This is required to avoid
diff --git a/src/Common/Scheduler/ResouceLink.cpp b/src/Common/Scheduler/ResouceLink.cpp
new file mode 100644
index 00000000000..2da5dba62dc
--- /dev/null
+++ b/src/Common/Scheduler/ResouceLink.cpp
@@ -0,0 +1,25 @@
+#include <Common/Scheduler/ISchedulerQueue.h>
+#include <Common/Scheduler/ResourceLink.h>
+#include <Common/Scheduler/ResourceRequest.h>
+
+namespace DB
+{
+void ResourceLink::adjust(ResourceCost estimated_cost, ResourceCost real_cost) const
+{
+    if (queue)
+        queue->adjustBudget(estimated_cost, real_cost);
+}
+
+void ResourceLink::consumed(ResourceCost cost) const
+{
+    if (queue)
+        queue->consumeBudget(cost);
+}
+
+void ResourceLink::accumulate(DB::ResourceCost cost) const
+{
+    if (queue)
+        queue->accumulateBudget(cost);
+}
+}
+
diff --git a/src/Common/Scheduler/ResourceGuard.h b/src/Common/Scheduler/ResourceGuard.h
index 50f665a384b..3c29f588fba 100644
--- a/src/Common/Scheduler/ResourceGuard.h
+++ b/src/Common/Scheduler/ResourceGuard.h
@@ -2,9 +2,10 @@
 
 #include <base/types.h>
 
+#include <Common/Scheduler/ISchedulerConstraint.h>
+#include <Common/Scheduler/ISchedulerQueue.h>
 #include <Common/Scheduler/ResourceRequest.h>
 #include <Common/Scheduler/ResourceLink.h>
-#include <Common/Scheduler/ISchedulerConstraint.h>
 
 #include <condition_variable>
 #include <mutex>
diff --git a/src/Common/Scheduler/ResourceLink.h b/src/Common/Scheduler/ResourceLink.h
index 108f51ac399..450d9bc1efa 100644
--- a/src/Common/Scheduler/ResourceLink.h
+++ b/src/Common/Scheduler/ResourceLink.h
@@ -2,12 +2,10 @@
 
 #include <base/types.h>
 
-#include <Common/Scheduler/ResourceRequest.h>
-#include <Common/Scheduler/ISchedulerQueue.h>
-
-
 namespace DB
 {
+class ISchedulerQueue;
+using ResourceCost = Int64;
 
 /*
  * Everything required for resource consumption. Connection to a specific resource queue.
@@ -17,23 +15,11 @@ struct ResourceLink
     ISchedulerQueue * queue = nullptr;
     bool operator==(const ResourceLink &) const = default;
 
-    void adjust(ResourceCost estimated_cost, ResourceCost real_cost) const
-    {
-        if (queue)
-            queue->adjustBudget(estimated_cost, real_cost);
-    }
+    void adjust(ResourceCost estimated_cost, ResourceCost real_cost) const;
 
-    void consumed(ResourceCost cost) const
-    {
-        if (queue)
-            queue->consumeBudget(cost);
-    }
+    void consumed(ResourceCost cost) const;
 
-    void accumulate(ResourceCost cost) const
-    {
-        if (queue)
-            queue->accumulateBudget(cost);
-    }
+    void accumulate(ResourceCost cost) const;
 };
 
 }
diff --git a/src/Common/SymbolIndex.cpp b/src/Common/SymbolIndex.cpp
index 8dde617fc74..a2d58fc7e8c 100644
--- a/src/Common/SymbolIndex.cpp
+++ b/src/Common/SymbolIndex.cpp
@@ -2,6 +2,8 @@
 
 #include <Common/SymbolIndex.h>
 #include <Common/MemorySanitizer.h>
+#include <base/hex.h>
+#include <base/sort.h>
 
 #include <algorithm>
 #include <optional>
@@ -11,8 +13,6 @@
 
 #include <filesystem>
 
-#include <base/sort.h>
-
 /**
 
 ELF object can contain three different places with symbol names and addresses:
diff --git a/src/Common/ThreadStatus.h b/src/Common/ThreadStatus.h
index 77386af6c2b..48b52f8aa6e 100644
--- a/src/Common/ThreadStatus.h
+++ b/src/Common/ThreadStatus.h
@@ -1,12 +1,12 @@
 #pragma once
 
-#include <Core/SettingsEnums.h>
-#include <Interpreters/Context_fwd.h>
+#include <Core/LogsLevel.h>
 #include <IO/Progress.h>
+#include <Interpreters/Context_fwd.h>
+#include <base/StringRef.h>
 #include <Common/MemoryTracker.h>
 #include <Common/ProfileEvents.h>
 #include <Common/Stopwatch.h>
-#include <base/StringRef.h>
 
 #include <boost/noncopyable.hpp>
 
diff --git a/src/Common/formatIPv6.h b/src/Common/formatIPv6.h
index fa7a9592c48..3451eda6b3c 100644
--- a/src/Common/formatIPv6.h
+++ b/src/Common/formatIPv6.h
@@ -1,13 +1,12 @@
 #pragma once
 
-#include <base/types.h>
-#include <cstring>
 #include <algorithm>
+#include <cstring>
 #include <type_traits>
 #include <utility>
-#include <base/range.h>
-#include <base/unaligned.h>
 #include <base/hex.h>
+#include <base/types.h>
+#include <base/unaligned.h>
 #include <Common/StringUtils/StringUtils.h>
 
 constexpr size_t IPV4_BINARY_LENGTH = 4;
diff --git a/src/Common/tests/gtest_proxy_configuration_resolver_provider.cpp b/src/Common/tests/gtest_proxy_configuration_resolver_provider.cpp
index 9a7447b02e4..d5d6f86f661 100644
--- a/src/Common/tests/gtest_proxy_configuration_resolver_provider.cpp
+++ b/src/Common/tests/gtest_proxy_configuration_resolver_provider.cpp
@@ -4,6 +4,8 @@
 #include <Common/tests/gtest_global_context.h>
 #include <Common/tests/gtest_helper_functions.h>
 
+#include <Poco/Util/MapConfiguration.h>
+
 using ConfigurationPtr = Poco::AutoPtr<Poco::Util::AbstractConfiguration>;
 
 class ProxyConfigurationResolverProviderTests : public ::testing::Test
diff --git a/src/Core/BaseSettings.h b/src/Core/BaseSettings.h
index 6f3245c83e8..7191038a4ce 100644
--- a/src/Core/BaseSettings.h
+++ b/src/Core/BaseSettings.h
@@ -7,7 +7,6 @@
 #include <base/range.h>
 #include <boost/blank.hpp>
 #include <unordered_map>
-#include <boost/program_options/options_description.hpp>
 
 
 namespace boost::program_options
@@ -129,18 +128,6 @@ public:
         std::conditional_t<Traits::allow_custom_settings, const CustomSettingMap::mapped_type*, boost::blank> custom_setting;
     };
 
-    /// Adds program options to set the settings from a command line.
-    /// (Don't forget to call notify() on the `variables_map` after parsing it!)
-    void addProgramOptions(boost::program_options::options_description & options);
-
-    /// Adds program options as to set the settings from a command line.
-    /// Allows to set one setting multiple times, the last value will be used.
-    /// (Don't forget to call notify() on the `variables_map` after parsing it!)
-    void addProgramOptionsAsMultitokens(boost::program_options::options_description & options);
-
-    void addProgramOption(boost::program_options::options_description & options, std::string_view name, const SettingFieldRef & field);
-    void addProgramOptionAsMultitoken(boost::program_options::options_description & options, std::string_view name, const SettingFieldRef & field);
-
     enum SkipFlags
     {
         SKIP_NONE = 0,
@@ -561,57 +548,6 @@ String BaseSettings<TTraits>::toString() const
     return out.str();
 }
 
-template <typename TTraits>
-void BaseSettings<TTraits>::addProgramOptions(boost::program_options::options_description & options)
-{
-    const auto & settings_to_aliases = TTraits::settingsToAliases();
-    for (const auto & field : all())
-    {
-        std::string_view name = field.getName();
-        addProgramOption(options, name, field);
-
-        if (auto it = settings_to_aliases.find(name); it != settings_to_aliases.end())
-        {
-            for (const auto alias : it->second)
-                addProgramOption(options, alias, field);
-        }
-    }
-}
-
-template <typename TTraits>
-void BaseSettings<TTraits>::addProgramOptionsAsMultitokens(boost::program_options::options_description & options)
-{
-    const auto & settings_to_aliases = TTraits::settingsToAliases();
-    for (const auto & field : all())
-    {
-        std::string_view name = field.getName();
-        addProgramOptionAsMultitoken(options, name, field);
-
-        if (auto it = settings_to_aliases.find(name); it != settings_to_aliases.end())
-        {
-            for (const auto alias : it->second)
-                addProgramOptionAsMultitoken(options, alias, field);
-        }
-    }
-}
-
-
-template <typename TTraits>
-void BaseSettings<TTraits>::addProgramOption(boost::program_options::options_description & options, std::string_view name, const SettingFieldRef & field)
-{
-    auto on_program_option = boost::function1<void, const std::string &>([this, name](const std::string & value) { set(name, value); });
-    options.add(boost::shared_ptr<boost::program_options::option_description>(new boost::program_options::option_description(
-        name.data(), boost::program_options::value<std::string>()->composing()->notifier(on_program_option), field.getDescription())));
-}
-
-template <typename TTraits>
-void BaseSettings<TTraits>::addProgramOptionAsMultitoken(boost::program_options::options_description & options, std::string_view name, const SettingFieldRef & field)
-{
-    auto on_program_option = boost::function1<void, const Strings &>([this, name](const Strings & values) { set(name, values.back()); });
-    options.add(boost::shared_ptr<boost::program_options::option_description>(new boost::program_options::option_description(
-        name.data(), boost::program_options::value<Strings>()->multitoken()->composing()->notifier(on_program_option), field.getDescription())));
-}
-
 template <typename TTraits>
 bool operator==(const BaseSettings<TTraits> & left, const BaseSettings<TTraits> & right)
 {
diff --git a/src/Core/BaseSettingsProgramOptions.h b/src/Core/BaseSettingsProgramOptions.h
new file mode 100644
index 00000000000..6c8166fc119
--- /dev/null
+++ b/src/Core/BaseSettingsProgramOptions.h
@@ -0,0 +1,60 @@
+#pragma once
+
+#include <Core/Settings.h>
+#include <Core/Types_fwd.h>
+
+#include <boost/program_options.hpp>
+
+namespace DB
+{
+
+template <typename T>
+void addProgramOptionAsMultitoken(T &cmd_settings, boost::program_options::options_description & options, std::string_view name, const typename T::SettingFieldRef & field)
+{
+    auto on_program_option = boost::function1<void, const Strings &>([&cmd_settings, name](const Strings & values) { cmd_settings.set(name, values.back()); });
+    options.add(boost::shared_ptr<boost::program_options::option_description>(new boost::program_options::option_description(
+            name.data(), boost::program_options::value<Strings>()->multitoken()->composing()->notifier(on_program_option), field.getDescription())));
+}
+
+template <typename T>
+void addProgramOptionsAsMultitokens(T &cmd_settings, boost::program_options::options_description & options)
+{
+    const auto & settings_to_aliases = T::Traits::settingsToAliases();
+    for (const auto & field : cmd_settings.all())
+    {
+        std::string_view name = field.getName();
+        addProgramOptionAsMultitoken(cmd_settings, options, name, field);
+
+        if (auto it = settings_to_aliases.find(name); it != settings_to_aliases.end())
+            for (const auto alias : it->second)
+                addProgramOptionAsMultitoken(cmd_settings, options, alias, field);
+    }
+}
+
+/// Adds program options to set the settings from a command line.
+/// (Don't forget to call notify() on the `variables_map` after parsing it!)
+template <typename T>
+void addProgramOption(T &cmd_settings, boost::program_options::options_description & options, std::string_view name, const typename T::SettingFieldRef  & field)
+{
+    auto on_program_option = boost::function1<void, const std::string &>([&cmd_settings, name](const std::string & value) { cmd_settings.set(name, value); });
+    options.add(boost::shared_ptr<boost::program_options::option_description>(new boost::program_options::option_description(
+            name.data(), boost::program_options::value<std::string>()->composing()->notifier(on_program_option), field.getDescription())));
+}
+
+template <typename T>
+void addProgramOptions(T &cmd_settings, boost::program_options::options_description & options)
+{
+    const auto & settings_to_aliases = T::Traits::settingsToAliases();
+    for (const auto & field : cmd_settings.all())
+    {
+        std::string_view name = field.getName();
+        addProgramOption(cmd_settings, options, name, field);
+
+        if (auto it = settings_to_aliases.find(name); it != settings_to_aliases.end())
+            for (const auto alias : it->second)
+                addProgramOption(cmd_settings, options, alias, field);
+    }
+}
+
+
+}
diff --git a/src/Core/LogsLevel.h b/src/Core/LogsLevel.h
new file mode 100644
index 00000000000..95721820d9c
--- /dev/null
+++ b/src/Core/LogsLevel.h
@@ -0,0 +1,16 @@
+#pragma once
+
+namespace DB
+{
+enum class LogsLevel
+{
+    none = 0, /// Disable
+    fatal,
+    error,
+    warning,
+    information,
+    debug,
+    trace,
+    test,
+};
+}
diff --git a/src/Core/SettingsEnums.h b/src/Core/SettingsEnums.h
index 22fcf0389d8..421712ed868 100644
--- a/src/Core/SettingsEnums.h
+++ b/src/Core/SettingsEnums.h
@@ -1,12 +1,13 @@
 #pragma once
 
-#include <Core/SettingsFields.h>
 #include <Core/Joins.h>
-#include <QueryPipeline/SizeLimits.h>
+#include <Core/LogsLevel.h>
+#include <Core/SettingsFields.h>
 #include <Formats/FormatSettings.h>
 #include <IO/ReadSettings.h>
-#include <Common/ShellCommandSettings.h>
 #include <Parsers/ASTSQLSecurity.h>
+#include <QueryPipeline/SizeLimits.h>
+#include <Common/ShellCommandSettings.h>
 
 
 namespace DB
@@ -90,18 +91,6 @@ DECLARE_SETTING_ENUM_WITH_RENAME(IntervalOutputFormat, FormatSettings::IntervalO
 
 DECLARE_SETTING_ENUM_WITH_RENAME(ParquetVersion, FormatSettings::ParquetVersion)
 
-enum class LogsLevel
-{
-    none = 0,    /// Disable
-    fatal,
-    error,
-    warning,
-    information,
-    debug,
-    trace,
-    test,
-};
-
 DECLARE_SETTING_ENUM(LogsLevel)
 
 
diff --git a/src/Daemon/SentryWriter.cpp b/src/Daemon/SentryWriter.cpp
index 192e9952b9a..0fa8b99a6f7 100644
--- a/src/Daemon/SentryWriter.cpp
+++ b/src/Daemon/SentryWriter.cpp
@@ -12,6 +12,7 @@
 #include <Common/StackTrace.h>
 #include <Common/getNumberOfPhysicalCPUCores.h>
 #include <Core/ServerUUID.h>
+#include <IO/WriteHelpers.h>
 
 #include "config.h"
 #include <Common/config_version.h>
diff --git a/src/DataTypes/DataTypeDomainBool.cpp b/src/DataTypes/DataTypeDomainBool.cpp
index 245c5495299..3d19b6262d8 100644
--- a/src/DataTypes/DataTypeDomainBool.cpp
+++ b/src/DataTypes/DataTypeDomainBool.cpp
@@ -1,6 +1,7 @@
-#include <DataTypes/Serializations/SerializationBool.h>
-#include <DataTypes/DataTypeFactory.h>
 #include <DataTypes/DataTypeCustom.h>
+#include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/IDataType.h>
+#include <DataTypes/Serializations/SerializationBool.h>
 
 namespace DB
 {
diff --git a/src/DataTypes/DataTypeFactory.h b/src/DataTypes/DataTypeFactory.h
index a2aeb6f3646..4727cb3ae5c 100644
--- a/src/DataTypes/DataTypeFactory.h
+++ b/src/DataTypes/DataTypeFactory.h
@@ -1,6 +1,5 @@
 #pragma once
 
-#include <DataTypes/IDataType.h>
 #include <Parsers/IAST_fwd.h>
 #include <Common/IFactoryWithAliases.h>
 #include <DataTypes/DataTypeCustom.h>
diff --git a/src/DataTypes/DataTypeTuple.cpp b/src/DataTypes/DataTypeTuple.cpp
index eb218d8efb7..5bbd79160d4 100644
--- a/src/DataTypes/DataTypeTuple.cpp
+++ b/src/DataTypes/DataTypeTuple.cpp
@@ -346,7 +346,7 @@ SerializationPtr DataTypeTuple::getSerialization(const SerializationInfo & info)
     return std::make_shared<SerializationTuple>(std::move(serializations), have_explicit_names);
 }
 
-MutableSerializationInfoPtr DataTypeTuple::createSerializationInfo(const SerializationInfo::Settings & settings) const
+MutableSerializationInfoPtr DataTypeTuple::createSerializationInfo(const SerializationInfoSettings & settings) const
 {
     MutableSerializationInfos infos;
     infos.reserve(elems.size());
diff --git a/src/DataTypes/DataTypeTuple.h b/src/DataTypes/DataTypeTuple.h
index 4e5a0c1b33c..15561fe4286 100644
--- a/src/DataTypes/DataTypeTuple.h
+++ b/src/DataTypes/DataTypeTuple.h
@@ -58,7 +58,7 @@ public:
 
     SerializationPtr doGetDefaultSerialization() const override;
     SerializationPtr getSerialization(const SerializationInfo & info) const override;
-    MutableSerializationInfoPtr createSerializationInfo(const SerializationInfo::Settings & settings) const override;
+    MutableSerializationInfoPtr createSerializationInfo(const SerializationInfoSettings & settings) const override;
     SerializationInfoPtr getSerializationInfo(const IColumn & column) const override;
 
     const DataTypePtr & getElement(size_t i) const { return elems[i]; }
diff --git a/src/DataTypes/IDataType.cpp b/src/DataTypes/IDataType.cpp
index 40915418aea..344b81be960 100644
--- a/src/DataTypes/IDataType.cpp
+++ b/src/DataTypes/IDataType.cpp
@@ -202,7 +202,7 @@ void IDataType::setCustomization(DataTypeCustomDescPtr custom_desc_) const
         custom_serialization = std::move(custom_desc_->serialization);
 }
 
-MutableSerializationInfoPtr IDataType::createSerializationInfo(const SerializationInfo::Settings & settings) const
+MutableSerializationInfoPtr IDataType::createSerializationInfo(const SerializationInfoSettings & settings) const
 {
     return std::make_shared<SerializationInfo>(ISerialization::Kind::DEFAULT, settings);
 }
diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index 4403e3d9bd4..eaf798a3017 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -7,8 +7,6 @@
 #include <Common/COW.h>
 #include <DataTypes/DataTypeCustom.h>
 #include <DataTypes/Serializations/ISerialization.h>
-#include <DataTypes/Serializations/SerializationInfo.h>
-
 
 namespace DB
 {
@@ -38,6 +36,11 @@ struct DataTypeWithConstInfo
 
 using DataTypesWithConstInfo = std::vector<DataTypeWithConstInfo>;
 
+class SerializationInfo;
+using SerializationInfoPtr = std::shared_ptr<const SerializationInfo>;
+using MutableSerializationInfoPtr = std::shared_ptr<SerializationInfo>;
+struct SerializationInfoSettings;
+
 /** Properties of data type.
   *
   * Contains methods for getting serialization instances.
@@ -117,7 +120,7 @@ public:
 
     Names getSubcolumnNames() const;
 
-    virtual MutableSerializationInfoPtr createSerializationInfo(const SerializationInfo::Settings & settings) const;
+    virtual MutableSerializationInfoPtr createSerializationInfo(const SerializationInfoSettings & settings) const;
     virtual SerializationInfoPtr getSerializationInfo(const IColumn & column) const;
 
     /// TODO: support more types.
diff --git a/src/DataTypes/ObjectUtils.h b/src/DataTypes/ObjectUtils.h
index 2bfcaae09ca..9897f7d20f9 100644
--- a/src/DataTypes/ObjectUtils.h
+++ b/src/DataTypes/ObjectUtils.h
@@ -13,6 +13,7 @@ namespace DB
 
 struct StorageSnapshot;
 using StorageSnapshotPtr = std::shared_ptr<StorageSnapshot>;
+class ColumnsDescription;
 
 /// Returns number of dimensions in Array type. 0 if type is not array.
 size_t getNumberOfDimensions(const IDataType & type);
diff --git a/src/DataTypes/Serializations/SerializationInfo.h b/src/DataTypes/Serializations/SerializationInfo.h
index 3d8f4f1d00c..5a900a5521c 100644
--- a/src/DataTypes/Serializations/SerializationInfo.h
+++ b/src/DataTypes/Serializations/SerializationInfo.h
@@ -2,6 +2,8 @@
 
 #include <Core/Types_fwd.h>
 #include <DataTypes/Serializations/ISerialization.h>
+#include <DataTypes/Serializations/SerializationInfoSettings.h>
+
 #include <Poco/JSON/Object.h>
 
 
@@ -28,6 +30,8 @@ constexpr auto SERIALIZATION_INFO_VERSION = 0;
 class SerializationInfo
 {
 public:
+    using Settings = SerializationInfoSettings;
+
     struct Data
     {
         size_t num_rows = 0;
@@ -38,16 +42,8 @@ public:
         void addDefaults(size_t length);
     };
 
-    struct Settings
-    {
-        const double ratio_of_defaults_for_sparse = 1.0;
-        const bool choose_kind = false;
-
-        bool isAlwaysDefault() const { return ratio_of_defaults_for_sparse >= 1.0; }
-    };
-
-    SerializationInfo(ISerialization::Kind kind_, const Settings & settings_);
-    SerializationInfo(ISerialization::Kind kind_, const Settings & settings_, const Data & data_);
+    SerializationInfo(ISerialization::Kind kind_, const SerializationInfoSettings & settings_);
+    SerializationInfo(ISerialization::Kind kind_, const SerializationInfoSettings & settings_, const Data & data_);
 
     virtual ~SerializationInfo() = default;
 
@@ -64,7 +60,7 @@ public:
     virtual std::shared_ptr<SerializationInfo> createWithType(
         const IDataType & old_type,
         const IDataType & new_type,
-        const Settings & new_settings) const;
+        const SerializationInfoSettings & new_settings) const;
 
     virtual void serialializeKindBinary(WriteBuffer & out) const;
     virtual void deserializeFromKindsBinary(ReadBuffer & in);
@@ -73,14 +69,14 @@ public:
     virtual void fromJSON(const Poco::JSON::Object & object);
 
     void setKind(ISerialization::Kind kind_) { kind = kind_; }
-    const Settings & getSettings() const { return settings; }
+    const SerializationInfoSettings & getSettings() const { return settings; }
     const Data & getData() const { return data; }
     ISerialization::Kind getKind() const { return kind; }
 
-    static ISerialization::Kind chooseKind(const Data & data, const Settings & settings);
+    static ISerialization::Kind chooseKind(const Data & data, const SerializationInfoSettings & settings);
 
 protected:
-    const Settings settings;
+    const SerializationInfoSettings settings;
 
     ISerialization::Kind kind;
     Data data;
@@ -96,7 +92,7 @@ using MutableSerializationInfos = std::vector<MutableSerializationInfoPtr>;
 class SerializationInfoByName : public std::map<String, MutableSerializationInfoPtr>
 {
 public:
-    using Settings = SerializationInfo::Settings;
+    using Settings = SerializationInfoSettings;
 
     SerializationInfoByName() = default;
     SerializationInfoByName(const NamesAndTypesList & columns, const Settings & settings);
diff --git a/src/DataTypes/Serializations/SerializationInfoSettings.h b/src/DataTypes/Serializations/SerializationInfoSettings.h
new file mode 100644
index 00000000000..26f2c344bea
--- /dev/null
+++ b/src/DataTypes/Serializations/SerializationInfoSettings.h
@@ -0,0 +1,14 @@
+#pragma once
+
+namespace DB
+{
+
+struct SerializationInfoSettings
+{
+    const double ratio_of_defaults_for_sparse = 1.0;
+    const bool choose_kind = false;
+
+    bool isAlwaysDefault() const { return ratio_of_defaults_for_sparse >= 1.0; }
+};
+
+}
diff --git a/src/DataTypes/tests/gtest_DataType_deserializeAsText.cpp b/src/DataTypes/tests/gtest_DataType_deserializeAsText.cpp
index 0373e55a62d..bf5337c89da 100644
--- a/src/DataTypes/tests/gtest_DataType_deserializeAsText.cpp
+++ b/src/DataTypes/tests/gtest_DataType_deserializeAsText.cpp
@@ -1,6 +1,7 @@
 #include <Columns/IColumn.h>
 #include <Core/Field.h>
 #include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/IDataType.h>
 #include <Formats/FormatSettings.h>
 #include <IO/ReadBuffer.h>
 
diff --git a/src/Databases/DatabaseAtomic.cpp b/src/Databases/DatabaseAtomic.cpp
index 0bf7c8af4b4..6f3f1151153 100644
--- a/src/Databases/DatabaseAtomic.cpp
+++ b/src/Databases/DatabaseAtomic.cpp
@@ -11,6 +11,7 @@
 #include <Common/filesystemHelpers.h>
 #include <Storages/StorageMaterializedView.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/ExternalDictionariesLoader.h>
 #include <filesystem>
 #include <Interpreters/DDLTask.h>
diff --git a/src/Databases/DatabaseMemory.cpp b/src/Databases/DatabaseMemory.cpp
index 794eebbc399..4ff7b3c7f2b 100644
--- a/src/Databases/DatabaseMemory.cpp
+++ b/src/Databases/DatabaseMemory.cpp
@@ -6,6 +6,7 @@
 #include <Databases/DDLDependencyVisitor.h>
 #include <Databases/DDLLoadingDependencyVisitor.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/formatAST.h>
diff --git a/src/Databases/DatabaseOnDisk.cpp b/src/Databases/DatabaseOnDisk.cpp
index dcfc1916450..896baa561b4 100644
--- a/src/Databases/DatabaseOnDisk.cpp
+++ b/src/Databases/DatabaseOnDisk.cpp
@@ -5,8 +5,9 @@
 #include <IO/WriteBufferFromFile.h>
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/InterpreterCreateQuery.h>
 #include <Interpreters/ApplyWithSubqueryVisitor.h>
+#include <Interpreters/DatabaseCatalog.h>
+#include <Interpreters/InterpreterCreateQuery.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ParserCreateQuery.h>
diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index 3b6a712510d..59b3e52e139 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -20,6 +20,7 @@
 #include <Databases/TablesDependencyGraph.h>
 #include <Interpreters/Cluster.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/DDLTask.h>
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
diff --git a/src/Databases/DatabasesCommon.cpp b/src/Databases/DatabasesCommon.cpp
index f8d6ad69ba8..d40e5f98aaa 100644
--- a/src/Databases/DatabasesCommon.cpp
+++ b/src/Databases/DatabasesCommon.cpp
@@ -1,6 +1,7 @@
 #include <Databases/DatabasesCommon.h>
 #include <Interpreters/InterpreterCreateQuery.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTSelectWithUnionQuery.h>
 #include <Parsers/ParserCreateQuery.h>
diff --git a/src/Databases/IDatabase.cpp b/src/Databases/IDatabase.cpp
index ae8fc58bf89..95d671d1960 100644
--- a/src/Databases/IDatabase.cpp
+++ b/src/Databases/IDatabase.cpp
@@ -1,11 +1,12 @@
 #include <memory>
 #include <Databases/IDatabase.h>
-#include <Storages/IStorage.h>
-#include <Parsers/ASTCreateQuery.h>
-#include <Common/quoteString.h>
 #include <Interpreters/DatabaseCatalog.h>
-#include <Common/NamePrompter.h>
+#include <Interpreters/TableNameHints.h>
+#include <Parsers/ASTCreateQuery.h>
+#include <Storages/IStorage.h>
 #include <Common/CurrentMetrics.h>
+#include <Common/NamePrompter.h>
+#include <Common/quoteString.h>
 
 
 namespace CurrentMetrics
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.cpp b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
index 696a0ef7416..9d20427e0d5 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
@@ -9,6 +9,7 @@
 #include <Common/logger_useful.h>
 #include <Common/filesystemHelpers.h>
 #include <Common/CurrentMetrics.h>
+#include <Common/Scheduler/IResourceManager.h>
 #include <Disks/ObjectStorages/DiskObjectStorageRemoteMetadataRestoreHelper.h>
 #include <Disks/ObjectStorages/DiskObjectStorageTransaction.h>
 #include <Disks/FakeDiskTransaction.h>
diff --git a/src/Formats/FormatFactory.h b/src/Formats/FormatFactory.h
index 46c1b8ddcdd..93f67e83831 100644
--- a/src/Formats/FormatFactory.h
+++ b/src/Formats/FormatFactory.h
@@ -23,6 +23,7 @@ namespace DB
 class Block;
 struct Settings;
 struct FormatFactorySettings;
+struct ReadSettings;
 
 class ReadBuffer;
 class WriteBuffer;
diff --git a/src/Formats/FormatSchemaInfo.h b/src/Formats/FormatSchemaInfo.h
index e8758c3f761..0dd28699896 100644
--- a/src/Formats/FormatSchemaInfo.h
+++ b/src/Formats/FormatSchemaInfo.h
@@ -8,6 +8,7 @@
 namespace DB
 {
 class Context;
+class Block;
 
 /// Extracts information about where the format schema file is from passed context and keep it.
 class FormatSchemaInfo
diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index b05b768899b..735b536986d 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -3,6 +3,7 @@
 #include <IO/PeekableReadBuffer.h>
 #include <IO/WithFileSize.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Processors/Formats/ISchemaReader.h>
 #include <Storages/IStorage.h>
 #include <Common/assert_cast.h>
diff --git a/src/Formats/SchemaInferenceUtils.h b/src/Formats/SchemaInferenceUtils.h
index b492d9b22b6..bcf3d194825 100644
--- a/src/Formats/SchemaInferenceUtils.h
+++ b/src/Formats/SchemaInferenceUtils.h
@@ -3,9 +3,15 @@
 #include <DataTypes/IDataType.h>
 #include <IO/ReadBuffer.h>
 
+#include <vector>
+
 namespace DB
 {
 
+class Block;
+class NamesAndTypesList;
+using NamesAndTypesLists = std::vector<NamesAndTypesList>;
+
 /// Struct with some additional information about inferred types for JSON formats.
 struct JSONInferenceInfo
 {
diff --git a/src/Functions/DateTimeTransforms.h b/src/Functions/DateTimeTransforms.h
index f5072de24f3..558c309007c 100644
--- a/src/Functions/DateTimeTransforms.h
+++ b/src/Functions/DateTimeTransforms.h
@@ -11,6 +11,7 @@
 #include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnVector.h>
 #include <Columns/ColumnDecimal.h>
+#include <Formats/FormatSettings.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunction.h>
 #include <Functions/extractTimeZoneFromFunctionArguments.h>
diff --git a/src/Functions/FunctionJoinGet.cpp b/src/Functions/FunctionJoinGet.cpp
index 5602c88c60e..085c4db3f57 100644
--- a/src/Functions/FunctionJoinGet.cpp
+++ b/src/Functions/FunctionJoinGet.cpp
@@ -1,12 +1,13 @@
 #include <Columns/ColumnString.h>
+#include <Core/Block.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
-#include <Interpreters/Context.h>
-#include <Interpreters/HashJoin.h>
 #include <Functions/IFunction.h>
+#include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
+#include <Interpreters/HashJoin.h>
 #include <Storages/StorageJoin.h>
 #include <Storages/TableLockHolder.h>
-#include <Core/Block.h>
 
 
 namespace DB
diff --git a/src/Functions/FunctionsStringHashFixedString.cpp b/src/Functions/FunctionsStringHashFixedString.cpp
index bbb02de6c9f..f4160badd37 100644
--- a/src/Functions/FunctionsStringHashFixedString.cpp
+++ b/src/Functions/FunctionsStringHashFixedString.cpp
@@ -274,7 +274,7 @@ public:
             const typename ColumnIPv6::Container & data = col_from_ip->getData();
             const auto size = col_from_ip->size();
             auto & chars_to = col_to->getChars();
-            const auto length = IPV6_BINARY_LENGTH;
+            const auto length = sizeof(IPv6::UnderlyingType);
             chars_to.resize(size * Impl::length);
             for (size_t i = 0; i < size; ++i)
             {
diff --git a/src/Functions/appendTrailingCharIfAbsent.cpp b/src/Functions/appendTrailingCharIfAbsent.cpp
index 7ff35e599be..a5554171aaa 100644
--- a/src/Functions/appendTrailingCharIfAbsent.cpp
+++ b/src/Functions/appendTrailingCharIfAbsent.cpp
@@ -1,9 +1,10 @@
 #include <Columns/ColumnString.h>
-#include <Common/assert_cast.h>
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunction.h>
+#include <base/range.h>
+#include <Common/assert_cast.h>
 
 
 namespace DB
diff --git a/src/Functions/array/arrayIntersect.cpp b/src/Functions/array/arrayIntersect.cpp
index ffc7480219e..209441eb301 100644
--- a/src/Functions/array/arrayIntersect.cpp
+++ b/src/Functions/array/arrayIntersect.cpp
@@ -20,6 +20,7 @@
 #include <Columns/ColumnTuple.h>
 #include <Common/HashTable/ClearableHashMap.h>
 #include <Common/assert_cast.h>
+#include <base/range.h>
 #include <base/TypeLists.h>
 #include <Interpreters/castColumn.h>
 
diff --git a/src/Functions/dateDiff.cpp b/src/Functions/dateDiff.cpp
index f75e6eb4fc8..8f318d1bc55 100644
--- a/src/Functions/dateDiff.cpp
+++ b/src/Functions/dateDiff.cpp
@@ -6,7 +6,7 @@
 #include <Columns/ColumnsDateTime.h>
 #include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnDecimal.h>
-
+#include <Formats/FormatSettings.h>
 #include <Functions/IFunction.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/FunctionFactory.h>
diff --git a/src/Functions/date_trunc.cpp b/src/Functions/date_trunc.cpp
index f64848e9185..8493df17a2f 100644
--- a/src/Functions/date_trunc.cpp
+++ b/src/Functions/date_trunc.cpp
@@ -1,9 +1,10 @@
 #include <Columns/ColumnConst.h>
-#include <Columns/ColumnsNumber.h>
 #include <Columns/ColumnString.h>
+#include <Columns/ColumnsNumber.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeInterval.h>
+#include <Formats/FormatSettings.h>
 #include <Functions/DateTimeTransforms.h>
 #include <Functions/FunctionFactory.h>
 
diff --git a/src/Functions/hasColumnInTable.cpp b/src/Functions/hasColumnInTable.cpp
index 66ed515e490..48783a672e2 100644
--- a/src/Functions/hasColumnInTable.cpp
+++ b/src/Functions/hasColumnInTable.cpp
@@ -7,6 +7,7 @@
 #include <Storages/IStorage.h>
 #include <Interpreters/Cluster.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Storages/getStructureOfRemoteTable.h>
 
 
diff --git a/src/Functions/keyvaluepair/ArgumentExtractor.h b/src/Functions/keyvaluepair/ArgumentExtractor.h
index e6538584d01..6ff8aa36f13 100644
--- a/src/Functions/keyvaluepair/ArgumentExtractor.h
+++ b/src/Functions/keyvaluepair/ArgumentExtractor.h
@@ -4,6 +4,7 @@
 #include <Columns/ColumnsNumber.h>
 #include <Core/ColumnsWithTypeAndName.h>
 
+#include <list>
 #include <optional>
 
 namespace DB
diff --git a/src/Functions/tupleConcat.cpp b/src/Functions/tupleConcat.cpp
index 0556f4181e6..c48e4d61463 100644
--- a/src/Functions/tupleConcat.cpp
+++ b/src/Functions/tupleConcat.cpp
@@ -4,6 +4,8 @@
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunction.h>
 
+#include <base/range.h>
+
 namespace DB
 {
 namespace ErrorCodes
diff --git a/src/IO/CachedInMemoryReadBufferFromFile.h b/src/IO/CachedInMemoryReadBufferFromFile.h
index 300c2e82386..a0d07486359 100644
--- a/src/IO/CachedInMemoryReadBufferFromFile.h
+++ b/src/IO/CachedInMemoryReadBufferFromFile.h
@@ -1,7 +1,8 @@
 #pragma once
 
-#include <Common/PageCache.h>
 #include <IO/ReadBufferFromFileBase.h>
+#include <IO/ReadSettings.h>
+#include <Common/PageCache.h>
 
 namespace DB
 {
diff --git a/src/IO/ReadHelpers.h b/src/IO/ReadHelpers.h
index 49530f4787a..ca568c469b4 100644
--- a/src/IO/ReadHelpers.h
+++ b/src/IO/ReadHelpers.h
@@ -154,9 +154,12 @@ inline void readIPv6Binary(IPv6 & ip, ReadBuffer & buf)
     size_t size = 0;
     readVarUInt(size, buf);
 
-    if (size != IPV6_BINARY_LENGTH)
-        throw Exception(ErrorCodes::SIZE_OF_FIXED_STRING_DOESNT_MATCH,
-                        "Size of the string {} doesn't match size of binary IPv6 {}", size, IPV6_BINARY_LENGTH);
+    if (size != sizeof(IPv6::UnderlyingType))
+        throw Exception(
+            ErrorCodes::SIZE_OF_FIXED_STRING_DOESNT_MATCH,
+            "Size of the string {} doesn't match size of binary IPv6 {}",
+            size,
+            sizeof(IPv6::UnderlyingType));
 
     buf.readStrict(reinterpret_cast<char*>(&ip.toUnderType()), size);
 }
diff --git a/src/IO/S3/copyS3File.h b/src/IO/S3/copyS3File.h
index 093d26ba7bb..5eb6f702473 100644
--- a/src/IO/S3/copyS3File.h
+++ b/src/IO/S3/copyS3File.h
@@ -14,6 +14,7 @@
 
 namespace DB
 {
+struct ReadSettings;
 class SeekableReadBuffer;
 
 using CreateReadBuffer = std::function<std::unique_ptr<SeekableReadBuffer>()>;
diff --git a/src/IO/examples/read_buffer_from_hdfs.cpp b/src/IO/examples/read_buffer_from_hdfs.cpp
index 977dd2ae227..c499542fedb 100644
--- a/src/IO/examples/read_buffer_from_hdfs.cpp
+++ b/src/IO/examples/read_buffer_from_hdfs.cpp
@@ -6,6 +6,8 @@
 #include <base/types.h>
 #include <Common/Config/ConfigProcessor.h>
 
+#include <Poco/Util/MapConfiguration.h>
+
 using namespace DB;
 
 int main()
diff --git a/src/Interpreters/ActionLocksManager.cpp b/src/Interpreters/ActionLocksManager.cpp
index 65f13ebd66c..28803a94c80 100644
--- a/src/Interpreters/ActionLocksManager.cpp
+++ b/src/Interpreters/ActionLocksManager.cpp
@@ -1,5 +1,6 @@
 #include "ActionLocksManager.h"
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Databases/IDatabase.h>
 #include <Storages/IStorage.h>
 
diff --git a/src/Interpreters/ActionsVisitor.cpp b/src/Interpreters/ActionsVisitor.cpp
index f9a58c8c3ca..16e2449206d 100644
--- a/src/Interpreters/ActionsVisitor.cpp
+++ b/src/Interpreters/ActionsVisitor.cpp
@@ -44,6 +44,7 @@
 #include <Interpreters/ExpressionActions.h>
 #include <Interpreters/misc.h>
 #include <Interpreters/ActionsVisitor.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/Set.h>
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/convertFieldToType.h>
diff --git a/src/Interpreters/ActionsVisitor.h b/src/Interpreters/ActionsVisitor.h
index 1e2ebaf6d87..643bf50ecd4 100644
--- a/src/Interpreters/ActionsVisitor.h
+++ b/src/Interpreters/ActionsVisitor.h
@@ -1,13 +1,14 @@
 #pragma once
 
 #include <string_view>
+#include <Core/ColumnNumbers.h>
+#include <Core/ColumnWithTypeAndName.h>
 #include <Core/NamesAndTypes.h>
 #include <Interpreters/Context_fwd.h>
 #include <Interpreters/InDepthNodeVisitor.h>
 #include <Interpreters/PreparedSets.h>
 #include <Parsers/IAST.h>
-#include <Core/ColumnNumbers.h>
-#include <Core/ColumnWithTypeAndName.h>
+#include <QueryPipeline/SizeLimits.h>
 
 namespace DB
 {
diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index 9234d052d97..1c6039bbbf7 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -11,6 +11,7 @@
 #include <IO/copyData.h>
 #include <Interpreters/AsynchronousInsertLog.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterInsertQuery.h>
 #include <Interpreters/ProcessList.h>
 #include <Interpreters/executeQuery.h>
diff --git a/src/Interpreters/CollectJoinOnKeysVisitor.h b/src/Interpreters/CollectJoinOnKeysVisitor.h
index 194ec01bcd5..ff10db3beb5 100644
--- a/src/Interpreters/CollectJoinOnKeysVisitor.h
+++ b/src/Interpreters/CollectJoinOnKeysVisitor.h
@@ -1,11 +1,12 @@
 #pragma once
 
+#include <Core/Joins.h>
 #include <Core/Names.h>
+#include <Interpreters/Aliases.h>
+#include <Interpreters/DatabaseAndTableWithAlias.h>
+#include <Interpreters/InDepthNodeVisitor.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/queryToString.h>
-#include <Interpreters/InDepthNodeVisitor.h>
-#include <Interpreters/DatabaseAndTableWithAlias.h>
-#include <Interpreters/Aliases.h>
 
 
 namespace DB
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index dbd9bbd1ff8..c2d6febc733 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -19,9 +19,8 @@
 #include <Disks/IO/getThreadPoolReader.h>
 #include <Interpreters/ClientInfo.h>
 #include <Interpreters/Context_fwd.h>
-#include <Interpreters/DatabaseCatalog.h>
+#include <Interpreters/StorageID.h>
 #include <Interpreters/MergeTreeTransactionHolder.h>
-#include <Common/Scheduler/IResourceManager.h>
 #include <Parsers/IAST_fwd.h>
 #include <Server/HTTP/HTTPContext.h>
 #include <Storages/ColumnsDescription.h>
@@ -149,6 +148,18 @@ template <class Queue>
 class MergeTreeBackgroundExecutor;
 class AsyncLoader;
 
+struct TemporaryTableHolder;
+using TemporaryTablesMapping = std::map<String, std::shared_ptr<TemporaryTableHolder>>;
+
+class LoadTask;
+using LoadTaskPtr = std::shared_ptr<LoadTask>;
+using LoadTaskPtrs = std::vector<LoadTaskPtr>;
+
+class IClassifier;
+using ClassifierPtr = std::shared_ptr<IClassifier>;
+class IResourceManager;
+using ResourceManagerPtr = std::shared_ptr<IResourceManager>;
+
 /// Scheduling policy can be changed using `background_merges_mutations_scheduling_policy` config option.
 /// By default concurrent merges are scheduled using "round_robin" to ensure fair and starvation-free operation.
 /// Previously in heavily overloaded shards big merges could possibly be starved by smaller
diff --git a/src/Interpreters/DDLTask.cpp b/src/Interpreters/DDLTask.cpp
index e10f3ecfbc9..a37b4db029a 100644
--- a/src/Interpreters/DDLTask.cpp
+++ b/src/Interpreters/DDLTask.cpp
@@ -2,6 +2,8 @@
 #include <base/sort.h>
 #include <Common/DNSResolver.h>
 #include <Common/isLocalAddress.h>
+#include <Databases/DatabaseReplicated.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <IO/WriteHelpers.h>
 #include <IO/ReadHelpers.h>
 #include <IO/Operators.h>
@@ -14,7 +16,6 @@
 #include <Parsers/parseQuery.h>
 #include <Parsers/queryToString.h>
 #include <Parsers/ASTQueryWithTableAndOutput.h>
-#include <Databases/DatabaseReplicated.h>
 
 
 namespace DB
diff --git a/src/Interpreters/DatabaseCatalog.cpp b/src/Interpreters/DatabaseCatalog.cpp
index c2f2003aabd..ec6c8b5924f 100644
--- a/src/Interpreters/DatabaseCatalog.cpp
+++ b/src/Interpreters/DatabaseCatalog.cpp
@@ -2,6 +2,7 @@
 #include <mutex>
 #include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/TableNameHints.h>
 #include <Interpreters/loadMetadata.h>
 #include <Interpreters/executeQuery.h>
 #include <Interpreters/InterpreterCreateQuery.h>
@@ -1705,4 +1706,43 @@ DDLGuard::~DDLGuard()
     releaseTableLock();
 }
 
+std::pair<String, String> TableNameHints::getHintForTable(const String & table_name) const
+{
+    auto results = this->getHints(table_name, getAllRegisteredNames());
+    if (results.empty())
+        return getExtendedHintForTable(table_name);
+    return std::make_pair(database->getDatabaseName(), results[0]);
+}
+
+std::pair<String, String> TableNameHints::getExtendedHintForTable(const String & table_name) const
+{
+    /// load all available databases from the DatabaseCatalog instance
+    auto & database_catalog = DatabaseCatalog::instance();
+    auto all_databases = database_catalog.getDatabases();
+
+    for (const auto & [db_name, db] : all_databases)
+    {
+        /// this case should be covered already by getHintForTable
+        if (db_name == database->getDatabaseName())
+            continue;
+
+        TableNameHints hints(db, context);
+        auto results = hints.getHints(table_name);
+
+        /// if the results are not empty, return the first instance of the table_name
+        /// and the corresponding database_name that was found.
+        if (!results.empty())
+            return std::make_pair(db_name, results[0]);
+    }
+    return {};
+}
+
+Names TableNameHints::getAllRegisteredNames() const
+{
+    Names result;
+    if (database)
+        for (auto table_it = database->getTablesIterator(context); table_it->isValid(); table_it->next())
+            result.emplace_back(table_it->name());
+    return result;
+}
 }
diff --git a/src/Interpreters/DatabaseCatalog.h b/src/Interpreters/DatabaseCatalog.h
index 6995fc51941..30b49cf1fed 100644
--- a/src/Interpreters/DatabaseCatalog.h
+++ b/src/Interpreters/DatabaseCatalog.h
@@ -1,13 +1,11 @@
 #pragma once
 
 #include <Core/UUID.h>
-#include <Databases/IDatabase.h>
 #include <Databases/TablesDependencyGraph.h>
 #include <Interpreters/Context_fwd.h>
 #include <Interpreters/StorageID.h>
 #include <Parsers/IAST_fwd.h>
 #include <Storages/IStorage_fwd.h>
-#include <Common/NamePrompter.h>
 #include <Common/SharedMutex.h>
 
 #include <boost/noncopyable.hpp>
@@ -365,68 +363,6 @@ private:
     static constexpr time_t DBMS_DEFAULT_DISK_RELOAD_PERIOD_SEC = 5;
 };
 
-class TableNameHints : public IHints<>
-{
-public:
-    TableNameHints(ConstDatabasePtr database_, ContextPtr context_)
-        : context(context_),
-        database(database_)
-    {
-    }
-
-    /// getHintForTable tries to get a hint for the provided table_name in the provided
-    /// database. If the results are empty, it goes for extended hints for the table
-    /// with getExtendedHintForTable which looks for the table name in every database that's
-    /// available in the database catalog. It finally returns a single hint which is the database
-    /// name and table_name pair which is similar to the table_name provided. Perhaps something to
-    /// consider is should we return more than one pair of hint?
-    std::pair<String, String> getHintForTable(const String & table_name) const
-    {
-        auto results = this->getHints(table_name, getAllRegisteredNames());
-        if (results.empty())
-            return getExtendedHintForTable(table_name);
-        return std::make_pair(database->getDatabaseName(), results[0]);
-    }
-
-    /// getExtendedHintsForTable tries to get hint for the given table_name across all
-    /// the databases that are available in the database catalog.
-    std::pair<String, String> getExtendedHintForTable(const String & table_name) const
-    {
-        /// load all available databases from the DatabaseCatalog instance
-        auto & database_catalog = DatabaseCatalog::instance();
-        auto all_databases = database_catalog.getDatabases();
-
-        for (const auto & [db_name, db] : all_databases)
-        {
-            /// this case should be covered already by getHintForTable
-            if (db_name == database->getDatabaseName())
-                continue;
-
-            TableNameHints hints(db, context);
-            auto results = hints.getHints(table_name);
-
-            /// if the results are not empty, return the first instance of the table_name
-            /// and the corresponding database_name that was found.
-            if (!results.empty())
-                return std::make_pair(db_name, results[0]);
-        }
-        return {};
-    }
-
-    Names getAllRegisteredNames() const override
-    {
-        Names result;
-        if (database)
-            for (auto table_it = database->getTablesIterator(context); table_it->isValid(); table_it->next())
-                result.emplace_back(table_it->name());
-        return result;
-    }
-
-private:
-    ContextPtr context;
-    ConstDatabasePtr database;
-};
-
 
 /// This class is useful when creating a table or database.
 /// Usually we create IStorage/IDatabase object first and then add it to IDatabase/DatabaseCatalog.
diff --git a/src/Interpreters/IKeyValueEntity.h b/src/Interpreters/IKeyValueEntity.h
index d1ceda57f0e..856ce28bae7 100644
--- a/src/Interpreters/IKeyValueEntity.h
+++ b/src/Interpreters/IKeyValueEntity.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <Core/Block.h>
 #include <Core/Names.h>
 #include <Processors/Chunk.h>
 
diff --git a/src/Interpreters/InJoinSubqueriesPreprocessor.cpp b/src/Interpreters/InJoinSubqueriesPreprocessor.cpp
index ec4241a2740..3b3ef928b42 100644
--- a/src/Interpreters/InJoinSubqueriesPreprocessor.cpp
+++ b/src/Interpreters/InJoinSubqueriesPreprocessor.cpp
@@ -1,6 +1,7 @@
 #include <Interpreters/InJoinSubqueriesPreprocessor.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/DatabaseAndTableWithAlias.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/IdentifierSemantic.h>
 #include <Interpreters/InDepthNodeVisitor.h>
 #include <Storages/StorageDistributed.h>
diff --git a/src/Interpreters/InterpreterCheckQuery.cpp b/src/Interpreters/InterpreterCheckQuery.cpp
index 98a281bd5ad..ae8cef3f102 100644
--- a/src/Interpreters/InterpreterCheckQuery.cpp
+++ b/src/Interpreters/InterpreterCheckQuery.cpp
@@ -16,6 +16,7 @@
 #include <DataTypes/DataTypeString.h>
 
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/ProcessList.h>
 
 #include <Parsers/ASTCheckQuery.h>
diff --git a/src/Interpreters/InterpreterCreateIndexQuery.cpp b/src/Interpreters/InterpreterCreateIndexQuery.cpp
index cd2f996c74c..aed4b0587b4 100644
--- a/src/Interpreters/InterpreterCreateIndexQuery.cpp
+++ b/src/Interpreters/InterpreterCreateIndexQuery.cpp
@@ -1,10 +1,11 @@
-#include <Interpreters/InterpreterFactory.h>
-#include <Interpreters/InterpreterCreateIndexQuery.h>
 
 #include <Access/ContextAccess.h>
 #include <Databases/DatabaseReplicated.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
+#include <Interpreters/InterpreterFactory.h>
+#include <Interpreters/InterpreterCreateIndexQuery.h>
 #include <Interpreters/FunctionNameNormalizer.h>
 #include <Parsers/ASTCreateIndexQuery.h>
 #include <Parsers/ASTIdentifier.h>
diff --git a/src/Interpreters/InterpreterDescribeQuery.cpp b/src/Interpreters/InterpreterDescribeQuery.cpp
index 04d44e34fff..87b0eb89302 100644
--- a/src/Interpreters/InterpreterDescribeQuery.cpp
+++ b/src/Interpreters/InterpreterDescribeQuery.cpp
@@ -9,6 +9,7 @@
 #include <Interpreters/InterpreterSelectWithUnionQuery.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/InterpreterDescribeQuery.h>
 #include <Interpreters/IdentifierSemantic.h>
diff --git a/src/Interpreters/InterpreterDropIndexQuery.cpp b/src/Interpreters/InterpreterDropIndexQuery.cpp
index 025677eeb91..f052aa201f1 100644
--- a/src/Interpreters/InterpreterDropIndexQuery.cpp
+++ b/src/Interpreters/InterpreterDropIndexQuery.cpp
@@ -1,6 +1,7 @@
 #include <Access/ContextAccess.h>
 #include <Databases/DatabaseReplicated.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterDropIndexQuery.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
diff --git a/src/Interpreters/InterpreterDropQuery.cpp b/src/Interpreters/InterpreterDropQuery.cpp
index 72aa4cc63e3..a7040709034 100644
--- a/src/Interpreters/InterpreterDropQuery.cpp
+++ b/src/Interpreters/InterpreterDropQuery.cpp
@@ -1,5 +1,6 @@
 #include <Databases/IDatabase.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/InterpreterDropQuery.h>
diff --git a/src/Interpreters/InterpreterExistsQuery.cpp b/src/Interpreters/InterpreterExistsQuery.cpp
index e4176a44533..14ca9eaed0a 100644
--- a/src/Interpreters/InterpreterExistsQuery.cpp
+++ b/src/Interpreters/InterpreterExistsQuery.cpp
@@ -5,6 +5,7 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <Columns/ColumnsNumber.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/InterpreterExistsQuery.h>
 #include <Access/Common/AccessFlags.h>
diff --git a/src/Interpreters/InterpreterInsertQuery.cpp b/src/Interpreters/InterpreterInsertQuery.cpp
index 3e8bb268fe7..fc58f7b5098 100644
--- a/src/Interpreters/InterpreterInsertQuery.cpp
+++ b/src/Interpreters/InterpreterInsertQuery.cpp
@@ -7,6 +7,7 @@
 #include <Columns/ColumnNullable.h>
 #include <Processors/Transforms/buildPushingToViewsChain.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterSelectWithUnionQuery.h>
 #include <Interpreters/InterpreterWatchQuery.h>
 #include <Interpreters/QueryLog.h>
diff --git a/src/Interpreters/InterpreterKillQueryQuery.cpp b/src/Interpreters/InterpreterKillQueryQuery.cpp
index 26dae6a1df3..6d6b1085ffb 100644
--- a/src/Interpreters/InterpreterKillQueryQuery.cpp
+++ b/src/Interpreters/InterpreterKillQueryQuery.cpp
@@ -3,6 +3,7 @@
 #include <Parsers/ASTKillQueryQuery.h>
 #include <Parsers/queryToString.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
 #include <Interpreters/ProcessList.h>
 #include <Interpreters/executeQuery.h>
diff --git a/src/Interpreters/InterpreterOptimizeQuery.cpp b/src/Interpreters/InterpreterOptimizeQuery.cpp
index 1e2eaa50ab1..907a01b0432 100644
--- a/src/Interpreters/InterpreterOptimizeQuery.cpp
+++ b/src/Interpreters/InterpreterOptimizeQuery.cpp
@@ -2,6 +2,7 @@
 #include <Parsers/ASTOptimizeQuery.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/InterpreterOptimizeQuery.h>
 #include <Access/Common/AccessRightsElement.h>
diff --git a/src/Interpreters/InterpreterRenameQuery.cpp b/src/Interpreters/InterpreterRenameQuery.cpp
index 06b6ebc9cbb..b63672f1757 100644
--- a/src/Interpreters/InterpreterRenameQuery.cpp
+++ b/src/Interpreters/InterpreterRenameQuery.cpp
@@ -1,6 +1,7 @@
 #include <Parsers/ASTRenameQuery.h>
 #include <Databases/IDatabase.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/InterpreterRenameQuery.h>
 #include <Storages/IStorage.h>
diff --git a/src/Interpreters/InterpreterShowCreateQuery.cpp b/src/Interpreters/InterpreterShowCreateQuery.cpp
index 9edac1fd8e1..0fca7b64d5a 100644
--- a/src/Interpreters/InterpreterShowCreateQuery.cpp
+++ b/src/Interpreters/InterpreterShowCreateQuery.cpp
@@ -9,6 +9,7 @@
 #include <Common/typeid_cast.h>
 #include <Access/Common/AccessFlags.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/formatWithPossiblyHidingSecrets.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/InterpreterShowCreateQuery.h>
diff --git a/src/Interpreters/InterpreterShowFunctionsQuery.cpp b/src/Interpreters/InterpreterShowFunctionsQuery.cpp
index 829670d7929..96a730f6527 100644
--- a/src/Interpreters/InterpreterShowFunctionsQuery.cpp
+++ b/src/Interpreters/InterpreterShowFunctionsQuery.cpp
@@ -1,8 +1,8 @@
-#include <Interpreters/InterpreterFactory.h>
-#include <Interpreters/InterpreterShowFunctionsQuery.h>
-
+#include <Databases/IDatabase.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/DatabaseCatalog.h>
+#include <Interpreters/InterpreterFactory.h>
+#include <Interpreters/InterpreterShowFunctionsQuery.h>
 #include <Interpreters/executeQuery.h>
 #include <Parsers/ASTShowFunctionsQuery.h>
 
diff --git a/src/Interpreters/InterpreterUndropQuery.cpp b/src/Interpreters/InterpreterUndropQuery.cpp
index f628a656947..920df3d6aed 100644
--- a/src/Interpreters/InterpreterUndropQuery.cpp
+++ b/src/Interpreters/InterpreterUndropQuery.cpp
@@ -1,4 +1,5 @@
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/InterpreterUndropQuery.h>
diff --git a/src/Interpreters/InterpreterWatchQuery.cpp b/src/Interpreters/InterpreterWatchQuery.cpp
index 2b68c5d7a10..4937d8660e0 100644
--- a/src/Interpreters/InterpreterWatchQuery.cpp
+++ b/src/Interpreters/InterpreterWatchQuery.cpp
@@ -12,9 +12,10 @@ limitations under the License. */
 #include <Core/Settings.h>
 #include <Common/typeid_cast.h>
 #include <Parsers/ASTWatchQuery.h>
+#include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterFactory.h>
 #include <Interpreters/InterpreterWatchQuery.h>
-#include <Interpreters/Context.h>
 #include <Access/Common/AccessFlags.h>
 #include <QueryPipeline/StreamLocalLimits.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
diff --git a/src/Interpreters/JoinedTables.cpp b/src/Interpreters/JoinedTables.cpp
index 49693332280..5b549a19083 100644
--- a/src/Interpreters/JoinedTables.cpp
+++ b/src/Interpreters/JoinedTables.cpp
@@ -2,6 +2,7 @@
 
 #include <Core/SettingsEnums.h>
 
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/IdentifierSemantic.h>
 #include <Interpreters/InDepthNodeVisitor.h>
 #include <Interpreters/InJoinSubqueriesPreprocessor.h>
diff --git a/src/Interpreters/RewriteSumFunctionWithSumAndCountVisitor.cpp b/src/Interpreters/RewriteSumFunctionWithSumAndCountVisitor.cpp
index 2f5e597bdab..8e60603cca9 100644
--- a/src/Interpreters/RewriteSumFunctionWithSumAndCountVisitor.cpp
+++ b/src/Interpreters/RewriteSumFunctionWithSumAndCountVisitor.cpp
@@ -4,6 +4,8 @@
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIdentifier.h>
 
+#include <Poco/String.h>
+
 namespace DB
 {
 
diff --git a/src/Interpreters/SystemLog.cpp b/src/Interpreters/SystemLog.cpp
index efb2559ce42..db73fe038c0 100644
--- a/src/Interpreters/SystemLog.cpp
+++ b/src/Interpreters/SystemLog.cpp
@@ -11,6 +11,7 @@
 #include <Interpreters/BlobStorageLog.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/CrashLog.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/FilesystemCacheLog.h>
 #include <Interpreters/FilesystemReadPrefetchesLog.h>
 #include <Interpreters/InterpreterCreateQuery.h>
diff --git a/src/Interpreters/SystemLog.h b/src/Interpreters/SystemLog.h
index c296b91e24a..e5b79585701 100644
--- a/src/Interpreters/SystemLog.h
+++ b/src/Interpreters/SystemLog.h
@@ -1,8 +1,9 @@
 #pragma once
 
+#include <Interpreters/StorageID.h>
 #include <Common/SystemLogBase.h>
 
-#include <Interpreters/StorageID.h>
+#include <boost/noncopyable.hpp>
 
 namespace DB
 {
diff --git a/src/Interpreters/TableNameHints.h b/src/Interpreters/TableNameHints.h
new file mode 100644
index 00000000000..d3d8d10c50c
--- /dev/null
+++ b/src/Interpreters/TableNameHints.h
@@ -0,0 +1,39 @@
+#pragma once
+
+#include <Core/Names.h>
+#include <Interpreters/Context_fwd.h>
+#include <Common/NamePrompter.h>
+
+#include <memory>
+
+namespace DB
+{
+
+class IDatabase;
+using ConstDatabasePtr = std::shared_ptr<const IDatabase>;
+
+class TableNameHints : public IHints<>
+{
+public:
+    TableNameHints(ConstDatabasePtr database_, ContextPtr context_) : context(context_), database(database_) { }
+
+    /// getHintForTable tries to get a hint for the provided table_name in the provided
+    /// database. If the results are empty, it goes for extended hints for the table
+    /// with getExtendedHintForTable which looks for the table name in every database that's
+    /// available in the database catalog. It finally returns a single hint which is the database
+    /// name and table_name pair which is similar to the table_name provided. Perhaps something to
+    /// consider is should we return more than one pair of hint?
+    std::pair<String, String> getHintForTable(const String & table_name) const;
+
+    /// getExtendedHintsForTable tries to get hint for the given table_name across all
+    /// the databases that are available in the database catalog.
+    std::pair<String, String> getExtendedHintForTable(const String & table_name) const;
+
+    Names getAllRegisteredNames() const override;
+
+private:
+    ContextPtr context;
+    ConstDatabasePtr database;
+};
+
+}
diff --git a/src/Interpreters/executeDDLQueryOnCluster.cpp b/src/Interpreters/executeDDLQueryOnCluster.cpp
index df8236c11f4..fbcb57b6125 100644
--- a/src/Interpreters/executeDDLQueryOnCluster.cpp
+++ b/src/Interpreters/executeDDLQueryOnCluster.cpp
@@ -1,4 +1,5 @@
 #include <Interpreters/executeDDLQueryOnCluster.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/DDLWorker.h>
 #include <Interpreters/DDLTask.h>
 #include <Interpreters/AddDefaultDatabaseVisitor.h>
diff --git a/src/Interpreters/getTableExpressions.cpp b/src/Interpreters/getTableExpressions.cpp
index 2853be4c05e..cd92d9ecbf3 100644
--- a/src/Interpreters/getTableExpressions.cpp
+++ b/src/Interpreters/getTableExpressions.cpp
@@ -1,5 +1,6 @@
 #include <Interpreters/getTableExpressions.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterSelectWithUnionQuery.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
 #include <Parsers/ASTSelectQuery.h>
diff --git a/src/Interpreters/interpretSubquery.cpp b/src/Interpreters/interpretSubquery.cpp
index 5f00be07fa5..6b42345f1d6 100644
--- a/src/Interpreters/interpretSubquery.cpp
+++ b/src/Interpreters/interpretSubquery.cpp
@@ -10,9 +10,10 @@
 #include <Parsers/ASTSubquery.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
 
-#include <Interpreters/interpretSubquery.h>
-#include <Interpreters/DatabaseAndTableWithAlias.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseAndTableWithAlias.h>
+#include <Interpreters/DatabaseCatalog.h>
+#include <Interpreters/interpretSubquery.h>
 
 namespace DB
 {
diff --git a/src/Interpreters/loadMetadata.cpp b/src/Interpreters/loadMetadata.cpp
index 226472175b3..9c3922b8bda 100644
--- a/src/Interpreters/loadMetadata.cpp
+++ b/src/Interpreters/loadMetadata.cpp
@@ -6,11 +6,12 @@
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/parseQuery.h>
 
+#include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterCreateQuery.h>
 #include <Interpreters/InterpreterSystemQuery.h>
-#include <Interpreters/Context.h>
-#include <Interpreters/loadMetadata.h>
 #include <Interpreters/executeQuery.h>
+#include <Interpreters/loadMetadata.h>
 
 #include <Databases/DatabaseOrdinary.h>
 #include <Databases/TablesLoader.h>
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 8ca8f0f258b..a8d455cf9ee 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -51,6 +51,7 @@
 
 #include <Interpreters/ArrayJoinAction.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/HashJoin.h>
 #include <Interpreters/IJoin.h>
 #include <Interpreters/TableJoin.h>
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
index 6d2532b350a..b1fd86bb806 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <Core/NamesAndTypes.h>
 #include <Formats/FormatSettings.h>
 #include <Formats/SchemaInferenceUtils.h>
 #include <Processors/Formats/IInputFormat.h>
diff --git a/src/Processors/Formats/Impl/Parquet/Write.h b/src/Processors/Formats/Impl/Parquet/Write.h
index 24733ac276b..f162984fd5e 100644
--- a/src/Processors/Formats/Impl/Parquet/Write.h
+++ b/src/Processors/Formats/Impl/Parquet/Write.h
@@ -2,6 +2,7 @@
 
 #include <Processors/Formats/Impl/Parquet/ThriftUtil.h>
 #include <Columns/IColumn.h>
+#include <Core/Block.h>
 #include <DataTypes/IDataType.h>
 #include <Common/PODArray.h>
 #include <IO/CompressionMethod.h>
diff --git a/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.cpp b/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.cpp
index 83a75318d61..c38e9e97ed5 100644
--- a/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.cpp
+++ b/src/Processors/Transforms/CreateSetAndFilterOnTheFlyTransform.cpp
@@ -12,6 +12,8 @@
 #include <Core/ColumnWithTypeAndName.h>
 #include <base/types.h>
 
+#include <Poco/String.h>
+
 namespace DB
 {
 
diff --git a/src/Processors/Transforms/getSourceFromASTInsertQuery.cpp b/src/Processors/Transforms/getSourceFromASTInsertQuery.cpp
index 8a13973b970..a2a42f27c3f 100644
--- a/src/Processors/Transforms/getSourceFromASTInsertQuery.cpp
+++ b/src/Processors/Transforms/getSourceFromASTInsertQuery.cpp
@@ -1,5 +1,6 @@
 #include <Parsers/ASTInsertQuery.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterSetQuery.h>
 #include <IO/ConcatReadBuffer.h>
 #include <IO/ReadBufferFromMemory.h>
diff --git a/src/Server/GRPCServer.cpp b/src/Server/GRPCServer.cpp
index dfae812c620..72135157117 100644
--- a/src/Server/GRPCServer.cpp
+++ b/src/Server/GRPCServer.cpp
@@ -13,6 +13,7 @@
 #include <DataTypes/DataTypeFactory.h>
 #include <QueryPipeline/ProfileInfo.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InternalTextLogsQueue.h>
 #include <Interpreters/executeQuery.h>
 #include <Interpreters/Session.h>
diff --git a/src/Server/MySQLHandler.cpp b/src/Server/MySQLHandler.cpp
index 9efcebfc72d..ad5cae01540 100644
--- a/src/Server/MySQLHandler.cpp
+++ b/src/Server/MySQLHandler.cpp
@@ -15,6 +15,7 @@
 #include <IO/WriteBufferFromPocoSocket.h>
 #include <IO/WriteBufferFromString.h>
 #include <IO/copyData.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/Session.h>
 #include <Interpreters/executeQuery.h>
 #include <Server/TCPServer.h>
@@ -22,10 +23,10 @@
 #include <base/scope_guard.h>
 #include <Common/NetException.h>
 #include <Common/OpenSSLHelpers.h>
-#include <Common/logger_useful.h>
-#include <Common/setThreadName.h>
 #include <Common/config_version.h>
+#include <Common/logger_useful.h>
 #include <Common/re2.h>
+#include <Common/setThreadName.h>
 
 #if USE_SSL
 #    include <Poco/Crypto/RSAKey.h>
diff --git a/src/Server/PrometheusMetricsWriter.cpp b/src/Server/PrometheusMetricsWriter.cpp
index d0fdcd61493..85eafbe4808 100644
--- a/src/Server/PrometheusMetricsWriter.cpp
+++ b/src/Server/PrometheusMetricsWriter.cpp
@@ -1,7 +1,9 @@
 #include "PrometheusMetricsWriter.h"
 
 #include <IO/WriteHelpers.h>
+#include <Common/ErrorCodes.h>
 #include <Common/re2.h>
+
 #include <algorithm>
 
 #include "config.h"
diff --git a/src/Storages/Distributed/DistributedSettings.cpp b/src/Storages/Distributed/DistributedSettings.cpp
index e07b8da34af..1f6aa6c72fa 100644
--- a/src/Storages/Distributed/DistributedSettings.cpp
+++ b/src/Storages/Distributed/DistributedSettings.cpp
@@ -1,9 +1,12 @@
-#include <Storages/Distributed/DistributedSettings.h>
+#include <Core/BaseSettings.h>
 #include <Parsers/ASTCreateQuery.h>
-#include <Parsers/ASTSetQuery.h>
 #include <Parsers/ASTFunction.h>
+#include <Parsers/ASTSetQuery.h>
+#include <Storages/Distributed/DistributedSettings.h>
 #include <Common/Exception.h>
 
+#include <Poco/Util/AbstractConfiguration.h>
+
 
 namespace DB
 {
diff --git a/src/Storages/ExecutableSettings.cpp b/src/Storages/ExecutableSettings.cpp
index dc462350a06..d00e4098181 100644
--- a/src/Storages/ExecutableSettings.cpp
+++ b/src/Storages/ExecutableSettings.cpp
@@ -1,10 +1,10 @@
 #include "ExecutableSettings.h"
 
-#include <Common/Exception.h>
-
+#include <Core/BaseSettings.h>
 #include <Parsers/ASTCreateQuery.h>
-#include <Parsers/ASTSetQuery.h>
 #include <Parsers/ASTFunction.h>
+#include <Parsers/ASTSetQuery.h>
+#include <Common/Exception.h>
 
 namespace DB
 {
diff --git a/src/Storages/ExecutableSettings.h b/src/Storages/ExecutableSettings.h
index 10dbae8ac9f..95627f08d16 100644
--- a/src/Storages/ExecutableSettings.h
+++ b/src/Storages/ExecutableSettings.h
@@ -2,6 +2,7 @@
 
 #include <Core/Defines.h>
 #include <Core/BaseSettings.h>
+#include <Core/SettingsEnums.h>
 
 namespace DB
 {
diff --git a/src/Storages/FileLog/StorageFileLog.cpp b/src/Storages/FileLog/StorageFileLog.cpp
index a5f2331a068..7b0cfdf6a6c 100644
--- a/src/Storages/FileLog/StorageFileLog.cpp
+++ b/src/Storages/FileLog/StorageFileLog.cpp
@@ -8,6 +8,7 @@
 #include <IO/WriteBufferFromFile.h>
 #include <IO/WriteIntText.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterInsertQuery.h>
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Parsers/ASTCreateQuery.h>
diff --git a/src/Storages/MergeTree/extractZkPathFromCreateQuery.cpp b/src/Storages/MergeTree/extractZkPathFromCreateQuery.cpp
index 45d667047af..8ea732b0243 100644
--- a/src/Storages/MergeTree/extractZkPathFromCreateQuery.cpp
+++ b/src/Storages/MergeTree/extractZkPathFromCreateQuery.cpp
@@ -1,11 +1,12 @@
-#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
-#include <Common/Macros.h>
 #include <Databases/DatabaseReplicatedHelpers.h>
 #include <Databases/IDatabase.h>
+#include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTLiteral.h>
-#include <Interpreters/Context.h>
+#include <Storages/MergeTree/extractZkPathFromCreateQuery.h>
+#include <Common/Macros.h>
 
 
 namespace DB
diff --git a/src/Storages/RocksDB/StorageSystemRocksDB.cpp b/src/Storages/RocksDB/StorageSystemRocksDB.cpp
index eec2f53381f..4406a7c3fd4 100644
--- a/src/Storages/RocksDB/StorageSystemRocksDB.cpp
+++ b/src/Storages/RocksDB/StorageSystemRocksDB.cpp
@@ -10,6 +10,7 @@
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/typeid_cast.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Databases/IDatabase.h>
 #include <rocksdb/statistics.h>
 
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 6e7ac2b47b8..e4cd166437e 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -5,6 +5,7 @@
 #include <IO/S3Common.h>
 #include <IO/CompressionMethod.h>
 #include <Formats/FormatFactory.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterInsertQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTInsertQuery.h>
@@ -24,8 +25,8 @@
 #include <Storages/VirtualColumnUtils.h>
 #include <Storages/prepareReadingFromFormat.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
-#include <filesystem>
 
+#include <filesystem>
 
 namespace fs = std::filesystem;
 
diff --git a/src/Storages/StorageMaterializedView.cpp b/src/Storages/StorageMaterializedView.cpp
index 9958d65819b..16428d2dc1c 100644
--- a/src/Storages/StorageMaterializedView.cpp
+++ b/src/Storages/StorageMaterializedView.cpp
@@ -5,14 +5,15 @@
 #include <Parsers/ASTSelectWithUnionQuery.h>
 #include <Parsers/ASTCreateQuery.h>
 
+#include <Access/Common/AccessFlags.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterCreateQuery.h>
 #include <Interpreters/InterpreterDropQuery.h>
-#include <Interpreters/InterpreterRenameQuery.h>
 #include <Interpreters/InterpreterInsertQuery.h>
-#include <Interpreters/getTableExpressions.h>
+#include <Interpreters/InterpreterRenameQuery.h>
 #include <Interpreters/getHeaderForProcessingStage.h>
-#include <Access/Common/AccessFlags.h>
+#include <Interpreters/getTableExpressions.h>
 
 #include <Storages/AlterCommands.h>
 #include <Storages/StorageFactory.h>
diff --git a/src/Storages/StorageNull.cpp b/src/Storages/StorageNull.cpp
index 5e4fde99306..7a8852ca2d6 100644
--- a/src/Storages/StorageNull.cpp
+++ b/src/Storages/StorageNull.cpp
@@ -2,8 +2,9 @@
 #include <Storages/StorageFactory.h>
 #include <Storages/AlterCommands.h>
 
-#include <Interpreters/Context.h>
 #include <Databases/IDatabase.h>
+#include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 
 #include <IO/WriteHelpers.h>
 
diff --git a/src/Storages/System/StorageSystemClusters.cpp b/src/Storages/System/StorageSystemClusters.cpp
index 3c01b4717cc..cb8d5caa50c 100644
--- a/src/Storages/System/StorageSystemClusters.cpp
+++ b/src/Storages/System/StorageSystemClusters.cpp
@@ -3,6 +3,7 @@
 #include <DataTypes/DataTypeNullable.h>
 #include <Interpreters/Cluster.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Storages/System/StorageSystemClusters.h>
 #include <Databases/DatabaseReplicated.h>
 
diff --git a/src/Storages/System/StorageSystemColumns.cpp b/src/Storages/System/StorageSystemColumns.cpp
index 5c96c6502af..8c6d29a3b70 100644
--- a/src/Storages/System/StorageSystemColumns.cpp
+++ b/src/Storages/System/StorageSystemColumns.cpp
@@ -16,6 +16,7 @@
 #include <Databases/IDatabase.h>
 #include <Processors/Sources/NullSource.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/SourceStepWithFilter.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
diff --git a/src/Storages/System/StorageSystemDatabases.cpp b/src/Storages/System/StorageSystemDatabases.cpp
index f5537b508ba..2351c3c6a2a 100644
--- a/src/Storages/System/StorageSystemDatabases.cpp
+++ b/src/Storages/System/StorageSystemDatabases.cpp
@@ -2,6 +2,7 @@
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypeUUID.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/formatWithPossiblyHidingSecrets.h>
 #include <Access/ContextAccess.h>
 #include <Storages/System/StorageSystemDatabases.h>
diff --git a/src/Storages/System/StorageSystemDistributionQueue.cpp b/src/Storages/System/StorageSystemDistributionQueue.cpp
index 50c6436f316..e2058448904 100644
--- a/src/Storages/System/StorageSystemDistributionQueue.cpp
+++ b/src/Storages/System/StorageSystemDistributionQueue.cpp
@@ -10,6 +10,7 @@
 #include <Access/ContextAccess.h>
 #include <Common/typeid_cast.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Databases/IDatabase.h>
 
 namespace DB
diff --git a/src/Storages/System/StorageSystemDroppedTablesParts.cpp b/src/Storages/System/StorageSystemDroppedTablesParts.cpp
index 20baeee1d3b..344c653f7e4 100644
--- a/src/Storages/System/StorageSystemDroppedTablesParts.cpp
+++ b/src/Storages/System/StorageSystemDroppedTablesParts.cpp
@@ -4,6 +4,7 @@
 #include <Storages/System/StorageSystemDroppedTablesParts.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypeUUID.h>
+#include <Interpreters/DatabaseCatalog.h>
 
 
 namespace DB
diff --git a/src/Storages/System/StorageSystemGraphite.cpp b/src/Storages/System/StorageSystemGraphite.cpp
index eaa386763c2..d8b760e1302 100644
--- a/src/Storages/System/StorageSystemGraphite.cpp
+++ b/src/Storages/System/StorageSystemGraphite.cpp
@@ -1,6 +1,7 @@
 #include <Storages/System/StorageSystemGraphite.h>
 #include <Storages/MergeTree/MergeTreeData.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 
 
 namespace DB
diff --git a/src/Storages/System/StorageSystemMutations.cpp b/src/Storages/System/StorageSystemMutations.cpp
index 60b80e0b0ad..94656008029 100644
--- a/src/Storages/System/StorageSystemMutations.cpp
+++ b/src/Storages/System/StorageSystemMutations.cpp
@@ -9,6 +9,7 @@
 #include <Access/ContextAccess.h>
 #include <Databases/IDatabase.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 
 
 namespace DB
diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index 6bdfdd357e8..812a4e6efbe 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -22,6 +22,7 @@
 #include <Processors/Sources/SourceFromSingleChunk.h>
 #include <QueryPipeline/Pipe.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 
 
 namespace DB
diff --git a/src/Storages/System/StorageSystemTables.cpp b/src/Storages/System/StorageSystemTables.cpp
index 639c1455b83..edfc7213dcd 100644
--- a/src/Storages/System/StorageSystemTables.cpp
+++ b/src/Storages/System/StorageSystemTables.cpp
@@ -9,6 +9,7 @@
 #include <Storages/VirtualColumnUtils.h>
 #include <Access/ContextAccess.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/formatWithPossiblyHidingSecrets.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTSelectWithUnionQuery.h>
diff --git a/src/Storages/System/StorageSystemZooKeeperConnection.cpp b/src/Storages/System/StorageSystemZooKeeperConnection.cpp
index 8041370ee92..950e20512c0 100644
--- a/src/Storages/System/StorageSystemZooKeeperConnection.cpp
+++ b/src/Storages/System/StorageSystemZooKeeperConnection.cpp
@@ -8,6 +8,8 @@
 #include <Coordination/KeeperFeatureFlags.h>
 #include <Storages/System/StorageSystemZooKeeperConnection.h>
 
+#include <Poco/NumberParser.h>
+
 namespace DB
 {
 
diff --git a/src/Storages/buildQueryTreeForShard.cpp b/src/Storages/buildQueryTreeForShard.cpp
index c87a1b216ca..41c8f475f03 100644
--- a/src/Storages/buildQueryTreeForShard.cpp
+++ b/src/Storages/buildQueryTreeForShard.cpp
@@ -10,6 +10,7 @@
 #include <Analyzer/JoinNode.h>
 #include <Analyzer/Utils.h>
 #include <Functions/FunctionFactory.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
 #include <Storages/removeGroupingFunctionSpecializations.h>
 #include <Storages/StorageDistributed.h>
diff --git a/src/Storages/getStructureOfRemoteTable.cpp b/src/Storages/getStructureOfRemoteTable.cpp
index c545367b63d..26e953c0578 100644
--- a/src/Storages/getStructureOfRemoteTable.cpp
+++ b/src/Storages/getStructureOfRemoteTable.cpp
@@ -2,6 +2,7 @@
 #include <Interpreters/Cluster.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/ClusterProxy/executeQuery.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <QueryPipeline/RemoteQueryExecutor.h>
 #include <DataTypes/DataTypeFactory.h>
 #include <DataTypes/DataTypeString.h>
diff --git a/src/TableFunctions/TableFunctionMerge.cpp b/src/TableFunctions/TableFunctionMerge.cpp
index ff1459ca34b..13b5c167e0e 100644
--- a/src/TableFunctions/TableFunctionMerge.cpp
+++ b/src/TableFunctions/TableFunctionMerge.cpp
@@ -8,6 +8,7 @@
 #include <Analyzer/TableFunctionNode.h>
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/DatabaseCatalog.h>
 #include <Access/ContextAccess.h>
 #include <TableFunctions/TableFunctionFactory.h>
 #include <TableFunctions/registerTableFunctions.h>

From ec6c276a92a3f9d340e3fd1ac80a2db06c3e7ccb Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 18 Mar 2024 18:02:54 +0300
Subject: [PATCH 751/985] Temporary data use temporary_files_codec setting

---
 src/Compression/CompressionFactory.cpp        |  8 +++++
 src/Compression/CompressionFactory.h          |  3 ++
 src/Core/Settings.h                           |  2 +-
 src/Interpreters/Context.cpp                  | 15 ++++++---
 src/Interpreters/ProcessList.cpp              | 18 ++++++++--
 src/Interpreters/TemporaryDataOnDisk.cpp      | 24 +++++++++-----
 src/Interpreters/TemporaryDataOnDisk.h        | 33 ++++++++++++++-----
 src/Interpreters/tests/gtest_filecache.cpp    |  6 ++--
 .../MergeTreeDataPartWriterCompact.cpp        |  9 +----
 .../MergeTreeDataPartWriterOnDisk.cpp         |  4 +--
 10 files changed, 84 insertions(+), 38 deletions(-)

diff --git a/src/Compression/CompressionFactory.cpp b/src/Compression/CompressionFactory.cpp
index f4413401667..68e0131c91b 100644
--- a/src/Compression/CompressionFactory.cpp
+++ b/src/Compression/CompressionFactory.cpp
@@ -7,6 +7,8 @@
 #include <Poco/String.h>
 #include <IO/ReadBuffer.h>
 #include <Parsers/queryToString.h>
+#include <Parsers/parseQuery.h>
+#include <Parsers/ExpressionElementParsers.h>
 #include <Compression/CompressionCodecMultiple.h>
 #include <Compression/CompressionCodecNone.h>
 #include <IO/WriteHelpers.h>
@@ -44,6 +46,12 @@ CompressionCodecPtr CompressionCodecFactory::get(const String & family_name, std
     }
 }
 
+CompressionCodecPtr CompressionCodecFactory::get(const String & compression_codec) const
+{
+    ParserCodec codec_parser;
+    auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
+    return CompressionCodecFactory::instance().get(ast, nullptr);
+}
 
 CompressionCodecPtr CompressionCodecFactory::get(
     const ASTPtr & ast, const IDataType * column_type, CompressionCodecPtr current_default, bool only_generic) const
diff --git a/src/Compression/CompressionFactory.h b/src/Compression/CompressionFactory.h
index e71476d564d..2885f35d7bd 100644
--- a/src/Compression/CompressionFactory.h
+++ b/src/Compression/CompressionFactory.h
@@ -68,6 +68,9 @@ public:
     /// For backward compatibility with config settings
     CompressionCodecPtr get(const String & family_name, std::optional<int> level) const;
 
+    /// Get codec by name with optional params. Example: LZ4, ZSTD(3)
+    CompressionCodecPtr get(const String & compression_codec) const;
+
     /// Register codec with parameters and column type
     void registerCompressionCodecWithType(const String & family_name, std::optional<uint8_t> byte_code, CreatorWithType creator);
     /// Register codec with parameters
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index a3c5638d97f..a04a8e430e9 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -450,7 +450,7 @@ class IColumn;
     \
     M(Bool, compatibility_ignore_collation_in_create_table, true, "Compatibility ignore collation in create table", 0) \
     \
-    M(String, temporary_files_codec, "LZ4", "Set compression codec for temporary files (sort and join on disk). I.e. LZ4, NONE.", 0) \
+    M(String, temporary_files_codec, "LZ4", "Set compression codec for temporary files produced by (JOINs, external GROUP BY, external ORDER BY). I.e. LZ4, NONE.", 0) \
     \
     M(UInt64, max_rows_to_transfer, 0, "Maximum size (in rows) of the transmitted external table obtained when the GLOBAL IN/JOIN section is executed.", 0) \
     M(UInt64, max_bytes_to_transfer, 0, "Maximum size (in uncompressed bytes) of the transmitted external table obtained when the GLOBAL IN/JOIN section is executed.", 0) \
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 6a0657a842c..038b9712b0c 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -1073,7 +1073,9 @@ void Context::setTemporaryStoragePath(const String & path, size_t max_size)
         setupTmpPath(shared->log, disk->getPath());
     }
 
-    shared->root_temp_data_on_disk = std::make_shared<TemporaryDataOnDiskScope>(volume, max_size);
+    TemporaryDataOnDiskSettings temporary_data_on_disk_settings;
+    temporary_data_on_disk_settings.max_size_on_disk = max_size;
+    shared->root_temp_data_on_disk = std::make_shared<TemporaryDataOnDiskScope>(std::move(volume), std::move(temporary_data_on_disk_settings));
 }
 
 void Context::setTemporaryStoragePolicy(const String & policy_name, size_t max_size)
@@ -1093,7 +1095,7 @@ void Context::setTemporaryStoragePolicy(const String & policy_name, size_t max_s
     VolumePtr volume = tmp_policy->getVolume(0);
 
     if (volume->getDisks().empty())
-         throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "No disks volume for temporary files");
+        throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "No disks volume for temporary files");
 
     for (const auto & disk : volume->getDisks())
     {
@@ -1119,7 +1121,9 @@ void Context::setTemporaryStoragePolicy(const String & policy_name, size_t max_s
     if (shared->root_temp_data_on_disk)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Temporary storage is already set");
 
-    shared->root_temp_data_on_disk = std::make_shared<TemporaryDataOnDiskScope>(volume, max_size);
+    TemporaryDataOnDiskSettings temporary_data_on_disk_settings;
+    temporary_data_on_disk_settings.max_size_on_disk = max_size;
+    shared->root_temp_data_on_disk = std::make_shared<TemporaryDataOnDiskScope>(std::move(volume), std::move(temporary_data_on_disk_settings));
 }
 
 void Context::setTemporaryStorageInCache(const String & cache_disk_name, size_t max_size)
@@ -1140,7 +1144,10 @@ void Context::setTemporaryStorageInCache(const String & cache_disk_name, size_t
 
     shared->tmp_path = file_cache->getBasePath();
     VolumePtr volume = createLocalSingleDiskVolume(shared->tmp_path, shared->getConfigRefWithLock(lock));
-    shared->root_temp_data_on_disk = std::make_shared<TemporaryDataOnDiskScope>(volume, file_cache.get(), max_size);
+
+    TemporaryDataOnDiskSettings temporary_data_on_disk_settings;
+    temporary_data_on_disk_settings.max_size_on_disk = max_size;
+    shared->root_temp_data_on_disk = std::make_shared<TemporaryDataOnDiskScope>(std::move(volume), file_cache.get(), std::move(temporary_data_on_disk_settings));
 }
 
 void Context::setFlagsPath(const String & path)
diff --git a/src/Interpreters/ProcessList.cpp b/src/Interpreters/ProcessList.cpp
index 3bd7b2d4206..889ad79f4ef 100644
--- a/src/Interpreters/ProcessList.cpp
+++ b/src/Interpreters/ProcessList.cpp
@@ -208,8 +208,13 @@ ProcessList::insert(const String & query_, const IAST * ast, ContextMutablePtr q
             thread_group->memory_tracker.setParent(&user_process_list.user_memory_tracker);
             if (user_process_list.user_temp_data_on_disk)
             {
+                TemporaryDataOnDiskSettings temporary_data_on_disk_settings
+                {
+                    .max_size_on_disk = settings.max_temporary_data_on_disk_size_for_query,
+                    .compression_codec = settings.temporary_files_codec
+                };
                 query_context->setTempDataOnDisk(std::make_shared<TemporaryDataOnDiskScope>(
-                    user_process_list.user_temp_data_on_disk, settings.max_temporary_data_on_disk_size_for_query));
+                    user_process_list.user_temp_data_on_disk, std::move(temporary_data_on_disk_settings)));
             }
 
             /// Set query-level memory trackers
@@ -682,8 +687,15 @@ ProcessListForUser::ProcessListForUser(ContextPtr global_context, ProcessList *
 
     if (global_context)
     {
-        size_t size_limit = global_context->getSettingsRef().max_temporary_data_on_disk_size_for_user;
-        user_temp_data_on_disk = std::make_shared<TemporaryDataOnDiskScope>(global_context->getSharedTempDataOnDisk(), size_limit);
+        auto & settings = global_context->getSettingsRef();
+        TemporaryDataOnDiskSettings temporary_data_on_disk_settings
+        {
+            .max_size_on_disk = settings.max_temporary_data_on_disk_size_for_user,
+            .compression_codec = settings.temporary_files_codec
+        };
+
+        user_temp_data_on_disk = std::make_shared<TemporaryDataOnDiskScope>(global_context->getSharedTempDataOnDisk(),
+            std::move(temporary_data_on_disk_settings));
     }
 }
 
diff --git a/src/Interpreters/TemporaryDataOnDisk.cpp b/src/Interpreters/TemporaryDataOnDisk.cpp
index a48e7d8e040..4a30c0ae726 100644
--- a/src/Interpreters/TemporaryDataOnDisk.cpp
+++ b/src/Interpreters/TemporaryDataOnDisk.cpp
@@ -44,20 +44,20 @@ void TemporaryDataOnDiskScope::deltaAllocAndCheck(ssize_t compressed_delta, ssiz
     }
 
     size_t new_consumprion = stat.compressed_size + compressed_delta;
-    if (compressed_delta > 0 && limit && new_consumprion > limit)
+    if (compressed_delta > 0 && settings.max_size_on_disk && new_consumprion > settings.max_size_on_disk)
         throw Exception(ErrorCodes::TOO_MANY_ROWS_OR_BYTES,
-            "Limit for temporary files size exceeded (would consume {} / {} bytes)", new_consumprion, limit);
+            "Limit for temporary files size exceeded (would consume {} / {} bytes)", new_consumprion, settings.max_size_on_disk);
 
     stat.compressed_size += compressed_delta;
     stat.uncompressed_size += uncompressed_delta;
 }
 
 TemporaryDataOnDisk::TemporaryDataOnDisk(TemporaryDataOnDiskScopePtr parent_)
-    : TemporaryDataOnDiskScope(std::move(parent_), /* limit_ = */ 0)
+    : TemporaryDataOnDiskScope(parent_, parent_->getSettings())
 {}
 
 TemporaryDataOnDisk::TemporaryDataOnDisk(TemporaryDataOnDiskScopePtr parent_, CurrentMetrics::Metric metric_scope)
-    : TemporaryDataOnDiskScope(std::move(parent_), /* limit_ = */ 0)
+    : TemporaryDataOnDiskScope(parent_, parent_->getSettings())
     , current_metric_scope(metric_scope)
 {}
 
@@ -153,11 +153,19 @@ bool TemporaryDataOnDisk::empty() const
     return streams.empty();
 }
 
+static inline CompressionCodecPtr getCodec(const TemporaryDataOnDiskSettings & settings)
+{
+    if (settings.compression_codec.empty())
+        return CompressionCodecFactory::instance().get("NONE");
+
+    return CompressionCodecFactory::instance().get(settings.compression_codec);
+}
+
 struct TemporaryFileStream::OutputWriter
 {
-    OutputWriter(std::unique_ptr<WriteBuffer> out_buf_, const Block & header_)
+    OutputWriter(std::unique_ptr<WriteBuffer> out_buf_, const Block & header_, const TemporaryDataOnDiskSettings & settings)
         : out_buf(std::move(out_buf_))
-        , out_compressed_buf(*out_buf)
+        , out_compressed_buf(*out_buf, getCodec(settings))
         , out_writer(out_compressed_buf, DBMS_TCP_PROTOCOL_VERSION, header_)
     {
     }
@@ -248,7 +256,7 @@ TemporaryFileStream::TemporaryFileStream(TemporaryFileOnDiskHolder file_, const
     : parent(parent_)
     , header(header_)
     , file(std::move(file_))
-    , out_writer(std::make_unique<OutputWriter>(std::make_unique<WriteBufferFromFile>(file->getAbsolutePath()), header))
+    , out_writer(std::make_unique<OutputWriter>(std::make_unique<WriteBufferFromFile>(file->getAbsolutePath()), header, parent->settings))
 {
     LOG_TEST(getLogger("TemporaryFileStream"), "Writing to temporary file {}", file->getAbsolutePath());
 }
@@ -263,7 +271,7 @@ TemporaryFileStream::TemporaryFileStream(FileSegmentsHolderPtr segments_, const
     auto out_buf = std::make_unique<WriteBufferToFileSegment>(&segment_holder->front());
 
     LOG_TEST(getLogger("TemporaryFileStream"), "Writing to temporary file {}", out_buf->getFileName());
-    out_writer = std::make_unique<OutputWriter>(std::move(out_buf), header);
+    out_writer = std::make_unique<OutputWriter>(std::move(out_buf), header, parent_->settings);
 }
 
 size_t TemporaryFileStream::write(const Block & block)
diff --git a/src/Interpreters/TemporaryDataOnDisk.h b/src/Interpreters/TemporaryDataOnDisk.h
index 8b0649be1b1..40100a62b44 100644
--- a/src/Interpreters/TemporaryDataOnDisk.h
+++ b/src/Interpreters/TemporaryDataOnDisk.h
@@ -28,6 +28,15 @@ using TemporaryFileStreamPtr = std::unique_ptr<TemporaryFileStream>;
 
 class FileCache;
 
+struct TemporaryDataOnDiskSettings
+{
+    /// Max size on disk, if 0 there will be no limit
+    size_t max_size_on_disk = 0;
+
+    /// Compression codec for temporary data, if empty no compression will be used. LZ4 by default
+    String compression_codec = "LZ4";
+};
+
 /*
  * Used to account amount of temporary data written to disk.
  * If limit is set, throws exception if limit is exceeded.
@@ -43,22 +52,30 @@ public:
         std::atomic<size_t> uncompressed_size;
     };
 
-    explicit TemporaryDataOnDiskScope(VolumePtr volume_, size_t limit_)
-        : volume(std::move(volume_)), limit(limit_)
+    explicit TemporaryDataOnDiskScope(VolumePtr volume_, TemporaryDataOnDiskSettings settings_)
+        : volume(std::move(volume_))
+        , settings(std::move(settings_))
     {}
 
-    explicit TemporaryDataOnDiskScope(VolumePtr volume_, FileCache * file_cache_, size_t limit_)
-        : volume(std::move(volume_)), file_cache(file_cache_), limit(limit_)
+    explicit TemporaryDataOnDiskScope(VolumePtr volume_, FileCache * file_cache_, TemporaryDataOnDiskSettings settings_)
+        : volume(std::move(volume_))
+        , file_cache(file_cache_)
+        , settings(std::move(settings_))
     {}
 
-    explicit TemporaryDataOnDiskScope(TemporaryDataOnDiskScopePtr parent_, size_t limit_)
-        : parent(std::move(parent_)), volume(parent->volume), file_cache(parent->file_cache), limit(limit_)
+    explicit TemporaryDataOnDiskScope(TemporaryDataOnDiskScopePtr parent_, TemporaryDataOnDiskSettings settings_)
+        : parent(std::move(parent_))
+        , volume(parent->volume)
+        , file_cache(parent->file_cache)
+        , settings(std::move(settings_))
     {}
 
     /// TODO: remove
     /// Refactor all code that uses volume directly to use TemporaryDataOnDisk.
     VolumePtr getVolume() const { return volume; }
 
+    const TemporaryDataOnDiskSettings & getSettings() const { return settings; }
+
 protected:
     void deltaAllocAndCheck(ssize_t compressed_delta, ssize_t uncompressed_delta);
 
@@ -68,14 +85,14 @@ protected:
     FileCache * file_cache = nullptr;
 
     StatAtomic stat;
-    size_t limit = 0;
+    const TemporaryDataOnDiskSettings settings;
 };
 
 /*
  * Holds the set of temporary files.
  * New file stream is created with `createStream`.
  * Streams are owned by this object and will be deleted when it is deleted.
- * It's a leaf node in temorarty data scope tree.
+ * It's a leaf node in temporary data scope tree.
  */
 class TemporaryDataOnDisk : private TemporaryDataOnDiskScope
 {
diff --git a/src/Interpreters/tests/gtest_filecache.cpp b/src/Interpreters/tests/gtest_filecache.cpp
index 2679d1b8d18..09afb01d7ff 100644
--- a/src/Interpreters/tests/gtest_filecache.cpp
+++ b/src/Interpreters/tests/gtest_filecache.cpp
@@ -947,7 +947,7 @@ TEST_F(FileCacheTest, temporaryData)
     file_cache.initialize();
 
     const auto user = FileCache::getCommonUser();
-    auto tmp_data_scope = std::make_shared<TemporaryDataOnDiskScope>(nullptr, &file_cache, 0);
+    auto tmp_data_scope = std::make_shared<TemporaryDataOnDiskScope>(nullptr, &file_cache, TemporaryDataOnDiskSettings{});
 
     auto some_data_holder = file_cache.getOrSet(file_cache.createKeyForPath("some_data"), 0, 5_KiB, 5_KiB, CreateFileSegmentSettings{}, 0, user);
 
@@ -1130,7 +1130,7 @@ TEST_F(FileCacheTest, TemporaryDataReadBufferSize)
         DB::FileCache file_cache("cache", settings);
         file_cache.initialize();
 
-        auto tmp_data_scope = std::make_shared<TemporaryDataOnDiskScope>(/*volume=*/nullptr, &file_cache, /*limit=*/0);
+        auto tmp_data_scope = std::make_shared<TemporaryDataOnDiskScope>(/*volume=*/nullptr, &file_cache, /*settings=*/TemporaryDataOnDiskSettings{});
 
         auto tmp_data = std::make_unique<TemporaryDataOnDisk>(tmp_data_scope);
 
@@ -1152,7 +1152,7 @@ TEST_F(FileCacheTest, TemporaryDataReadBufferSize)
         disk = createDisk("temporary_data_read_buffer_size_test_dir");
         VolumePtr volume = std::make_shared<SingleDiskVolume>("volume", disk);
 
-        auto tmp_data_scope = std::make_shared<TemporaryDataOnDiskScope>(/*volume=*/volume, /*cache=*/nullptr, /*limit=*/0);
+        auto tmp_data_scope = std::make_shared<TemporaryDataOnDiskScope>(/*volume=*/volume, /*cache=*/nullptr, /*settings=*/TemporaryDataOnDiskSettings{});
 
         auto tmp_data = std::make_unique<TemporaryDataOnDisk>(tmp_data_scope);
 
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
index fe45d0bee54..1605e5cdb9a 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterCompact.cpp
@@ -9,13 +9,6 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-static CompressionCodecPtr getMarksCompressionCodec(const String & marks_compression_codec)
-{
-    ParserCodec codec_parser;
-    auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(marks_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
-    return CompressionCodecFactory::instance().get(ast, nullptr);
-}
-
 MergeTreeDataPartWriterCompact::MergeTreeDataPartWriterCompact(
     const MergeTreeMutableDataPartPtr & data_part_,
     const NamesAndTypesList & columns_list_,
@@ -46,7 +39,7 @@ MergeTreeDataPartWriterCompact::MergeTreeDataPartWriterCompact(
     {
         marks_compressor = std::make_unique<CompressedWriteBuffer>(
             *marks_file_hashing,
-            getMarksCompressionCodec(settings_.marks_compression_codec),
+             CompressionCodecFactory::instance().get(settings_.marks_compression_codec),
             settings_.marks_compress_block_size);
 
         marks_source_hashing = std::make_unique<HashingWriteBuffer>(*marks_compressor);
diff --git a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
index a31da5bc4fe..5a82357c6eb 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartWriterOnDisk.cpp
@@ -242,9 +242,7 @@ void MergeTreeDataPartWriterOnDisk::initPrimaryIndex()
 
         if (compress_primary_key)
         {
-            ParserCodec codec_parser;
-            auto ast = parseQuery(codec_parser, "(" + Poco::toUpper(settings.primary_key_compression_codec) + ")", 0, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS);
-            CompressionCodecPtr primary_key_compression_codec = CompressionCodecFactory::instance().get(ast, nullptr);
+            CompressionCodecPtr primary_key_compression_codec = CompressionCodecFactory::instance().get(settings.primary_key_compression_codec);
             index_compressor_stream = std::make_unique<CompressedWriteBuffer>(*index_file_hashing_stream, primary_key_compression_codec, settings.primary_key_compress_block_size);
             index_source_hashing_stream = std::make_unique<HashingWriteBuffer>(*index_compressor_stream);
         }

From f4d20a79b08525a3d39716b9a95b6f3ae6058817 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 19 Mar 2024 19:07:02 +0300
Subject: [PATCH 752/985] Fixed build

---
 src/Interpreters/ProcessList.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Interpreters/ProcessList.cpp b/src/Interpreters/ProcessList.cpp
index 889ad79f4ef..0e2a6e14f07 100644
--- a/src/Interpreters/ProcessList.cpp
+++ b/src/Interpreters/ProcessList.cpp
@@ -687,7 +687,7 @@ ProcessListForUser::ProcessListForUser(ContextPtr global_context, ProcessList *
 
     if (global_context)
     {
-        auto & settings = global_context->getSettingsRef();
+        const auto & settings = global_context->getSettingsRef();
         TemporaryDataOnDiskSettings temporary_data_on_disk_settings
         {
             .max_size_on_disk = settings.max_temporary_data_on_disk_size_for_user,

From 574647ed2a9e78185a9dcf9d104d6f73d2588700 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 19 Mar 2024 17:16:53 +0100
Subject: [PATCH 753/985] Update config for another test

---
 tests/integration/test_mask_sensitive_info/configs/users.xml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/integration/test_mask_sensitive_info/configs/users.xml b/tests/integration/test_mask_sensitive_info/configs/users.xml
index f129a5bb3e3..54ee9b2c9db 100644
--- a/tests/integration/test_mask_sensitive_info/configs/users.xml
+++ b/tests/integration/test_mask_sensitive_info/configs/users.xml
@@ -2,6 +2,7 @@
     <profiles>
         <default>
             <s3_retry_attempts>5</s3_retry_attempts>
+            <s3queue_allow_experimental_sharded_mode>1</s3queue_allow_experimental_sharded_mode>
         </default>
     </profiles>
     <users>

From 79bbcbdf1e438d98298499d0c007c7b52b979667 Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 19 Mar 2024 17:20:31 +0100
Subject: [PATCH 754/985] Update StorageS3Queue.cpp

---
 src/Storages/S3Queue/StorageS3Queue.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 048816fe4f1..bf4d3759d8e 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -133,7 +133,7 @@ StorageS3Queue::StorageS3Queue(
     if (mode == LoadingStrictnessLevel::CREATE
         && !context_->getSettingsRef().s3queue_allow_experimental_sharded_mode
         && s3queue_settings->mode == S3QueueMode::ORDERED
-        && s3queue_settings->s3queue_total_shards_num)
+        && (s3queue_settings->s3queue_total_shards_num > 1 || s3queue_settings->s3queue_processing_threads_num > 1))
     {
         throw Exception(ErrorCodes::QUERY_NOT_ALLOWED, "S3Queue sharded mode is not allowed. To enable use `s3queue_allow_experimental_sharded_mode`");
     }

From 7ebab45beff7bdea5c2dbef2e1aaa568c7c7fbca Mon Sep 17 00:00:00 2001
From: Kseniia Sumarokova <54203879+kssenii@users.noreply.github.com>
Date: Tue, 19 Mar 2024 17:21:03 +0100
Subject: [PATCH 755/985] Update users.xml

---
 tests/integration/test_mask_sensitive_info/configs/users.xml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/integration/test_mask_sensitive_info/configs/users.xml b/tests/integration/test_mask_sensitive_info/configs/users.xml
index 54ee9b2c9db..f129a5bb3e3 100644
--- a/tests/integration/test_mask_sensitive_info/configs/users.xml
+++ b/tests/integration/test_mask_sensitive_info/configs/users.xml
@@ -2,7 +2,6 @@
     <profiles>
         <default>
             <s3_retry_attempts>5</s3_retry_attempts>
-            <s3queue_allow_experimental_sharded_mode>1</s3queue_allow_experimental_sharded_mode>
         </default>
     </profiles>
     <users>

From c6f0a434c04023290b67403eeab7136631573798 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 19 Mar 2024 17:40:27 +0100
Subject: [PATCH 756/985] Remove some magic_enum from headers

---
 src/Common/IntervalKind.cpp                   |  7 +++
 src/Common/IntervalKind.h                     |  3 +-
 .../MergeTree/MergeTreeDataPartType.cpp       | 47 +++++++++++++++++++
 .../MergeTree/MergeTreeDataPartType.h         | 28 ++---------
 4 files changed, 59 insertions(+), 26 deletions(-)
 create mode 100644 src/Storages/MergeTree/MergeTreeDataPartType.cpp

diff --git a/src/Common/IntervalKind.cpp b/src/Common/IntervalKind.cpp
index 7ba32a689f5..22c7db504c3 100644
--- a/src/Common/IntervalKind.cpp
+++ b/src/Common/IntervalKind.cpp
@@ -1,6 +1,8 @@
 #include <Common/IntervalKind.h>
 #include <Common/Exception.h>
 
+#include <base/EnumReflection.h>
+
 
 namespace DB
 {
@@ -10,6 +12,11 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
 }
 
+std::string_view IntervalKind::toString() const
+{
+    return magic_enum::enum_name(kind);
+}
+
 Int64 IntervalKind::toAvgNanoseconds() const
 {
     static constexpr Int64 NANOSECONDS_PER_MICROSECOND = 1000;
diff --git a/src/Common/IntervalKind.h b/src/Common/IntervalKind.h
index d77a39cb9fa..497dc83be0b 100644
--- a/src/Common/IntervalKind.h
+++ b/src/Common/IntervalKind.h
@@ -1,7 +1,6 @@
 #pragma once
 
 #include <base/types.h>
-#include <base/EnumReflection.h>
 
 namespace DB
 {
@@ -27,7 +26,7 @@ struct IntervalKind
     IntervalKind(Kind kind_ = Kind::Second) : kind(kind_) {} /// NOLINT
     operator Kind() const { return kind; } /// NOLINT
 
-    constexpr std::string_view toString() const { return magic_enum::enum_name(kind); }
+    std::string_view toString() const;
 
     /// Returns number of nanoseconds in one interval.
     /// For `Month`, `Quarter` and `Year` the function returns an average number of nanoseconds.
diff --git a/src/Storages/MergeTree/MergeTreeDataPartType.cpp b/src/Storages/MergeTree/MergeTreeDataPartType.cpp
new file mode 100644
index 00000000000..fb5555cb13f
--- /dev/null
+++ b/src/Storages/MergeTree/MergeTreeDataPartType.cpp
@@ -0,0 +1,47 @@
+#include <base/types.h>
+#include <Common/Exception.h>
+
+#include <magic_enum.hpp>
+
+#include <Storages/MergeTree/MergeTreeDataPartType.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+extern const int BAD_ARGUMENTS;
+}
+
+template <typename E>
+requires std::is_enum_v<E>
+static E parseEnum(const String & str)
+{
+    auto value = magic_enum::enum_cast<E>(str);
+    if (!value || *value == E::Unknown)
+        throw DB::Exception(ErrorCodes::BAD_ARGUMENTS, "Unexpected string {} for enum {}", str, magic_enum::enum_type_name<E>());
+
+    return *value;
+}
+
+String MergeTreeDataPartType::toString() const
+{
+    return String(magic_enum::enum_name(value));
+}
+
+void MergeTreeDataPartType::fromString(const String & str)
+{
+    value = parseEnum<Value>(str);
+}
+
+String MergeTreeDataPartStorageType::toString() const
+{
+    return String(magic_enum::enum_name(value));
+}
+
+void MergeTreeDataPartStorageType::fromString(const String & str)
+{
+    value = parseEnum<Value>(str);
+}
+
+}
diff --git a/src/Storages/MergeTree/MergeTreeDataPartType.h b/src/Storages/MergeTree/MergeTreeDataPartType.h
index 64f3abee391..8177809d41e 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartType.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartType.h
@@ -1,29 +1,9 @@
 #pragma once
 
-#include <Common/Exception.h>
 #include <base/types.h>
-#include <magic_enum.hpp>
 
 namespace DB
 {
-
-namespace ErrorCodes
-{
-    extern const int BAD_ARGUMENTS;
-}
-
-template <typename E>
-requires std::is_enum_v<E>
-static E parseEnum(const String & str)
-{
-    auto value = magic_enum::enum_cast<E>(str);
-    if (!value || *value == E::Unknown)
-        throw DB::Exception(ErrorCodes::BAD_ARGUMENTS,
-            "Unexpected string {} for enum {}", str, magic_enum::enum_type_name<E>());
-
-    return *value;
-}
-
 /// It's a bug in clang with three-way comparison operator
 /// https://github.com/llvm/llvm-project/issues/55919
 #pragma clang diagnostic push
@@ -51,8 +31,8 @@ public:
     auto operator<=>(const MergeTreeDataPartType &) const = default;
 
     Value getValue() const { return value; }
-    String toString() const { return String(magic_enum::enum_name(value)); }
-    void fromString(const String & str) { value = parseEnum<Value>(str); }
+    String toString() const;
+    void fromString(const String & str);
 
 private:
     Value value;
@@ -74,8 +54,8 @@ public:
     auto operator<=>(const MergeTreeDataPartStorageType &) const = default;
 
     Value getValue() const { return value; }
-    String toString() const { return String(magic_enum::enum_name(value)); }
-    void fromString(const String & str) { value = parseEnum<Value>(str); }
+    String toString() const;
+    void fromString(const String & str);
 
 private:
     Value value;

From 301037ca6a69507418c865ab33123b21426faa5d Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 19 Mar 2024 17:53:32 +0100
Subject: [PATCH 757/985] Replace `cat | sed; mv` by `sed -i`

---
 docker/test/stateless/run.sh | 30 ++++++------------------------
 docker/test/upgrade/run.sh   | 20 ++++----------------
 2 files changed, 10 insertions(+), 40 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index f4de7677012..e531a9928ac 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -51,10 +51,7 @@ fi
 config_logs_export_cluster /etc/clickhouse-server/config.d/system_logs_export.yaml
 
 if [[ -n "$BUGFIX_VALIDATE_CHECK" ]] && [[ "$BUGFIX_VALIDATE_CHECK" -eq 1 ]]; then
-    sudo cat /etc/clickhouse-server/config.d/zookeeper.xml \
-    | sed "/<use_compression>1<\/use_compression>/d" \
-    > /etc/clickhouse-server/config.d/zookeeper.xml.tmp
-    sudo mv /etc/clickhouse-server/config.d/zookeeper.xml.tmp /etc/clickhouse-server/config.d/zookeeper.xml
+    sudo sed -i "/<use_compression>1<\/use_compression>/d" /etc/clickhouse-server/config.d/zookeeper.xml
 
     # it contains some new settings, but we can safely remove it
     rm /etc/clickhouse-server/config.d/handlers.yaml
@@ -75,10 +72,7 @@ if [[ -n "$BUGFIX_VALIDATE_CHECK" ]] && [[ "$BUGFIX_VALIDATE_CHECK" -eq 1 ]]; th
 
     function remove_keeper_config()
     {
-        sudo cat /etc/clickhouse-server/config.d/keeper_port.xml \
-          | sed "/<$1>$2<\/$1>/d" \
-          > /etc/clickhouse-server/config.d/keeper_port.xml.tmp
-        sudo mv /etc/clickhouse-server/config.d/keeper_port.xml.tmp /etc/clickhouse-server/config.d/keeper_port.xml
+        sudo sed -i "/<$1>$2<\/$1>/d" /etc/clickhouse-server/config.d/keeper_port.xml
     }
     # commit_logs_cache_size_threshold setting doesn't exist on some older versions
     remove_keeper_config "commit_logs_cache_size_threshold" "[[:digit:]]\+"
@@ -113,25 +107,13 @@ else
 fi
 
 if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
-    sudo cat /etc/clickhouse-server1/config.d/filesystem_caches_path.xml \
-    | sed "s|<filesystem_caches_path>/var/lib/clickhouse/filesystem_caches/</filesystem_caches_path>|<filesystem_caches_path>/var/lib/clickhouse/filesystem_caches_1/</filesystem_caches_path>|" \
-    > /etc/clickhouse-server1/config.d/filesystem_caches_path.xml.tmp
-    mv /etc/clickhouse-server1/config.d/filesystem_caches_path.xml.tmp /etc/clickhouse-server1/config.d/filesystem_caches_path.xml
+    sudo sed -i "s|<filesystem_caches_path>/var/lib/clickhouse/filesystem_caches/</filesystem_caches_path>|<filesystem_caches_path>/var/lib/clickhouse/filesystem_caches_1/</filesystem_caches_path>|" /etc/clickhouse-server1/config.d/filesystem_caches_path.xml
 
-    sudo cat /etc/clickhouse-server2/config.d/filesystem_caches_path.xml \
-    | sed "s|<filesystem_caches_path>/var/lib/clickhouse/filesystem_caches/</filesystem_caches_path>|<filesystem_caches_path>/var/lib/clickhouse/filesystem_caches_2/</filesystem_caches_path>|" \
-    > /etc/clickhouse-server2/config.d/filesystem_caches_path.xml.tmp
-    mv /etc/clickhouse-server2/config.d/filesystem_caches_path.xml.tmp /etc/clickhouse-server2/config.d/filesystem_caches_path.xml
+    sudo sed -i "s|<filesystem_caches_path>/var/lib/clickhouse/filesystem_caches/</filesystem_caches_path>|<filesystem_caches_path>/var/lib/clickhouse/filesystem_caches_2/</filesystem_caches_path>|" /etc/clickhouse-server2/config.d/filesystem_caches_path.xml
 
-    sudo cat /etc/clickhouse-server1/config.d/filesystem_caches_path.xml \
-    | sed "s|<custom_cached_disks_base_directory replace=\"replace\">/var/lib/clickhouse/filesystem_caches/</custom_cached_disks_base_directory>|<custom_cached_disks_base_directory replace=\"replace\">/var/lib/clickhouse/filesystem_caches_1/</custom_cached_disks_base_directory>|" \
-    > /etc/clickhouse-server1/config.d/filesystem_caches_path.xml.tmp
-    mv /etc/clickhouse-server1/config.d/filesystem_caches_path.xml.tmp /etc/clickhouse-server1/config.d/filesystem_caches_path.xml
+    sudo sed -i "s|<custom_cached_disks_base_directory replace=\"replace\">/var/lib/clickhouse/filesystem_caches/</custom_cached_disks_base_directory>|<custom_cached_disks_base_directory replace=\"replace\">/var/lib/clickhouse/filesystem_caches_1/</custom_cached_disks_base_directory>|" /etc/clickhouse-server1/config.d/filesystem_caches_path.xml
 
-    sudo cat /etc/clickhouse-server2/config.d/filesystem_caches_path.xml \
-    | sed "s|<custom_cached_disks_base_directory replace=\"replace\">/var/lib/clickhouse/filesystem_caches/</custom_cached_disks_base_directory>|<custom_cached_disks_base_directory replace=\"replace\">/var/lib/clickhouse/filesystem_caches_2/</custom_cached_disks_base_directory>|" \
-    > /etc/clickhouse-server2/config.d/filesystem_caches_path.xml.tmp
-    mv /etc/clickhouse-server2/config.d/filesystem_caches_path.xml.tmp /etc/clickhouse-server2/config.d/filesystem_caches_path.xml
+    sudo sed -i "s|<custom_cached_disks_base_directory replace=\"replace\">/var/lib/clickhouse/filesystem_caches/</custom_cached_disks_base_directory>|<custom_cached_disks_base_directory replace=\"replace\">/var/lib/clickhouse/filesystem_caches_2/</custom_cached_disks_base_directory>|" /etc/clickhouse-server2/config.d/filesystem_caches_path.xml
 
     mkdir -p /var/run/clickhouse-server1
     sudo chown clickhouse:clickhouse /var/run/clickhouse-server1
diff --git a/docker/test/upgrade/run.sh b/docker/test/upgrade/run.sh
index 69228b1bfc9..325fc274cf7 100644
--- a/docker/test/upgrade/run.sh
+++ b/docker/test/upgrade/run.sh
@@ -67,10 +67,7 @@ configure
 
 function remove_keeper_config()
 {
-  sudo cat /etc/clickhouse-server/config.d/keeper_port.xml \
-    | sed "/<$1>$2<\/$1>/d" \
-    > /etc/clickhouse-server/config.d/keeper_port.xml.tmp
-  sudo mv /etc/clickhouse-server/config.d/keeper_port.xml.tmp /etc/clickhouse-server/config.d/keeper_port.xml
+  sudo sed -i "/<$1>$2<\/$1>/d" /etc/clickhouse-server/config.d/keeper_port.xml
 }
 
 # async_replication setting doesn't exist on some older versions
@@ -120,10 +117,7 @@ export ZOOKEEPER_FAULT_INJECTION=0
 configure
 
 # force_sync=false doesn't work correctly on some older versions
-sudo cat /etc/clickhouse-server/config.d/keeper_port.xml \
-  | sed "s|<force_sync>false</force_sync>|<force_sync>true</force_sync>|" \
-  > /etc/clickhouse-server/config.d/keeper_port.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/keeper_port.xml.tmp /etc/clickhouse-server/config.d/keeper_port.xml
+sudo sed -i "s|<force_sync>false</force_sync>|<force_sync>true</force_sync>|" /etc/clickhouse-server/config.d/keeper_port.xml
 
 #todo: remove these after 24.3 released.
 sudo cat /etc/clickhouse-server/config.d/azure_storage_conf.xml \
@@ -150,10 +144,7 @@ remove_keeper_config "latest_logs_cache_size_threshold" "[[:digit:]]\+"
 remove_keeper_config "commit_logs_cache_size_threshold" "[[:digit:]]\+"
 
 # But we still need default disk because some tables loaded only into it
-sudo cat /etc/clickhouse-server/config.d/s3_storage_policy_by_default.xml \
-  | sed "s|<main><disk>s3</disk></main>|<main><disk>s3</disk></main><default><disk>default</disk></default>|" \
-  > /etc/clickhouse-server/config.d/s3_storage_policy_by_default.xml.tmp
-mv /etc/clickhouse-server/config.d/s3_storage_policy_by_default.xml.tmp /etc/clickhouse-server/config.d/s3_storage_policy_by_default.xml
+sudo sed -i "s|<main><disk>s3</disk></main>|<main><disk>s3</disk></main><default><disk>default</disk></default>|" /etc/clickhouse-server/config.d/s3_storage_policy_by_default.xml
 sudo chown clickhouse /etc/clickhouse-server/config.d/s3_storage_policy_by_default.xml
 sudo chgrp clickhouse /etc/clickhouse-server/config.d/s3_storage_policy_by_default.xml
 
@@ -256,10 +247,7 @@ then
 fi
 
 # Just in case previous version left some garbage in zk
-sudo cat /etc/clickhouse-server/config.d/lost_forever_check.xml \
-  | sed "s|>1<|>0<|g" \
-  > /etc/clickhouse-server/config.d/lost_forever_check.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/lost_forever_check.xml.tmp /etc/clickhouse-server/config.d/lost_forever_check.xml
+sudo sed -i "s|>1<|>0<|g" /etc/clickhouse-server/config.d/lost_forever_check.xml \
 rm /etc/clickhouse-server/config.d/filesystem_caches_path.xml
 
 start 500

From fce926446bac1f1de0591c1efb6fbf3539015b67 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Tue, 19 Mar 2024 18:05:57 +0100
Subject: [PATCH 758/985] Fix sed to not produce
 local_blob_storage_blob_storage

---
 docker/test/stateless/run.sh | 10 ++--------
 docker/test/upgrade/run.sh   | 20 ++++----------------
 2 files changed, 6 insertions(+), 24 deletions(-)

diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index e531a9928ac..bac9d8df7a9 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -59,16 +59,10 @@ if [[ -n "$BUGFIX_VALIDATE_CHECK" ]] && [[ "$BUGFIX_VALIDATE_CHECK" -eq 1 ]]; th
     rm /etc/clickhouse-server/config.d/zero_copy_destructive_operations.xml
 
     #todo: remove these after 24.3 released.
-    sudo cat /etc/clickhouse-server/config.d/azure_storage_conf.xml \
-      | sed "s|<object_storage_type>azure|<object_storage_type>azure_blob_storage|" \
-      > /etc/clickhouse-server/config.d/azure_storage_conf.xml.tmp
-    sudo mv /etc/clickhouse-server/config.d/azure_storage_conf.xml.tmp /etc/clickhouse-server/config.d/azure_storage_conf.xml
+    sudo sed -i "s|<object_storage_type>azure<|<object_storage_type>azure_blob_storage<|" /etc/clickhouse-server/config.d/azure_storage_conf.xml
 
     #todo: remove these after 24.3 released.
-    sudo cat /etc/clickhouse-server/config.d/storage_conf.xml \
-      | sed "s|<object_storage_type>local|<object_storage_type>local_blob_storage|" \
-      > /etc/clickhouse-server/config.d/storage_conf.xml.tmp
-    sudo mv /etc/clickhouse-server/config.d/storage_conf.xml.tmp /etc/clickhouse-server/config.d/storage_conf.xml
+    sudo sed -i "s|<object_storage_type>local<|<object_storage_type>local_blob_storage<|" /etc/clickhouse-server/config.d/storage_conf.xml
 
     function remove_keeper_config()
     {
diff --git a/docker/test/upgrade/run.sh b/docker/test/upgrade/run.sh
index 325fc274cf7..6761ddba3e5 100644
--- a/docker/test/upgrade/run.sh
+++ b/docker/test/upgrade/run.sh
@@ -77,16 +77,10 @@ remove_keeper_config "async_replication" "1"
 remove_keeper_config "create_if_not_exists" "[01]"
 
 #todo: remove these after 24.3 released.
-sudo cat /etc/clickhouse-server/config.d/azure_storage_conf.xml \
-  | sed "s|<object_storage_type>azure|<object_storage_type>azure_blob_storage|" \
-  > /etc/clickhouse-server/config.d/azure_storage_conf.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/azure_storage_conf.xml.tmp /etc/clickhouse-server/config.d/azure_storage_conf.xml
+sudo sed -i "s|<object_storage_type>azure<|<object_storage_type>azure_blob_storage<|" /etc/clickhouse-server/config.d/azure_storage_conf.xml
 
 #todo: remove these after 24.3 released.
-sudo cat /etc/clickhouse-server/config.d/storage_conf.xml \
-  | sed "s|<object_storage_type>local|<object_storage_type>local_blob_storage|" \
-  > /etc/clickhouse-server/config.d/storage_conf.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/storage_conf.xml.tmp /etc/clickhouse-server/config.d/storage_conf.xml
+sudo sed -i "s|<object_storage_type>local<|<object_storage_type>local_blob_storage<|" /etc/clickhouse-server/config.d/storage_conf.xml
 
 # latest_logs_cache_size_threshold setting doesn't exist on some older versions
 remove_keeper_config "latest_logs_cache_size_threshold" "[[:digit:]]\+"
@@ -120,16 +114,10 @@ configure
 sudo sed -i "s|<force_sync>false</force_sync>|<force_sync>true</force_sync>|" /etc/clickhouse-server/config.d/keeper_port.xml
 
 #todo: remove these after 24.3 released.
-sudo cat /etc/clickhouse-server/config.d/azure_storage_conf.xml \
-  | sed "s|<object_storage_type>azure|<object_storage_type>azure_blob_storage|" \
-  > /etc/clickhouse-server/config.d/azure_storage_conf.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/azure_storage_conf.xml.tmp /etc/clickhouse-server/config.d/azure_storage_conf.xml
+sudo sed -i "s|<object_storage_type>azure<|<object_storage_type>azure_blob_storage<|" /etc/clickhouse-server/config.d/azure_storage_conf.xml
 
 #todo: remove these after 24.3 released.
-sudo cat /etc/clickhouse-server/config.d/storage_conf.xml \
-  | sed "s|<object_storage_type>local|<object_storage_type>local_blob_storage|" \
-  > /etc/clickhouse-server/config.d/storage_conf.xml.tmp
-sudo mv /etc/clickhouse-server/config.d/storage_conf.xml.tmp /etc/clickhouse-server/config.d/storage_conf.xml
+sudo sed -i "s|<object_storage_type>local<|<object_storage_type>local_blob_storage<|" /etc/clickhouse-server/config.d/storage_conf.xml
 
 # async_replication setting doesn't exist on some older versions
 remove_keeper_config "async_replication" "1"

From 824092b6192b043e28cd775284b27ca720d3e7fe Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Tue, 19 Mar 2024 18:38:02 +0100
Subject: [PATCH 759/985] Updated to use single part upload for single block of
 small size and fixed test fail

---
 .../IO/WriteBufferFromAzureBlobStorage.cpp    | 20 ++++++++++++++++++-
 .../AzureBlobStorage/AzureBlobStorageAuth.cpp |  2 +-
 .../test.py                                   |  1 +
 3 files changed, 21 insertions(+), 2 deletions(-)

diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index 50763f7f189..f966e431506 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -89,11 +89,25 @@ void WriteBufferFromAzureBlobStorage::execWithRetry(std::function<void()> func,
 
 void WriteBufferFromAzureBlobStorage::finalizeImpl()
 {
+    auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
+
+    if (buffer_allocation_policy->getBufferNumber() == 1)
+    {
+        size_t data_size = size_t(position() - memory.data());
+        if (data_size <= max_single_part_upload_size)
+        {
+            Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(memory.data()), data_size);
+            execWithRetry([&](){ block_blob_client.Upload(memory_stream); }, max_unexpected_write_error_retries, data_size);
+            LOG_TRACE(log, "Committed single block for blob `{}`", blob_path);
+            return;
+        }
+    }
+
+
     execWithRetry([this](){ next(); }, max_unexpected_write_error_retries);
 
     task_tracker->waitAll();
 
-    auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
     execWithRetry([&](){ block_blob_client.CommitBlockList(block_ids); }, max_unexpected_write_error_retries);
 
     LOG_TRACE(log, "Committed {} blocks for blob `{}`", block_ids.size(), blob_path);
@@ -116,6 +130,8 @@ void WriteBufferFromAzureBlobStorage::allocateBuffer()
         size = std::min(size_t(DBMS_DEFAULT_BUFFER_SIZE), size);
     }
 
+    LOG_INFO(log, "allocateBuffer size = {}", size);
+
     memory = Memory(size);
     WriteBuffer::set(memory.data(), memory.size());
 }
@@ -129,6 +145,8 @@ void WriteBufferFromAzureBlobStorage::writePart()
     if (data_size == 0)
         return;
 
+    LOG_TRACE(log, "writePart data size `{}`", data_size);
+
     auto upload_worker = [&] ()
     {
         auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
diff --git a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
index 3c06801a070..e7ee768876f 100644
--- a/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
+++ b/src/Disks/ObjectStorages/AzureBlobStorage/AzureBlobStorageAuth.cpp
@@ -213,7 +213,7 @@ std::unique_ptr<BlobContainerClient> getAzureBlobContainerClient(
 std::unique_ptr<AzureObjectStorageSettings> getAzureBlobStorageSettings(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr context)
 {
     std::unique_ptr<AzureObjectStorageSettings> settings = std::make_unique<AzureObjectStorageSettings>();
-    settings->max_single_part_upload_size = config.getUInt64(config_prefix + ".max_single_part_upload_size", 100 * 1024 * 1024);
+    settings->max_single_part_upload_size = config.getUInt64(config_prefix + ".max_single_part_upload_size", context->getSettings().azure_max_single_part_upload_size);
     settings->min_bytes_for_seek = config.getUInt64(config_prefix + ".min_bytes_for_seek", 1024 * 1024);
     settings->max_single_read_retries = config.getInt(config_prefix + ".max_single_read_retries", 3);
     settings->max_single_download_retries = config.getInt(config_prefix + ".max_single_download_retries", 3);
diff --git a/tests/integration/test_merge_tree_azure_blob_storage/test.py b/tests/integration/test_merge_tree_azure_blob_storage/test.py
index 55deb87a97e..cffab672bd1 100644
--- a/tests/integration/test_merge_tree_azure_blob_storage/test.py
+++ b/tests/integration/test_merge_tree_azure_blob_storage/test.py
@@ -37,6 +37,7 @@ def generate_cluster_def(port):
                 <account_name>devstoreaccount1</account_name>
                 <account_key>Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==</account_key>
                 <max_single_part_upload_size>100000</max_single_part_upload_size>
+                <min_upload_part_size>100000</min_upload_part_size>
                 <max_single_download_retries>10</max_single_download_retries>
                 <max_single_read_retries>10</max_single_read_retries>
             </blob_storage_disk>

From 764c72b6c9bc3c54d7e505514aef8b8c4c7a5fd7 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Tue, 19 Mar 2024 20:41:39 +0300
Subject: [PATCH 760/985] Fixed code review issues

---
 tests/integration/test_temporary_data_in_cache/test.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/integration/test_temporary_data_in_cache/test.py b/tests/integration/test_temporary_data_in_cache/test.py
index ed06a70cf5a..5eed7563d9b 100644
--- a/tests/integration/test_temporary_data_in_cache/test.py
+++ b/tests/integration/test_temporary_data_in_cache/test.py
@@ -67,6 +67,7 @@ def test_cache_evicted_by_temporary_data(start_cluster):
             settings={
                 "max_bytes_before_external_group_by": "4M",
                 "max_bytes_before_external_sort": "4M",
+                "temporary_files_codec": "ZSTD"
             },
         )
     assert fnmatch.fnmatch(

From f60b5f3cb7f1c32fd6f5d9837c4d27401dbe5da8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 19 Mar 2024 18:45:07 +0100
Subject: [PATCH 761/985] Add test for #60317

---
 .../03014_analyzer_groupby_fuzz_60317.reference          | 1 +
 .../0_stateless/03014_analyzer_groupby_fuzz_60317.sql    | 9 +++++++++
 2 files changed, 10 insertions(+)
 create mode 100644 tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.reference
 create mode 100644 tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.sql

diff --git a/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.reference b/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.reference
new file mode 100644
index 00000000000..4972904f87d
--- /dev/null
+++ b/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.reference
@@ -0,0 +1 @@
+30	30	1970-01-01
diff --git a/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.sql b/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.sql
new file mode 100644
index 00000000000..2f54058526e
--- /dev/null
+++ b/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.sql
@@ -0,0 +1,9 @@
+-- https://github.com/ClickHouse/ClickHouse/issues/60317
+SELECT
+    toNullable(materialize(_CAST(30, 'LowCardinality(UInt8)'))) as a,
+    _CAST(30, 'LowCardinality(UInt8)') as b,
+    makeDate(materialize(_CAST(30, 'LowCardinality(UInt8)')), 10, _CAST(30, 'Nullable(UInt8)')) as c
+FROM system.one
+GROUP BY
+    _CAST(30, 'Nullable(UInt8)')
+SETTINGS allow_experimental_analyzer = 1;

From e954f684823c98adfe5bc99af8de4c7a615a60a2 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 19 Mar 2024 18:51:09 +0100
Subject: [PATCH 762/985] Add test for #60772

---
 .../03015_analyzer_groupby_fuzz_60772.reference        |  1 +
 .../0_stateless/03015_analyzer_groupby_fuzz_60772.sql  | 10 ++++++++++
 2 files changed, 11 insertions(+)
 create mode 100644 tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.reference
 create mode 100644 tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.sql

diff --git a/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.reference b/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.reference
new file mode 100644
index 00000000000..611407ecd90
--- /dev/null
+++ b/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.reference
@@ -0,0 +1 @@
+%W	2018-01-02 22:33:44	1
diff --git a/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.sql b/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.sql
new file mode 100644
index 00000000000..c8b4eef50ff
--- /dev/null
+++ b/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.sql
@@ -0,0 +1,10 @@
+-- https://github.com/ClickHouse/ClickHouse/issues/60772
+SELECT toFixedString(toFixedString(toFixedString(toFixedString(toFixedString(toFixedString('%W', 2), 2), 2),toLowCardinality(toLowCardinality(toNullable(2)))), 2), 2),
+       toFixedString(toFixedString('2018-01-02 22:33:44', 19), 19),
+       hasSubsequence(toNullable(materialize(toLowCardinality('garbage'))), 'gr')
+GROUP BY
+    '2018-01-02 22:33:44',
+    toFixedString(toFixedString('2018-01-02 22:33:44', 19), 19),
+    'gr',
+    '2018-01-02 22:33:44'
+SETTINGS allow_experimental_analyzer = 1;

From b19540f5b6f6b229a4c49353a01d8cc8921b5602 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Tue, 19 Mar 2024 19:03:20 +0100
Subject: [PATCH 763/985] Fix style
 tests/integration/test_temporary_data_in_cache/test.py

---
 tests/integration/test_temporary_data_in_cache/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_temporary_data_in_cache/test.py b/tests/integration/test_temporary_data_in_cache/test.py
index 5eed7563d9b..cab134dcce2 100644
--- a/tests/integration/test_temporary_data_in_cache/test.py
+++ b/tests/integration/test_temporary_data_in_cache/test.py
@@ -67,7 +67,7 @@ def test_cache_evicted_by_temporary_data(start_cluster):
             settings={
                 "max_bytes_before_external_group_by": "4M",
                 "max_bytes_before_external_sort": "4M",
-                "temporary_files_codec": "ZSTD"
+                "temporary_files_codec": "ZSTD",
             },
         )
     assert fnmatch.fnmatch(

From d56838080011e65ac2363862e8d6157bf2b35d2b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 19 Mar 2024 19:03:35 +0100
Subject: [PATCH 764/985] Add test for #59796

---
 .../0_stateless/03016_analyzer_groupby_fuzz_59796.reference | 1 +
 .../0_stateless/03016_analyzer_groupby_fuzz_59796.sql       | 6 ++++++
 2 files changed, 7 insertions(+)
 create mode 100644 tests/queries/0_stateless/03016_analyzer_groupby_fuzz_59796.reference
 create mode 100644 tests/queries/0_stateless/03016_analyzer_groupby_fuzz_59796.sql

diff --git a/tests/queries/0_stateless/03016_analyzer_groupby_fuzz_59796.reference b/tests/queries/0_stateless/03016_analyzer_groupby_fuzz_59796.reference
new file mode 100644
index 00000000000..6f7389b482b
--- /dev/null
+++ b/tests/queries/0_stateless/03016_analyzer_groupby_fuzz_59796.reference
@@ -0,0 +1 @@
+\0\0\0 key="v" \0 key="v"  key="v"  key="v"  key="v" \0 key="v" 
diff --git a/tests/queries/0_stateless/03016_analyzer_groupby_fuzz_59796.sql b/tests/queries/0_stateless/03016_analyzer_groupby_fuzz_59796.sql
new file mode 100644
index 00000000000..c00a75a631c
--- /dev/null
+++ b/tests/queries/0_stateless/03016_analyzer_groupby_fuzz_59796.sql
@@ -0,0 +1,6 @@
+SELECT
+    concat(concat(unhex('00'), concat(unhex('00'), concat(unhex(toFixedString('00', 2)), toFixedString(toFixedString(' key="v" ', 9), 9), concat(unhex('00'), toFixedString(' key="v" ', 9)), toFixedString(materialize(toLowCardinality(' key="v" ')), 9)), toFixedString(' key="v" ', 9)), toFixedString(' key="v" ', 9)), unhex('00'), ' key="v" ') AS haystack
+GROUP BY
+    concat(unhex('00'), toFixedString(materialize(toFixedString(' key="v" ', 9)), 9), toFixedString(toFixedString('00', 2), toNullable(2)),  toFixedString(toFixedString(toFixedString(' key="v" ', 9), 9), 9)),
+    concat(' key="v" ')
+SETTINGS allow_experimental_analyzer = 1;

From 73d601d231a8825643492b8895e6d1b43f04915f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Tue, 19 Mar 2024 19:11:32 +0100
Subject: [PATCH 765/985] Add test for #61600

---
 .../03017_analyzer_groupby_fuzz_61600.reference    |  1 +
 .../03017_analyzer_groupby_fuzz_61600.sql          | 14 ++++++++++++++
 2 files changed, 15 insertions(+)
 create mode 100644 tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.reference
 create mode 100644 tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.sql

diff --git a/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.reference b/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.reference
new file mode 100644
index 00000000000..68acb650f8e
--- /dev/null
+++ b/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.reference
@@ -0,0 +1 @@
+38	\N
diff --git a/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.sql b/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.sql
new file mode 100644
index 00000000000..44b27750c16
--- /dev/null
+++ b/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.sql
@@ -0,0 +1,14 @@
+CREATE TABLE set_index_not__fuzz_0 (`name` String, `status` Enum8('alive' = 0, 'rip' = 1), INDEX idx_status status TYPE set(2) GRANULARITY 1)
+ENGINE = MergeTree ORDER BY name
+SETTINGS index_granularity = 8192;
+
+INSERT INTO set_index_not__fuzz_0 SELECT * from generateRandom() limit 1;
+
+SELECT
+    38,
+    concat(position(concat(concat(position(concat(toUInt256(3)), 'ca', 2), 3),NULLIF(1, materialize(toLowCardinality(1)))), toLowCardinality(toNullable('ca'))), concat(NULLIF(1, 1), concat(3), toNullable(3)))
+FROM set_index_not__fuzz_0
+GROUP BY
+    toNullable(3),
+    concat(concat(NULLIF(1, 1), toNullable(toNullable(3))))
+SETTINGS allow_experimental_analyzer = 1;

From 221b74c77fd56fd184b770620af2c634f5227680 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Tue, 19 Mar 2024 19:44:15 +0100
Subject: [PATCH 766/985] Fix #ci_set_analyzer

---
 src/Analyzer/QueryNode.h                       | 5 +++++
 src/Interpreters/ClusterProxy/executeQuery.cpp | 1 +
 src/Planner/PlannerJoinTree.cpp                | 7 +++++++
 src/Storages/StorageDistributed.cpp            | 2 ++
 src/Storages/buildQueryTreeForShard.cpp        | 7 +++++++
 5 files changed, 22 insertions(+)

diff --git a/src/Analyzer/QueryNode.h b/src/Analyzer/QueryNode.h
index d8b8741afb2..6f9067908dd 100644
--- a/src/Analyzer/QueryNode.h
+++ b/src/Analyzer/QueryNode.h
@@ -99,6 +99,11 @@ public:
         return settings_changes;
     }
 
+    void clearSettingsChanges()
+    {
+        settings_changes.clear();
+    }
+
     /// Returns true if query node is subquery, false otherwise
     bool isSubquery() const
     {
diff --git a/src/Interpreters/ClusterProxy/executeQuery.cpp b/src/Interpreters/ClusterProxy/executeQuery.cpp
index 07ef7aa6c96..2348081b56c 100644
--- a/src/Interpreters/ClusterProxy/executeQuery.cpp
+++ b/src/Interpreters/ClusterProxy/executeQuery.cpp
@@ -127,6 +127,7 @@ ContextMutablePtr updateSettingsForCluster(const Cluster & cluster,
     ///
     /// Here we don't try to analyze setting again. In case if query_info->additional_filter_ast is not empty, some filter was applied.
     /// It's just easier to add this filter for a source table.
+    LOG_DEBUG(&Poco::Logger::get("updateSettings"), "{}", additional_filter_ast != nullptr);
     if (additional_filter_ast)
     {
         Tuple tuple;
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 8ca8f0f258b..e7afd7a1ea4 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -1,5 +1,6 @@
 #include <Planner/PlannerJoinTree.h>
 
+#include "Common/logger_useful.h"
 #include <Common/scope_guard_safe.h>
 
 #include <Columns/ColumnAggregateFunction.h>
@@ -63,6 +64,7 @@
 #include <Planner/Utils.h>
 #include <Planner/CollectSets.h>
 #include <Planner/CollectTableExpressionData.h>
+#include <Poco/Logger.h>
 
 namespace DB
 {
@@ -523,6 +525,7 @@ FilterDAGInfo buildAdditionalFiltersIfNeeded(const StoragePtr & storage,
         return {};
 
     auto const & storage_id = storage->getStorageID();
+    LOG_DEBUG(&Poco::Logger::get("Planner"), "{}", storage_id.getFullNameNotQuoted());
 
     ASTPtr additional_filter_ast;
     for (const auto & additional_filter : additional_filters)
@@ -543,6 +546,8 @@ FilterDAGInfo buildAdditionalFiltersIfNeeded(const StoragePtr & storage,
         }
     }
 
+    LOG_DEBUG(&Poco::Logger::get("Planner"), "{}", additional_filter_ast != nullptr);
+
     if (!additional_filter_ast)
         return {};
 
@@ -847,6 +852,8 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
                 const auto & table_expression_alias = table_expression->getOriginalAlias();
                 auto additional_filters_info
                     = buildAdditionalFiltersIfNeeded(storage, table_expression_alias, table_expression_query_info, planner_context);
+                if (additional_filters_info.actions)
+                    LOG_DEBUG(&Poco::Logger::get("Planner"), "{}", additional_filters_info.actions->dumpDAG());
                 add_filter(additional_filters_info, "additional filter");
 
                 from_stage = storage->getQueryProcessingStage(
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index a9b909bc71e..675e5b1071a 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -836,6 +836,8 @@ void StorageDistributed::read(
 {
     Block header;
 
+    LOG_DEBUG(&Poco::Logger::get("read"), "{}", query_info.additional_filter_ast != nullptr);
+
     SelectQueryInfo modified_query_info = query_info;
 
     if (local_context->getSettingsRef().allow_experimental_analyzer)
diff --git a/src/Storages/buildQueryTreeForShard.cpp b/src/Storages/buildQueryTreeForShard.cpp
index c87a1b216ca..ff88172e7a3 100644
--- a/src/Storages/buildQueryTreeForShard.cpp
+++ b/src/Storages/buildQueryTreeForShard.cpp
@@ -20,6 +20,7 @@
 #include <Processors/QueryPlan/ExpressionStep.h>
 #include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
 #include <QueryPipeline/QueryPipelineBuilder.h>
+#include "Analyzer/QueryNode.h"
 
 namespace DB
 {
@@ -383,6 +384,12 @@ QueryTreeNodePtr buildQueryTreeForShard(const PlannerContextPtr & planner_contex
 
     createUniqueTableAliases(query_tree_to_modify, nullptr, planner_context->getQueryContext());
 
+    // Get rid of the settings clause so we don't send them to remote. Thus newly non-important
+    // settings won't break any remote parser. It's also more reasonable since the query settings
+    // are written into the query context and will be sent by the query pipeline.
+    if (auto * query_node = query_tree_to_modify->as<QueryNode>())
+        query_node->clearSettingsChanges();
+
     return query_tree_to_modify;
 }
 

From b561560c9968cacef84b62564e2dbf37182bcb6f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 19 Mar 2024 19:55:59 +0100
Subject: [PATCH 767/985] Remove it from remaining places

---
 src/Common/SensitiveDataMasker.cpp            |  2 +-
 .../JoinToSubqueryTransformVisitor.cpp        |  8 ++--
 .../TranslateQualifiedNamesVisitor.cpp        |  8 ++--
 src/Parsers/ASTColumnsMatcher.cpp             |  6 ---
 src/Parsers/ASTColumnsTransformers.cpp        | 40 +++++++++----------
 src/Parsers/ASTColumnsTransformers.h          |  9 ++---
 .../Formats/Impl/AvroRowOutputFormat.cpp      |  2 +-
 7 files changed, 33 insertions(+), 42 deletions(-)

diff --git a/src/Common/SensitiveDataMasker.cpp b/src/Common/SensitiveDataMasker.cpp
index 28eae6f451d..8c29b899841 100644
--- a/src/Common/SensitiveDataMasker.cpp
+++ b/src/Common/SensitiveDataMasker.cpp
@@ -60,7 +60,7 @@ public:
         , replacement(replacement_string)
     {
         if (!regexp.ok())
-            throw DB::Exception(DB::ErrorCodes::CANNOT_COMPILE_REGEXP,
+            throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
                 "SensitiveDataMasker: cannot compile re2: {}, error: {}. "
                 "Look at https://github.com/google/re2/wiki/Syntax for reference.",
                 regexp_string_, regexp.error());
diff --git a/src/Interpreters/JoinToSubqueryTransformVisitor.cpp b/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
index 209f8e68b8f..5cda4c982b4 100644
--- a/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
+++ b/src/Interpreters/JoinToSubqueryTransformVisitor.cpp
@@ -205,16 +205,16 @@ private:
                 has_asterisks = true;
 
                 String pattern = columns_regexp_matcher->getPattern();
-                auto regexp = std::make_shared<re2::RE2>(pattern, re2::RE2::Quiet);
-                if (!regexp->ok())
+                re2::RE2 regexp(pattern, re2::RE2::Quiet);
+                if (!regexp.ok())
                     throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
-                        "COLUMNS pattern {} cannot be compiled: {}", pattern, regexp->error());
+                        "COLUMNS pattern {} cannot be compiled: {}", pattern, regexp.error());
 
                 for (auto & table_name : data.tables_order)
                     data.addTableColumns(
                         table_name,
                         columns,
-                        [&](const String & column_name) { return re2::RE2::PartialMatch(column_name, *regexp); });
+                        [&](const String & column_name) { return re2::RE2::PartialMatch(column_name, regexp); });
 
                 if (columns_regexp_matcher->transformers)
                 {
diff --git a/src/Interpreters/TranslateQualifiedNamesVisitor.cpp b/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
index e3690d0fcc0..03df7283992 100644
--- a/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
+++ b/src/Interpreters/TranslateQualifiedNamesVisitor.cpp
@@ -278,17 +278,17 @@ void TranslateQualifiedNamesMatcher::visit(ASTExpressionList & node, const ASTPt
         else if (const auto * asterisk_regexp_pattern = child->as<ASTColumnsRegexpMatcher>())
         {
             String pattern = asterisk_regexp_pattern->getPattern();
-            auto regexp = std::make_shared<re2::RE2>(pattern, re2::RE2::Quiet);
-            if (!regexp->ok())
+            re2::RE2 regexp(pattern, re2::RE2::Quiet);
+            if (!regexp.ok())
                 throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
-                    "COLUMNS pattern {} cannot be compiled: {}", pattern, regexp->error());
+                    "COLUMNS pattern {} cannot be compiled: {}", pattern, regexp.error());
 
             bool first_table = true;
             for (const auto & table : tables_with_columns)
             {
                 for (const auto & column : table.columns)
                 {
-                    if (re2::RE2::PartialMatch(column.name, *regexp)
+                    if (re2::RE2::PartialMatch(column.name, regexp)
                         && (first_table || !data.join_using_columns.contains(column.name)))
                     {
                         addIdentifier(columns, table.table, column.name);
diff --git a/src/Parsers/ASTColumnsMatcher.cpp b/src/Parsers/ASTColumnsMatcher.cpp
index dac3661d482..518fd9b722d 100644
--- a/src/Parsers/ASTColumnsMatcher.cpp
+++ b/src/Parsers/ASTColumnsMatcher.cpp
@@ -4,17 +4,11 @@
 #include <IO/WriteHelpers.h>
 #include <Common/SipHash.h>
 #include <Common/quoteString.h>
-#include <Common/re2.h>
 
 
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int CANNOT_COMPILE_REGEXP;
-}
-
 ASTPtr ASTColumnsRegexpMatcher::clone() const
 {
     auto clone = std::make_shared<ASTColumnsRegexpMatcher>(*this);
diff --git a/src/Parsers/ASTColumnsTransformers.cpp b/src/Parsers/ASTColumnsTransformers.cpp
index 34a1ae6e8e0..7f3fda9914c 100644
--- a/src/Parsers/ASTColumnsTransformers.cpp
+++ b/src/Parsers/ASTColumnsTransformers.cpp
@@ -12,6 +12,7 @@
 
 namespace DB
 {
+
 namespace ErrorCodes
 {
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
@@ -179,8 +180,8 @@ void ASTColumnsExceptTransformer::formatImpl(const FormatSettings & settings, Fo
         (*it)->formatImpl(settings, state, frame);
     }
 
-    if (!original_pattern.empty())
-        settings.ostr << quoteString(original_pattern);
+    if (!pattern.empty())
+        settings.ostr << quoteString(pattern);
 
     if (children.size() > 1)
         settings.ostr << ")";
@@ -202,8 +203,8 @@ void ASTColumnsExceptTransformer::appendColumnName(WriteBuffer & ostr) const
         (*it)->appendColumnName(ostr);
     }
 
-    if (!original_pattern.empty())
-        writeQuotedString(original_pattern, ostr);
+    if (!pattern.empty())
+        writeQuotedString(pattern, ostr);
 
     if (children.size() > 1)
         writeChar(')', ostr);
@@ -212,8 +213,8 @@ void ASTColumnsExceptTransformer::appendColumnName(WriteBuffer & ostr) const
 void ASTColumnsExceptTransformer::updateTreeHashImpl(SipHash & hash_state, bool ignore_aliases) const
 {
     hash_state.update(is_strict);
-    hash_state.update(original_pattern.size());
-    hash_state.update(original_pattern);
+    hash_state.update(pattern.size());
+    hash_state.update(pattern);
 
     IAST::updateTreeHashImpl(hash_state, ignore_aliases);
 }
@@ -221,7 +222,7 @@ void ASTColumnsExceptTransformer::updateTreeHashImpl(SipHash & hash_state, bool
 void ASTColumnsExceptTransformer::transform(ASTs & nodes) const
 {
     std::set<String> expected_columns;
-    if (original_pattern.empty())
+    if (pattern.empty())
     {
         for (const auto & child : children)
             expected_columns.insert(child->as<const ASTIdentifier &>().name());
@@ -243,11 +244,13 @@ void ASTColumnsExceptTransformer::transform(ASTs & nodes) const
     }
     else
     {
+        auto regexp = getMatcher();
+
         for (auto * it = nodes.begin(); it != nodes.end();)
         {
             if (const auto * id = it->get()->as<ASTIdentifier>())
             {
-                if (isColumnMatching(id->shortName()))
+                if (RE2::PartialMatch(id->shortName(), *regexp))
                 {
                     it = nodes.erase(it);
                     continue;
@@ -268,23 +271,18 @@ void ASTColumnsExceptTransformer::transform(ASTs & nodes) const
     }
 }
 
-void ASTColumnsExceptTransformer::setPattern(String pattern)
+void ASTColumnsExceptTransformer::setPattern(String pattern_)
 {
-    original_pattern = std::move(pattern);
-    column_matcher = std::make_shared<RE2>(original_pattern, RE2::Quiet);
-    if (!column_matcher->ok())
-        throw DB::Exception(DB::ErrorCodes::CANNOT_COMPILE_REGEXP, "COLUMNS pattern {} cannot be compiled: {}",
-            original_pattern, column_matcher->error());
+    pattern = std::move(pattern_);
 }
 
-const std::shared_ptr<re2::RE2> & ASTColumnsExceptTransformer::getMatcher() const
+std::shared_ptr<re2::RE2> ASTColumnsExceptTransformer::getMatcher() const
 {
-    return column_matcher;
-}
-
-bool ASTColumnsExceptTransformer::isColumnMatching(const String & column_name) const
-{
-    return RE2::PartialMatch(column_name, *column_matcher);
+    auto regexp = std::make_shared<re2::RE2>(pattern, re2::RE2::Quiet);
+    if (!regexp->ok())
+        throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
+            "COLUMNS pattern {} cannot be compiled: {}", pattern, regexp->error());
+    return regexp;
 }
 
 void ASTColumnsReplaceTransformer::Replacement::formatImpl(
diff --git a/src/Parsers/ASTColumnsTransformers.h b/src/Parsers/ASTColumnsTransformers.h
index a2a138e13c9..2d13cd85819 100644
--- a/src/Parsers/ASTColumnsTransformers.h
+++ b/src/Parsers/ASTColumnsTransformers.h
@@ -2,6 +2,7 @@
 
 #include <Parsers/IAST.h>
 
+
 namespace re2
 {
     class RE2;
@@ -76,16 +77,14 @@ public:
         return clone;
     }
     void transform(ASTs & nodes) const override;
-    void setPattern(String pattern);
-    const std::shared_ptr<re2::RE2> & getMatcher() const;
-    bool isColumnMatching(const String & column_name) const;
+    void setPattern(String pattern_);
+    std::shared_ptr<re2::RE2> getMatcher() const;
     void appendColumnName(WriteBuffer & ostr) const override;
     void updateTreeHashImpl(SipHash & hash_state, bool ignore_aliases) const override;
 
 protected:
     void formatImpl(const FormatSettings & settings, FormatState &, FormatStateStacked) const override;
-    std::shared_ptr<re2::RE2> column_matcher;
-    String original_pattern;
+    String pattern;
 };
 
 class ASTColumnsReplaceTransformer : public IASTColumnsTransformer
diff --git a/src/Processors/Formats/Impl/AvroRowOutputFormat.cpp b/src/Processors/Formats/Impl/AvroRowOutputFormat.cpp
index 07700942b57..a79a7d10c78 100644
--- a/src/Processors/Formats/Impl/AvroRowOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/AvroRowOutputFormat.cpp
@@ -52,7 +52,7 @@ public:
         : string_to_string_regexp(settings_.avro.string_column_pattern)
     {
         if (!string_to_string_regexp.ok())
-            throw DB::Exception(DB::ErrorCodes::CANNOT_COMPILE_REGEXP, "Avro: cannot compile re2: {}, error: {}. "
+            throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP, "Avro: cannot compile re2: {}, error: {}. "
                 "Look at https://github.com/google/re2/wiki/Syntax for reference.",
                 settings_.avro.string_column_pattern, string_to_string_regexp.error());
     }

From 1913466da4487784582df7301fe10464a80b2a4a Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Tue, 19 Mar 2024 20:31:00 +0100
Subject: [PATCH 768/985] fix uaf of async_insert_queue

---
 src/Interpreters/AsynchronousInsertQueue.cpp | 15 ++++++++++++++-
 src/Interpreters/AsynchronousInsertQueue.h   |  2 ++
 src/Interpreters/Context.cpp                 |  8 +++++---
 3 files changed, 21 insertions(+), 4 deletions(-)

diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index 9234d052d97..e82a902e03b 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -218,7 +218,7 @@ AsynchronousInsertQueue::AsynchronousInsertQueue(ContextPtr context_, size_t poo
         dump_by_first_update_threads.emplace_back([this, i] { processBatchDeadlines(i); });
 }
 
-AsynchronousInsertQueue::~AsynchronousInsertQueue()
+void AsynchronousInsertQueue::flushAndShutdown()
 {
     try
     {
@@ -257,6 +257,19 @@ AsynchronousInsertQueue::~AsynchronousInsertQueue()
     }
 }
 
+AsynchronousInsertQueue::~AsynchronousInsertQueue()
+{
+    for (const auto & shard : queue_shards)
+    {
+        for (const auto & [first_update, elem] : shard.queue)
+        {
+            const auto & insert_query = elem.key.query->as<const ASTInsertQuery &>();
+            LOG_WARNING(log, "Has unprocessed async insert for {}.{}",
+                        backQuoteIfNeed(insert_query.getDatabase()), backQuoteIfNeed(insert_query.getTable()));
+        }
+    }
+}
+
 void AsynchronousInsertQueue::scheduleDataProcessingJob(
     const InsertQuery & key, InsertDataPtr data, ContextPtr global_context, size_t shard_num)
 {
diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index 1a006cce85c..1a4678e3a7d 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -63,6 +63,8 @@ public:
     PushResult pushQueryWithBlock(ASTPtr query, Block block, ContextPtr query_context);
     size_t getPoolSize() const { return pool_size; }
 
+    void flushAndShutdown();
+
 private:
 
     struct InsertQuery
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index b1d2621e925..f388cf6b3de 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -566,7 +566,7 @@ struct ContextSharedPart : boost::noncopyable
             std::lock_guard lock(mutex);
             delete_async_insert_queue = std::move(async_insert_queue);
         }
-        delete_async_insert_queue.reset();
+        delete_async_insert_queue->flushAndShutdown();
 
         /// Stop periodic reloading of the configuration files.
         /// This must be done first because otherwise the reloading may pass a changed config
@@ -590,6 +590,8 @@ struct ContextSharedPart : boost::noncopyable
         LOG_TRACE(log, "Shutting down database catalog");
         DatabaseCatalog::shutdown();
 
+        delete_async_insert_queue.reset();
+
         SHUTDOWN(log, "merges executor", merge_mutate_executor, wait());
         SHUTDOWN(log, "fetches executor", fetch_executor, wait());
         SHUTDOWN(log, "moves executor", moves_executor, wait());
@@ -4990,7 +4992,7 @@ PartUUIDsPtr Context::getIgnoredPartUUIDs() const
 
 AsynchronousInsertQueue * Context::tryGetAsynchronousInsertQueue() const
 {
-    std::lock_guard lock(mutex);
+    SharedLockGuard lock(shared->mutex);
     return shared->async_insert_queue.get();
 }
 
@@ -4998,7 +5000,7 @@ void Context::setAsynchronousInsertQueue(const std::shared_ptr<AsynchronousInser
 {
     AsynchronousInsertQueue::validateSettings(settings, getLogger("Context"));
 
-    std::lock_guard lock(mutex);
+    SharedLockGuard lock(shared->mutex);
 
     if (std::chrono::milliseconds(settings.async_insert_poll_timeout_ms) == std::chrono::milliseconds::zero())
         throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting async_insert_poll_timeout_ms can't be zero");

From 11d0b0a9fad7414cd5be6d3cccac80c1e5f66a91 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Thu, 14 Mar 2024 19:22:02 +0100
Subject: [PATCH 769/985] Forbid SimpleAggregateFunction in ORDER BY of
 MergeTree tables

Like AggregateFunction is forbidden, but they are forbidden because they
are not comparable.

New setting (allow_suspicious_primary_key) had been added for backard
compatiblity (turned OFF by default).

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Core/Settings.h                           |  1 +
 src/Core/SettingsChangesHistory.h             |  1 +
 .../MergeTree/registerStorageMergeTree.cpp    | 24 ++++++++++++++++---
 .../01410_nullable_key_and_index.sql          |  2 +-
 ...order_by_SimpleAggregateFunction.reference |  0
 ...03020_order_by_SimpleAggregateFunction.sql | 14 +++++++++++
 6 files changed, 38 insertions(+), 4 deletions(-)
 create mode 100644 tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.reference
 create mode 100644 tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.sql

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index a3c5638d97f..7d53803e41f 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -161,6 +161,7 @@ class IColumn;
     M(Bool, allow_suspicious_indices, false, "Reject primary/secondary indexes and sorting keys with identical expressions", 0) \
     M(Bool, allow_suspicious_ttl_expressions, false, "Reject TTL expressions that don't depend on any of table's columns. It indicates a user error most of the time.", 0) \
     M(Bool, allow_suspicious_variant_types, false, "In CREATE TABLE statement allows specifying Variant type with similar variant types (for example, with different numeric or date types). Enabling this setting may introduce some ambiguity when working with values with similar types.", 0) \
+    M(Bool, allow_suspicious_primary_key, false, "Forbid suspicious PRIMARY KEY/ORDER BY for MergeTree (i.e. SimpleAggregateFunction)", 0) \
     M(Bool, compile_expressions, false, "Compile some scalar functions and operators to native code.", 0) \
     M(UInt64, min_count_to_compile_expression, 3, "The number of identical expressions before they are JIT-compiled", 0) \
     M(Bool, compile_aggregate_expressions, true, "Compile aggregate functions to native code.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 072b9803682..2d8c173d850 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -95,6 +95,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"throw_if_deduplication_in_dependent_materialized_views_enabled_with_async_insert", false, true, "Deduplication is dependent materialized view cannot work together with async inserts."},
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
               {"function_locate_has_mysql_compatible_argument_order", false, true, "Increase compatibility with MySQL's locate function."},
+              {"allow_suspicious_primary_key", true, false, "Forbid suspicious PRIMARY KEY/ORDER BY for MergeTree (i.e. SimpleAggregateFunction)"},
               {"filesystem_cache_reserve_space_wait_lock_timeout_milliseconds", 1000, 1000, "Wait time to lock cache for sapce reservation in filesystem cache"},
               {"max_parser_backtracks", 0, 1000000, "Limiting the complexity of parsing"},
               {"keeper_max_retries", 10, 10, "Max retries for general keeper operations"},
diff --git a/src/Storages/MergeTree/registerStorageMergeTree.cpp b/src/Storages/MergeTree/registerStorageMergeTree.cpp
index 2b24a56e994..e89547952d0 100644
--- a/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -13,6 +13,7 @@
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTSetQuery.h>
 
+#include <DataTypes/DataTypeCustomSimpleAggregateFunction.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 
 #include <Interpreters/Context.h>
@@ -30,6 +31,7 @@ namespace ErrorCodes
     extern const int UNKNOWN_STORAGE;
     extern const int NO_REPLICA_NAME_GIVEN;
     extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
+    extern const int DATA_TYPE_CANNOT_BE_USED_IN_KEY;
 }
 
 
@@ -110,6 +112,16 @@ static ColumnsDescription getColumnsDescriptionFromZookeeper(const String & raw_
     return ColumnsDescription::parse(zookeeper->get(fs::path(zookeeper_path) / "columns", &columns_stat));
 }
 
+static void verifySortingKey(const KeyDescription & sorting_key)
+{
+    /// Aggregate functions already forbidden, but SimpleAggregateFunction are not
+    for (const auto & data_type : sorting_key.data_types)
+    {
+        if (dynamic_cast<const DataTypeCustomSimpleAggregateFunction *>(data_type->getCustomName()))
+            throw Exception(ErrorCodes::DATA_TYPE_CANNOT_BE_USED_IN_KEY, "Column with type {} is not allowed in key expression", data_type->getCustomName()->getName());
+    }
+}
+
 
 static StoragePtr create(const StorageFactory::Arguments & args)
 {
@@ -148,6 +160,8 @@ static StoragePtr create(const StorageFactory::Arguments & args)
         || (args.query.columns_list->indices && !args.query.columns_list->indices->children.empty())
         || (args.query.columns_list->projections && !args.query.columns_list->projections->children.empty());
 
+    const Settings & local_settings = args.getLocalContext()->getSettingsRef();
+
     String name_part = args.engine_name.substr(0, args.engine_name.size() - strlen("MergeTree"));
 
     bool replicated = startsWith(name_part, "Replicated");
@@ -293,7 +307,7 @@ static StoragePtr create(const StorageFactory::Arguments & args)
                             arg_idx, e.message(), verbose_help_message);
         }
     }
-    else if (args.mode <= LoadingStrictnessLevel::CREATE && !args.getLocalContext()->getSettingsRef().allow_deprecated_syntax_for_merge_tree)
+    else if (args.mode <= LoadingStrictnessLevel::CREATE && !local_settings.allow_deprecated_syntax_for_merge_tree)
     {
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "This syntax for *MergeTree engine is deprecated. "
                                                    "Use extended storage definition syntax with ORDER BY/PRIMARY KEY clause. "
@@ -532,7 +546,7 @@ static StoragePtr create(const StorageFactory::Arguments & args)
 
         if (!args.storage_def->order_by)
         {
-            if (args.getLocalContext()->getSettingsRef().create_table_empty_primary_key_by_default)
+            if (local_settings.create_table_empty_primary_key_by_default)
             {
                 args.storage_def->set(args.storage_def->order_by, makeASTFunction("tuple"));
             }
@@ -553,6 +567,8 @@ static StoragePtr create(const StorageFactory::Arguments & args)
         /// column if sorting key will be changed.
         metadata.sorting_key = KeyDescription::getSortingKeyFromAST(
             args.storage_def->order_by->ptr(), metadata.columns, context, merging_param_key_arg);
+        if (!local_settings.allow_suspicious_primary_key)
+            verifySortingKey(metadata.sorting_key);
 
         /// If primary key explicitly defined, than get it from AST
         if (args.storage_def->primary_key)
@@ -577,7 +593,7 @@ static StoragePtr create(const StorageFactory::Arguments & args)
         if (args.storage_def->sample_by)
             metadata.sampling_key = KeyDescription::getKeyFromAST(args.storage_def->sample_by->ptr(), metadata.columns, context);
 
-        bool allow_suspicious_ttl = LoadingStrictnessLevel::SECONDARY_CREATE <= args.mode || args.getLocalContext()->getSettingsRef().allow_suspicious_ttl_expressions;
+        bool allow_suspicious_ttl = LoadingStrictnessLevel::SECONDARY_CREATE <= args.mode || local_settings.allow_suspicious_ttl_expressions;
 
         if (args.storage_def->ttl_table)
         {
@@ -665,6 +681,8 @@ static StoragePtr create(const StorageFactory::Arguments & args)
         /// column if sorting key will be changed.
         metadata.sorting_key
             = KeyDescription::getSortingKeyFromAST(engine_args[arg_num], metadata.columns, context, merging_param_key_arg);
+        if (!local_settings.allow_suspicious_primary_key)
+            verifySortingKey(metadata.sorting_key);
 
         /// In old syntax primary_key always equals to sorting key.
         metadata.primary_key = KeyDescription::getKeyFromAST(engine_args[arg_num], metadata.columns, context);
diff --git a/tests/queries/0_stateless/01410_nullable_key_and_index.sql b/tests/queries/0_stateless/01410_nullable_key_and_index.sql
index 905d997d95c..7c28a7a6e70 100644
--- a/tests/queries/0_stateless/01410_nullable_key_and_index.sql
+++ b/tests/queries/0_stateless/01410_nullable_key_and_index.sql
@@ -73,5 +73,5 @@ CREATE TABLE invalid_lc_null (id LowCardinality(Nullable(String))) ENGINE = Merg
 CREATE TABLE invalid_array_null (id Array(Nullable(String))) ENGINE = MergeTree ORDER BY id; -- { serverError 44 }
 CREATE TABLE invalid_tuple_null (id Tuple(Nullable(String), UInt8)) ENGINE = MergeTree ORDER BY id; -- { serverError 44 }
 CREATE TABLE invalid_map_null (id Map(UInt8, Nullable(String))) ENGINE = MergeTree ORDER BY id; -- { serverError 44 }
-CREATE TABLE invalid_simple_agg_state_null (id SimpleAggregateFunction(sum, Nullable(UInt64))) ENGINE = MergeTree ORDER BY id; -- { serverError 44 }
+CREATE TABLE invalid_simple_agg_state_null (id SimpleAggregateFunction(sum, Nullable(UInt64))) ENGINE = MergeTree ORDER BY id; -- { serverError DATA_TYPE_CANNOT_BE_USED_IN_KEY }
 -- AggregateFunctions are not comparable and cannot be used in key expressions. No need to test it.
diff --git a/tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.reference b/tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.sql b/tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.sql
new file mode 100644
index 00000000000..fd3418fb50e
--- /dev/null
+++ b/tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.sql
@@ -0,0 +1,14 @@
+set allow_suspicious_primary_key = 0;
+
+create table data (key Int, value AggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() order by (key, value); -- { serverError DATA_TYPE_CANNOT_BE_USED_IN_KEY }
+create table data (key Int, value SimpleAggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() order by (key, value); -- { serverError DATA_TYPE_CANNOT_BE_USED_IN_KEY }
+
+create table data (key Int, value AggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() primary key value; -- { serverError DATA_TYPE_CANNOT_BE_USED_IN_KEY }
+create table data (key Int, value SimpleAggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() primary key value; -- { serverError DATA_TYPE_CANNOT_BE_USED_IN_KEY }
+
+create table data (key Int, value AggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() primary key value order by (value, key); -- { serverError DATA_TYPE_CANNOT_BE_USED_IN_KEY }
+create table data (key Int, value SimpleAggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() primary key value order by (value, key); -- { serverError DATA_TYPE_CANNOT_BE_USED_IN_KEY }
+
+set allow_suspicious_primary_key = 1;
+
+create table data (key Int, value SimpleAggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() primary key value order by (value, key);

From 2f4b9b3a5b824ea255e1ea17c522f68d01cd0967 Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Tue, 19 Mar 2024 16:08:20 +0100
Subject: [PATCH 770/985] Add few notes and a debug check.

---
 .../AbstractConfigurationComparison.cpp       | 29 ++++++++++---------
 .../Config/AbstractConfigurationComparison.h  | 12 ++++----
 src/Common/Config/ConfigHelper.h              |  2 ++
 .../ExternalDictionariesLoader.cpp            |  2 +-
 4 files changed, 24 insertions(+), 21 deletions(-)

diff --git a/src/Common/Config/AbstractConfigurationComparison.cpp b/src/Common/Config/AbstractConfigurationComparison.cpp
index e983bd32f51..e241a540cc1 100644
--- a/src/Common/Config/AbstractConfigurationComparison.cpp
+++ b/src/Common/Config/AbstractConfigurationComparison.cpp
@@ -37,6 +37,12 @@ namespace
         {
             std::erase_if(left_subkeys, [&](const String & key) { return ignore_keys->contains(key); });
             std::erase_if(right_subkeys, [&](const String & key) { return ignore_keys->contains(key); });
+
+#if defined(ABORT_ON_LOGICAL_ERROR)
+            /// Compound `ignore_keys` are not yet implemented.
+            for (const auto & ignore_key : *ignore_keys)
+                chassert(ignore_key.find(".") == std::string_view::npos);
+#endif
         }
 
         /// Check that the right configuration has the same set of subkeys as the left configuration.
@@ -63,7 +69,7 @@ namespace
                 if (!left_subkeys_set.contains(subkey))
                     return false;
 
-                if (!isSameConfiguration(left, concatKeyAndSubKey(left_key, subkey), right, concatKeyAndSubKey(right_key, subkey)))
+                if (!isSameConfigurationImpl(left, concatKeyAndSubKey(left_key, subkey), right, concatKeyAndSubKey(right_key, subkey), nullptr))
                     return false;
             }
             return true;
@@ -82,6 +88,14 @@ bool isSameConfiguration(const Poco::Util::AbstractConfiguration & left, const P
     return isSameConfiguration(left, key, right, key);
 }
 
+bool isSameConfiguration(const Poco::Util::AbstractConfiguration & left, const String & left_key,
+                         const Poco::Util::AbstractConfiguration & right, const String & right_key,
+                         const std::unordered_set<std::string_view> & ignore_keys)
+{
+    const auto * ignore_keys_ptr = !ignore_keys.empty() ? &ignore_keys : nullptr;
+    return isSameConfigurationImpl(left, left_key, right, right_key, ignore_keys_ptr);
+}
+
 bool isSameConfigurationWithMultipleKeys(const Poco::Util::AbstractConfiguration & left, const Poco::Util::AbstractConfiguration & right, const String & root, const String & name)
 {
     if (&left == &right)
@@ -99,17 +113,4 @@ bool isSameConfigurationWithMultipleKeys(const Poco::Util::AbstractConfiguration
     return true;
 }
 
-bool isSameConfiguration(const Poco::Util::AbstractConfiguration & left, const String & left_key,
-                         const Poco::Util::AbstractConfiguration & right, const String & right_key)
-{
-    return isSameConfigurationImpl(left, left_key, right, right_key, /* ignore_keys= */ nullptr);
-}
-
-bool isSameConfigurationIgnoringKeys(const Poco::Util::AbstractConfiguration & left, const String & left_key,
-                                     const Poco::Util::AbstractConfiguration & right, const String & right_key,
-                                     const std::unordered_set<std::string_view> & ignore_keys)
-{
-    return isSameConfigurationImpl(left, left_key, right, right_key, !ignore_keys.empty() ? &ignore_keys : nullptr);
-}
-
 }
diff --git a/src/Common/Config/AbstractConfigurationComparison.h b/src/Common/Config/AbstractConfigurationComparison.h
index edaff8d5363..e8f65a4afcc 100644
--- a/src/Common/Config/AbstractConfigurationComparison.h
+++ b/src/Common/Config/AbstractConfigurationComparison.h
@@ -11,6 +11,8 @@ namespace Poco::Util
 namespace DB
 {
     /// Returns true if two configurations contains the same keys and values.
+    /// NOTE: These functions assume no configuration has items having both children and a value
+    /// (i.e. items like "<test>value<child1/></test>").
     bool isSameConfiguration(const Poco::Util::AbstractConfiguration & left,
                              const Poco::Util::AbstractConfiguration & right);
 
@@ -31,13 +33,11 @@ namespace DB
                              const String & key);
 
     /// Returns true if specified subviews of the two configurations contains the same keys and values.
+    /// If `ignore_keys` is specified then the function skips those keys while comparing
+    /// (even if their values differ, they're considered to be the same.)
     bool isSameConfiguration(const Poco::Util::AbstractConfiguration & left, const String & left_key,
-                             const Poco::Util::AbstractConfiguration & right, const String & right_key);
-
-    /// Returns true if specified subviews of the two configurations contains the same keys and values, but without checking specified keys.
-    bool isSameConfigurationIgnoringKeys(const Poco::Util::AbstractConfiguration & left, const String & left_key,
-                                         const Poco::Util::AbstractConfiguration & right, const String & right_key,
-                                         const std::unordered_set<std::string_view> & ignore_keys);
+                             const Poco::Util::AbstractConfiguration & right, const String & right_key,
+                             const std::unordered_set<std::string_view> & ignore_keys = {});
 
     inline bool operator==(const Poco::Util::AbstractConfiguration & left, const Poco::Util::AbstractConfiguration & right)
     {
diff --git a/src/Common/Config/ConfigHelper.h b/src/Common/Config/ConfigHelper.h
index 4f13bc4ad78..513438bd859 100644
--- a/src/Common/Config/ConfigHelper.h
+++ b/src/Common/Config/ConfigHelper.h
@@ -14,6 +14,8 @@ namespace DB::ConfigHelper
 {
 
 /// Clones a configuration.
+/// NOTE: This function assumes the source configuration doesn't have items having both children and a value
+/// (i.e. items like "<test>value<child1/></test>").
 Poco::AutoPtr<Poco::Util::AbstractConfiguration> clone(const Poco::Util::AbstractConfiguration & src);
 
 /// The behavior is like `config.getBool(key, default_)`,
diff --git a/src/Interpreters/ExternalDictionariesLoader.cpp b/src/Interpreters/ExternalDictionariesLoader.cpp
index 34ad240d089..f48ee61dab8 100644
--- a/src/Interpreters/ExternalDictionariesLoader.cpp
+++ b/src/Interpreters/ExternalDictionariesLoader.cpp
@@ -55,7 +55,7 @@ bool ExternalDictionariesLoader::doesConfigChangeRequiresReloadingObject(const P
         ignore_keys.insert("database");
     }
 
-    return !isSameConfigurationIgnoringKeys(old_config, old_key_in_config, new_config, new_key_in_config, ignore_keys);
+    return !isSameConfiguration(old_config, old_key_in_config, new_config, new_key_in_config, ignore_keys);
 }
 
 void ExternalDictionariesLoader::updateObjectFromConfigWithoutReloading(IExternalLoadable & object, const Poco::Util::AbstractConfiguration & config, const String & key_in_config) const

From 13ff65474ace15bcd7fc907242a5f7066dacec79 Mon Sep 17 00:00:00 2001
From: Nikita Taranov <nikita.taranov@clickhouse.com>
Date: Tue, 19 Mar 2024 21:09:03 +0000
Subject: [PATCH 771/985] impl

---
 src/Storages/System/StorageSystemReplicas.cpp         |  6 +++++-
 .../02908_many_requests_to_system_replicas.reference  |  1 +
 .../02908_many_requests_to_system_replicas.sh         | 11 ++++++++++-
 3 files changed, 16 insertions(+), 2 deletions(-)

diff --git a/src/Storages/System/StorageSystemReplicas.cpp b/src/Storages/System/StorageSystemReplicas.cpp
index af8d67cbc21..35550de11cb 100644
--- a/src/Storages/System/StorageSystemReplicas.cpp
+++ b/src/Storages/System/StorageSystemReplicas.cpp
@@ -135,8 +135,12 @@ public:
 
             auto & [_, storage, promise, with_zk_fields] = req;
 
-            auto get_status_task = [this, storage, with_zk_fields, promise] () mutable
+            auto get_status_task = [this, storage, with_zk_fields, promise, thread_group = CurrentThread::getGroup()]() mutable
             {
+                SCOPE_EXIT_SAFE(if (thread_group) CurrentThread::detachFromGroupIfNotDetached(););
+                if (thread_group)
+                    CurrentThread::attachToGroupIfDetached(thread_group);
+
                 try
                 {
                     ReplicatedTableStatus status;
diff --git a/tests/queries/0_stateless/02908_many_requests_to_system_replicas.reference b/tests/queries/0_stateless/02908_many_requests_to_system_replicas.reference
index f1ca07ef408..17c94686470 100644
--- a/tests/queries/0_stateless/02908_many_requests_to_system_replicas.reference
+++ b/tests/queries/0_stateless/02908_many_requests_to_system_replicas.reference
@@ -3,3 +3,4 @@ Making 200 requests to system.replicas
 Query system.replicas while waiting for other concurrent requests to finish
 0
 900
+1
diff --git a/tests/queries/0_stateless/02908_many_requests_to_system_replicas.sh b/tests/queries/0_stateless/02908_many_requests_to_system_replicas.sh
index 2c57545e603..17e1d87963a 100755
--- a/tests/queries/0_stateless/02908_many_requests_to_system_replicas.sh
+++ b/tests/queries/0_stateless/02908_many_requests_to_system_replicas.sh
@@ -49,7 +49,7 @@ echo "Making $CONCURRENCY requests to system.replicas"
 
 for i in $(seq 1 $CONCURRENCY)
 do
-    curl "$CLICKHOUSE_URL" --silent --fail --show-error --data "SELECT * FROM system.replicas WHERE database=currentDatabase() FORMAT Null;" 2>&1 || echo "query $i failed" &
+    curl "$CLICKHOUSE_URL" --silent --fail --show-error --data "SELECT * FROM system.replicas WHERE database=currentDatabase() FORMAT Null SETTINGS log_comment='02908_many_requests';" &>/dev/null &
 done
 
 echo "Query system.replicas while waiting for other concurrent requests to finish"
@@ -59,3 +59,12 @@ curl "$CLICKHOUSE_URL" --silent --fail --show-error --data "SELECT sum(lost_part
 curl "$CLICKHOUSE_URL" --silent --fail --show-error --data "SELECT sum(is_leader) FROM system.replicas WHERE database=currentDatabase();" 2>&1;
 
 wait;
+
+$CLICKHOUSE_CLIENT -nq "
+SYSTEM FLUSH LOGS;
+
+-- without optimisation there are ~350K zk requests
+SELECT sum(ProfileEvents['ZooKeeperTransactions']) < 30000
+  FROM system.query_log
+ WHERE current_database=currentDatabase() AND log_comment='02908_many_requests';
+"

From 82b18670a2def4a853fc612344a948b584f59a61 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Tue, 19 Mar 2024 22:31:26 +0100
Subject: [PATCH 772/985] Fix error

---
 src/Analyzer/ColumnTransformers.cpp    |  6 +++---
 src/Analyzer/ColumnTransformers.h      | 13 ++++++-------
 src/Analyzer/MatcherNode.cpp           | 11 +++++++----
 src/Parsers/ASTColumnsTransformers.cpp |  3 +++
 4 files changed, 19 insertions(+), 14 deletions(-)

diff --git a/src/Analyzer/ColumnTransformers.cpp b/src/Analyzer/ColumnTransformers.cpp
index 40e1e019d50..3a6b9e3b291 100644
--- a/src/Analyzer/ColumnTransformers.cpp
+++ b/src/Analyzer/ColumnTransformers.cpp
@@ -1,18 +1,18 @@
 #include <Analyzer/ColumnTransformers.h>
 
 #include <Common/SipHash.h>
+#include <Common/re2.h>
 
 #include <IO/WriteBuffer.h>
-#include <IO/WriteHelpers.h>
 #include <IO/Operators.h>
 
 #include <Parsers/ASTIdentifier.h>
-#include <Parsers/ASTAsterisk.h>
 #include <Parsers/ASTColumnsTransformers.h>
 
 #include <Analyzer/FunctionNode.h>
 #include <Analyzer/LambdaNode.h>
 
+
 namespace DB
 {
 
@@ -133,7 +133,7 @@ ExceptColumnTransformerNode::ExceptColumnTransformerNode(std::shared_ptr<re2::RE
 bool ExceptColumnTransformerNode::isColumnMatching(const std::string & column_name) const
 {
     if (column_matcher)
-        return RE2::PartialMatch(column_name, *column_matcher);
+        return re2::RE2::PartialMatch(column_name, *column_matcher);
 
     for (const auto & name : except_column_names)
         if (column_name == name)
diff --git a/src/Analyzer/ColumnTransformers.h b/src/Analyzer/ColumnTransformers.h
index 43f32318fc9..8fa8e28f194 100644
--- a/src/Analyzer/ColumnTransformers.h
+++ b/src/Analyzer/ColumnTransformers.h
@@ -3,7 +3,12 @@
 #include <Analyzer/Identifier.h>
 #include <Analyzer/IQueryTreeNode.h>
 #include <Analyzer/ListNode.h>
-#include <Common/re2.h>
+
+
+namespace re2
+{
+    class RE2;
+}
 
 namespace DB
 {
@@ -102,8 +107,6 @@ enum class ApplyColumnTransformerType
 /// Get apply column transformer type name
 const char * toString(ApplyColumnTransformerType type);
 
-class ApplyColumnTransformerNode;
-using ApplyColumnTransformerNodePtr = std::shared_ptr<ApplyColumnTransformerNode>;
 
 /// Apply column transformer
 class ApplyColumnTransformerNode final : public IColumnTransformerNode
@@ -158,8 +161,6 @@ enum class ExceptColumnTransformerType
 
 const char * toString(ExceptColumnTransformerType type);
 
-class ExceptColumnTransformerNode;
-using ExceptColumnTransformerNodePtr = std::shared_ptr<ExceptColumnTransformerNode>;
 
 /** Except column transformer.
   * Strict EXCEPT column transformer must use all column names during matched nodes transformation.
@@ -230,8 +231,6 @@ private:
     static constexpr size_t children_size = 0;
 };
 
-class ReplaceColumnTransformerNode;
-using ReplaceColumnTransformerNodePtr = std::shared_ptr<ReplaceColumnTransformerNode>;
 
 /** Replace column transformer.
   * Strict replace column transformer must use all replacements during matched nodes transformation.
diff --git a/src/Analyzer/MatcherNode.cpp b/src/Analyzer/MatcherNode.cpp
index d0efb0646b3..05861bcc039 100644
--- a/src/Analyzer/MatcherNode.cpp
+++ b/src/Analyzer/MatcherNode.cpp
@@ -99,10 +99,13 @@ MatcherNode::MatcherNode(MatcherNodeType matcher_type_,
     , qualified_identifier(qualified_identifier_)
     , columns_identifiers(columns_identifiers_)
 {
-    columns_matcher = std::make_shared<re2::RE2>(pattern_, re2::RE2::Quiet);
-    if (!columns_matcher->ok())
-        throw DB::Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
-            "COLUMNS pattern {} cannot be compiled: {}", pattern_, columns_matcher->error());
+    if (!pattern_.empty())
+    {
+        columns_matcher = std::make_shared<re2::RE2>(pattern_, re2::RE2::Quiet);
+        if (!columns_matcher->ok())
+            throw DB::Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
+                "COLUMNS pattern {} cannot be compiled: {}", pattern_, columns_matcher->error());
+    }
 
     auto column_transformers_list_node = std::make_shared<ListNode>();
 
diff --git a/src/Parsers/ASTColumnsTransformers.cpp b/src/Parsers/ASTColumnsTransformers.cpp
index 7f3fda9914c..42c4c6ad88a 100644
--- a/src/Parsers/ASTColumnsTransformers.cpp
+++ b/src/Parsers/ASTColumnsTransformers.cpp
@@ -278,6 +278,9 @@ void ASTColumnsExceptTransformer::setPattern(String pattern_)
 
 std::shared_ptr<re2::RE2> ASTColumnsExceptTransformer::getMatcher() const
 {
+    if (pattern.empty())
+        return {};
+
     auto regexp = std::make_shared<re2::RE2>(pattern, re2::RE2::Quiet);
     if (!regexp->ok())
         throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,

From 7275caf5bb3f0f555bbf2155c61822d5f6cdb0de Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Tue, 19 Mar 2024 22:40:00 +0100
Subject: [PATCH 773/985] Update Context.cpp

---
 src/Interpreters/Context.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index f388cf6b3de..b3f16a9ba52 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -566,7 +566,8 @@ struct ContextSharedPart : boost::noncopyable
             std::lock_guard lock(mutex);
             delete_async_insert_queue = std::move(async_insert_queue);
         }
-        delete_async_insert_queue->flushAndShutdown();
+        if (delete_async_insert_queue)
+            delete_async_insert_queue->flushAndShutdown();
 
         /// Stop periodic reloading of the configuration files.
         /// This must be done first because otherwise the reloading may pass a changed config

From 6eb488fe517df53aee24bc40dcc2f66a12052ffc Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Tue, 19 Mar 2024 23:29:09 +0100
Subject: [PATCH 774/985] Ping CI


From cfab620f49206bc3672e57813400857ff5541c7b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 20 Mar 2024 01:11:53 +0100
Subject: [PATCH 775/985] Fix bad code

---
 src/Analyzer/MatcherNode.cpp | 6 +++---
 src/Analyzer/MatcherNode.h   | 6 +++---
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/Analyzer/MatcherNode.cpp b/src/Analyzer/MatcherNode.cpp
index 05861bcc039..48b60423688 100644
--- a/src/Analyzer/MatcherNode.cpp
+++ b/src/Analyzer/MatcherNode.cpp
@@ -53,7 +53,7 @@ MatcherNode::MatcherNode(Identifier qualified_identifier_, ColumnTransformersNod
 {
 }
 
-MatcherNode::MatcherNode(const String & pattern_, ColumnTransformersNodes column_transformers_)
+MatcherNode::MatcherNode(String pattern_, ColumnTransformersNodes column_transformers_)
     : MatcherNode(MatcherNodeType::COLUMNS_REGEXP,
         {} /*qualified_identifier*/,
         {} /*columns_identifiers*/,
@@ -62,7 +62,7 @@ MatcherNode::MatcherNode(const String & pattern_, ColumnTransformersNodes column
 {
 }
 
-MatcherNode::MatcherNode(Identifier qualified_identifier_, const String & pattern_, ColumnTransformersNodes column_transformers_)
+MatcherNode::MatcherNode(Identifier qualified_identifier_, String pattern_, ColumnTransformersNodes column_transformers_)
     : MatcherNode(MatcherNodeType::COLUMNS_REGEXP,
         std::move(qualified_identifier_),
         {} /*columns_identifiers*/,
@@ -92,7 +92,7 @@ MatcherNode::MatcherNode(Identifier qualified_identifier_, Identifiers columns_i
 MatcherNode::MatcherNode(MatcherNodeType matcher_type_,
     Identifier qualified_identifier_,
     Identifiers columns_identifiers_,
-    const String & pattern_,
+    String pattern_,
     ColumnTransformersNodes column_transformers_)
     : IQueryTreeNode(children_size)
     , matcher_type(matcher_type_)
diff --git a/src/Analyzer/MatcherNode.h b/src/Analyzer/MatcherNode.h
index 2217fde6eff..9f6b7c6ce3d 100644
--- a/src/Analyzer/MatcherNode.h
+++ b/src/Analyzer/MatcherNode.h
@@ -59,10 +59,10 @@ public:
     explicit MatcherNode(Identifier qualified_identifier_, ColumnTransformersNodes column_transformers_ = {});
 
     /// Variant unqualified COLUMNS('regexp')
-    explicit MatcherNode(const String & pattern_, ColumnTransformersNodes column_transformers_ = {});
+    explicit MatcherNode(String pattern_, ColumnTransformersNodes column_transformers_ = {});
 
     /// Variant qualified COLUMNS('regexp')
-    explicit MatcherNode(Identifier qualified_identifier_, const String & pattern_, ColumnTransformersNodes column_transformers_ = {});
+    explicit MatcherNode(Identifier qualified_identifier_, String pattern_, ColumnTransformersNodes column_transformers_ = {});
 
     /// Variant unqualified COLUMNS(column_name_1, ...)
     explicit MatcherNode(Identifiers columns_identifiers_, ColumnTransformersNodes column_transformers_ = {});
@@ -147,7 +147,7 @@ private:
     explicit MatcherNode(MatcherNodeType matcher_type_,
         Identifier qualified_identifier_,
         Identifiers columns_identifiers_,
-        const String & pattern_,
+        String pattern_,
         ColumnTransformersNodes column_transformers_);
 
     MatcherNodeType matcher_type;

From c63a5566dc8f54ed28f07ddf7097bbfeb7f8b0a7 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 20 Mar 2024 01:25:46 +0100
Subject: [PATCH 776/985] Add a test

---
 .../03014_invalid_utf8_client.expect          | 27 +++++++++++++++++++
 .../03014_invalid_utf8_client.reference       |  0
 2 files changed, 27 insertions(+)
 create mode 100755 tests/queries/0_stateless/03014_invalid_utf8_client.expect
 create mode 100644 tests/queries/0_stateless/03014_invalid_utf8_client.reference

diff --git a/tests/queries/0_stateless/03014_invalid_utf8_client.expect b/tests/queries/0_stateless/03014_invalid_utf8_client.expect
new file mode 100755
index 00000000000..13cbfe408d4
--- /dev/null
+++ b/tests/queries/0_stateless/03014_invalid_utf8_client.expect
@@ -0,0 +1,27 @@
+#!/usr/bin/expect -f
+
+set basedir [file dirname $argv0]
+set basename [file tail $argv0]
+exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+set history_file $env(CLICKHOUSE_TMP)/$basename.history
+
+log_user 0
+set timeout 60
+match_max 100000
+
+expect_after {
+    # Do not ignore eof from expect
+    -i $any_spawn_id eof { exp_continue }
+    # A default timeout action is to do nothing, change it to fail
+    -i $any_spawn_id timeout { exit 1 }
+}
+
+spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT_BINARY \$CLICKHOUSE_CLIENT_OPT --disable_suggestion --history_file=$history_file"
+expect ":) "
+
+send -- "SELECT \x99\r"
+
+expect "Syntax error"
+
+send "exit\r"
+expect eof
diff --git a/tests/queries/0_stateless/03014_invalid_utf8_client.reference b/tests/queries/0_stateless/03014_invalid_utf8_client.reference
new file mode 100644
index 00000000000..e69de29bb2d

From a29d4f5db2aa6554ece3d1dbcef98928d899f6f4 Mon Sep 17 00:00:00 2001
From: liuneng <1398775315@qq.com>
Date: Wed, 20 Mar 2024 10:24:34 +0800
Subject: [PATCH 777/985] fix bug

---
 src/Analyzer/Passes/ConvertInToEqualPass.cpp | 3 +--
 src/Core/SettingsChangesHistory.h            | 1 +
 tests/performance/function_in.xml            | 4 +---
 3 files changed, 3 insertions(+), 5 deletions(-)

diff --git a/src/Analyzer/Passes/ConvertInToEqualPass.cpp b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
index 26db3a4f4aa..e89300cd967 100644
--- a/src/Analyzer/Passes/ConvertInToEqualPass.cpp
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
@@ -36,11 +36,10 @@ public:
             return ;
         if (constant_node->getValue().getType() == Field::Types::Which::Tuple)
             return;
-        auto const_value = std::make_shared<ConstantNode>(constant_node->getValue());
 
         auto equal_resolver = createInternalFunctionEqualOverloadResolver();
         auto equal = std::make_shared<FunctionNode>("equals");
-        QueryTreeNodes arguments{column_node->clone(), const_value};
+        QueryTreeNodes arguments{column_node->clone(), constant_node->clone()};
         equal->getArguments().getNodes() = std::move(arguments);
         equal->resolveAsFunction(equal_resolver);
         node = equal;
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 8e2b2915c2a..886dce72176 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -96,6 +96,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
               {"filesystem_cache_reserve_space_wait_lock_timeout_milliseconds", 1000, 1000, "Wait time to lock cache for sapce reservation in filesystem cache"},
               {"max_parser_backtracks", 0, 1000000, "Limiting the complexity of parsing"},
+              {"optimize_in_to_equal", false, true, "Convert in single value to equal"},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
diff --git a/tests/performance/function_in.xml b/tests/performance/function_in.xml
index 16e6bb91469..af4f8737ba7 100644
--- a/tests/performance/function_in.xml
+++ b/tests/performance/function_in.xml
@@ -21,10 +21,8 @@
         ENGINE = Memory
     </create_query>
     <fill_query>insert into t_nullable select ['aaaaaa','bbaaaa','ccaaaa','ddaaaa'][number % 101 + 1], ['aa','bb','cc','dd'][number % 100 + 1], ['aa','bb','cc','dd'][number % 102 + 1], number%10+1, number%10+2, number%10+3, number%10+4,number%10+5, number%6000+1, number%5000+2 from numbers_mt(30000000)</fill_query>
-    <query>select * from t_nullable where key_string1 in ('aaaaaa') format Null</query>
     <query>select * from t_nullable where key_string1 in ('aaaaaa') format Null SETTINGS allow_experimental_analyzer=1</query>
-    <query>select * from t_nullable where key_string2 in ('3') format Null</query>
     <query>select * from t_nullable where key_string2 in ('3') format Null SETTINGS allow_experimental_analyzer=1</query>
     <drop_query>drop table if exists t_nullable</drop_query>
 
-</test>
\ No newline at end of file
+</test>

From 862abf2f6efecf8a5acf6bf49f681b0d696c3db9 Mon Sep 17 00:00:00 2001
From: liuneng <1398775315@qq.com>
Date: Wed, 20 Mar 2024 10:40:22 +0800
Subject: [PATCH 778/985] remove config

---
 src/Analyzer/Passes/ConvertInToEqualPass.cpp | 2 --
 src/Core/Settings.h                          | 1 -
 src/Core/SettingsChangesHistory.h            | 1 -
 3 files changed, 4 deletions(-)

diff --git a/src/Analyzer/Passes/ConvertInToEqualPass.cpp b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
index e89300cd967..ce2cec9f9ed 100644
--- a/src/Analyzer/Passes/ConvertInToEqualPass.cpp
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
@@ -24,8 +24,6 @@ public:
 
     void enterImpl(QueryTreeNodePtr & node)
     {
-        if (!getSettings().optimize_in_to_equal)
-            return;
         auto * func_node = node->as<FunctionNode>();
         if (!func_node || func_node->getFunctionName() != "in" || func_node->getArguments().getNodes().size() != 2)
             return ;
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 19655d6493d..e6adb00137f 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -593,7 +593,6 @@ class IColumn;
     M(Bool, optimize_functions_to_subcolumns, false, "Transform functions to subcolumns, if possible, to reduce amount of read data. E.g. 'length(arr)' -> 'arr.size0', 'col IS NULL' -> 'col.null' ", 0) \
     M(Bool, optimize_using_constraints, false, "Use constraints for query optimization", 0)                                                                                                                                           \
     M(Bool, optimize_substitute_columns, false, "Use constraints for column substitution", 0)                                                                                                                                         \
-    M(Bool, optimize_in_to_equal, true, "Convert the constant in to equal", 0)   \
     M(Bool, optimize_append_index, false, "Use constraints in order to append index condition (indexHint)", 0) \
     M(Bool, optimize_time_filter_with_preimage, true, "Optimize Date and DateTime predicates by converting functions into equivalent comparisons without conversions (e.g. toYear(col) = 2023 -> col >= '2023-01-01' AND col <= '2023-12-31')", 0) \
     M(Bool, normalize_function_names, true, "Normalize function names to their canonical names", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 886dce72176..8e2b2915c2a 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -96,7 +96,6 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"parallel_replicas_allow_in_with_subquery", false, true, "If true, subquery for IN will be executed on every follower replica"},
               {"filesystem_cache_reserve_space_wait_lock_timeout_milliseconds", 1000, 1000, "Wait time to lock cache for sapce reservation in filesystem cache"},
               {"max_parser_backtracks", 0, 1000000, "Limiting the complexity of parsing"},
-              {"optimize_in_to_equal", false, true, "Convert in single value to equal"},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},

From 45bbef689a053489a141bd8e2e20dc422c1d11d2 Mon Sep 17 00:00:00 2001
From: liuneng <1398775315@qq.com>
Date: Wed, 20 Mar 2024 12:29:48 +0800
Subject: [PATCH 779/985] fix error for in Null

---
 src/Analyzer/Passes/ConvertInToEqualPass.cpp               | 7 +++++--
 .../0_stateless/03013_optimize_in_to_equal.reference       | 6 ++++++
 tests/queries/0_stateless/03013_optimize_in_to_equal.sql   | 4 +++-
 3 files changed, 14 insertions(+), 3 deletions(-)

diff --git a/src/Analyzer/Passes/ConvertInToEqualPass.cpp b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
index ce2cec9f9ed..45b8a91f7ad 100644
--- a/src/Analyzer/Passes/ConvertInToEqualPass.cpp
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
@@ -32,9 +32,12 @@ public:
         auto * constant_node = args[1]->as<ConstantNode>();
         if (!column_node || !constant_node)
             return ;
+        // IN multiple values is not supported
         if (constant_node->getValue().getType() == Field::Types::Which::Tuple)
-            return;
-
+            return ;
+        // x IN null not equivalent to x = null
+        if (constant_node->hasSourceExpression() || constant_node->getValue().isNull())
+            return ;
         auto equal_resolver = createInternalFunctionEqualOverloadResolver();
         auto equal = std::make_shared<FunctionNode>("equals");
         QueryTreeNodes arguments{column_node->clone(), constant_node->clone()};
diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.reference b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
index f55a7b76eaf..9ef4de0f607 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
@@ -1,5 +1,11 @@
 a	1
 -------------------
+0
+0
+0
+0
+0
+-------------------
 QUERY id: 0
   PROJECTION COLUMNS
     x String
diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
index 9d80825ceb4..e4dba3a0aa2 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
@@ -5,6 +5,8 @@ INSERT INTO test VALUES ('a', 1), ('b', 2), ('c', 3), ('d', 4), ('e', 5);
 
 select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
+select x in Null from test;
+select '-------------------';
 explain query tree select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x in ('a','b') SETTINGS allow_experimental_analyzer = 1;
\ No newline at end of file
+explain query tree select * from test where x in ('a','b') SETTINGS allow_experimental_analyzer = 1;

From 96e90438e0a1f47fc706792492cf86fe093d0b26 Mon Sep 17 00:00:00 2001
From: nemonlou <nemonlou@qq.com>
Date: Wed, 20 Mar 2024 14:25:16 +0800
Subject: [PATCH 780/985] fix clang-tiny

---
 src/Processors/Transforms/MergeJoinTransform.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Processors/Transforms/MergeJoinTransform.cpp b/src/Processors/Transforms/MergeJoinTransform.cpp
index b63598483ef..62361bef5e2 100644
--- a/src/Processors/Transforms/MergeJoinTransform.cpp
+++ b/src/Processors/Transforms/MergeJoinTransform.cpp
@@ -305,7 +305,7 @@ MergeJoinAlgorithm::MergeJoinAlgorithm(
         left_to_right_key_remap[left_idx] = right_idx;
     }
 
-    auto smjPtr = typeid_cast<const FullSortingMergeJoin *>(table_join.get());
+    const auto *smjPtr = typeid_cast<const FullSortingMergeJoin *>(table_join.get());
     if (smjPtr)
     {
         null_direction_hint = smjPtr->getNullDirection();

From 2312eb886f93f126be326abd6af1f5ad433d0f29 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 20 Mar 2024 08:53:26 +0100
Subject: [PATCH 781/985] Fix part log for async insert with deduplication

---
 .../MergeTree/ReplicatedMergeTreeSink.cpp     | 14 +++++++++++
 ...14_async_with_dedup_part_log_rmt.reference |  5 ++++
 .../03014_async_with_dedup_part_log_rmt.sql   | 24 +++++++++++++++++++
 3 files changed, 43 insertions(+)
 create mode 100644 tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.reference
 create mode 100644 tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.sql

diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
index f67076c741b..b43d47bf5f4 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
@@ -487,7 +487,14 @@ void ReplicatedMergeTreeSinkImpl<true>::finishDelayedChunk(const ZooKeeperWithFa
             partition.temp_part.finalize();
             auto conflict_block_ids = commitPart(zookeeper, partition.temp_part.part, partition.block_id, delayed_chunk->replicas_num, false).first;
             if (conflict_block_ids.empty())
+            {
+                auto counters_snapshot = std::make_shared<ProfileEvents::Counters::Snapshot>(partition.part_counters.getPartiallyAtomicSnapshot());
+                PartLog::addNewPart(
+                    storage.getContext(),
+                    PartLog::PartLogEntry(partition.temp_part.part, partition.elapsed_ns, counters_snapshot),
+                    ExecutionStatus(0));
                 break;
+            }
 
             storage.async_block_ids_cache.triggerCacheUpdate();
             ++retry_times;
@@ -495,7 +502,14 @@ void ReplicatedMergeTreeSinkImpl<true>::finishDelayedChunk(const ZooKeeperWithFa
             /// partition clean conflict
             partition.filterBlockDuplicate(conflict_block_ids, false);
             if (partition.block_with_partition.block.rows() == 0)
+            {
+                auto counters_snapshot = std::make_shared<ProfileEvents::Counters::Snapshot>(partition.part_counters.getPartiallyAtomicSnapshot());
+                PartLog::addNewPart(
+                    storage.getContext(),
+                    PartLog::PartLogEntry(partition.temp_part.part, partition.elapsed_ns, counters_snapshot),
+                    ExecutionStatus(ErrorCodes::INSERT_WAS_DEDUPLICATED));
                 break;
+            }
             partition.block_with_partition.partition = std::move(partition.temp_part.part->partition.value);
             /// partition.temp_part is already finalized, no need to call cancel
             partition.temp_part = storage.writer.writeTempPart(partition.block_with_partition, metadata_snapshot, context);
diff --git a/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.reference b/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.reference
new file mode 100644
index 00000000000..335c796a9cf
--- /dev/null
+++ b/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.reference
@@ -0,0 +1,5 @@
+-- Inserted part --
+0	1
+-- Deduplicated part --
+0	1
+389	1
diff --git a/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.sql b/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.sql
new file mode 100644
index 00000000000..e14c1635853
--- /dev/null
+++ b/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.sql
@@ -0,0 +1,24 @@
+CREATE TABLE 03014_async_with_dedup_part_log (x UInt64)
+ENGINE=ReplicatedMergeTree('/clickhouse/table/{database}/03014_async_with_dedup_part_log', 'r1') ORDER BY tuple();
+
+SET async_insert = 1;
+SET wait_for_async_insert = 1;
+SET async_insert_deduplicate = 1;
+
+SELECT '-- Inserted part --';
+INSERT INTO 03014_async_with_dedup_part_log VALUES (2);
+
+SYSTEM FLUSH LOGS;
+SELECT error, count() FROM system.part_log
+WHERE table = '03014_async_with_dedup_part_log' and database = currentDatabase()
+GROUP BY error
+ORDER BY error;
+
+SELECT '-- Deduplicated part --';
+INSERT INTO 03014_async_with_dedup_part_log VALUES (2);
+
+SYSTEM FLUSH LOGS;
+SELECT error, count() FROM system.part_log
+WHERE table = '03014_async_with_dedup_part_log' and database = currentDatabase()
+GROUP BY error
+ORDER BY error;

From e7aa23d33236443f4fbe36e695a47c6ff4e857d6 Mon Sep 17 00:00:00 2001
From: YenchangChan <chenyanchang1990@163.com>
Date: Mon, 18 Mar 2024 20:14:46 +0800
Subject: [PATCH 782/985] Remove duplicate code in copyS3File.cpp

---
 src/IO/S3/copyS3File.cpp | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/src/IO/S3/copyS3File.cpp b/src/IO/S3/copyS3File.cpp
index 51518df268c..b780c1fc08f 100644
--- a/src/IO/S3/copyS3File.cpp
+++ b/src/IO/S3/copyS3File.cpp
@@ -194,11 +194,6 @@ namespace
 
                 auto outcome = client_ptr->CompleteMultipartUpload(request);
 
-                if (blob_storage_log)
-                    blob_storage_log->addEvent(BlobStorageLogElement::EventType::MultiPartUploadComplete,
-                                               dest_bucket, dest_key, /* local_path_ */ {}, /* data_size */ 0,
-                                               outcome.IsSuccess() ? nullptr : &outcome.GetError());
-
                 if (blob_storage_log)
                     blob_storage_log->addEvent(BlobStorageLogElement::EventType::MultiPartUploadComplete,
                                                dest_bucket, dest_key, /* local_path_ */ {}, /* data_size */ 0,

From d2d5f3b323c3e8b7a4a9823ea14b48b516030907 Mon Sep 17 00:00:00 2001
From: liuneng <1398775315@qq.com>
Date: Wed, 20 Mar 2024 17:29:35 +0800
Subject: [PATCH 783/985] add not in

---
 src/Analyzer/Passes/ConvertInToEqualPass.cpp  | 38 ++++++++++++-------
 src/Analyzer/Passes/ConvertInToEqualPass.h    |  8 +++-
 src/Functions/CMakeLists.txt                  |  2 +
 src/Functions/equals.cpp                      |  5 +++
 src/Functions/equals.h                        | 11 ++++++
 src/Functions/notEquals.cpp                   |  5 +++
 src/Functions/notEquals.h                     | 11 ++++++
 .../03013_optimize_in_to_equal.reference      | 27 ++++++++++++-
 .../03013_optimize_in_to_equal.sql            | 10 +++--
 9 files changed, 98 insertions(+), 19 deletions(-)
 create mode 100644 src/Functions/equals.h
 create mode 100644 src/Functions/notEquals.h

diff --git a/src/Analyzer/Passes/ConvertInToEqualPass.cpp b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
index 45b8a91f7ad..fbac09de7aa 100644
--- a/src/Analyzer/Passes/ConvertInToEqualPass.cpp
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
@@ -3,29 +3,28 @@
 #include <Analyzer/FunctionNode.h>
 #include <Analyzer/InDepthQueryTreeVisitor.h>
 #include <Analyzer/Passes/ConvertInToEqualPass.h>
-#include <Functions/FunctionsComparison.h>
-#include <Functions/IFunctionAdaptors.h>
+#include <Functions/equals.h>
+#include <Functions/notEquals.h>
 
 namespace DB
 {
 
-using FunctionEquals = FunctionComparison<EqualsOp, NameEquals>;
-
 class ConvertInToEqualPassVisitor : public InDepthQueryTreeVisitorWithContext<ConvertInToEqualPassVisitor>
 {
 public:
     using Base = InDepthQueryTreeVisitorWithContext<ConvertInToEqualPassVisitor>;
     using Base::Base;
 
-    FunctionOverloadResolverPtr createInternalFunctionEqualOverloadResolver()
-    {
-        return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionEquals>(getContext()->getSettings().decimal_check_overflow));
-    }
-
     void enterImpl(QueryTreeNodePtr & node)
     {
+        static const std::unordered_map<String, String> MAPPING = {
+            {"in", "equals"},
+            {"notIn", "notEquals"}
+        };
         auto * func_node = node->as<FunctionNode>();
-        if (!func_node || func_node->getFunctionName() != "in" || func_node->getArguments().getNodes().size() != 2)
+        if (!func_node
+            || !MAPPING.contains(func_node->getFunctionName())
+            || func_node->getArguments().getNodes().size() != 2)
             return ;
         auto args = func_node->getArguments().getNodes();
         auto * column_node = args[0]->as<ColumnNode>();
@@ -38,13 +37,26 @@ public:
         // x IN null not equivalent to x = null
         if (constant_node->hasSourceExpression() || constant_node->getValue().isNull())
             return ;
-        auto equal_resolver = createInternalFunctionEqualOverloadResolver();
-        auto equal = std::make_shared<FunctionNode>("equals");
+        auto result_func_name = MAPPING.at(func_node->getFunctionName());
+        auto equal = std::make_shared<FunctionNode>(result_func_name);
         QueryTreeNodes arguments{column_node->clone(), constant_node->clone()};
         equal->getArguments().getNodes() = std::move(arguments);
-        equal->resolveAsFunction(equal_resolver);
+        FunctionOverloadResolverPtr resolver;
+        bool decimal_check_overflow = getContext()->getSettingsRef().decimal_check_overflow;
+        if (result_func_name == "equals")
+        {
+            resolver = createInternalFunctionEqualOverloadResolver(decimal_check_overflow);
+        }
+        else
+        {
+            resolver = createInternalFunctionNotEqualOverloadResolver(decimal_check_overflow);
+        }
+        equal->resolveAsFunction(resolver);
         node = equal;
     }
+private:
+    FunctionOverloadResolverPtr equal_resolver;
+    FunctionOverloadResolverPtr not_equal_resolver;
 };
 
 void ConvertInToEqualPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
diff --git a/src/Analyzer/Passes/ConvertInToEqualPass.h b/src/Analyzer/Passes/ConvertInToEqualPass.h
index 7de75e94f04..bd4f8607c88 100644
--- a/src/Analyzer/Passes/ConvertInToEqualPass.h
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.h
@@ -5,9 +5,15 @@
 namespace DB
 {
 /** Optimize `in` to `equals` if possible.
-  *
+  * 1. convert in single value to equal
   * Example: SELECT * from test where x IN (1);
   * Result: SELECT * from test where x = 1;
+  *
+  * 2. convert not in single value to notEqual
+  * Example: SELECT * from test where x NOT IN (1);
+  * Result: SELECT * from test where x != 1;
+  *
+  * If value is null or tuple, do not convert.
   */
 class ConvertInToEqualPass final : public IQueryTreePass
 {
diff --git a/src/Functions/CMakeLists.txt b/src/Functions/CMakeLists.txt
index ac3e3671ae0..399394011b5 100644
--- a/src/Functions/CMakeLists.txt
+++ b/src/Functions/CMakeLists.txt
@@ -14,6 +14,8 @@ extract_into_parent_list(clickhouse_functions_sources dbms_sources
     multiMatchAny.cpp
     checkHyperscanRegexp.cpp
     array/has.cpp
+    equals.cpp
+    notEquals.cpp
     CastOverloadResolver.cpp
 )
 extract_into_parent_list(clickhouse_functions_headers dbms_headers
diff --git a/src/Functions/equals.cpp b/src/Functions/equals.cpp
index 5c59daf0537..512abaa6fc7 100644
--- a/src/Functions/equals.cpp
+++ b/src/Functions/equals.cpp
@@ -13,6 +13,11 @@ REGISTER_FUNCTION(Equals)
     factory.registerFunction<FunctionEquals>();
 }
 
+FunctionOverloadResolverPtr createInternalFunctionEqualOverloadResolver(bool decimal_check_overflow)
+{
+    return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionEquals>(decimal_check_overflow));
+}
+
 template <>
 ColumnPtr FunctionComparison<EqualsOp, NameEquals>::executeTupleImpl(
     const ColumnsWithTypeAndName & x, const ColumnsWithTypeAndName & y, size_t tuple_size, size_t input_rows_count) const
diff --git a/src/Functions/equals.h b/src/Functions/equals.h
new file mode 100644
index 00000000000..855cba4db3e
--- /dev/null
+++ b/src/Functions/equals.h
@@ -0,0 +1,11 @@
+#pragma once
+#include <memory>
+
+namespace DB
+{
+
+class IFunctionOverloadResolver;
+using FunctionOverloadResolverPtr = std::shared_ptr<IFunctionOverloadResolver>;
+
+FunctionOverloadResolverPtr createInternalFunctionEqualOverloadResolver(bool decimal_check_overflow);
+}
diff --git a/src/Functions/notEquals.cpp b/src/Functions/notEquals.cpp
index 3a63db46711..744a0997d95 100644
--- a/src/Functions/notEquals.cpp
+++ b/src/Functions/notEquals.cpp
@@ -12,6 +12,11 @@ REGISTER_FUNCTION(NotEquals)
     factory.registerFunction<FunctionNotEquals>();
 }
 
+FunctionOverloadResolverPtr createInternalFunctionNotEqualOverloadResolver(bool decimal_check_overflow)
+{
+    return std::make_unique<FunctionToOverloadResolverAdaptor>(std::make_shared<FunctionNotEquals>(decimal_check_overflow));
+}
+
 template <>
 ColumnPtr FunctionComparison<NotEqualsOp, NameNotEquals>::executeTupleImpl(
     const ColumnsWithTypeAndName & x, const ColumnsWithTypeAndName & y, size_t tuple_size, size_t input_rows_count) const
diff --git a/src/Functions/notEquals.h b/src/Functions/notEquals.h
new file mode 100644
index 00000000000..961889d68d7
--- /dev/null
+++ b/src/Functions/notEquals.h
@@ -0,0 +1,11 @@
+#pragma once
+#include <memory>
+
+namespace DB
+{
+
+class IFunctionOverloadResolver;
+using FunctionOverloadResolverPtr = std::shared_ptr<IFunctionOverloadResolver>;
+
+FunctionOverloadResolverPtr createInternalFunctionNotEqualOverloadResolver(bool decimal_check_overflow);
+}
diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.reference b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
index 9ef4de0f607..dcaa14abfb1 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
@@ -3,8 +3,6 @@ a	1
 0
 0
 0
-0
-0
 -------------------
 QUERY id: 0
   PROJECTION COLUMNS
@@ -41,3 +39,28 @@ QUERY id: 0
           COLUMN id: 7, column_name: x, result_type: String, source_id: 3
           CONSTANT id: 8, constant_value: Tuple_(\'a\', \'b\'), constant_value_type: Tuple(String, String)
   SETTINGS allow_experimental_analyzer=1
+-------------------
+b	2
+c	3
+-------------------
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: notEquals, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: \'a\', constant_value_type: String
+  SETTINGS allow_experimental_analyzer=1
+-------------------
+a	1
+b	2
+c	3
diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
index e4dba3a0aa2..be4dc2275a9 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
@@ -1,8 +1,6 @@
 DROP TABLE IF EXISTS test;
 CREATE TABLE test (x String, y Int32) ENGINE = MergeTree() ORDER BY x;
-
-INSERT INTO test VALUES ('a', 1), ('b', 2), ('c', 3), ('d', 4), ('e', 5);
-
+INSERT INTO test VALUES ('a', 1), ('b', 2), ('c', 3);
 select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
 select x in Null from test;
@@ -10,3 +8,9 @@ select '-------------------';
 explain query tree select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
 explain query tree select * from test where x in ('a','b') SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
+select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
+explain query tree select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
+select * from test where x not in (NULL) SETTINGS allow_experimental_analyzer = 1;

From 10bf164aa732adc68d914eb3911f1c94aec77fcf Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Wed, 20 Mar 2024 10:47:15 +0100
Subject: [PATCH 784/985] Cleanup #ci_set_analyzer

---
 .../ClusterProxy/executeQuery.cpp             |  1 -
 src/Planner/PlannerJoinTree.cpp               |  7 -------
 src/Storages/StorageDistributed.cpp           |  2 --
 src/Storages/buildQueryTreeForShard.cpp       | 20 +++++++++----------
 .../01455_opentelemetry_distributed.reference |  4 ++--
 ..._parallel_replicas_join_subquery.reference |  2 +-
 ...02771_parallel_replicas_analyzer.reference |  2 +-
 7 files changed, 14 insertions(+), 24 deletions(-)

diff --git a/src/Interpreters/ClusterProxy/executeQuery.cpp b/src/Interpreters/ClusterProxy/executeQuery.cpp
index 2348081b56c..07ef7aa6c96 100644
--- a/src/Interpreters/ClusterProxy/executeQuery.cpp
+++ b/src/Interpreters/ClusterProxy/executeQuery.cpp
@@ -127,7 +127,6 @@ ContextMutablePtr updateSettingsForCluster(const Cluster & cluster,
     ///
     /// Here we don't try to analyze setting again. In case if query_info->additional_filter_ast is not empty, some filter was applied.
     /// It's just easier to add this filter for a source table.
-    LOG_DEBUG(&Poco::Logger::get("updateSettings"), "{}", additional_filter_ast != nullptr);
     if (additional_filter_ast)
     {
         Tuple tuple;
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index e7afd7a1ea4..8ca8f0f258b 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -1,6 +1,5 @@
 #include <Planner/PlannerJoinTree.h>
 
-#include "Common/logger_useful.h"
 #include <Common/scope_guard_safe.h>
 
 #include <Columns/ColumnAggregateFunction.h>
@@ -64,7 +63,6 @@
 #include <Planner/Utils.h>
 #include <Planner/CollectSets.h>
 #include <Planner/CollectTableExpressionData.h>
-#include <Poco/Logger.h>
 
 namespace DB
 {
@@ -525,7 +523,6 @@ FilterDAGInfo buildAdditionalFiltersIfNeeded(const StoragePtr & storage,
         return {};
 
     auto const & storage_id = storage->getStorageID();
-    LOG_DEBUG(&Poco::Logger::get("Planner"), "{}", storage_id.getFullNameNotQuoted());
 
     ASTPtr additional_filter_ast;
     for (const auto & additional_filter : additional_filters)
@@ -546,8 +543,6 @@ FilterDAGInfo buildAdditionalFiltersIfNeeded(const StoragePtr & storage,
         }
     }
 
-    LOG_DEBUG(&Poco::Logger::get("Planner"), "{}", additional_filter_ast != nullptr);
-
     if (!additional_filter_ast)
         return {};
 
@@ -852,8 +847,6 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
                 const auto & table_expression_alias = table_expression->getOriginalAlias();
                 auto additional_filters_info
                     = buildAdditionalFiltersIfNeeded(storage, table_expression_alias, table_expression_query_info, planner_context);
-                if (additional_filters_info.actions)
-                    LOG_DEBUG(&Poco::Logger::get("Planner"), "{}", additional_filters_info.actions->dumpDAG());
                 add_filter(additional_filters_info, "additional filter");
 
                 from_stage = storage->getQueryProcessingStage(
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 675e5b1071a..a9b909bc71e 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -836,8 +836,6 @@ void StorageDistributed::read(
 {
     Block header;
 
-    LOG_DEBUG(&Poco::Logger::get("read"), "{}", query_info.additional_filter_ast != nullptr);
-
     SelectQueryInfo modified_query_info = query_info;
 
     if (local_context->getSettingsRef().allow_experimental_analyzer)
diff --git a/src/Storages/buildQueryTreeForShard.cpp b/src/Storages/buildQueryTreeForShard.cpp
index ff88172e7a3..5015e89dff7 100644
--- a/src/Storages/buildQueryTreeForShard.cpp
+++ b/src/Storages/buildQueryTreeForShard.cpp
@@ -1,26 +1,26 @@
 
 #include <Storages/buildQueryTreeForShard.h>
 
-#include <Analyzer/createUniqueTableAliases.h>
 #include <Analyzer/ColumnNode.h>
+#include <Analyzer/createUniqueTableAliases.h>
 #include <Analyzer/FunctionNode.h>
-#include <Analyzer/IQueryTreeNode.h>
 #include <Analyzer/InDepthQueryTreeVisitor.h>
-#include <Analyzer/TableNode.h>
+#include <Analyzer/IQueryTreeNode.h>
 #include <Analyzer/JoinNode.h>
+#include <Analyzer/QueryNode.h>
+#include <Analyzer/TableNode.h>
 #include <Analyzer/Utils.h>
 #include <Functions/FunctionFactory.h>
 #include <Interpreters/InterpreterSelectQueryAnalyzer.h>
+#include <Planner/Utils.h>
+#include <Processors/Executors/CompletedPipelineExecutor.h>
+#include <Processors/QueryPlan/ExpressionStep.h>
+#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
+#include <Processors/Transforms/SquashingChunksTransform.h>
+#include <QueryPipeline/QueryPipelineBuilder.h>
 #include <Storages/removeGroupingFunctionSpecializations.h>
 #include <Storages/StorageDistributed.h>
 #include <Storages/StorageDummy.h>
-#include <Planner/Utils.h>
-#include <Processors/Executors/CompletedPipelineExecutor.h>
-#include <Processors/Transforms/SquashingChunksTransform.h>
-#include <Processors/QueryPlan/ExpressionStep.h>
-#include <Processors/QueryPlan/Optimizations/QueryPlanOptimizationSettings.h>
-#include <QueryPipeline/QueryPipelineBuilder.h>
-#include "Analyzer/QueryNode.h"
 
 namespace DB
 {
diff --git a/tests/queries/0_stateless/01455_opentelemetry_distributed.reference b/tests/queries/0_stateless/01455_opentelemetry_distributed.reference
index b04a3a5ea82..2920b387aa2 100644
--- a/tests/queries/0_stateless/01455_opentelemetry_distributed.reference
+++ b/tests/queries/0_stateless/01455_opentelemetry_distributed.reference
@@ -1,9 +1,9 @@
 ===http===
 {"query":"select 1 from remote('127.0.0.2', system, one) settings allow_experimental_analyzer = 1 format Null\n","status":"QueryFinish","tracestate":"some custom state","sorted_by_start_time":1}
 {"query":"DESC TABLE system.one","status":"QueryFinish","tracestate":"some custom state","sorted_by_start_time":1}
-{"query":"SELECT 1 AS `1` FROM `system`.`one` AS `__table1` SETTINGS allow_experimental_analyzer = 1","status":"QueryFinish","tracestate":"some custom state","sorted_by_start_time":1}
+{"query":"SELECT 1 AS `1` FROM `system`.`one` AS `__table1`","status":"QueryFinish","tracestate":"some custom state","sorted_by_start_time":1}
 {"query":"DESC TABLE system.one","query_status":"QueryFinish","tracestate":"some custom state","sorted_by_finish_time":1}
-{"query":"SELECT 1 AS `1` FROM `system`.`one` AS `__table1` SETTINGS allow_experimental_analyzer = 1","query_status":"QueryFinish","tracestate":"some custom state","sorted_by_finish_time":1}
+{"query":"SELECT 1 AS `1` FROM `system`.`one` AS `__table1`","query_status":"QueryFinish","tracestate":"some custom state","sorted_by_finish_time":1}
 {"query":"select 1 from remote('127.0.0.2', system, one) settings allow_experimental_analyzer = 1 format Null\n","query_status":"QueryFinish","tracestate":"some custom state","sorted_by_finish_time":1}
 {"total spans":"3","unique spans":"3","unique non-zero parent spans":"3"}
 {"initial query spans with proper parent":"2"}
diff --git a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
index 028cc744170..451f0d6d485 100644
--- a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
+++ b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.reference
@@ -31,7 +31,7 @@
 29	2j&S)ba?XG	QuQj	17163829389637435056
 3	UlI+1		14144472852965836438
 =============== QUERIES EXECUTED BY PARALLEL INNER QUERY ALONE ===============
-0	3	SELECT `__table1`.`key` AS `key`, `__table1`.`value1` AS `value1`, `__table1`.`value2` AS `value2`, toUInt64(min(`__table1`.`time`)) AS `start_ts` FROM `default`.`join_inner_table` AS `__table1` PREWHERE (`__table1`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table1`.`number` > _CAST(1610517366120, \'UInt64\')) GROUP BY `__table1`.`key`, `__table1`.`value1`, `__table1`.`value2` ORDER BY `__table1`.`key` ASC, `__table1`.`value1` ASC, `__table1`.`value2` ASC LIMIT _CAST(10, \'UInt64\') SETTINGS allow_experimental_parallel_reading_from_replicas = 1, allow_experimental_analyzer = 1
+0	3	SELECT `__table1`.`key` AS `key`, `__table1`.`value1` AS `value1`, `__table1`.`value2` AS `value2`, toUInt64(min(`__table1`.`time`)) AS `start_ts` FROM `default`.`join_inner_table` AS `__table1` PREWHERE (`__table1`.`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`__table1`.`number` > _CAST(1610517366120, \'UInt64\')) GROUP BY `__table1`.`key`, `__table1`.`value1`, `__table1`.`value2` ORDER BY `__table1`.`key` ASC, `__table1`.`value1` ASC, `__table1`.`value2` ASC LIMIT _CAST(10, \'UInt64\')
 0	3	SELECT `key`, `value1`, `value2`, toUInt64(min(`time`)) AS `start_ts` FROM `default`.`join_inner_table` PREWHERE (`id` = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (`number` > toUInt64(\'1610517366120\')) GROUP BY `key`, `value1`, `value2` ORDER BY `key` ASC, `value1` ASC, `value2` ASC LIMIT 10
 1	1	-- Parallel inner query alone\nSELECT\n    key,\n    value1,\n    value2,\n    toUInt64(min(time)) AS start_ts\nFROM join_inner_table\nPREWHERE (id = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (number > toUInt64(\'1610517366120\'))\nGROUP BY key, value1, value2\nORDER BY key, value1, value2\nLIMIT 10\nSETTINGS allow_experimental_parallel_reading_from_replicas = 1, allow_experimental_analyzer=0;
 1	1	-- Parallel inner query alone\nSELECT\n    key,\n    value1,\n    value2,\n    toUInt64(min(time)) AS start_ts\nFROM join_inner_table\nPREWHERE (id = \'833c9e22-c245-4eb5-8745-117a9a1f26b1\') AND (number > toUInt64(\'1610517366120\'))\nGROUP BY key, value1, value2\nORDER BY key, value1, value2\nLIMIT 10\nSETTINGS allow_experimental_parallel_reading_from_replicas = 1, allow_experimental_analyzer=1;
diff --git a/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference
index 3b8a394a522..5bf3520ccdb 100644
--- a/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference
+++ b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference
@@ -9,4 +9,4 @@
 7885388429666205427
 8124171311239967992
 1	1	-- Simple query with analyzer and pure parallel replicas\nSELECT number\nFROM join_inner_table__fuzz_146_replicated\n    SETTINGS\n    allow_experimental_analyzer = 1,\n    max_parallel_replicas = 2,\n    cluster_for_parallel_replicas = \'test_cluster_one_shard_three_replicas_localhost\',\n    allow_experimental_parallel_reading_from_replicas = 1;
-0	2	SELECT `__table1`.`number` AS `number` FROM `default`.`join_inner_table__fuzz_146_replicated` AS `__table1` SETTINGS allow_experimental_analyzer = 1, max_parallel_replicas = 2, cluster_for_parallel_replicas = \'test_cluster_one_shard_three_replicas_localhost\', allow_experimental_parallel_reading_from_replicas = 1
+0	2	SELECT `__table1`.`number` AS `number` FROM `default`.`join_inner_table__fuzz_146_replicated` AS `__table1`

From 2c0612c42522007b493f0838dcde7b2030a2d708 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 20 Mar 2024 09:54:49 +0000
Subject: [PATCH 785/985] Empty-Commit


From 2c0e266cfe13b48f9cb149683a5405a6b2fa41e1 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 20 Mar 2024 10:58:46 +0100
Subject: [PATCH 786/985] Addressed review comments

---
 src/Common/BufferAllocationPolicy.cpp         |  2 +-
 src/Common/BufferAllocationPolicy.h           |  3 +-
 .../IO/WriteBufferFromAzureBlobStorage.cpp    | 53 +++++++++++--------
 src/IO/WriteBufferFromS3.cpp                  | 32 +++++------
 src/IO/WriteBufferFromS3.h                    |  1 -
 5 files changed, 47 insertions(+), 44 deletions(-)

diff --git a/src/Common/BufferAllocationPolicy.cpp b/src/Common/BufferAllocationPolicy.cpp
index 14d009008b9..359da0f8313 100644
--- a/src/Common/BufferAllocationPolicy.cpp
+++ b/src/Common/BufferAllocationPolicy.cpp
@@ -73,7 +73,7 @@ public:
 
         if (1 == buffer_number)
         {
-            current_size = first_size;
+            current_size =  std::min(size_t(DBMS_DEFAULT_BUFFER_SIZE), first_size);
             return;
         }
 
diff --git a/src/Common/BufferAllocationPolicy.h b/src/Common/BufferAllocationPolicy.h
index dd04139e694..4ac20f1605b 100644
--- a/src/Common/BufferAllocationPolicy.h
+++ b/src/Common/BufferAllocationPolicy.h
@@ -9,6 +9,7 @@
 namespace DB
 {
 
+///  Buffer number starts with 0
 class IBufferAllocationPolicy
 {
 public:
@@ -20,7 +21,7 @@ public:
         size_t max_size = 5ULL * 1024 * 1024 * 1024;
         size_t multiply_factor = 2;
         size_t multiply_parts_count_threshold = 500;
-        size_t max_single_size = 32 * 1024 * 1024;
+        size_t max_single_size = 32 * 1024 * 1024; /// Max size for a single buffer/block
     };
 
 
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index f966e431506..1ef54272295 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -18,6 +18,25 @@ namespace ProfileEvents
 namespace DB
 {
 
+struct WriteBufferFromAzureBlobStorage::PartData
+{
+    Memory<> memory;
+    size_t data_size = 0;
+};
+
+IBufferAllocationPolicy::IBufferAllocationPolicyPtr createBufferAllocationPolicy(const AzureObjectStorageSettings & settings)
+{
+    IBufferAllocationPolicy::Settings allocation_settings;
+    allocation_settings.strict_size = settings.strict_upload_part_size;
+    allocation_settings.min_size = settings.min_upload_part_size;
+    allocation_settings.max_size = settings.max_upload_part_size;
+    allocation_settings.multiply_factor = settings.upload_part_size_multiply_factor;
+    allocation_settings.multiply_parts_count_threshold = settings.upload_part_size_multiply_parts_count_threshold;
+    allocation_settings.max_single_size = settings.max_single_part_upload_size;
+
+    return IBufferAllocationPolicy::create(allocation_settings);
+}
+
 WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> blob_container_client_,
     const String & blob_path_,
@@ -27,12 +46,7 @@ WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     ThreadPoolCallbackRunner<void> schedule_)
     : WriteBufferFromFileBase(buf_size_, nullptr, 0)
     , log(getLogger("WriteBufferFromAzureBlobStorage"))
-    , buffer_allocation_policy(IBufferAllocationPolicy::create({settings_->strict_upload_part_size,
-                                                                settings_->min_upload_part_size,
-                                                                settings_->max_upload_part_size,
-                                                                settings_->upload_part_size_multiply_factor,
-                                                                settings_->upload_part_size_multiply_parts_count_threshold,
-                                                                settings_->max_single_part_upload_size}))
+    , buffer_allocation_policy(createBufferAllocationPolicy(*settings_.get()))
     , max_single_part_upload_size(settings_->max_single_part_upload_size)
     , max_unexpected_write_error_retries(settings_->max_unexpected_write_error_retries)
     , blob_path(blob_path_)
@@ -91,6 +105,8 @@ void WriteBufferFromAzureBlobStorage::finalizeImpl()
 {
     auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
 
+    /// If there is only one block and size is less than or equal to max_single_part_upload_size
+    /// then we use single part upload instead of multi part upload
     if (buffer_allocation_policy->getBufferNumber() == 1)
     {
         size_t data_size = size_t(position() - memory.data());
@@ -124,39 +140,30 @@ void WriteBufferFromAzureBlobStorage::allocateBuffer()
 {
     buffer_allocation_policy->nextBuffer();
     auto size = buffer_allocation_policy->getBufferSize();
-
-    if (buffer_allocation_policy->getBufferNumber() == 1)
-    {
-        size = std::min(size_t(DBMS_DEFAULT_BUFFER_SIZE), size);
-    }
-
-    LOG_INFO(log, "allocateBuffer size = {}", size);
-
     memory = Memory(size);
     WriteBuffer::set(memory.data(), memory.size());
 }
 
 void WriteBufferFromAzureBlobStorage::writePart()
 {
-    size_t data_size = size_t(position() - memory.data());
-    auto data = std::move(memory);
+    std::shared_ptr<PartData> part_data;
+    auto data_size = size_t(position() - memory.data());
+    part_data = std::make_shared<PartData>(std::move(memory), data_size);
     WriteBuffer::set(nullptr, 0);
 
-    if (data_size == 0)
+    if (part_data->data_size == 0)
         return;
 
-    LOG_TRACE(log, "writePart data size `{}`", data_size);
-
-    auto upload_worker = [&] ()
+    auto upload_worker = [&, part_data] ()
     {
         auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
         const std::string & block_id = block_ids.emplace_back(getRandomASCIIString(64));
 
-        Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(data.data()), data_size);
-        execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, max_unexpected_write_error_retries, data_size);
+        Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(part_data->memory.data()), part_data->data_size);
+        execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, max_unexpected_write_error_retries, part_data->data_size);
 
         if (write_settings.remote_throttler)
-            write_settings.remote_throttler->add(data_size, ProfileEvents::RemoteWriteThrottlerBytes, ProfileEvents::RemoteWriteThrottlerSleepMicroseconds);
+            write_settings.remote_throttler->add(part_data->data_size, ProfileEvents::RemoteWriteThrottlerBytes, ProfileEvents::RemoteWriteThrottlerSleepMicroseconds);
     };
 
     task_tracker->add(std::move(upload_worker));
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index c907c4cb6b6..3ee59c42079 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -74,6 +74,19 @@ struct WriteBufferFromS3::PartData
     }
 };
 
+IBufferAllocationPolicy::IBufferAllocationPolicyPtr createBufferAllocationPolicy(const S3Settings::RequestSettings::PartUploadSettings & settings)
+{
+    IBufferAllocationPolicy::Settings allocation_settings;
+    allocation_settings.strict_size = settings.strict_upload_part_size;
+    allocation_settings.min_size = settings.min_upload_part_size;
+    allocation_settings.max_size = settings.max_upload_part_size;
+    allocation_settings.multiply_factor = settings.upload_part_size_multiply_factor;
+    allocation_settings.multiply_parts_count_threshold = settings.upload_part_size_multiply_parts_count_threshold;
+    allocation_settings.max_single_size = settings.max_single_part_upload_size;
+
+    return IBufferAllocationPolicy::create(allocation_settings);
+}
+
 
 WriteBufferFromS3::WriteBufferFromS3(
     std::shared_ptr<const S3::Client> client_ptr_,
@@ -93,12 +106,7 @@ WriteBufferFromS3::WriteBufferFromS3(
     , write_settings(write_settings_)
     , client_ptr(std::move(client_ptr_))
     , object_metadata(std::move(object_metadata_))
-    , buffer_allocation_policy(IBufferAllocationPolicy::create({upload_settings.strict_upload_part_size,
-                                                                upload_settings.min_upload_part_size,
-                                                                upload_settings.max_upload_part_size,
-                                                                upload_settings.upload_part_size_multiply_factor,
-                                                                upload_settings.upload_part_size_multiply_parts_count_threshold,
-                                                                upload_settings.max_single_part_upload_size}))
+    , buffer_allocation_policy(createBufferAllocationPolicy(upload_settings))
     , task_tracker(
           std::make_unique<TaskTracker>(
               std::move(schedule_),
@@ -327,22 +335,10 @@ void WriteBufferFromS3::detachBuffer()
     detached_part_data.push_back({std::move(buf), data_size});
 }
 
-void WriteBufferFromS3::allocateFirstBuffer()
-{
-    const auto max_first_buffer = buffer_allocation_policy->getBufferSize();
-    const auto size = std::min(size_t(DBMS_DEFAULT_BUFFER_SIZE), max_first_buffer);
-    memory = Memory(size);
-    WriteBuffer::set(memory.data(), memory.size());
-}
-
 void WriteBufferFromS3::allocateBuffer()
 {
     buffer_allocation_policy->nextBuffer();
     chassert(0 == hidden_size);
-
-    if (buffer_allocation_policy->getBufferNumber() == 1)
-        return allocateFirstBuffer();
-
     memory = Memory(buffer_allocation_policy->getBufferSize());
     WriteBuffer::set(memory.data(), memory.size());
 }
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 201743e7f9c..3d2aed74e88 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -59,7 +59,6 @@ private:
 
     struct PartData;
     void hidePartialData();
-    void allocateFirstBuffer();
     void reallocateFirstBuffer();
     void detachBuffer();
     void allocateBuffer();

From 25bae3e0a5f1b7cb157eb2bc0aa9984e2e6b5274 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Wed, 20 Mar 2024 10:58:43 +0000
Subject: [PATCH 787/985] Verbose error medssage about
 analyzer_compatibility_join_using_top_level_identifier

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 30 ++++++++++++++++++++---
 1 file changed, 26 insertions(+), 4 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 0414ea93f94..c7362cc4cce 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -7409,18 +7409,40 @@ void QueryAnalyzer::resolveJoin(QueryTreeNodePtr & join_node, IdentifierResolveS
             if (!result_left_table_expression)
                 result_left_table_expression = tryResolveIdentifierFromJoinTreeNode(identifier_lookup, join_node_typed.getLeftTableExpression(), scope);
 
-            /// Here we may try to resolve identifier from projection in case it's not resolved from left table expression
-            /// and analyzer_compatibility_join_using_top_level_identifier is disabled.
-            /// For now we do not do this, because not all corner cases are clear.
+            /** Here we may try to resolve identifier from projection in case it's not resolved from left table expression
+              * and analyzer_compatibility_join_using_top_level_identifier is disabled.
+              * For now we do not do this, because not all corner cases are clear.
+              * But let's at least mention it in error message
+              */
             /// if (!settings.analyzer_compatibility_join_using_top_level_identifier && !result_left_table_expression)
             ///     result_left_table_expression = try_resolve_identifier_from_query_projection(identifier_full_name, join_node_typed.getLeftTableExpression(), scope);
 
             if (!result_left_table_expression)
+            {
+                String extra_message;
+                const QueryNode * query_node = scope.scope_node ? scope.scope_node->as<QueryNode>() : nullptr;
+                if (settings.analyzer_compatibility_join_using_top_level_identifier && query_node)
+                {
+                    for (const auto & projection_node : query_node->getProjection().getNodes())
+                    {
+                        if (projection_node->hasAlias() && identifier_full_name == projection_node->getAlias())
+                        {
+                            extra_message = fmt::format(
+                                " , but alias '{}' is present in SELECT list."
+                                " You may try to SET analyzer_compatibility_join_using_top_level_identifier = 1, to allow to use it in USING clause",
+                                projection_node->formatASTForErrorMessage());
+                            break;
+                        }
+                    }
+                }
+
                 throw Exception(ErrorCodes::UNKNOWN_IDENTIFIER,
-                    "JOIN {} using identifier '{}' cannot be resolved from left table expression. In scope {}",
+                    "JOIN {} using identifier '{}' cannot be resolved from left table expression{}. In scope {}",
                     join_node_typed.formatASTForErrorMessage(),
                     identifier_full_name,
+                    extra_message,
                     scope.scope_node->formatASTForErrorMessage());
+            }
 
             if (result_left_table_expression->getNodeType() != QueryTreeNodeType::COLUMN)
                 throw Exception(ErrorCodes::UNSUPPORTED_METHOD,

From 5c1a54f643b9c72bf87ab03358a6244a7adf692b Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 18 Mar 2024 15:22:50 +0100
Subject: [PATCH 788/985] Fix `clickhouse-client -s` argument

---
 programs/client/Client.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index 4203e4738dd..9e90596b4f8 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -933,7 +933,7 @@ void Client::addOptions(OptionsDescription & options_description)
         ("config,c", po::value<std::string>(), "config-file path (another shorthand)")
         ("connection", po::value<std::string>(), "connection to use (from the client config), by default connection name is hostname")
         ("secure,s", "Use TLS connection")
-        ("no-secure,s", "Don't use TLS connection")
+        ("no-secure", "Don't use TLS connection")
         ("user,u", po::value<std::string>()->default_value("default"), "user")
         ("password", po::value<std::string>(), "password")
         ("ask-password", "ask-password")

From 55f7595c43f7f694dca65fad2880ba92b6d5de41 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 18 Mar 2024 15:24:55 +0100
Subject: [PATCH 789/985] Test `-s` argument for clickhouse-client

---
 tests/queries/0_stateless/00505_secure.reference | 1 +
 tests/queries/0_stateless/00505_secure.sh        | 4 ++++
 2 files changed, 5 insertions(+)

diff --git a/tests/queries/0_stateless/00505_secure.reference b/tests/queries/0_stateless/00505_secure.reference
index 9a8656bf491..73bdbdbafbe 100644
--- a/tests/queries/0_stateless/00505_secure.reference
+++ b/tests/queries/0_stateless/00505_secure.reference
@@ -1,3 +1,4 @@
+1
 2
 3
 4
diff --git a/tests/queries/0_stateless/00505_secure.sh b/tests/queries/0_stateless/00505_secure.sh
index b7c12911b90..dcda2c0f2e8 100755
--- a/tests/queries/0_stateless/00505_secure.sh
+++ b/tests/queries/0_stateless/00505_secure.sh
@@ -7,6 +7,10 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
+# Use $CLICKHOUSE_CLIENT_SECURE, but replace `--secure` by `-s` to test it
+CLICKHOUSE_CLIENT_S=${CLICKHOUSE_CLIENT_SECURE/ --secure / -s }
+$CLICKHOUSE_CLIENT_S -q "SELECT 1;"
+
 $CLICKHOUSE_CLIENT_SECURE -q "SELECT 2;"
 
 #disable test

From 463b90e058c1c6f0b5cd692e2fd699f5b5a1b3f8 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Mon, 18 Mar 2024 16:23:07 +0100
Subject: [PATCH 790/985] Add test for `--no-secure`

---
 tests/queries/0_stateless/00505_secure.reference | 1 +
 tests/queries/0_stateless/00505_secure.sh        | 2 ++
 2 files changed, 3 insertions(+)

diff --git a/tests/queries/0_stateless/00505_secure.reference b/tests/queries/0_stateless/00505_secure.reference
index 73bdbdbafbe..24319e2c136 100644
--- a/tests/queries/0_stateless/00505_secure.reference
+++ b/tests/queries/0_stateless/00505_secure.reference
@@ -1,3 +1,4 @@
+0
 1
 2
 3
diff --git a/tests/queries/0_stateless/00505_secure.sh b/tests/queries/0_stateless/00505_secure.sh
index dcda2c0f2e8..eaa50bce6b1 100755
--- a/tests/queries/0_stateless/00505_secure.sh
+++ b/tests/queries/0_stateless/00505_secure.sh
@@ -7,6 +7,8 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
+$CLICKHOUSE_CLIENT --no-secure -q "SELECT 0;"
+
 # Use $CLICKHOUSE_CLIENT_SECURE, but replace `--secure` by `-s` to test it
 CLICKHOUSE_CLIENT_S=${CLICKHOUSE_CLIENT_SECURE/ --secure / -s }
 $CLICKHOUSE_CLIENT_S -q "SELECT 1;"

From 624b3a6dbe198eb3c125fe37593b8c22b82c78f8 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 20 Mar 2024 12:08:46 +0000
Subject: [PATCH 791/985] Fixing
 00223_shard_distributed_aggregation_memory_efficient with analyzer.

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 17 ++++++++++++++++-
 src/Functions/randConstant.cpp            | 16 +++++++++++-----
 tests/analyzer_tech_debt.txt              |  1 -
 3 files changed, 27 insertions(+), 7 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 1da5d86edf3..2a46417ee98 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -799,6 +799,8 @@ struct IdentifierResolveScope
     /// Node hash to mask id map
     std::shared_ptr<std::map<IQueryTreeNode::Hash, size_t>> projection_mask_map;
 
+    std::map<IQueryTreeNode::Hash, FunctionOverloadResolverPtr> rand_constant_cache;
+
     [[maybe_unused]] const IdentifierResolveScope * getNearestQueryScope() const
     {
         const IdentifierResolveScope * scope_to_check = this;
@@ -5534,7 +5536,20 @@ ProjectionNames QueryAnalyzer::resolveFunction(QueryTreeNodePtr & node, Identifi
 
     if (!function)
     {
-        function = FunctionFactory::instance().tryGet(function_name, scope.context);
+        /// This is a hack to allow a query like `select randConstant(), randConstant(), randConstant()`.
+        /// Function randConstant() would return the same value for the same arguments (in scope).
+        if (function_name == "randConstant")
+        {
+            auto hash = function_node_ptr->getTreeHash();
+            auto & func = scope.rand_constant_cache[hash];
+            if (!func)
+                func = FunctionFactory::instance().tryGet(function_name, scope.context);
+
+            function = func;
+        }
+        else
+            function = FunctionFactory::instance().tryGet(function_name, scope.context);
+
         is_executable_udf = false;
     }
 
diff --git a/src/Functions/randConstant.cpp b/src/Functions/randConstant.cpp
index 22ce6d88ea6..5872ab8bb34 100644
--- a/src/Functions/randConstant.cpp
+++ b/src/Functions/randConstant.cpp
@@ -88,6 +88,14 @@ public:
         return std::make_unique<RandomConstantOverloadResolver<ToType, Name>>();
     }
 
+    RandomConstantOverloadResolver()
+    {
+        typename ColumnVector<ToType>::Container vec_to(1);
+
+        TargetSpecific::Default::RandImpl::execute(reinterpret_cast<char *>(vec_to.data()), sizeof(ToType));
+        value = vec_to[0];
+    }
+
     DataTypePtr getReturnTypeImpl(const DataTypes & data_types) const override
     {
         size_t number_of_arguments = data_types.size();
@@ -105,13 +113,11 @@ public:
         if (!arguments.empty())
             argument_types.emplace_back(arguments.back().type);
 
-        typename ColumnVector<ToType>::Container vec_to(1);
-
-        TargetSpecific::Default::RandImpl::execute(reinterpret_cast<char *>(vec_to.data()), sizeof(ToType));
-        ToType value = vec_to[0];
-
         return std::make_unique<FunctionBaseRandomConstant<ToType, Name>>(value, argument_types, return_type);
     }
+
+private:
+    ToType value;
 };
 
 struct NameRandConstant { static constexpr auto name = "randConstant"; };
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index 7cd73705e77..2d8497234e2 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -1,4 +1,3 @@
-00223_shard_distributed_aggregation_memory_efficient
 00725_memory_tracking
 01062_pm_all_join_with_block_continuation
 01083_expressions_in_engine_arguments

From 007775c9826853ddcec24282edbd1e1496911b0a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 20 Mar 2024 13:09:26 +0100
Subject: [PATCH 792/985] Better fuzzer logs

---
 docker/test/fuzzer/run-fuzzer.sh | 11 +++++------
 1 file changed, 5 insertions(+), 6 deletions(-)

diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index c9e1681401d..55f4d379005 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -173,16 +173,15 @@ function fuzz
 
     mkdir -p /var/run/clickhouse-server
 
-    # NOTE: we use process substitution here to preserve keep $! as a pid of clickhouse-server
-    # server.log -> CH logs
-    # stderr.log -> Process logs (sanitizer)
+    # server.log -> All server logs, including sanitizer
+    # stderr.log -> Process logs (sanitizer) only
     clickhouse-server \
         --config-file db/config.xml \
         --pid-file /var/run/clickhouse-server/clickhouse-server.pid \
         --  --path db \
             --logger.console=0 \
-            --logger.log=server.log > stderr.log 2>&1 &
-    server_pid=$!
+            --logger.log=server.log 2>&1 | tee -a stderr.log >> server.log 2>&1 &
+    server_pid=$(pidof clickhouse-server)
 
     kill -0 $server_pid
 
@@ -310,7 +309,7 @@ quit
     if [ "$server_died" == 1 ]
     then
         # The server has died.
-        if ! rg --text -o 'Received signal.*|Logical error.*|Assertion.*failed|Failed assertion.*|.*runtime error: .*|.*is located.*|(SUMMARY|ERROR): [a-zA-Z]+Sanitizer:.*|.*_LIBCPP_ASSERT.*|.*Child process was terminated by signal 9.*' server.log stderr.log > description.txt
+        if ! rg --text -o 'Received signal.*|Logical error.*|Assertion.*failed|Failed assertion.*|.*runtime error: .*|.*is located.*|(SUMMARY|ERROR): [a-zA-Z]+Sanitizer:.*|.*_LIBCPP_ASSERT.*|.*Child process was terminated by signal 9.*' server.log > description.txt
         then
             echo "Lost connection to server. See the logs." > description.txt
         fi

From 15339091626617a224ec8a152696b4c4f8881c3a Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 20 Mar 2024 13:22:30 +0100
Subject: [PATCH 793/985] Fix flaky 02122_parallel_formatting_Template

---
 tests/queries/0_stateless/02122_parallel_formatting_Template.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02122_parallel_formatting_Template.sh b/tests/queries/0_stateless/02122_parallel_formatting_Template.sh
index c7d2329ec14..86a4c017bbe 100755
--- a/tests/queries/0_stateless/02122_parallel_formatting_Template.sh
+++ b/tests/queries/0_stateless/02122_parallel_formatting_Template.sh
@@ -21,7 +21,7 @@ $CLICKHOUSE_CLIENT -q "select number as x, number + 1 as y, concat('string: ', t
 
 diff $non_parallel_file $parallel_file
 
-echo -ne '{prefix} \n${data}\n $$ suffix $$\n${totals}\n${min}\n${max}\n${rows:Quoted}\n${rows_before_limit:Quoted}\n${rows_read:Quoted}\n${bytes_read:Quoted}\n' > $resultset_path
+echo -ne '{prefix} \n${data}\n $$ suffix $$\n${totals}\n${min}\n${max}\n${rows:Quoted}\n${rows_before_limit:Quoted}\n' > $resultset_path
 
 echo "Template-2"
 $CLICKHOUSE_CLIENT -q "select number as x, number + 1 as y, concat('string: ', toString(number)) as s from numbers(200000) group by number with totals order by number limit 190000 format Template $TEMPLATE_SETTINGS" --output_format_parallel_formatting=0 --extremes=1 > $non_parallel_file

From 06d28eebe598e975fa14595d1ad1a5a1af3e1999 Mon Sep 17 00:00:00 2001
From: Kruglov Pavel <48961922+Avogar@users.noreply.github.com>
Date: Wed, 20 Mar 2024 13:58:21 +0100
Subject: [PATCH 794/985] Fix test reference

---
 ...159_parallel_formatting_tsv_and_friends.reference | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/tests/queries/1_stateful/00159_parallel_formatting_tsv_and_friends.reference b/tests/queries/1_stateful/00159_parallel_formatting_tsv_and_friends.reference
index 91e3af03db8..1131cbb670d 100644
--- a/tests/queries/1_stateful/00159_parallel_formatting_tsv_and_friends.reference
+++ b/tests/queries/1_stateful/00159_parallel_formatting_tsv_and_friends.reference
@@ -1,12 +1,12 @@
 TSV, false
-194d5061de4cae59489d989373f8effe  -
+2cc7bfde1a2855814c6ea2c8181679c8  -
 TSV, true
-194d5061de4cae59489d989373f8effe  -
+2cc7bfde1a2855814c6ea2c8181679c8  -
 TSVWithNames, false
-a6d327a3611288b3f973d00e6116f16e  -
+c4cb6f9c0d77cd76f2584279993b4438  -
 TSVWithNames, true
-a6d327a3611288b3f973d00e6116f16e  -
+c4cb6f9c0d77cd76f2584279993b4438  -
 TSKV, false
-c2e32a21c08aacf60bda21248ce4f73f  -
+fd9ccbc364c90e1f7682348fe7f11a5a  -
 TSKV, true
-c2e32a21c08aacf60bda21248ce4f73f  -
+fd9ccbc364c90e1f7682348fe7f11a5a  -

From 2c02476f4aea90906fc117067d4adc627b142cfe Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 20 Mar 2024 14:08:00 +0100
Subject: [PATCH 795/985] Change riscv RLIMIT_CPU

---
 CMakeLists.txt | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index d345705ae53..f646c830daa 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -61,11 +61,16 @@ if (ENABLE_CHECK_HEAVY_BUILDS)
     # set CPU time limit to 1000 seconds
     set (RLIMIT_CPU 1000)
 
-    # Sanitizers are too heavy. Also RISCV has some extra memory requirements
-    if (SANITIZE OR SANITIZE_COVERAGE OR WITH_COVERAGE OR ARCH_RISCV64)
+    # Sanitizers are too heavy
+    if (SANITIZE OR SANITIZE_COVERAGE OR WITH_COVERAGE)
        set (RLIMIT_DATA 10000000000) # 10G
     endif()
 
+    # For some files currently building RISCV64 might be too slow. TODO: Improve compilation times per file
+    if (ARCH_RISCV64)
+        set (RLIMIT_CPU 1800)
+    endif()
+
     set (CMAKE_CXX_COMPILER_LAUNCHER prlimit --as=${RLIMIT_AS} --data=${RLIMIT_DATA} --cpu=${RLIMIT_CPU} ${CMAKE_CXX_COMPILER_LAUNCHER})
 endif ()
 

From 5ed895dbf529415af2896abfda72f9a096461af9 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Wed, 20 Mar 2024 14:12:33 +0100
Subject: [PATCH 796/985] remove whitespace before coma

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index c7362cc4cce..6014d761794 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -7428,7 +7428,7 @@ void QueryAnalyzer::resolveJoin(QueryTreeNodePtr & join_node, IdentifierResolveS
                         if (projection_node->hasAlias() && identifier_full_name == projection_node->getAlias())
                         {
                             extra_message = fmt::format(
-                                " , but alias '{}' is present in SELECT list."
+                                ", but alias '{}' is present in SELECT list."
                                 " You may try to SET analyzer_compatibility_join_using_top_level_identifier = 1, to allow to use it in USING clause",
                                 projection_node->formatASTForErrorMessage());
                             break;

From 52b2220dc219fa7073e4cdb6ab45b37cad90df76 Mon Sep 17 00:00:00 2001
From: divanik <divanik>
Date: Wed, 20 Mar 2024 13:20:39 +0000
Subject: [PATCH 797/985] Resolved issues

---
 src/Common/iota.cpp                           | 10 +++----
 src/Common/iota.h                             | 11 +++----
 .../QueryPlan/ReadFromSystemNumbersStep.cpp   | 30 ++++++++-----------
 src/Storages/System/StorageSystemNumbers.cpp  |  3 +-
 4 files changed, 26 insertions(+), 28 deletions(-)

diff --git a/src/Common/iota.cpp b/src/Common/iota.cpp
index 86c9e04bb06..82fe86618c9 100644
--- a/src/Common/iota.cpp
+++ b/src/Common/iota.cpp
@@ -37,7 +37,7 @@ MULTITARGET_FUNCTION_AVX2_SSE42(
 )
 
 template <iota_supported_types T>
-void iota_with_step(T * begin, size_t count, T first_value, T step)
+void iotaWithStep(T * begin, size_t count, T first_value, T step)
 {
 #if USE_MULTITARGET_CODE
     if (isArchSupported(TargetArch::AVX2))
@@ -56,10 +56,10 @@ template void iota(UInt64 * begin, size_t count, UInt64 first_value);
 template void iota(size_t * begin, size_t count, size_t first_value);
 #endif
 
-template void iota_with_step(UInt8 * begin, size_t count, UInt8 first_value, UInt8 step);
-template void iota_with_step(UInt32 * begin, size_t count, UInt32 first_value, UInt32 step);
-template void iota_with_step(UInt64 * begin, size_t count, UInt64 first_value, UInt64 step);
+template void iotaWithStep(UInt8 * begin, size_t count, UInt8 first_value, UInt8 step);
+template void iotaWithStep(UInt32 * begin, size_t count, UInt32 first_value, UInt32 step);
+template void iotaWithStep(UInt64 * begin, size_t count, UInt64 first_value, UInt64 step);
 #if defined(OS_DARWIN)
-template void iota_with_step(size_t * begin, size_t count, size_t first_value, size_t step);
+template void iotaWithStep(size_t * begin, size_t count, size_t first_value, size_t step);
 #endif
 }
diff --git a/src/Common/iota.h b/src/Common/iota.h
index 8fa18be9769..7ddf61736b9 100644
--- a/src/Common/iota.h
+++ b/src/Common/iota.h
@@ -32,12 +32,13 @@ extern template void iota(UInt64 * begin, size_t count, UInt64 first_value);
 extern template void iota(size_t * begin, size_t count, size_t first_value);
 #endif
 
-template <iota_supported_types T> void iota_with_step(T * begin, size_t count, T first_value, T step);
+template <iota_supported_types T>
+void iotaWithStep(T * begin, size_t count, T first_value, T step);
 
-extern template void iota_with_step(UInt8 * begin, size_t count, UInt8 first_value, UInt8 step);
-extern template void iota_with_step(UInt32 * begin, size_t count, UInt32 first_value, UInt32 step);
-extern template void iota_with_step(UInt64 * begin, size_t count, UInt64 first_value, UInt64 step);
+extern template void iotaWithStep(UInt8 * begin, size_t count, UInt8 first_value, UInt8 step);
+extern template void iotaWithStep(UInt32 * begin, size_t count, UInt32 first_value, UInt32 step);
+extern template void iotaWithStep(UInt64 * begin, size_t count, UInt64 first_value, UInt64 step);
 #if defined(OS_DARWIN)
-extern template void iota_with_step(size_t * begin, size_t count, size_t first_value, size_t step);
+extern template void iotaWithStep(size_t * begin, size_t count, size_t first_value, size_t step);
 #endif
 }
diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 503dd534d89..7a61d09bdd2 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -12,10 +12,7 @@
 #include <fmt/format.h>
 #include <Common/iota.h>
 #include <Common/typeid_cast.h>
-
-#include <Common/logger_useful.h>
 #include "Core/Types.h"
-#include "base/Decimal_fwd.h"
 #include "base/types.h"
 
 namespace DB
@@ -30,12 +27,12 @@ namespace
 {
 
 template <iota_supported_types T>
-inline void iota_with_step_optimized(T * begin, size_t count, T first_value, T step)
+inline void iotaWithStepOptimized(T * begin, size_t count, T first_value, T step)
 {
     if (step == 1)
         iota(begin, count, first_value);
     else
-        iota_with_step(begin, count, first_value, step);
+        iotaWithStep(begin, count, first_value, step);
 }
 
 class NumbersSource : public ISource
@@ -76,7 +73,7 @@ protected:
 
         UInt64 * current_end = &vec[real_block_size];
 
-        iota_with_step_optimized(pos, static_cast<size_t>(current_end - pos), curr, step);
+        iotaWithStepOptimized(pos, static_cast<size_t>(current_end - pos), curr, step);
 
         next += chunk_step;
 
@@ -102,7 +99,7 @@ struct RangeWithStep
 
 using RangesWithStep = std::vector<RangeWithStep>;
 
-std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 step, UInt64 remainder)
+std::optional<RangeWithStep> steppedRangeFromRange(const Range & r, UInt64 step, UInt64 remainder)
 {
     if ((r.right.get<UInt64>() == 0) && (!r.right_included))
         return std::nullopt;
@@ -124,7 +121,7 @@ std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 st
     return std::optional{RangeWithStep{begin, step, static_cast<UInt128>(right_edge_included - begin) / step + 1}};
 }
 
-[[maybe_unused]] auto sizeOfRanges(const RangesWithStep & rs)
+auto sizeOfRanges(const RangesWithStep & rs)
 {
     UInt128 total_size{};
     for (const RangeWithStep & r : rs)
@@ -138,7 +135,7 @@ std::optional<RangeWithStep> stepped_range_from_range(const Range & r, UInt64 st
 /// Generate numbers according to ranges.
 /// Numbers generated is ordered in one stream.
 /// Notice that we will not generate additional numbers out of ranges.
-class [[maybe_unused]] NumbersRangedSource : public ISource
+class NumbersRangedSource : public ISource
 {
 public:
     /// Represent a position in Ranges list.
@@ -269,7 +266,7 @@ protected:
                     auto start_value_64 = static_cast<UInt64>(start_value);
                     auto end_value_64 = static_cast<UInt64>(end_value);
                     auto size = (end_value_64 - start_value_64) / this->step;
-                    iota_with_step_optimized(pos, static_cast<size_t>(size), start_value_64, step);
+                    iotaWithStepOptimized(pos, static_cast<size_t>(size), start_value_64, step);
                     pos += size;
                 }
             };
@@ -278,7 +275,7 @@ protected:
             {
                 UInt64 start_value = range.left + cursor.offset_in_range * step;
                 /// end_value will never overflow
-                iota_with_step_optimized(pos, static_cast<size_t>(need), start_value, step);
+                iotaWithStepOptimized(pos, static_cast<size_t>(need), start_value, step);
                 pos += need;
                 provided += need;
                 cursor.offset_in_range += need;
@@ -331,7 +328,7 @@ private:
 namespace
 {
 /// Whether we should push limit down to scan.
-[[maybe_unused]] bool shouldPushdownLimit(SelectQueryInfo & query_info, UInt64 limit_length)
+bool shouldPushdownLimit(SelectQueryInfo & query_info, UInt64 limit_length)
 {
     const auto & query = query_info.query->as<ASTSelectQuery &>();
     /// Just ignore some minor cases, such as:
@@ -344,7 +341,7 @@ namespace
 
 /// Shrink ranges to size.
 ///     For example: ranges: [1, 5], [8, 100]; size: 7, we will get [1, 5], [8, 9]
-[[maybe_unused]] void shrinkRanges(RangesWithStep & ranges, size_t size)
+void shrinkRanges(RangesWithStep & ranges, size_t size)
 {
     size_t last_range_idx = 0;
     for (size_t i = 0; i < ranges.size(); i++)
@@ -480,8 +477,8 @@ Pipe ReadFromSystemNumbersStep::makePipe()
             auto intersected_range = table_range->intersectWith(r);
             if (intersected_range.has_value())
             {
-                auto range_with_step = stepped_range_from_range(
-                    intersected_range.value(), numbers_storage.step, numbers_storage.offset % numbers_storage.step);
+                auto range_with_step
+                    = steppedRangeFromRange(intersected_range.value(), numbers_storage.step, numbers_storage.offset % numbers_storage.step);
                 if (range_with_step.has_value())
                     intersected_ranges.push_back(*range_with_step);
             }
@@ -496,7 +493,7 @@ Pipe ReadFromSystemNumbersStep::makePipe()
                 auto intersected_range = overflowed_table_range->intersectWith(r);
                 if (intersected_range)
                 {
-                    auto range_with_step = stepped_range_from_range(
+                    auto range_with_step = steppedRangeFromRange(
                         intersected_range.value(),
                         numbers_storage.step,
                         static_cast<UInt64>(
@@ -518,7 +515,6 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         const auto & limit_length = limit_length_and_offset.first;
         const auto & limit_offset = limit_length_and_offset.second;
 
-        /// If intersected ranges is limited or we can pushdown limit.
         UInt128 total_size = sizeOfRanges(intersected_ranges);
         UInt128 query_limit = limit_length + limit_offset;
 
diff --git a/src/Storages/System/StorageSystemNumbers.cpp b/src/Storages/System/StorageSystemNumbers.cpp
index 32d16ef38f9..629b11ee7f1 100644
--- a/src/Storages/System/StorageSystemNumbers.cpp
+++ b/src/Storages/System/StorageSystemNumbers.cpp
@@ -11,7 +11,6 @@
 #include <Processors/Sources/NullSource.h>
 #include <QueryPipeline/Pipe.h>
 #include <Storages/SelectQueryInfo.h>
-#include <Common/logger_useful.h>
 
 namespace DB
 {
@@ -26,6 +25,8 @@ StorageSystemNumbers::StorageSystemNumbers(
     : IStorage(table_id), multithreaded(multithreaded_), limit(limit_), offset(offset_), column_name(column_name_), step(step_)
 {
     StorageInMemoryMetadata storage_metadata;
+    /// This column doesn't have a comment, because otherwise it will be added to all the tables which were created via
+    /// CREATE TABLE test as numbers(5)
     storage_metadata.setColumns(ColumnsDescription({{column_name_, std::make_shared<DataTypeUInt64>()}}));
     setInMemoryMetadata(storage_metadata);
 }

From 9bf50ac814f59a1936dbe1b64a717718af1cfea8 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 20 Mar 2024 14:50:26 +0100
Subject: [PATCH 798/985] Fix aggregator when data is empty

---
 src/Interpreters/Aggregator.cpp                            | 7 ++++++-
 .../03015_aggregator_empty_data_multiple_blocks.reference  | 0
 .../03015_aggregator_empty_data_multiple_blocks.sql        | 3 +++
 3 files changed, 9 insertions(+), 1 deletion(-)
 create mode 100644 tests/queries/0_stateless/03015_aggregator_empty_data_multiple_blocks.reference
 create mode 100644 tests/queries/0_stateless/03015_aggregator_empty_data_multiple_blocks.sql

diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index 1c0d4b2d671..7f3b961a598 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -1867,7 +1867,12 @@ Aggregator::convertToBlockImpl(Method & method, Table & data, Arena * arena, Are
     if (data.empty())
     {
         auto && out_cols = prepareOutputBlockColumns(params, aggregate_functions, getHeader(final), aggregates_pools, final, rows);
-        return {finalizeBlock(params, getHeader(final), std::move(out_cols), final, rows)};
+        auto finalized_block = finalizeBlock(params, getHeader(final), std::move(out_cols), final, rows);
+
+        if (return_single_block)
+            return std::move(finalized_block);
+
+        return BlocksList{std::move(finalized_block)};
     }
     ConvertToBlockResVariant res;
     bool use_compiled_functions = false;
diff --git a/tests/queries/0_stateless/03015_aggregator_empty_data_multiple_blocks.reference b/tests/queries/0_stateless/03015_aggregator_empty_data_multiple_blocks.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03015_aggregator_empty_data_multiple_blocks.sql b/tests/queries/0_stateless/03015_aggregator_empty_data_multiple_blocks.sql
new file mode 100644
index 00000000000..d2c1816f7e8
--- /dev/null
+++ b/tests/queries/0_stateless/03015_aggregator_empty_data_multiple_blocks.sql
@@ -0,0 +1,3 @@
+CREATE TABLE 03015_aggregator_empty_data_multiple_blocks (c0 Int32) ENGINE = Memory();
+INSERT INTO 03015_aggregator_empty_data_multiple_blocks SELECT * FROM generateRandom() LIMIT 1000;
+SELECT radians(t1.c0) FROM 03015_aggregator_empty_data_multiple_blocks AS t1 RIGHT ANTI JOIN 03015_aggregator_empty_data_multiple_blocks AS right_0 ON t1.c0=right_0.c0 GROUP BY t1.c0;

From 981c9e0c12ef7f554f48aa7e8402eb7e15368296 Mon Sep 17 00:00:00 2001
From: Oxide Computer Company <eng@oxide.computer>
Date: Wed, 22 Nov 2023 11:47:30 +0000
Subject: [PATCH 799/985] Restore poco SUN files

These were accidentally deleted as unused in
https://github.com/ClickHouse/ClickHouse/commit/44afecf083b2cfa3d77d2e227f
---
 .../include/Poco/FPEnvironment_SUN.h          |  75 ++++++++++
 .../poco/Foundation/src/FPEnvironment_SUN.cpp | 139 ++++++++++++++++++
 2 files changed, 214 insertions(+)
 create mode 100644 base/poco/Foundation/include/Poco/FPEnvironment_SUN.h
 create mode 100644 base/poco/Foundation/src/FPEnvironment_SUN.cpp

diff --git a/base/poco/Foundation/include/Poco/FPEnvironment_SUN.h b/base/poco/Foundation/include/Poco/FPEnvironment_SUN.h
new file mode 100644
index 00000000000..7b31307e1ca
--- /dev/null
+++ b/base/poco/Foundation/include/Poco/FPEnvironment_SUN.h
@@ -0,0 +1,75 @@
+//
+// FPEnvironment_SUN.h
+//
+// Library: Foundation
+// Package: Core
+// Module:  FPEnvironment
+//
+// Definitions of class FPEnvironmentImpl for Solaris.
+//
+// Copyright (c) 2005-2006, Applied Informatics Software Engineering GmbH.
+// and Contributors.
+//
+// SPDX-License-Identifier:	BSL-1.0
+//
+
+
+#ifndef Foundation_FPEnvironment_SUN_INCLUDED
+#define Foundation_FPEnvironment_SUN_INCLUDED
+
+
+#include <ieeefp.h>
+#include "Poco/Foundation.h"
+
+
+namespace Poco
+{
+
+
+class FPEnvironmentImpl
+{
+protected:
+    enum RoundingModeImpl
+    {
+        FP_ROUND_DOWNWARD_IMPL = FP_RM,
+        FP_ROUND_UPWARD_IMPL = FP_RP,
+        FP_ROUND_TONEAREST_IMPL = FP_RN,
+        FP_ROUND_TOWARDZERO_IMPL = FP_RZ
+    };
+    enum FlagImpl
+    {
+        FP_DIVIDE_BY_ZERO_IMPL = FP_X_DZ,
+        FP_INEXACT_IMPL = FP_X_IMP,
+        FP_OVERFLOW_IMPL = FP_X_OFL,
+        FP_UNDERFLOW_IMPL = FP_X_UFL,
+        FP_INVALID_IMPL = FP_X_INV
+    };
+    FPEnvironmentImpl();
+    FPEnvironmentImpl(const FPEnvironmentImpl & env);
+    ~FPEnvironmentImpl();
+    FPEnvironmentImpl & operator=(const FPEnvironmentImpl & env);
+    void keepCurrentImpl();
+    static void clearFlagsImpl();
+    static bool isFlagImpl(FlagImpl flag);
+    static void setRoundingModeImpl(RoundingModeImpl mode);
+    static RoundingModeImpl getRoundingModeImpl();
+    static bool isInfiniteImpl(float value);
+    static bool isInfiniteImpl(double value);
+    static bool isInfiniteImpl(long double value);
+    static bool isNaNImpl(float value);
+    static bool isNaNImpl(double value);
+    static bool isNaNImpl(long double value);
+    static float copySignImpl(float target, float source);
+    static double copySignImpl(double target, double source);
+    static long double copySignImpl(long double target, long double source);
+
+private:
+    fp_rnd _rnd;
+    fp_except _exc;
+};
+
+
+} // namespace Poco
+
+
+#endif // Foundation_FPEnvironment_SUN_INCLUDED
diff --git a/base/poco/Foundation/src/FPEnvironment_SUN.cpp b/base/poco/Foundation/src/FPEnvironment_SUN.cpp
new file mode 100644
index 00000000000..36ee36431df
--- /dev/null
+++ b/base/poco/Foundation/src/FPEnvironment_SUN.cpp
@@ -0,0 +1,139 @@
+//
+// FPEnvironment_SUN.cpp
+//
+// Library: Foundation
+// Package: Core
+// Module:  FPEnvironment
+//
+// Copyright (c) 2005-2006, Applied Informatics Software Engineering GmbH.
+// and Contributors.
+//
+// SPDX-License-Identifier:	BSL-1.0
+//
+
+
+#include <math.h>
+#include "Poco/FPEnvironment_SUN.h"
+
+
+namespace Poco {
+
+
+FPEnvironmentImpl::FPEnvironmentImpl()
+{
+	_rnd = fpgetround();
+	_exc = fpgetmask();
+}
+
+
+FPEnvironmentImpl::FPEnvironmentImpl(const FPEnvironmentImpl& env)
+{
+	_rnd = env._rnd;
+	_exc = env._exc;
+}
+
+
+FPEnvironmentImpl::~FPEnvironmentImpl()
+{
+	fpsetround(_rnd);
+	fpsetmask(_exc);
+}
+
+
+FPEnvironmentImpl& FPEnvironmentImpl::operator = (const FPEnvironmentImpl& env)
+{
+	_rnd = env._rnd;
+	_exc = env._exc;
+	return *this;
+}
+
+
+bool FPEnvironmentImpl::isInfiniteImpl(float value)
+{
+	int cls = fpclass(value);
+	return cls == FP_PINF || cls == FP_NINF;
+}
+
+
+bool FPEnvironmentImpl::isInfiniteImpl(double value)
+{
+	int cls = fpclass(value);
+	return cls == FP_PINF || cls == FP_NINF;
+}
+
+
+bool FPEnvironmentImpl::isInfiniteImpl(long double value)
+{
+	int cls = fpclass(value);
+	return cls == FP_PINF || cls == FP_NINF;
+}
+
+
+bool FPEnvironmentImpl::isNaNImpl(float value)
+{
+	return isnanf(value) != 0;
+}
+
+
+bool FPEnvironmentImpl::isNaNImpl(double value)
+{
+	return isnan(value) != 0;
+}
+
+
+bool FPEnvironmentImpl::isNaNImpl(long double value)
+{
+	return isnan((double) value) != 0;
+}
+
+
+float FPEnvironmentImpl::copySignImpl(float target, float source)
+{
+	return (float) copysign(target, source);
+}
+
+
+double FPEnvironmentImpl::copySignImpl(double target, double source)
+{
+	return (float) copysign(target, source);
+}
+
+
+long double FPEnvironmentImpl::copySignImpl(long double target, long double source)
+{
+	return (source > 0 && target > 0) || (source < 0 && target < 0) ? target : -target;
+}
+
+
+void FPEnvironmentImpl::keepCurrentImpl()
+{
+	fpsetround(_rnd);
+	fpsetmask(_exc);
+}
+
+
+void FPEnvironmentImpl::clearFlagsImpl()
+{
+	fpsetsticky(0);
+}
+
+
+bool FPEnvironmentImpl::isFlagImpl(FlagImpl flag)
+{
+	return (fpgetsticky() & flag) != 0;
+}
+
+
+void FPEnvironmentImpl::setRoundingModeImpl(RoundingModeImpl mode)
+{
+	fpsetround((fp_rnd) mode);
+}
+
+
+FPEnvironmentImpl::RoundingModeImpl FPEnvironmentImpl::getRoundingModeImpl()
+{
+	return (FPEnvironmentImpl::RoundingModeImpl) fpgetround();
+}
+
+
+} // namespace Poco

From da28eaf454e6fca09dcc6c9b7f616f716ce49e02 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Tue, 19 Mar 2024 13:08:38 +0000
Subject: [PATCH 800/985] CI: remove compose files from integration test docker

 #ci_set_integration
---
 docker/test/integration/runner/Dockerfile        |  1 -
 tests/integration/README.md                      |  1 -
 .../compose/docker_compose_azurite.yml           |  0
 .../compose/docker_compose_cassandra.yml         |  0
 .../compose/docker_compose_clickhouse.yml        |  0
 .../compose/docker_compose_coredns.yml           |  0
 .../compose/docker_compose_dotnet_client.yml     |  0
 .../integration}/compose/docker_compose_hdfs.yml |  0
 .../integration}/compose/docker_compose_hive.yml |  0
 .../compose/docker_compose_jdbc_bridge.yml       |  0
 .../compose/docker_compose_kafka.yml             |  0
 .../compose/docker_compose_keeper.yml            |  0
 .../compose/docker_compose_kerberized_hdfs.yml   |  0
 .../compose/docker_compose_kerberized_kafka.yml  |  0
 .../compose/docker_compose_kerberos_kdc.yml      |  0
 .../integration}/compose/docker_compose_ldap.yml |  0
 .../compose/docker_compose_minio.yml             |  0
 .../compose/docker_compose_mongo.yml             |  0
 .../compose/docker_compose_mongo_secure.yml      |  0
 .../compose/docker_compose_mysql.yml             |  0
 .../compose/docker_compose_mysql_8_0.yml         |  0
 .../compose/docker_compose_mysql_client.yml      |  0
 .../compose/docker_compose_mysql_cluster.yml     |  0
 .../docker_compose_mysql_golang_client.yml       |  0
 .../compose/docker_compose_mysql_java_client.yml |  0
 .../compose/docker_compose_mysql_js_client.yml   |  0
 .../compose/docker_compose_mysql_php_client.yml  |  0
 .../integration}/compose/docker_compose_nats.yml |  0
 .../integration}/compose/docker_compose_net.yml  |  0
 .../compose/docker_compose_nginx.yml             |  0
 .../compose/docker_compose_postgres.yml          |  0
 .../compose/docker_compose_postgres_cluster.yml  |  0
 .../compose/docker_compose_postgresql.yml        |  0
 .../docker_compose_postgresql_java_client.yml    |  0
 .../compose/docker_compose_rabbitmq.yml          |  0
 .../compose/docker_compose_redis.yml             |  0
 .../compose/docker_compose_zookeeper.yml         |  0
 .../compose/docker_compose_zookeeper_secure.yml  |  0
 tests/integration/helpers/cluster.py             | 16 ++--------------
 tests/integration/runner                         |  2 +-
 40 files changed, 3 insertions(+), 17 deletions(-)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_azurite.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_cassandra.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_clickhouse.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_coredns.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_dotnet_client.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_hdfs.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_hive.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_jdbc_bridge.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_kafka.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_keeper.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_kerberized_hdfs.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_kerberized_kafka.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_kerberos_kdc.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_ldap.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_minio.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mongo.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mongo_secure.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mysql.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mysql_8_0.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mysql_client.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mysql_cluster.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mysql_golang_client.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mysql_java_client.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mysql_js_client.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_mysql_php_client.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_nats.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_net.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_nginx.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_postgres.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_postgres_cluster.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_postgresql.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_postgresql_java_client.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_rabbitmq.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_redis.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_zookeeper.yml (100%)
 rename {docker/test/integration/runner => tests/integration}/compose/docker_compose_zookeeper_secure.yml (100%)

diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index b876f7b9635..8297a7100d1 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -126,7 +126,6 @@ RUN set -x \
 
 COPY modprobe.sh /usr/local/bin/modprobe
 COPY dockerd-entrypoint.sh /usr/local/bin/
-COPY compose/ /compose/
 COPY misc/ /misc/
 
 
diff --git a/tests/integration/README.md b/tests/integration/README.md
index ac01c43769e..cde4cb05aec 100644
--- a/tests/integration/README.md
+++ b/tests/integration/README.md
@@ -66,7 +66,6 @@ set the following environment variables:
 
 Please note that if you use separate build (`ENABLE_CLICKHOUSE_ALL=OFF`), you need to build different components, including but not limited to `ENABLE_CLICKHOUSE_LIBRARY_BRIDGE=ON ENABLE_CLICKHOUSE_ODBC_BRIDGE=ON ENABLE_CLICKHOUSE_KEEPER=ON`. So it is easier to use `ENABLE_CLICKHOUSE_ALL=ON`
 
-For tests that use common docker compose files you may need to set up their path with environment variable: `DOCKER_COMPOSE_DIR=$HOME/ClickHouse/docker/test/integration/runner/compose`
 
 ### Running with runner script
 
diff --git a/docker/test/integration/runner/compose/docker_compose_azurite.yml b/tests/integration/compose/docker_compose_azurite.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_azurite.yml
rename to tests/integration/compose/docker_compose_azurite.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_cassandra.yml b/tests/integration/compose/docker_compose_cassandra.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_cassandra.yml
rename to tests/integration/compose/docker_compose_cassandra.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_clickhouse.yml b/tests/integration/compose/docker_compose_clickhouse.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_clickhouse.yml
rename to tests/integration/compose/docker_compose_clickhouse.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_coredns.yml b/tests/integration/compose/docker_compose_coredns.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_coredns.yml
rename to tests/integration/compose/docker_compose_coredns.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_dotnet_client.yml b/tests/integration/compose/docker_compose_dotnet_client.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_dotnet_client.yml
rename to tests/integration/compose/docker_compose_dotnet_client.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_hdfs.yml b/tests/integration/compose/docker_compose_hdfs.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_hdfs.yml
rename to tests/integration/compose/docker_compose_hdfs.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_hive.yml b/tests/integration/compose/docker_compose_hive.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_hive.yml
rename to tests/integration/compose/docker_compose_hive.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_jdbc_bridge.yml b/tests/integration/compose/docker_compose_jdbc_bridge.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_jdbc_bridge.yml
rename to tests/integration/compose/docker_compose_jdbc_bridge.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_kafka.yml b/tests/integration/compose/docker_compose_kafka.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_kafka.yml
rename to tests/integration/compose/docker_compose_kafka.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_keeper.yml b/tests/integration/compose/docker_compose_keeper.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_keeper.yml
rename to tests/integration/compose/docker_compose_keeper.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_kerberized_hdfs.yml b/tests/integration/compose/docker_compose_kerberized_hdfs.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_kerberized_hdfs.yml
rename to tests/integration/compose/docker_compose_kerberized_hdfs.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_kerberized_kafka.yml b/tests/integration/compose/docker_compose_kerberized_kafka.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_kerberized_kafka.yml
rename to tests/integration/compose/docker_compose_kerberized_kafka.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_kerberos_kdc.yml b/tests/integration/compose/docker_compose_kerberos_kdc.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_kerberos_kdc.yml
rename to tests/integration/compose/docker_compose_kerberos_kdc.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_ldap.yml b/tests/integration/compose/docker_compose_ldap.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_ldap.yml
rename to tests/integration/compose/docker_compose_ldap.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_minio.yml b/tests/integration/compose/docker_compose_minio.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_minio.yml
rename to tests/integration/compose/docker_compose_minio.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mongo.yml b/tests/integration/compose/docker_compose_mongo.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mongo.yml
rename to tests/integration/compose/docker_compose_mongo.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mongo_secure.yml b/tests/integration/compose/docker_compose_mongo_secure.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mongo_secure.yml
rename to tests/integration/compose/docker_compose_mongo_secure.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mysql.yml b/tests/integration/compose/docker_compose_mysql.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mysql.yml
rename to tests/integration/compose/docker_compose_mysql.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mysql_8_0.yml b/tests/integration/compose/docker_compose_mysql_8_0.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mysql_8_0.yml
rename to tests/integration/compose/docker_compose_mysql_8_0.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mysql_client.yml b/tests/integration/compose/docker_compose_mysql_client.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mysql_client.yml
rename to tests/integration/compose/docker_compose_mysql_client.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mysql_cluster.yml b/tests/integration/compose/docker_compose_mysql_cluster.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mysql_cluster.yml
rename to tests/integration/compose/docker_compose_mysql_cluster.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mysql_golang_client.yml b/tests/integration/compose/docker_compose_mysql_golang_client.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mysql_golang_client.yml
rename to tests/integration/compose/docker_compose_mysql_golang_client.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mysql_java_client.yml b/tests/integration/compose/docker_compose_mysql_java_client.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mysql_java_client.yml
rename to tests/integration/compose/docker_compose_mysql_java_client.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mysql_js_client.yml b/tests/integration/compose/docker_compose_mysql_js_client.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mysql_js_client.yml
rename to tests/integration/compose/docker_compose_mysql_js_client.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_mysql_php_client.yml b/tests/integration/compose/docker_compose_mysql_php_client.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_mysql_php_client.yml
rename to tests/integration/compose/docker_compose_mysql_php_client.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_nats.yml b/tests/integration/compose/docker_compose_nats.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_nats.yml
rename to tests/integration/compose/docker_compose_nats.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_net.yml b/tests/integration/compose/docker_compose_net.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_net.yml
rename to tests/integration/compose/docker_compose_net.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_nginx.yml b/tests/integration/compose/docker_compose_nginx.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_nginx.yml
rename to tests/integration/compose/docker_compose_nginx.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_postgres.yml b/tests/integration/compose/docker_compose_postgres.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_postgres.yml
rename to tests/integration/compose/docker_compose_postgres.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_postgres_cluster.yml b/tests/integration/compose/docker_compose_postgres_cluster.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_postgres_cluster.yml
rename to tests/integration/compose/docker_compose_postgres_cluster.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_postgresql.yml b/tests/integration/compose/docker_compose_postgresql.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_postgresql.yml
rename to tests/integration/compose/docker_compose_postgresql.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_postgresql_java_client.yml b/tests/integration/compose/docker_compose_postgresql_java_client.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_postgresql_java_client.yml
rename to tests/integration/compose/docker_compose_postgresql_java_client.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_rabbitmq.yml b/tests/integration/compose/docker_compose_rabbitmq.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_rabbitmq.yml
rename to tests/integration/compose/docker_compose_rabbitmq.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_redis.yml b/tests/integration/compose/docker_compose_redis.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_redis.yml
rename to tests/integration/compose/docker_compose_redis.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_zookeeper.yml b/tests/integration/compose/docker_compose_zookeeper.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_zookeeper.yml
rename to tests/integration/compose/docker_compose_zookeeper.yml
diff --git a/docker/test/integration/runner/compose/docker_compose_zookeeper_secure.yml b/tests/integration/compose/docker_compose_zookeeper_secure.yml
similarity index 100%
rename from docker/test/integration/runner/compose/docker_compose_zookeeper_secure.yml
rename to tests/integration/compose/docker_compose_zookeeper_secure.yml
diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index b695b493db7..152b0d066ee 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -55,9 +55,7 @@ from .config_cluster import *
 
 HELPERS_DIR = p.dirname(__file__)
 CLICKHOUSE_ROOT_DIR = p.join(p.dirname(__file__), "../../..")
-LOCAL_DOCKER_COMPOSE_DIR = p.join(
-    CLICKHOUSE_ROOT_DIR, "docker/test/integration/runner/compose/"
-)
+LOCAL_DOCKER_COMPOSE_DIR = p.join(CLICKHOUSE_ROOT_DIR, "tests/integration/compose/")
 DEFAULT_ENV_NAME = ".env"
 
 SANITIZER_SIGN = "=================="
@@ -186,17 +184,7 @@ def get_library_bridge_path():
 
 
 def get_docker_compose_path():
-    compose_path = os.environ.get("DOCKER_COMPOSE_DIR")
-    if compose_path is not None:
-        return os.path.dirname(compose_path)
-    else:
-        if os.path.exists(os.path.dirname("/compose/")):
-            return os.path.dirname("/compose/")  # default in docker runner container
-        else:
-            logging.debug(
-                f"Fallback docker_compose_path to LOCAL_DOCKER_COMPOSE_DIR: {LOCAL_DOCKER_COMPOSE_DIR}"
-            )
-            return LOCAL_DOCKER_COMPOSE_DIR
+    return LOCAL_DOCKER_COMPOSE_DIR
 
 
 def check_kafka_is_available(kafka_id, kafka_port):
diff --git a/tests/integration/runner b/tests/integration/runner
index f1d5198f545..2834eaf311b 100755
--- a/tests/integration/runner
+++ b/tests/integration/runner
@@ -415,7 +415,7 @@ if __name__ == "__main__":
 
     cmd = cmd_base + " " + args.command
     cmd_pre_pull = (
-        f"{cmd_base} find /compose -name docker_compose_*.yml "
+        f"{cmd_base} find /ClickHouse/tests/integration/compose -name docker_compose_*.yml "
         r"-exec docker-compose -f '{}' pull \;"
     )
 

From a343406da47f62f015a5b70590fae479a3894625 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 20 Mar 2024 15:33:45 +0100
Subject: [PATCH 801/985] Another fix for SumIfToCountIfPass

---
 src/Analyzer/Passes/SumIfToCountIfPass.cpp    | 10 ++--
 ...3010_sum_to_to_count_if_nullable.reference | 46 +++++++++++++++++++
 .../03010_sum_to_to_count_if_nullable.sql     |  5 +-
 3 files changed, 56 insertions(+), 5 deletions(-)

diff --git a/src/Analyzer/Passes/SumIfToCountIfPass.cpp b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
index 1c2097e7be9..1a4712aa697 100644
--- a/src/Analyzer/Passes/SumIfToCountIfPass.cpp
+++ b/src/Analyzer/Passes/SumIfToCountIfPass.cpp
@@ -97,13 +97,15 @@ public:
         if (!if_true_condition_constant_node || !if_false_condition_constant_node)
             return;
 
+        if (auto constant_type = if_true_condition_constant_node->getResultType(); !isNativeInteger(constant_type))
+            return;
+
+        if (auto constant_type = if_false_condition_constant_node->getResultType(); !isNativeInteger(constant_type))
+            return;
+
         const auto & if_true_condition_constant_value_literal = if_true_condition_constant_node->getValue();
         const auto & if_false_condition_constant_value_literal = if_false_condition_constant_node->getValue();
 
-        if (!isInt64OrUInt64FieldType(if_true_condition_constant_value_literal.getType()) ||
-            !isInt64OrUInt64FieldType(if_false_condition_constant_value_literal.getType()))
-            return;
-
         auto if_true_condition_value = if_true_condition_constant_value_literal.get<UInt64>();
         auto if_false_condition_value = if_false_condition_constant_value_literal.get<UInt64>();
 
diff --git a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
index 89e5f639c66..d20634acf93 100644
--- a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
+++ b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.reference
@@ -1,5 +1,6 @@
 (5,NULL)
 (5,NULL)
+((6150),3)
 (5,NULL)
 QUERY id: 0
   PROJECTION COLUMNS
@@ -66,3 +67,48 @@ QUERY id: 0
       ARGUMENTS
         LIST id: 19, nodes: 1
           CONSTANT id: 20, constant_value: UInt64_10, constant_value_type: UInt8
+((6150),3)
+QUERY id: 0
+  PROJECTION COLUMNS
+    ((sum(if(equals(modulo(number, 2), 0), toNullable(0), 123))), toUInt8(3)) Tuple(Tuple(Nullable(UInt64)), UInt8)
+  PROJECTION
+    LIST id: 1, nodes: 1
+      FUNCTION id: 2, function_name: tuple, function_type: ordinary, result_type: Tuple(Tuple(Nullable(UInt64)), UInt8)
+        ARGUMENTS
+          LIST id: 3, nodes: 2
+            FUNCTION id: 4, function_name: tuple, function_type: ordinary, result_type: Tuple(Nullable(UInt64))
+              ARGUMENTS
+                LIST id: 5, nodes: 1
+                  FUNCTION id: 6, function_name: sum, function_type: aggregate, nulls_action : IGNORE_NULLS, result_type: Nullable(UInt64)
+                    ARGUMENTS
+                      LIST id: 7, nodes: 1
+                        FUNCTION id: 8, function_name: if, function_type: ordinary, result_type: Nullable(UInt8)
+                          ARGUMENTS
+                            LIST id: 9, nodes: 3
+                              FUNCTION id: 10, function_name: equals, function_type: ordinary, result_type: UInt8
+                                ARGUMENTS
+                                  LIST id: 11, nodes: 2
+                                    FUNCTION id: 12, function_name: modulo, function_type: ordinary, result_type: UInt8
+                                      ARGUMENTS
+                                        LIST id: 13, nodes: 2
+                                          COLUMN id: 14, column_name: number, result_type: UInt64, source_id: 15
+                                          CONSTANT id: 16, constant_value: UInt64_2, constant_value_type: UInt8
+                                    CONSTANT id: 17, constant_value: UInt64_0, constant_value_type: UInt8
+                              CONSTANT id: 18, constant_value: UInt64_0, constant_value_type: Nullable(UInt8)
+                                EXPRESSION
+                                  FUNCTION id: 19, function_name: toNullable, function_type: ordinary, result_type: Nullable(UInt8)
+                                    ARGUMENTS
+                                      LIST id: 20, nodes: 1
+                                        CONSTANT id: 21, constant_value: UInt64_0, constant_value_type: UInt8
+                              CONSTANT id: 22, constant_value: UInt64_123, constant_value_type: UInt8
+            CONSTANT id: 23, constant_value: UInt64_3, constant_value_type: UInt8
+              EXPRESSION
+                FUNCTION id: 24, function_name: toUInt8, function_type: ordinary, result_type: UInt8
+                  ARGUMENTS
+                    LIST id: 25, nodes: 1
+                      CONSTANT id: 26, constant_value: UInt64_3, constant_value_type: UInt8
+  JOIN TREE
+    TABLE_FUNCTION id: 15, alias: __table1, table_function_name: numbers
+      ARGUMENTS
+        LIST id: 27, nodes: 1
+          CONSTANT id: 28, constant_value: UInt64_100, constant_value_type: UInt8
diff --git a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql
index b283a69a020..71a175faac8 100644
--- a/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql
+++ b/tests/queries/0_stateless/03010_sum_to_to_count_if_nullable.sql
@@ -3,9 +3,12 @@ SET optimize_rewrite_sum_if_to_count_if = 1;
 SET allow_experimental_analyzer = 0;
 SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10);
 SELECT (sum(if((number % 2) = 0, toNullable(1), 0)), NULL) FROM numbers(10);
+SELECT (tuple(sum(if((number % 2) = 0, toNullable(0), 123)) IGNORE NULLS), toUInt8(3)) FROM numbers(100);
 
 SET allow_experimental_analyzer = 1;
 SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10);
 EXPLAIN QUERY TREE SELECT (sumIf(toNullable(1), (number % 2) = 0), NULL) FROM numbers(10);
 SELECT (sum(if((number % 2) = 0, toNullable(1), 0)), NULL) FROM numbers(10);
-EXPLAIN QUERY TREE SELECT (sum(if((number % 2) = 0, toNullable(1), 0)), NULL) FROM numbers(10);
\ No newline at end of file
+EXPLAIN QUERY TREE SELECT (sum(if((number % 2) = 0, toNullable(1), 0)), NULL) FROM numbers(10);
+SELECT (tuple(sum(if((number % 2) = 0, toNullable(0), 123)) IGNORE NULLS), toUInt8(3)) FROM numbers(100);
+EXPLAIN QUERY TREE SELECT (tuple(sum(if((number % 2) = 0, toNullable(0), 123)) IGNORE NULLS), toUInt8(3)) FROM numbers(100);

From dd1fd5ec391f91ba9656589c8af0a98e95ff3edd Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Wed, 20 Mar 2024 15:35:39 +0100
Subject: [PATCH 802/985] Ping CI


From e6256fa380721a2d60d29658ae0f8977db1a639e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 20 Mar 2024 15:43:09 +0100
Subject: [PATCH 803/985] Fix build

---
 src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h b/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h
index 7807f3d8c25..ccc88079daa 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPartInfoForReader.h
@@ -15,6 +15,7 @@ struct MergeTreeDataPartChecksums;
 struct MergeTreeIndexGranularityInfo;
 class ISerialization;
 using SerializationPtr = std::shared_ptr<const ISerialization>;
+class SerializationInfoByName;
 
 /**
  * A class which contains all information about a data part that is required

From e34c4618a52b37665c04a3f3b4192add46976cf6 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Wed, 20 Mar 2024 15:56:54 +0100
Subject: [PATCH 804/985] Fix data race during snapshot destructor call

---
 src/Coordination/KeeperDispatcher.cpp         |  8 +-
 src/Coordination/KeeperSnapshotManager.h      |  3 +-
 src/Coordination/KeeperStateMachine.cpp       | 87 ++++++++++---------
 src/Coordination/tests/gtest_coordination.cpp |  2 +-
 4 files changed, 50 insertions(+), 50 deletions(-)

diff --git a/src/Coordination/KeeperDispatcher.cpp b/src/Coordination/KeeperDispatcher.cpp
index cd642087130..84e1632e9b1 100644
--- a/src/Coordination/KeeperDispatcher.cpp
+++ b/src/Coordination/KeeperDispatcher.cpp
@@ -325,12 +325,12 @@ void KeeperDispatcher::snapshotThread()
         if (!snapshots_queue.pop(task))
             break;
 
-        if (shutdown_called)
-            break;
-
         try
         {
-            auto snapshot_file_info = task.create_snapshot(std::move(task.snapshot));
+            auto snapshot_file_info = task.create_snapshot(std::move(task.snapshot), /*execute_only_cleanup=*/shutdown_called);
+
+            if (shutdown_called)
+                break;
 
             if (snapshot_file_info.path.empty())
                 continue;
diff --git a/src/Coordination/KeeperSnapshotManager.h b/src/Coordination/KeeperSnapshotManager.h
index ad3bcee028a..8ba0f92a564 100644
--- a/src/Coordination/KeeperSnapshotManager.h
+++ b/src/Coordination/KeeperSnapshotManager.h
@@ -98,8 +98,7 @@ struct SnapshotFileInfo
 };
 
 using KeeperStorageSnapshotPtr = std::shared_ptr<KeeperStorageSnapshot>;
-using CreateSnapshotCallback = std::function<SnapshotFileInfo(KeeperStorageSnapshotPtr &&)>;
-
+using CreateSnapshotCallback = std::function<SnapshotFileInfo(KeeperStorageSnapshotPtr &&, bool)>;
 
 using SnapshotMetaAndStorage = std::pair<SnapshotMetadataPtr, KeeperStoragePtr>;
 
diff --git a/src/Coordination/KeeperStateMachine.cpp b/src/Coordination/KeeperStateMachine.cpp
index 0c398a0d549..3dbdb329b93 100644
--- a/src/Coordination/KeeperStateMachine.cpp
+++ b/src/Coordination/KeeperStateMachine.cpp
@@ -564,63 +564,65 @@ void KeeperStateMachine::create_snapshot(nuraft::snapshot & s, nuraft::async_res
     }
 
     /// create snapshot task for background execution (in snapshot thread)
-    snapshot_task.create_snapshot = [this, when_done](KeeperStorageSnapshotPtr && snapshot)
+    snapshot_task.create_snapshot = [this, when_done](KeeperStorageSnapshotPtr && snapshot, bool execute_only_cleanup)
     {
         nuraft::ptr<std::exception> exception(nullptr);
         bool ret = true;
-        try
+        if (!execute_only_cleanup)
         {
-            { /// Read storage data without locks and create snapshot
-                std::lock_guard lock(snapshots_lock);
+            try
+            {
+                { /// Read storage data without locks and create snapshot
+                    std::lock_guard lock(snapshots_lock);
 
-                if (latest_snapshot_meta && snapshot->snapshot_meta->get_last_log_idx() <= latest_snapshot_meta->get_last_log_idx())
-                {
-                    LOG_INFO(
-                        log,
-                        "Will not create a snapshot with last log idx {} because a snapshot with bigger last log idx ({}) is already "
-                        "created",
-                        snapshot->snapshot_meta->get_last_log_idx(),
-                        latest_snapshot_meta->get_last_log_idx());
-                }
-                else
-                {
-                    latest_snapshot_meta = snapshot->snapshot_meta;
-                    /// we rely on the fact that the snapshot disk cannot be changed during runtime
-                    if (isLocalDisk(*keeper_context->getLatestSnapshotDisk()))
+                    if (latest_snapshot_meta && snapshot->snapshot_meta->get_last_log_idx() <= latest_snapshot_meta->get_last_log_idx())
                     {
-                        auto snapshot_info = snapshot_manager.serializeSnapshotToDisk(*snapshot);
-                        latest_snapshot_info = std::move(snapshot_info);
-                        latest_snapshot_buf = nullptr;
+                        LOG_INFO(
+                            log,
+                            "Will not create a snapshot with last log idx {} because a snapshot with bigger last log idx ({}) is already "
+                            "created",
+                            snapshot->snapshot_meta->get_last_log_idx(),
+                            latest_snapshot_meta->get_last_log_idx());
                     }
                     else
                     {
-                        auto snapshot_buf = snapshot_manager.serializeSnapshotToBuffer(*snapshot);
-                        auto snapshot_info = snapshot_manager.serializeSnapshotBufferToDisk(*snapshot_buf, snapshot->snapshot_meta->get_last_log_idx());
-                        latest_snapshot_info = std::move(snapshot_info);
-                        latest_snapshot_buf = std::move(snapshot_buf);
-                    }
+                        latest_snapshot_meta = snapshot->snapshot_meta;
+                        /// we rely on the fact that the snapshot disk cannot be changed during runtime
+                        if (isLocalDisk(*keeper_context->getLatestSnapshotDisk()))
+                        {
+                            auto snapshot_info = snapshot_manager.serializeSnapshotToDisk(*snapshot);
+                            latest_snapshot_info = std::move(snapshot_info);
+                            latest_snapshot_buf = nullptr;
+                        }
+                        else
+                        {
+                            auto snapshot_buf = snapshot_manager.serializeSnapshotToBuffer(*snapshot);
+                            auto snapshot_info = snapshot_manager.serializeSnapshotBufferToDisk(*snapshot_buf, snapshot->snapshot_meta->get_last_log_idx());
+                            latest_snapshot_info = std::move(snapshot_info);
+                            latest_snapshot_buf = std::move(snapshot_buf);
+                        }
 
-                    ProfileEvents::increment(ProfileEvents::KeeperSnapshotCreations);
-                    LOG_DEBUG(log, "Created persistent snapshot {} with path {}", latest_snapshot_meta->get_last_log_idx(), latest_snapshot_info.path);
+                        ProfileEvents::increment(ProfileEvents::KeeperSnapshotCreations);
+                        LOG_DEBUG(log, "Created persistent snapshot {} with path {}", latest_snapshot_meta->get_last_log_idx(), latest_snapshot_info.path);
+                    }
                 }
             }
-
+            catch (...)
             {
-                /// Destroy snapshot with lock
-                std::lock_guard lock(storage_and_responses_lock);
-                LOG_TRACE(log, "Clearing garbage after snapshot");
-                /// Turn off "snapshot mode" and clear outdate part of storage state
-                storage->clearGarbageAfterSnapshot();
-                LOG_TRACE(log, "Cleared garbage after snapshot");
-                snapshot.reset();
+                ProfileEvents::increment(ProfileEvents::KeeperSnapshotCreationsFailed);
+                LOG_TRACE(log, "Exception happened during snapshot");
+                tryLogCurrentException(log);
+                ret = false;
             }
         }
-        catch (...)
         {
-            ProfileEvents::increment(ProfileEvents::KeeperSnapshotCreationsFailed);
-            LOG_TRACE(log, "Exception happened during snapshot");
-            tryLogCurrentException(log);
-            ret = false;
+            /// Destroy snapshot with lock
+            std::lock_guard lock(storage_and_responses_lock);
+            LOG_TRACE(log, "Clearing garbage after snapshot");
+            /// Turn off "snapshot mode" and clear outdate part of storage state
+            storage->clearGarbageAfterSnapshot();
+            LOG_TRACE(log, "Cleared garbage after snapshot");
+            snapshot.reset();
         }
 
         when_done(ret, exception);
@@ -628,11 +630,10 @@ void KeeperStateMachine::create_snapshot(nuraft::snapshot & s, nuraft::async_res
         return ret ? latest_snapshot_info : SnapshotFileInfo{};
     };
 
-
     if (keeper_context->getServerState() == KeeperContext::Phase::SHUTDOWN)
     {
         LOG_INFO(log, "Creating a snapshot during shutdown because 'create_snapshot_on_exit' is enabled.");
-        auto snapshot_file_info = snapshot_task.create_snapshot(std::move(snapshot_task.snapshot));
+        auto snapshot_file_info = snapshot_task.create_snapshot(std::move(snapshot_task.snapshot), /*execute_only_cleanup=*/false);
 
         if (!snapshot_file_info.path.empty() && snapshot_manager_s3)
         {
diff --git a/src/Coordination/tests/gtest_coordination.cpp b/src/Coordination/tests/gtest_coordination.cpp
index 07dfac0670e..d314757efc9 100644
--- a/src/Coordination/tests/gtest_coordination.cpp
+++ b/src/Coordination/tests/gtest_coordination.cpp
@@ -1818,7 +1818,7 @@ void testLogAndStateMachine(
             bool pop_result = snapshots_queue.pop(snapshot_task);
             EXPECT_TRUE(pop_result);
 
-            snapshot_task.create_snapshot(std::move(snapshot_task.snapshot));
+            snapshot_task.create_snapshot(std::move(snapshot_task.snapshot), /*execute_only_cleanup=*/false);
         }
 
         if (snapshot_created && changelog.size() > settings->reserved_log_items)

From aa1a210d5d793b16d162d0f49fc92f12de0d7e8c Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 20 Mar 2024 17:07:32 +0100
Subject: [PATCH 805/985] Fix logging of autoscaling lambda, add test for
 effective_capacity

---
 tests/ci/autoscale_runners_lambda/app.py      | 26 ++++++++---------
 .../test_autoscale.py                         | 29 ++++++++++++++++++-
 2 files changed, 41 insertions(+), 14 deletions(-)

diff --git a/tests/ci/autoscale_runners_lambda/app.py b/tests/ci/autoscale_runners_lambda/app.py
index 6c3d71708e9..520abcb41bb 100644
--- a/tests/ci/autoscale_runners_lambda/app.py
+++ b/tests/ci/autoscale_runners_lambda/app.py
@@ -120,13 +120,13 @@ def set_capacity(
         # Let's calculate a new desired capacity
         # (capacity_deficit + scale_up - 1) // scale_up : will increase min by 1
         # if there is any capacity_deficit
-        desired_capacity = (
+        new_capacity = (
             asg["DesiredCapacity"] + (capacity_deficit + scale_up - 1) // scale_up
         )
-        desired_capacity = max(desired_capacity, asg["MinSize"])
-        desired_capacity = min(desired_capacity, asg["MaxSize"])
+        new_capacity = max(new_capacity, asg["MinSize"])
+        new_capacity = min(new_capacity, asg["MaxSize"])
         # Finally, should the capacity be even changed
-        stop = stop or asg["DesiredCapacity"] == desired_capacity
+        stop = stop or asg["DesiredCapacity"] == new_capacity
         if stop:
             logging.info(
                 "Do not increase ASG %s capacity, current capacity=%s, effective "
@@ -144,9 +144,9 @@ def set_capacity(
             "The ASG %s capacity will be increased to %s, current capacity=%s, "
             "effective capacity=%s, maximum capacity=%s, running jobs=%s, queue size=%s",
             asg["AutoScalingGroupName"],
-            desired_capacity,
-            effective_capacity,
+            new_capacity,
             asg["DesiredCapacity"],
+            effective_capacity,
             asg["MaxSize"],
             running,
             queued,
@@ -154,16 +154,16 @@ def set_capacity(
         if not dry_run:
             client.set_desired_capacity(
                 AutoScalingGroupName=asg["AutoScalingGroupName"],
-                DesiredCapacity=desired_capacity,
+                DesiredCapacity=new_capacity,
             )
         return
 
     # Now we will calculate if we need to scale down
     stop = stop or asg["DesiredCapacity"] == asg["MinSize"]
-    desired_capacity = asg["DesiredCapacity"] - (capacity_reserve // scale_down)
-    desired_capacity = max(desired_capacity, asg["MinSize"])
-    desired_capacity = min(desired_capacity, asg["MaxSize"])
-    stop = stop or asg["DesiredCapacity"] == desired_capacity
+    new_capacity = asg["DesiredCapacity"] - (capacity_reserve // scale_down)
+    new_capacity = max(new_capacity, asg["MinSize"])
+    new_capacity = min(new_capacity, asg["MaxSize"])
+    stop = stop or asg["DesiredCapacity"] == new_capacity
     if stop:
         logging.info(
             "Do not decrease ASG %s capacity, current capacity=%s, effective "
@@ -181,7 +181,7 @@ def set_capacity(
         "The ASG %s capacity will be decreased to %s, current capacity=%s, effective "
         "capacity=%s, minimum capacity=%s, running jobs=%s, queue size=%s",
         asg["AutoScalingGroupName"],
-        desired_capacity,
+        new_capacity,
         asg["DesiredCapacity"],
         effective_capacity,
         asg["MinSize"],
@@ -191,7 +191,7 @@ def set_capacity(
     if not dry_run:
         client.set_desired_capacity(
             AutoScalingGroupName=asg["AutoScalingGroupName"],
-            DesiredCapacity=desired_capacity,
+            DesiredCapacity=new_capacity,
         )
 
 
diff --git a/tests/ci/autoscale_runners_lambda/test_autoscale.py b/tests/ci/autoscale_runners_lambda/test_autoscale.py
index 75f178ac394..3aeab49ffc7 100644
--- a/tests/ci/autoscale_runners_lambda/test_autoscale.py
+++ b/tests/ci/autoscale_runners_lambda/test_autoscale.py
@@ -35,7 +35,7 @@ class TestSetCapacity(unittest.TestCase):
 
         @property
         def expected_capacity(self) -> int:
-            """one-time property"""
+            """a one-time property"""
             capacity, self._expected_capacity = self._expected_capacity, -1
             return capacity
 
@@ -117,6 +117,33 @@ class TestSetCapacity(unittest.TestCase):
             set_capacity(t.name, t.queues, self.client, False)
             self.assertEqual(t.expected_capacity, self.client.expected_capacity, t.name)
 
+    def test_effective_capacity(self):
+        """Normal cases test increasing w/o considering
+        effective_capacity much lower than DesiredCapacity"""
+        test_cases = (
+            TestCase(
+                "desired-overwritten",
+                1,
+                20,  # DesiredCapacity, overwritten by effective_capacity
+                50,
+                [
+                    Queue("in_progress", 30, "desired-overwritten"),
+                    Queue("queued", 60, "desired-overwritten"),
+                ],
+                40,
+            ),
+        )
+        for t in test_cases:
+            self.client.data_helper(t.name, t.min_size, t.desired_capacity, t.max_size)
+            # we test that effective_capacity is 30 (a half of 60)
+            data_with_instances = self.client.expected_data
+            data_with_instances["AutoScalingGroups"][0]["Instances"] = [
+                {"HealthStatus": "Healthy" if i % 2 else "Unhealthy"} for i in range(60)
+            ]
+            self.client.expected_data = data_with_instances
+            set_capacity(t.name, t.queues, self.client, False)
+            self.assertEqual(t.expected_capacity, self.client.expected_capacity, t.name)
+
     def test_exceptions(self):
         test_cases = (
             (

From a7ff6d63c397e729919ab9e31d797b91b6ae4708 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Wed, 20 Mar 2024 16:48:24 +0000
Subject: [PATCH 806/985] Fix Non-ready set for system.parts.

---
 .../System/StorageSystemDetachedParts.cpp     | 25 ++++++++++--
 .../StorageSystemDroppedTablesParts.cpp       |  5 ++-
 .../System/StorageSystemDroppedTablesParts.h  |  6 +--
 .../System/StorageSystemPartsBase.cpp         | 39 ++++++++++++++++---
 src/Storages/System/StorageSystemPartsBase.h  |  6 +--
 .../0_stateless/02841_not_ready_set_bug.sh    |  1 +
 6 files changed, 65 insertions(+), 17 deletions(-)

diff --git a/src/Storages/System/StorageSystemDetachedParts.cpp b/src/Storages/System/StorageSystemDetachedParts.cpp
index 1eb79744022..7207e981561 100644
--- a/src/Storages/System/StorageSystemDetachedParts.cpp
+++ b/src/Storages/System/StorageSystemDetachedParts.cpp
@@ -4,10 +4,12 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeUUID.h>
 #include <Storages/IStorage.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
 #include <Storages/System/StorageSystemPartsBase.h>
 #include <Storages/System/getQueriedColumnsMaskAndHeader.h>
+#include <Storages/VirtualColumnUtils.h>
 #include <Processors/Sources/SourceFromSingleChunk.h>
 #include <QueryPipeline/Pipe.h>
 #include <IO/SharedThreadPools.h>
@@ -320,16 +322,33 @@ protected:
     std::shared_ptr<StorageSystemDetachedParts> storage;
     std::vector<UInt8> columns_mask;
 
-    const ActionsDAG::Node * predicate = nullptr;
+    ActionsDAGPtr filter;
     const size_t max_block_size;
     const size_t num_streams;
 };
 
 void ReadFromSystemDetachedParts::applyFilters(ActionDAGNodes added_filter_nodes)
 {
+    filter_actions_dag = ActionsDAG::buildFilterActionsDAG(added_filter_nodes.nodes);
     filter_actions_dag = ActionsDAG::buildFilterActionsDAG(added_filter_nodes.nodes);
     if (filter_actions_dag)
-        predicate = filter_actions_dag->getOutputs().at(0);
+    {
+        const auto * predicate = filter_actions_dag->getOutputs().at(0);
+
+        Block block;
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeString>(), "database"));
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeString>(), "table"));
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeString>(), "engine"));
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeUInt8>(), "active"));
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeUUID>(), "uuid"));
+
+        filter = VirtualColumnUtils::splitFilterDagForAllowedInputs(predicate, &block);
+        if (filter)
+        {
+            auto empty_block = block.cloneWithColumns(block.cloneEmptyColumns());
+            VirtualColumnUtils::filterBlockWithDAG(filter, empty_block, context);
+        }
+    }
 }
 
 void StorageSystemDetachedParts::read(
@@ -358,7 +377,7 @@ void StorageSystemDetachedParts::read(
 
 void ReadFromSystemDetachedParts::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
 {
-    auto state = std::make_shared<SourceState>(StoragesInfoStream(predicate, context));
+    auto state = std::make_shared<SourceState>(StoragesInfoStream(nullptr, filter, context));
 
     Pipe pipe;
 
diff --git a/src/Storages/System/StorageSystemDroppedTablesParts.cpp b/src/Storages/System/StorageSystemDroppedTablesParts.cpp
index 20baeee1d3b..3301339df76 100644
--- a/src/Storages/System/StorageSystemDroppedTablesParts.cpp
+++ b/src/Storages/System/StorageSystemDroppedTablesParts.cpp
@@ -10,7 +10,7 @@ namespace DB
 {
 
 
-StoragesDroppedInfoStream::StoragesDroppedInfoStream(const ActionsDAG::Node * predicate, ContextPtr context)
+StoragesDroppedInfoStream::StoragesDroppedInfoStream(const ActionsDAGPtr & filter, ContextPtr context)
         : StoragesInfoStreamBase(context)
 {
     /// Will apply WHERE to subset of columns and then add more columns.
@@ -73,7 +73,8 @@ StoragesDroppedInfoStream::StoragesDroppedInfoStream(const ActionsDAG::Node * pr
     if (block_to_filter.rows())
     {
         /// Filter block_to_filter with columns 'database', 'table', 'engine', 'active'.
-        VirtualColumnUtils::filterBlockWithPredicate(predicate, block_to_filter, context);
+        if (filter)
+            VirtualColumnUtils::filterBlockWithDAG(filter, block_to_filter, context);
         rows = block_to_filter.rows();
     }
 
diff --git a/src/Storages/System/StorageSystemDroppedTablesParts.h b/src/Storages/System/StorageSystemDroppedTablesParts.h
index a44abea7285..dff9e41cce3 100644
--- a/src/Storages/System/StorageSystemDroppedTablesParts.h
+++ b/src/Storages/System/StorageSystemDroppedTablesParts.h
@@ -9,7 +9,7 @@ namespace DB
 class StoragesDroppedInfoStream : public StoragesInfoStreamBase
 {
 public:
-    StoragesDroppedInfoStream(const ActionsDAG::Node * predicate, ContextPtr context);
+    StoragesDroppedInfoStream(const ActionsDAGPtr & filter, ContextPtr context);
 protected:
     bool tryLockTable(StoragesInfo &) override
     {
@@ -30,9 +30,9 @@ public:
 
     std::string getName() const override { return "SystemDroppedTablesParts"; }
 protected:
-    std::unique_ptr<StoragesInfoStreamBase> getStoragesInfoStream(const ActionsDAG::Node * predicate, ContextPtr context) override
+    std::unique_ptr<StoragesInfoStreamBase> getStoragesInfoStream(const ActionsDAGPtr &, const ActionsDAGPtr & filter, ContextPtr context) override
     {
-        return std::make_unique<StoragesDroppedInfoStream>(predicate, context);
+        return std::make_unique<StoragesDroppedInfoStream>(filter, context);
     }
 };
 
diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index 6bdfdd357e8..c81c2c18b2e 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -82,7 +82,7 @@ StoragesInfo::getProjectionParts(MergeTreeData::DataPartStateVector & state, boo
     return data->getProjectionPartsVectorForInternalUsage({State::Active}, &state);
 }
 
-StoragesInfoStream::StoragesInfoStream(const ActionsDAG::Node * predicate, ContextPtr context)
+StoragesInfoStream::StoragesInfoStream(const ActionsDAGPtr & filter_by_database, const ActionsDAGPtr & filter_by_other_columns, ContextPtr context)
     : StoragesInfoStreamBase(context)
 {
     /// Will apply WHERE to subset of columns and then add more columns.
@@ -114,7 +114,8 @@ StoragesInfoStream::StoragesInfoStream(const ActionsDAG::Node * predicate, Conte
             std::move(database_column_mut), std::make_shared<DataTypeString>(), "database"));
 
         /// Filter block_to_filter with column 'database'.
-        VirtualColumnUtils::filterBlockWithPredicate(predicate, block_to_filter, context);
+        if (filter_by_database)
+            VirtualColumnUtils::filterBlockWithDAG(filter_by_database, block_to_filter, context);
         rows = block_to_filter.rows();
 
         /// Block contains new columns, update database_column.
@@ -193,7 +194,8 @@ StoragesInfoStream::StoragesInfoStream(const ActionsDAG::Node * predicate, Conte
     if (rows)
     {
         /// Filter block_to_filter with columns 'database', 'table', 'engine', 'active'.
-        VirtualColumnUtils::filterBlockWithPredicate(predicate, block_to_filter, context);
+        if (filter_by_other_columns)
+            VirtualColumnUtils::filterBlockWithDAG(filter_by_other_columns, block_to_filter, context);
         rows = block_to_filter.rows();
     }
 
@@ -225,7 +227,8 @@ protected:
     std::shared_ptr<StorageSystemPartsBase> storage;
     std::vector<UInt8> columns_mask;
     const bool has_state_column;
-    const ActionsDAG::Node * predicate = nullptr;
+    ActionsDAGPtr filter_by_database;
+    ActionsDAGPtr filter_by_other_columns;
 };
 
 ReadFromSystemPartsBase::ReadFromSystemPartsBase(
@@ -253,7 +256,31 @@ void ReadFromSystemPartsBase::applyFilters(ActionDAGNodes added_filter_nodes)
 {
     filter_actions_dag = ActionsDAG::buildFilterActionsDAG(added_filter_nodes.nodes);
     if (filter_actions_dag)
-        predicate = filter_actions_dag->getOutputs().at(0);
+    {
+        const auto * predicate = filter_actions_dag->getOutputs().at(0);
+
+        Block block;
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeString>(), "database"));
+
+        filter_by_database = VirtualColumnUtils::splitFilterDagForAllowedInputs(predicate, &block);
+        if (filter_by_database)
+        {
+            auto empty_block = block.cloneWithColumns(block.cloneEmptyColumns());
+            VirtualColumnUtils::filterBlockWithDAG(filter_by_database, empty_block, context);
+        }
+
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeString>(), "table"));
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeString>(), "engine"));
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeUInt8>(), "active"));
+        block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeUUID>(), "uuid"));
+
+        filter_by_other_columns = VirtualColumnUtils::splitFilterDagForAllowedInputs(predicate, &block);
+        if (filter_by_other_columns)
+        {
+            auto empty_block = block.cloneWithColumns(block.cloneEmptyColumns());
+            VirtualColumnUtils::filterBlockWithDAG(filter_by_database, empty_block, context);
+        }
+    }
 }
 
 void StorageSystemPartsBase::read(
@@ -287,7 +314,7 @@ void StorageSystemPartsBase::read(
 
 void ReadFromSystemPartsBase::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
 {
-    auto stream = storage->getStoragesInfoStream(predicate, context);
+    auto stream = storage->getStoragesInfoStream(filter_by_database, filter_by_other_columns, context);
     auto header = getOutputStream().header;
 
     MutableColumns res_columns = header.cloneEmptyColumns();
diff --git a/src/Storages/System/StorageSystemPartsBase.h b/src/Storages/System/StorageSystemPartsBase.h
index 10d1a3a2e0e..be945162b39 100644
--- a/src/Storages/System/StorageSystemPartsBase.h
+++ b/src/Storages/System/StorageSystemPartsBase.h
@@ -115,7 +115,7 @@ protected:
 class StoragesInfoStream : public StoragesInfoStreamBase
 {
 public:
-    StoragesInfoStream(const ActionsDAG::Node * predicate, ContextPtr context);
+    StoragesInfoStream(const ActionsDAGPtr & filter_by_database, const ActionsDAGPtr & filter_by_other_columns, ContextPtr context);
 };
 
 /** Implements system table 'parts' which allows to get information about data parts for tables of MergeTree family.
@@ -145,9 +145,9 @@ protected:
 
     StorageSystemPartsBase(const StorageID & table_id_, ColumnsDescription && columns);
 
-    virtual std::unique_ptr<StoragesInfoStreamBase> getStoragesInfoStream(const ActionsDAG::Node * predicate, ContextPtr context)
+    virtual std::unique_ptr<StoragesInfoStreamBase> getStoragesInfoStream(const ActionsDAGPtr & filter_by_database, const ActionsDAGPtr & filter_by_other_columns, ContextPtr context)
     {
-        return std::make_unique<StoragesInfoStream>(predicate, context);
+        return std::make_unique<StoragesInfoStream>(filter_by_database, filter_by_other_columns, context);
     }
 
     virtual void
diff --git a/tests/queries/0_stateless/02841_not_ready_set_bug.sh b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
index 3aaffe51578..9b2f3b0698e 100755
--- a/tests/queries/0_stateless/02841_not_ready_set_bug.sh
+++ b/tests/queries/0_stateless/02841_not_ready_set_bug.sh
@@ -10,3 +10,4 @@ $CLICKHOUSE_CLIENT -q "insert into t1 select number from numbers(10);"
 $CLICKHOUSE_CLIENT --max_threads=2 --max_result_rows=1 --result_overflow_mode=break -q "with tab as (select min(number) from t1 prewhere number in (select number from view(select number, row_number() OVER (partition by number % 2 ORDER BY number DESC) from numbers_mt(1e4)) where number != 2 order by number)) select number from t1 union all select * from tab;" > /dev/null
 
 $CLICKHOUSE_CLIENT -q "SELECT * FROM system.tables WHERE 1 in (SELECT number from numbers(2)) AND database = currentDatabase() format Null"
+$CLICKHOUSE_CLIENT -q "SELECT xor(1, 0) FROM system.parts WHERE 1 IN (SELECT 1) FORMAT Null"

From 54fae360f0a43ba644e667cefbcc28a72e0bc4f9 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 20 Mar 2024 17:50:40 +0100
Subject: [PATCH 807/985] Disable duplicate-inclides style check

---
 utils/check-style/check_cpp.sh                  | 9 +++++----
 utils/check-style/process_style_check_result.py | 2 +-
 2 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/utils/check-style/check_cpp.sh b/utils/check-style/check_cpp.sh
index dc1dae70e22..d647f5eefe1 100755
--- a/utils/check-style/check_cpp.sh
+++ b/utils/check-style/check_cpp.sh
@@ -6,10 +6,11 @@ cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_ou
 
 start_total=$(date +%s)
 
-start=$(date +%s)
-./check-duplicate-includes.sh |& tee /test_output/duplicate_includes_output.txt
-runtime=$(($(date +%s)-start))
-echo "Check duplicates. Done. $runtime seconds."
+# We decided to have the regexp-based check disabled in favor of clang-tidy
+# start=$(date +%s)
+# ./check-duplicate-includes.sh |& tee /test_output/duplicate_includes_output.txt
+# runtime=$(($(date +%s)-start))
+# echo "Check duplicates. Done. $runtime seconds."
 
 start=$(date +%s)
 ./check-style -n              |& tee /test_output/style_output.txt
diff --git a/utils/check-style/process_style_check_result.py b/utils/check-style/process_style_check_result.py
index f1ca53eba3b..e603084732d 100755
--- a/utils/check-style/process_style_check_result.py
+++ b/utils/check-style/process_style_check_result.py
@@ -13,7 +13,7 @@ def process_result(result_folder):
     description = ""
     test_results = []
     checks = (
-        "duplicate includes",
+        # "duplicate includes",  # disabled in favor of clang-tidy
         "shellcheck",
         "style",
         "pylint",

From 952b6b85143b89cc507b6f08a46d662a7d9d87a3 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Wed, 20 Mar 2024 18:00:02 +0100
Subject: [PATCH 808/985] Use the same features for black check

---
 utils/check-style/check_py.sh | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/utils/check-style/check_py.sh b/utils/check-style/check_py.sh
index 13f4e754ed3..2e645d2f19a 100755
--- a/utils/check-style/check_py.sh
+++ b/utils/check-style/check_py.sh
@@ -4,9 +4,11 @@ cd /ClickHouse/utils/check-style || echo -e "failure\tRepo not found" > /test_ou
 
 start_total=`date +%s`
 
-# FIXME: 1 min to wait + head checkout
-echo "Check python formatting with black" | ts
+start=`date +%s`
+echo "Check " | ts
 ./check-black -n              |& tee /test_output/black_output.txt
+runtime=$((`date +%s`-start))
+echo "Check python formatting with black. Done. $runtime seconds."
 
 start=`date +%s`
 ./check-pylint -n               |& tee /test_output/pylint_output.txt

From ccf6657f4dd9354fb31c7c08889eb0b51f498f07 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 20 Mar 2024 16:20:39 +0000
Subject: [PATCH 809/985] Remove unused macro

---
 src/Dictionaries/DictionaryStructure.h | 27 --------------------------
 1 file changed, 27 deletions(-)

diff --git a/src/Dictionaries/DictionaryStructure.h b/src/Dictionaries/DictionaryStructure.h
index 56d11be9837..55060b1592f 100644
--- a/src/Dictionaries/DictionaryStructure.h
+++ b/src/Dictionaries/DictionaryStructure.h
@@ -41,33 +41,6 @@ enum class AttributeUnderlyingType : TypeIndexUnderlying
 
 #undef map_item
 
-
-#define CALL_FOR_ALL_DICTIONARY_ATTRIBUTE_TYPES(M) \
-    M(UInt8) \
-    M(UInt16) \
-    M(UInt32) \
-    M(UInt64) \
-    M(UInt128) \
-    M(UInt256) \
-    M(Int8) \
-    M(Int16) \
-    M(Int32) \
-    M(Int64) \
-    M(Int128) \
-    M(Int256) \
-    M(Decimal32) \
-    M(Decimal64) \
-    M(Decimal128) \
-    M(Decimal256) \
-    M(DateTime64) \
-    M(Float32) \
-    M(Float64) \
-    M(UUID) \
-    M(IPv4) \
-    M(IPv6) \
-    M(String) \
-    M(Array)
-
 /// Min and max lifetimes for a dictionary or its entry
 using DictionaryLifetime = ExternalLoadableLifetime;
 

From 9e8c731e1e96ff4f8dc131f312a13ca46acb8c72 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 20 Mar 2024 16:22:15 +0000
Subject: [PATCH 810/985] Remove some inclusion of magic enum

---
 src/Common/ExternalLoaderStatus.cpp           |  18 +++
 src/Common/ExternalLoaderStatus.h             |  32 ++---
 src/Core/SettingsEnums.cpp                    |  10 ++
 src/Core/SettingsEnums.h                      | 102 ++++++++++++++++
 src/Core/SettingsFields.h                     | 111 ------------------
 src/IO/WriteHelpers.h                         |   1 -
 src/Parsers/ASTTablesInSelectQuery.h          |   2 -
 .../System/StorageSystemDictionaries.cpp      |   2 +-
 8 files changed, 142 insertions(+), 136 deletions(-)
 create mode 100644 src/Common/ExternalLoaderStatus.cpp

diff --git a/src/Common/ExternalLoaderStatus.cpp b/src/Common/ExternalLoaderStatus.cpp
new file mode 100644
index 00000000000..f3298409f43
--- /dev/null
+++ b/src/Common/ExternalLoaderStatus.cpp
@@ -0,0 +1,18 @@
+#include <Common/ExternalLoaderStatus.h>
+
+#include <base/EnumReflection.h>
+
+namespace DB
+{
+
+std::vector<std::pair<String, Int8>> getExternalLoaderStatusEnumAllPossibleValues()
+{
+    std::vector<std::pair<String, Int8>> out;
+    out.reserve(magic_enum::enum_count<ExternalLoaderStatus>());
+
+    for (const auto & [value, str] : magic_enum::enum_entries<ExternalLoaderStatus>())
+        out.emplace_back(std::string{str}, static_cast<Int8>(value));
+
+    return out;
+}
+}
diff --git a/src/Common/ExternalLoaderStatus.h b/src/Common/ExternalLoaderStatus.h
index 6cd27837d8f..b6e98073fea 100644
--- a/src/Common/ExternalLoaderStatus.h
+++ b/src/Common/ExternalLoaderStatus.h
@@ -1,30 +1,20 @@
 #pragma once
 
 #include <vector>
-#include <base/EnumReflection.h>
 #include <base/types.h>
 
 namespace DB
 {
-    enum class ExternalLoaderStatus : int8_t
-    {
-        NOT_LOADED, /// Object hasn't been tried to load. This is an initial state.
-        LOADED, /// Object has been loaded successfully.
-        FAILED, /// Object has been failed to load.
-        LOADING, /// Object is being loaded right now for the first time.
-        FAILED_AND_RELOADING, /// Object was failed to load before and it's being reloaded right now.
-        LOADED_AND_RELOADING, /// Object was loaded successfully before and it's being reloaded right now.
-        NOT_EXIST, /// Object with this name wasn't found in the configuration.
-    };
+enum class ExternalLoaderStatus : int8_t
+{
+    NOT_LOADED, /// Object hasn't been tried to load. This is an initial state.
+    LOADED, /// Object has been loaded successfully.
+    FAILED, /// Object has been failed to load.
+    LOADING, /// Object is being loaded right now for the first time.
+    FAILED_AND_RELOADING, /// Object was failed to load before and it's being reloaded right now.
+    LOADED_AND_RELOADING, /// Object was loaded successfully before and it's being reloaded right now.
+    NOT_EXIST, /// Object with this name wasn't found in the configuration.
+};
 
-    inline std::vector<std::pair<String, Int8>> getStatusEnumAllPossibleValues()
-    {
-        std::vector<std::pair<String, Int8>> out;
-        out.reserve(magic_enum::enum_count<ExternalLoaderStatus>());
-
-        for (const auto & [value, str] : magic_enum::enum_entries<ExternalLoaderStatus>())
-            out.emplace_back(std::string{str}, static_cast<Int8>(value));
-
-        return out;
-    }
+std::vector<std::pair<String, Int8>> getExternalLoaderStatusEnumAllPossibleValues();
 }
diff --git a/src/Core/SettingsEnums.cpp b/src/Core/SettingsEnums.cpp
index de30d6d8eb5..c3f0715ad68 100644
--- a/src/Core/SettingsEnums.cpp
+++ b/src/Core/SettingsEnums.cpp
@@ -18,6 +18,16 @@ namespace ErrorCodes
     extern const int UNKNOWN_UNION;
 }
 
+template <typename Type>
+constexpr auto getEnumValues()
+{
+    std::array<std::pair<std::string_view, Type>, magic_enum::enum_count<Type>()> enum_values{};
+    size_t index = 0;
+    for (auto value : magic_enum::enum_values<Type>())
+        enum_values[index++] = std::pair{magic_enum::enum_name(value), value};
+    return enum_values;
+}
+
 IMPLEMENT_SETTING_ENUM(LoadBalancing, ErrorCodes::UNKNOWN_LOAD_BALANCING,
     {{"random",           LoadBalancing::RANDOM},
      {"nearest_hostname", LoadBalancing::NEAREST_HOSTNAME},
diff --git a/src/Core/SettingsEnums.h b/src/Core/SettingsEnums.h
index 22fcf0389d8..c11ae75bfc7 100644
--- a/src/Core/SettingsEnums.h
+++ b/src/Core/SettingsEnums.h
@@ -12,6 +12,108 @@
 namespace DB
 {
 
+template <typename Type>
+constexpr auto getEnumValues();
+
+/// NOLINTNEXTLINE
+#define DECLARE_SETTING_ENUM(ENUM_TYPE) \
+    DECLARE_SETTING_ENUM_WITH_RENAME(ENUM_TYPE, ENUM_TYPE)
+
+/// NOLINTNEXTLINE
+#define DECLARE_SETTING_ENUM_WITH_RENAME(NEW_NAME, ENUM_TYPE) \
+    struct SettingField##NEW_NAME##Traits \
+    { \
+        using EnumType = ENUM_TYPE; \
+        using EnumValuePairs = std::pair<const char *, EnumType>[]; \
+        static const String & toString(EnumType value); \
+        static EnumType fromString(std::string_view str); \
+    }; \
+    \
+    using SettingField##NEW_NAME = SettingFieldEnum<ENUM_TYPE, SettingField##NEW_NAME##Traits>;
+
+/// NOLINTNEXTLINE
+#define IMPLEMENT_SETTING_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
+    IMPLEMENT_SETTING_ENUM_IMPL(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, EnumValuePairs, __VA_ARGS__)
+
+/// NOLINTNEXTLINE
+#define IMPLEMENT_SETTING_AUTO_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME) \
+    IMPLEMENT_SETTING_ENUM_IMPL(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, , getEnumValues<EnumType>())
+
+/// NOLINTNEXTLINE
+#define IMPLEMENT_SETTING_ENUM_IMPL(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, PAIRS_TYPE, ...) \
+    const String & SettingField##NEW_NAME##Traits::toString(typename SettingField##NEW_NAME::EnumType value) \
+    { \
+        static const std::unordered_map<EnumType, String> map = [] { \
+            std::unordered_map<EnumType, String> res; \
+            for (const auto & [name, val] : PAIRS_TYPE __VA_ARGS__) \
+                res.emplace(val, name); \
+            return res; \
+        }(); \
+        auto it = map.find(value); \
+        if (it != map.end()) \
+            return it->second; \
+        throw Exception(ERROR_CODE_FOR_UNEXPECTED_NAME, \
+            "Unexpected value of " #NEW_NAME ":{}", std::to_string(std::underlying_type_t<EnumType>(value))); \
+    } \
+    \
+    typename SettingField##NEW_NAME::EnumType SettingField##NEW_NAME##Traits::fromString(std::string_view str) \
+    { \
+        static const std::unordered_map<std::string_view, EnumType> map = [] { \
+            std::unordered_map<std::string_view, EnumType> res; \
+            for (const auto & [name, val] : PAIRS_TYPE __VA_ARGS__) \
+                res.emplace(name, val); \
+            return res; \
+        }(); \
+        auto it = map.find(str); \
+        if (it != map.end()) \
+            return it->second; \
+        String msg; \
+        bool need_comma = false; \
+        for (auto & name : map | boost::adaptors::map_keys) \
+        { \
+            if (std::exchange(need_comma, true)) \
+                msg += ", "; \
+            msg += "'" + String{name} + "'"; \
+        } \
+        throw Exception(ERROR_CODE_FOR_UNEXPECTED_NAME, "Unexpected value of " #NEW_NAME ": '{}'. Must be one of [{}]", String{str}, msg); \
+    }
+
+/// NOLINTNEXTLINE
+#define DECLARE_SETTING_MULTI_ENUM(ENUM_TYPE) \
+    DECLARE_SETTING_MULTI_ENUM_WITH_RENAME(ENUM_TYPE, ENUM_TYPE)
+
+/// NOLINTNEXTLINE
+#define DECLARE_SETTING_MULTI_ENUM_WITH_RENAME(ENUM_TYPE, NEW_NAME) \
+    struct SettingField##NEW_NAME##Traits \
+    { \
+        using EnumType = ENUM_TYPE; \
+        using EnumValuePairs = std::pair<const char *, EnumType>[]; \
+        static size_t getEnumSize(); \
+        static const String & toString(EnumType value); \
+        static EnumType fromString(std::string_view str); \
+    }; \
+    \
+    using SettingField##NEW_NAME = SettingFieldMultiEnum<ENUM_TYPE, SettingField##NEW_NAME##Traits>; \
+    using NEW_NAME##List = typename SettingField##NEW_NAME::ValueType;
+
+/// NOLINTNEXTLINE
+#define IMPLEMENT_SETTING_MULTI_ENUM(ENUM_TYPE, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
+    IMPLEMENT_SETTING_MULTI_ENUM_WITH_RENAME(ENUM_TYPE, ERROR_CODE_FOR_UNEXPECTED_NAME, __VA_ARGS__)
+
+/// NOLINTNEXTLINE
+#define IMPLEMENT_SETTING_MULTI_ENUM_WITH_RENAME(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
+    IMPLEMENT_SETTING_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, __VA_ARGS__)\
+    size_t SettingField##NEW_NAME##Traits::getEnumSize() {\
+        return std::initializer_list<std::pair<const char*, NEW_NAME>> __VA_ARGS__ .size();\
+    }
+
+/// NOLINTNEXTLINE
+#define IMPLEMENT_SETTING_MULTI_AUTO_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME) \
+    IMPLEMENT_SETTING_AUTO_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME)\
+    size_t SettingField##NEW_NAME##Traits::getEnumSize() {\
+        return getEnumValues<EnumType>().size();\
+    }
+
 enum class LoadBalancing
 {
     /// among replicas with a minimum number of errors selected randomly
diff --git a/src/Core/SettingsFields.h b/src/Core/SettingsFields.h
index 452f3f149ab..cef30bb1916 100644
--- a/src/Core/SettingsFields.h
+++ b/src/Core/SettingsFields.h
@@ -7,9 +7,7 @@
 #include <Core/MultiEnum.h>
 #include <boost/range/adaptor/map.hpp>
 #include <chrono>
-#include <unordered_map>
 #include <string_view>
-#include <magic_enum.hpp>
 
 
 namespace DB
@@ -380,79 +378,6 @@ void SettingFieldEnum<EnumT, Traits>::readBinary(ReadBuffer & in)
     *this = Traits::fromString(SettingFieldEnumHelpers::readBinary(in));
 }
 
-template <typename Type>
-constexpr auto getEnumValues()
-{
-    std::array<std::pair<std::string_view, Type>, magic_enum::enum_count<Type>()> enum_values{};
-    size_t index = 0;
-    for (auto value : magic_enum::enum_values<Type>())
-        enum_values[index++] = std::pair{magic_enum::enum_name(value), value};
-    return enum_values;
-}
-
-/// NOLINTNEXTLINE
-#define DECLARE_SETTING_ENUM(ENUM_TYPE) \
-    DECLARE_SETTING_ENUM_WITH_RENAME(ENUM_TYPE, ENUM_TYPE)
-
-/// NOLINTNEXTLINE
-#define DECLARE_SETTING_ENUM_WITH_RENAME(NEW_NAME, ENUM_TYPE) \
-    struct SettingField##NEW_NAME##Traits \
-    { \
-        using EnumType = ENUM_TYPE; \
-        using EnumValuePairs = std::pair<const char *, EnumType>[]; \
-        static const String & toString(EnumType value); \
-        static EnumType fromString(std::string_view str); \
-    }; \
-    \
-    using SettingField##NEW_NAME = SettingFieldEnum<ENUM_TYPE, SettingField##NEW_NAME##Traits>;
-
-/// NOLINTNEXTLINE
-#define IMPLEMENT_SETTING_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
-    IMPLEMENT_SETTING_ENUM_IMPL(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, EnumValuePairs, __VA_ARGS__)
-
-/// NOLINTNEXTLINE
-#define IMPLEMENT_SETTING_AUTO_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME) \
-    IMPLEMENT_SETTING_ENUM_IMPL(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, , getEnumValues<EnumType>())
-
-/// NOLINTNEXTLINE
-#define IMPLEMENT_SETTING_ENUM_IMPL(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, PAIRS_TYPE, ...) \
-    const String & SettingField##NEW_NAME##Traits::toString(typename SettingField##NEW_NAME::EnumType value) \
-    { \
-        static const std::unordered_map<EnumType, String> map = [] { \
-            std::unordered_map<EnumType, String> res; \
-            for (const auto & [name, val] : PAIRS_TYPE __VA_ARGS__) \
-                res.emplace(val, name); \
-            return res; \
-        }(); \
-        auto it = map.find(value); \
-        if (it != map.end()) \
-            return it->second; \
-        throw Exception(ERROR_CODE_FOR_UNEXPECTED_NAME, \
-            "Unexpected value of " #NEW_NAME ":{}", std::to_string(std::underlying_type_t<EnumType>(value))); \
-    } \
-    \
-    typename SettingField##NEW_NAME::EnumType SettingField##NEW_NAME##Traits::fromString(std::string_view str) \
-    { \
-        static const std::unordered_map<std::string_view, EnumType> map = [] { \
-            std::unordered_map<std::string_view, EnumType> res; \
-            for (const auto & [name, val] : PAIRS_TYPE __VA_ARGS__) \
-                res.emplace(name, val); \
-            return res; \
-        }(); \
-        auto it = map.find(str); \
-        if (it != map.end()) \
-            return it->second; \
-        String msg; \
-        bool need_comma = false; \
-        for (auto & name : map | boost::adaptors::map_keys) \
-        { \
-            if (std::exchange(need_comma, true)) \
-                msg += ", "; \
-            msg += "'" + String{name} + "'"; \
-        } \
-        throw Exception(ERROR_CODE_FOR_UNEXPECTED_NAME, "Unexpected value of " #NEW_NAME ": '{}'. Must be one of [{}]", String{str}, msg); \
-    }
-
 // Mostly like SettingFieldEnum, but can have multiple enum values (or none) set at once.
 template <typename Enum, typename Traits>
 struct SettingFieldMultiEnum
@@ -543,42 +468,6 @@ void SettingFieldMultiEnum<EnumT, Traits>::readBinary(ReadBuffer & in)
     parseFromString(SettingFieldEnumHelpers::readBinary(in));
 }
 
-/// NOLINTNEXTLINE
-#define DECLARE_SETTING_MULTI_ENUM(ENUM_TYPE) \
-    DECLARE_SETTING_MULTI_ENUM_WITH_RENAME(ENUM_TYPE, ENUM_TYPE)
-
-/// NOLINTNEXTLINE
-#define DECLARE_SETTING_MULTI_ENUM_WITH_RENAME(ENUM_TYPE, NEW_NAME) \
-    struct SettingField##NEW_NAME##Traits \
-    { \
-        using EnumType = ENUM_TYPE; \
-        using EnumValuePairs = std::pair<const char *, EnumType>[]; \
-        static size_t getEnumSize(); \
-        static const String & toString(EnumType value); \
-        static EnumType fromString(std::string_view str); \
-    }; \
-    \
-    using SettingField##NEW_NAME = SettingFieldMultiEnum<ENUM_TYPE, SettingField##NEW_NAME##Traits>; \
-    using NEW_NAME##List = typename SettingField##NEW_NAME::ValueType;
-
-/// NOLINTNEXTLINE
-#define IMPLEMENT_SETTING_MULTI_ENUM(ENUM_TYPE, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
-    IMPLEMENT_SETTING_MULTI_ENUM_WITH_RENAME(ENUM_TYPE, ERROR_CODE_FOR_UNEXPECTED_NAME, __VA_ARGS__)
-
-/// NOLINTNEXTLINE
-#define IMPLEMENT_SETTING_MULTI_ENUM_WITH_RENAME(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, ...) \
-    IMPLEMENT_SETTING_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME, __VA_ARGS__)\
-    size_t SettingField##NEW_NAME##Traits::getEnumSize() {\
-        return std::initializer_list<std::pair<const char*, NEW_NAME>> __VA_ARGS__ .size();\
-    }
-
-/// NOLINTNEXTLINE
-#define IMPLEMENT_SETTING_MULTI_AUTO_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME) \
-    IMPLEMENT_SETTING_AUTO_ENUM(NEW_NAME, ERROR_CODE_FOR_UNEXPECTED_NAME)\
-    size_t SettingField##NEW_NAME##Traits::getEnumSize() {\
-        return getEnumValues<EnumType>().size();\
-    }
-
 /// Setting field for specifying user-defined timezone. It is basically a string, but it needs validation.
 struct SettingFieldTimezone
 {
diff --git a/src/IO/WriteHelpers.h b/src/IO/WriteHelpers.h
index 8b743e6351b..b42b4e6e978 100644
--- a/src/IO/WriteHelpers.h
+++ b/src/IO/WriteHelpers.h
@@ -19,7 +19,6 @@
 #include <base/find_symbols.h>
 #include <base/StringRef.h>
 #include <base/DecomposedFloat.h>
-#include <base/EnumReflection.h>
 
 #include <Core/DecimalFunctions.h>
 #include <Core/Types.h>
diff --git a/src/Parsers/ASTTablesInSelectQuery.h b/src/Parsers/ASTTablesInSelectQuery.h
index 67370eaee14..39ef0b21f6d 100644
--- a/src/Parsers/ASTTablesInSelectQuery.h
+++ b/src/Parsers/ASTTablesInSelectQuery.h
@@ -1,7 +1,5 @@
 #pragma once
 
-#include <base/EnumReflection.h>
-
 #include <Core/Joins.h>
 
 #include <Parsers/IAST.h>
diff --git a/src/Storages/System/StorageSystemDictionaries.cpp b/src/Storages/System/StorageSystemDictionaries.cpp
index 8b528b4a298..a62a4a3f425 100644
--- a/src/Storages/System/StorageSystemDictionaries.cpp
+++ b/src/Storages/System/StorageSystemDictionaries.cpp
@@ -66,7 +66,7 @@ ColumnsDescription StorageSystemDictionaries::getColumnsDescription()
         {"database", std::make_shared<DataTypeString>(), "Name of the database containing the dictionary created by DDL query. Empty string for other dictionaries."},
         {"name", std::make_shared<DataTypeString>(), "Dictionary name."},
         {"uuid", std::make_shared<DataTypeUUID>(), "Dictionary UUID."},
-        {"status", std::make_shared<DataTypeEnum8>(getStatusEnumAllPossibleValues()),
+        {"status", std::make_shared<DataTypeEnum8>(getExternalLoaderStatusEnumAllPossibleValues()),
             "Dictionary status. Possible values: "
             "NOT_LOADED — Dictionary was not loaded because it was not used, "
             "LOADED — Dictionary loaded successfully, "

From 0b54b34b5b8339b163c17420e552aa1dbca2692d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <benjamin.antal@clickhouse.com>
Date: Wed, 20 Mar 2024 16:27:32 +0000
Subject: [PATCH 811/985] Avoid instantiation of `CacheBase`'s ctor in header
 file

---
 src/IO/UncompressedCache.cpp | 11 +++++++++++
 src/IO/UncompressedCache.h   |  4 ++--
 src/Storages/MarkCache.cpp   | 11 +++++++++++
 src/Storages/MarkCache.h     |  5 ++---
 4 files changed, 26 insertions(+), 5 deletions(-)
 create mode 100644 src/IO/UncompressedCache.cpp
 create mode 100644 src/Storages/MarkCache.cpp

diff --git a/src/IO/UncompressedCache.cpp b/src/IO/UncompressedCache.cpp
new file mode 100644
index 00000000000..7309ef5d2f4
--- /dev/null
+++ b/src/IO/UncompressedCache.cpp
@@ -0,0 +1,11 @@
+#include <IO/UncompressedCache.h>
+
+namespace DB
+{
+template class CacheBase<UInt128, UncompressedCacheCell, UInt128TrivialHash, UncompressedSizeWeightFunction>;
+
+UncompressedCache::UncompressedCache(const String & cache_policy, size_t max_size_in_bytes, double size_ratio)
+    : Base(cache_policy, max_size_in_bytes, 0, size_ratio)
+{
+}
+}
diff --git a/src/IO/UncompressedCache.h b/src/IO/UncompressedCache.h
index 702804cdda3..aa515eec357 100644
--- a/src/IO/UncompressedCache.h
+++ b/src/IO/UncompressedCache.h
@@ -33,6 +33,7 @@ struct UncompressedSizeWeightFunction
     }
 };
 
+extern template class CacheBase<UInt128, UncompressedCacheCell, UInt128TrivialHash, UncompressedSizeWeightFunction>;
 
 /** Cache of decompressed blocks for implementation of CachedCompressedReadBuffer. thread-safe.
   */
@@ -42,8 +43,7 @@ private:
     using Base = CacheBase<UInt128, UncompressedCacheCell, UInt128TrivialHash, UncompressedSizeWeightFunction>;
 
 public:
-    UncompressedCache(const String & cache_policy, size_t max_size_in_bytes, double size_ratio)
-        : Base(cache_policy, max_size_in_bytes, 0, size_ratio) {}
+    UncompressedCache(const String & cache_policy, size_t max_size_in_bytes, double size_ratio);
 
     /// Calculate key from path to file and offset.
     static UInt128 hash(const String & path_to_file, size_t offset)
diff --git a/src/Storages/MarkCache.cpp b/src/Storages/MarkCache.cpp
new file mode 100644
index 00000000000..85f0aeac692
--- /dev/null
+++ b/src/Storages/MarkCache.cpp
@@ -0,0 +1,11 @@
+#include <Storages/MarkCache.h>
+
+namespace DB
+{
+template class CacheBase<UInt128, MarksInCompressedFile, UInt128TrivialHash, MarksWeightFunction>;
+
+MarkCache::MarkCache(const String & cache_policy, size_t max_size_in_bytes, double size_ratio)
+    : Base(cache_policy, max_size_in_bytes, 0, size_ratio)
+{
+}
+}
diff --git a/src/Storages/MarkCache.h b/src/Storages/MarkCache.h
index bcb6ae96c68..311fccdf810 100644
--- a/src/Storages/MarkCache.h
+++ b/src/Storages/MarkCache.h
@@ -31,7 +31,7 @@ struct MarksWeightFunction
     }
 };
 
-
+extern template class CacheBase<UInt128, MarksInCompressedFile, UInt128TrivialHash, MarksWeightFunction>;
 /** Cache of 'marks' for StorageMergeTree.
   * Marks is an index structure that addresses ranges in column file, corresponding to ranges of primary key.
   */
@@ -41,8 +41,7 @@ private:
     using Base = CacheBase<UInt128, MarksInCompressedFile, UInt128TrivialHash, MarksWeightFunction>;
 
 public:
-    MarkCache(const String & cache_policy, size_t max_size_in_bytes, double size_ratio)
-        : Base(cache_policy, max_size_in_bytes, 0, size_ratio) {}
+    MarkCache(const String & cache_policy, size_t max_size_in_bytes, double size_ratio);
 
     /// Calculate key from path to file and offset.
     static UInt128 hash(const String & path_to_file)

From 35cc3355971a20d86561aec0a40da00e8cdb4001 Mon Sep 17 00:00:00 2001
From: Robert Schulze <robert@clickhouse.com>
Date: Wed, 20 Mar 2024 18:04:35 +0100
Subject: [PATCH 812/985] Revert "Un-flake `test_undrop_query`"

---
 .../settings.md                               |  4 +-
 docs/en/sql-reference/statements/undrop.md    | 52 ++++++++++++-------
 src/Interpreters/DatabaseCatalog.cpp          |  4 +-
 src/Interpreters/InterpreterUndropQuery.cpp   |  6 +--
 tests/integration/test_undrop_query/test.py   | 25 +++------
 .../0_stateless/02681_undrop_query.sql        |  2 +-
 6 files changed, 48 insertions(+), 45 deletions(-)

diff --git a/docs/en/operations/server-configuration-parameters/settings.md b/docs/en/operations/server-configuration-parameters/settings.md
index f20dcb9025e..07c9a2b88ab 100644
--- a/docs/en/operations/server-configuration-parameters/settings.md
+++ b/docs/en/operations/server-configuration-parameters/settings.md
@@ -933,9 +933,9 @@ Hard limit is configured via system tools
 
 ## database_atomic_delay_before_drop_table_sec {#database_atomic_delay_before_drop_table_sec}
 
-The delay before a table data is dropped in seconds. If the `DROP TABLE` query has a `SYNC` modifier, this setting is ignored.
+Sets the delay before remove table data in seconds. If the query has `SYNC` modifier, this setting is ignored.
 
-Default value: `480` (8 minutes).
+Default value: `480` (8 minute).
 
 ## database_catalog_unused_dir_hide_timeout_sec {#database_catalog_unused_dir_hide_timeout_sec}
 
diff --git a/docs/en/sql-reference/statements/undrop.md b/docs/en/sql-reference/statements/undrop.md
index 4b138bfe679..40ac1ab4f99 100644
--- a/docs/en/sql-reference/statements/undrop.md
+++ b/docs/en/sql-reference/statements/undrop.md
@@ -13,6 +13,13 @@ a system table called `system.dropped_tables`.
 
 If you have a materialized view without a `TO` clause associated with the dropped table, then you will also have to UNDROP the inner table of that view.
 
+:::note
+UNDROP TABLE is experimental.  To use it add this setting: 
+```sql
+set allow_experimental_undrop_table_query = 1;
+```
+:::
+
 :::tip
 Also see [DROP TABLE](/docs/en/sql-reference/statements/drop.md)
 :::
@@ -25,53 +32,60 @@ UNDROP TABLE [db.]name [UUID '<uuid>'] [ON CLUSTER cluster]
 
 **Example**
 
+``` sql
+set allow_experimental_undrop_table_query = 1;
+```
+
 ```sql
-CREATE TABLE tab
+CREATE TABLE undropMe
 (
     `id` UInt8
 )
 ENGINE = MergeTree
-ORDER BY id;
-
-DROP TABLE tab;
-
-SELECT *
-FROM system.dropped_tables
-FORMAT Vertical;
+ORDER BY id
 ```
 
+```sql
+DROP TABLE undropMe
+```
+```sql
+SELECT *
+FROM system.dropped_tables
+FORMAT Vertical
+```
 ```response
 Row 1:
 ──────
 index:                 0
 database:              default
-table:                 tab
+table:                 undropMe
 uuid:                  aa696a1a-1d70-4e60-a841-4c80827706cc
 engine:                MergeTree
-metadata_dropped_path: /var/lib/clickhouse/metadata_dropped/default.tab.aa696a1a-1d70-4e60-a841-4c80827706cc.sql
+metadata_dropped_path: /var/lib/clickhouse/metadata_dropped/default.undropMe.aa696a1a-1d70-4e60-a841-4c80827706cc.sql
 table_dropped_time:    2023-04-05 14:12:12
 
 1 row in set. Elapsed: 0.001 sec. 
 ```
-
 ```sql
-UNDROP TABLE tab;
-
+UNDROP TABLE undropMe
+```
+```response
+Ok.
+```
+```sql
 SELECT *
 FROM system.dropped_tables
-FORMAT Vertical;
-
+FORMAT Vertical
+```
 ```response
 Ok.
 
 0 rows in set. Elapsed: 0.001 sec. 
 ```
-
 ```sql
-DESCRIBE TABLE tab
-FORMAT Vertical;
+DESCRIBE TABLE undropMe
+FORMAT Vertical
 ```
-
 ```response
 Row 1:
 ──────
diff --git a/src/Interpreters/DatabaseCatalog.cpp b/src/Interpreters/DatabaseCatalog.cpp
index c2f2003aabd..a5a523b658b 100644
--- a/src/Interpreters/DatabaseCatalog.cpp
+++ b/src/Interpreters/DatabaseCatalog.cpp
@@ -1142,7 +1142,7 @@ void DatabaseCatalog::dequeueDroppedTableCleanup(StorageID table_id)
     TableMarkedAsDropped dropped_table;
     {
         std::lock_guard lock(tables_marked_dropped_mutex);
-        auto latest_drop_time = std::numeric_limits<time_t>::min();
+        time_t latest_drop_time = std::numeric_limits<time_t>::min();
         auto it_dropped_table = tables_marked_dropped.end();
         for (auto it = tables_marked_dropped.begin(); it != tables_marked_dropped.end(); ++it)
         {
@@ -1167,7 +1167,7 @@ void DatabaseCatalog::dequeueDroppedTableCleanup(StorageID table_id)
         }
         if (it_dropped_table == tables_marked_dropped.end())
             throw Exception(ErrorCodes::UNKNOWN_TABLE,
-                "Table {} is being dropped, has been dropped, or the database engine does not support UNDROP",
+                "The drop task of table {} is in progress, has been dropped or the database engine doesn't support it",
                 table_id.getNameForLogs());
         latest_metadata_dropped_path = it_dropped_table->metadata_path;
         String table_metadata_path = getPathForMetadata(it_dropped_table->table_id);
diff --git a/src/Interpreters/InterpreterUndropQuery.cpp b/src/Interpreters/InterpreterUndropQuery.cpp
index f628a656947..8401c47df6b 100644
--- a/src/Interpreters/InterpreterUndropQuery.cpp
+++ b/src/Interpreters/InterpreterUndropQuery.cpp
@@ -17,16 +17,14 @@ namespace ErrorCodes
     extern const int SUPPORT_IS_DISABLED;
 }
 
-InterpreterUndropQuery::InterpreterUndropQuery(const ASTPtr & query_ptr_, ContextMutablePtr context_)
-    : WithMutableContext(context_)
-    , query_ptr(query_ptr_)
+InterpreterUndropQuery::InterpreterUndropQuery(const ASTPtr & query_ptr_, ContextMutablePtr context_) : WithMutableContext(context_), query_ptr(query_ptr_)
 {
 }
 
+
 BlockIO InterpreterUndropQuery::execute()
 {
     getContext()->checkAccess(AccessType::UNDROP_TABLE);
-
     auto & undrop = query_ptr->as<ASTUndropQuery &>();
     if (!undrop.cluster.empty() && !maybeRemoveOnCluster(query_ptr, getContext()))
     {
diff --git a/tests/integration/test_undrop_query/test.py b/tests/integration/test_undrop_query/test.py
index d57aa8c2dc7..590a5690e55 100644
--- a/tests/integration/test_undrop_query/test.py
+++ b/tests/integration/test_undrop_query/test.py
@@ -29,39 +29,30 @@ def test_undrop_drop_and_undrop_loop(started_cluster):
         logging.info(
             "random_sec: " + random_sec.__str__() + ", table_uuid: " + table_uuid
         )
-
         node.query(
-            "CREATE TABLE test_undrop_loop"
+            "create table test_undrop_loop"
             + count.__str__()
             + " UUID '"
             + table_uuid
-            + "' (id Int32) ENGINE = MergeTree() ORDER BY id;"
+            + "' (id Int32) Engine=MergeTree() order by id;"
         )
-
-        node.query("DROP TABLE test_undrop_loop" + count.__str__() + ";")
-
+        node.query("drop table test_undrop_loop" + count.__str__() + ";")
         time.sleep(random_sec)
-
         if random_sec >= 5:
             error = node.query_and_get_error(
-                "UNDROP TABLE test_undrop_loop"
+                "undrop table test_undrop_loop"
                 + count.__str__()
-                + " UUID '"
+                + " uuid '"
                 + table_uuid
                 + "';"
             )
             assert "UNKNOWN_TABLE" in error
-        elif random_sec <= 3:
-            # (*)
+        else:
             node.query(
-                "UNDROP TABLE test_undrop_loop"
+                "undrop table test_undrop_loop"
                 + count.__str__()
-                + " UUID '"
+                + " uuid '"
                 + table_uuid
                 + "';"
             )
             count = count + 1
-        else:
-            pass
-            # ignore random_sec = 4 to account for communication delay with the database.
-            # if we don't do that, then the second case (*) may find the table already dropped and receive an unexpected exception from the database (Bug #55167)
diff --git a/tests/queries/0_stateless/02681_undrop_query.sql b/tests/queries/0_stateless/02681_undrop_query.sql
index d038a383690..66447fc6c44 100644
--- a/tests/queries/0_stateless/02681_undrop_query.sql
+++ b/tests/queries/0_stateless/02681_undrop_query.sql
@@ -85,5 +85,5 @@ drop table 02681_undrop_multiple;
 select table from system.dropped_tables where table = '02681_undrop_multiple' limit 1;
 undrop table 02681_undrop_multiple;
 select * from 02681_undrop_multiple order by id;
-undrop table 02681_undrop_multiple; -- { serverError TABLE_ALREADY_EXISTS }
+undrop table 02681_undrop_multiple; -- { serverError 57 }
 drop table 02681_undrop_multiple sync;

From ed9db6d392ed8b68c6d39ba8ffab81f875bc6949 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Wed, 20 Mar 2024 18:08:58 +0100
Subject: [PATCH 813/985] Add fuzz queries with CUBE and ROLLUP

---
 ...03014_analyzer_groupby_fuzz_60317.reference | 10 ++++++++++
 .../03014_analyzer_groupby_fuzz_60317.sql      | 18 ++++++++++++++++++
 ...03015_analyzer_groupby_fuzz_60772.reference |  8 ++++++++
 .../03015_analyzer_groupby_fuzz_60772.sql      | 13 +++++++++++++
 ...03017_analyzer_groupby_fuzz_61600.reference |  3 +++
 .../03017_analyzer_groupby_fuzz_61600.sql      | 11 +++++++++++
 6 files changed, 63 insertions(+)

diff --git a/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.reference b/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.reference
index 4972904f87d..5e56482a470 100644
--- a/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.reference
+++ b/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.reference
@@ -1 +1,11 @@
 30	30	1970-01-01
+30	1970-01-01	30	30	1970-01-01	-1980.1
+30	1970-01-01	30	30	1970-01-01	-1980.1
+30	1970-01-01	30	30	1970-01-01	-1980.1
+30	1970-01-01	30	30	1970-01-01	-1980.1
+30	1970-01-01	30	30	1970-01-01	-1980.1
+30	1970-01-01	30	30	1970-01-01	-1980.1
+30	1970-01-01	30	30	1970-01-01	-1980.1
+30	1970-01-01	30	30	1970-01-01	-1980.1
+
+30	1970-01-01	30	30	1970-01-01	-1980.1
diff --git a/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.sql b/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.sql
index 2f54058526e..094614cb78d 100644
--- a/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.sql
+++ b/tests/queries/0_stateless/03014_analyzer_groupby_fuzz_60317.sql
@@ -7,3 +7,21 @@ FROM system.one
 GROUP BY
     _CAST(30, 'Nullable(UInt8)')
 SETTINGS allow_experimental_analyzer = 1;
+
+-- WITH CUBE (note that result is different with the analyzer (analyzer is correct including all combinations)
+SELECT
+    toNullable(toNullable(materialize(_CAST(30, 'LowCardinality(UInt8)')))) AS `toNullable(toNullable(materialize(toLowCardinality(30))))`,
+    _CAST(0, 'Date') AS `makeDate(-1980.1, -1980.1, 10)`,
+    _CAST(30, 'LowCardinality(UInt8)') AS `toLowCardinality(30)`,
+    30 AS `30`,
+    makeDate(materialize(_CAST(30, 'LowCardinality(UInt8)')), 10, _CAST(30, 'Nullable(UInt8)')) AS `makeDate(materialize(toLowCardinality(30)), 10, toNullable(toNullable(30)))`,
+    -1980.1 AS `-1980.1`
+FROM system.one AS __table1
+GROUP BY
+    _CAST(30, 'Nullable(UInt8)'),
+    -1980.1,
+    materialize(30),
+    _CAST(30, 'Nullable(UInt8)')
+WITH CUBE
+WITH TOTALS
+SETTINGS allow_experimental_analyzer = 1;
diff --git a/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.reference b/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.reference
index 611407ecd90..5cdf256a24a 100644
--- a/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.reference
+++ b/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.reference
@@ -1 +1,9 @@
 %W	2018-01-02 22:33:44	1
+%W	2018-01-02 22:33:44	1
+%W	2018-01-02 22:33:44	1
+%W	2018-01-02 22:33:44	1
+%W	2018-01-02 22:33:44	1
+%W	2018-01-02 22:33:44	1
+%W	2018-01-02 22:33:44	1
+%W	2018-01-02 22:33:44	1
+%W	2018-01-02 22:33:44	1
diff --git a/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.sql b/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.sql
index c8b4eef50ff..d3bd9ef0ce3 100644
--- a/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.sql
+++ b/tests/queries/0_stateless/03015_analyzer_groupby_fuzz_60772.sql
@@ -8,3 +8,16 @@ GROUP BY
     'gr',
     '2018-01-02 22:33:44'
 SETTINGS allow_experimental_analyzer = 1;
+
+-- WITH CUBE (note that result is different with the analyzer (analyzer is correct including all combinations)
+SELECT
+    toFixedString(toFixedString(toFixedString(toFixedString(toFixedString(toFixedString('%W', 2), 2), 2), toLowCardinality(toLowCardinality(toNullable(2)))), 2), 2),
+    toFixedString(toFixedString('2018-01-02 22:33:44', 19), 19),
+    hasSubsequence(toNullable(materialize(toLowCardinality('garbage'))), 'gr')
+GROUP BY
+    '2018-01-02 22:33:44',
+    toFixedString(toFixedString('2018-01-02 22:33:44', 19), 19),
+    'gr',
+    '2018-01-02 22:33:44'
+WITH CUBE
+SETTINGS allow_experimental_analyzer = 1;
diff --git a/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.reference b/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.reference
index 68acb650f8e..eaa1097a734 100644
--- a/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.reference
+++ b/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.reference
@@ -1 +1,4 @@
 38	\N
+38	\N
+38	\N
+38	\N
diff --git a/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.sql b/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.sql
index 44b27750c16..53a5cfe9b1a 100644
--- a/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.sql
+++ b/tests/queries/0_stateless/03017_analyzer_groupby_fuzz_61600.sql
@@ -12,3 +12,14 @@ GROUP BY
     toNullable(3),
     concat(concat(NULLIF(1, 1), toNullable(toNullable(3))))
 SETTINGS allow_experimental_analyzer = 1;
+
+-- WITH ROLLUP (note that result is different with the analyzer (analyzer is correct including all combinations)
+SELECT
+    38,
+    concat(position(concat(concat(position(concat(toUInt256(3)), 'ca', 2), 3), NULLIF(1, materialize(toLowCardinality(1)))), toLowCardinality(toNullable('ca'))), concat(NULLIF(1, 1), concat(3), toNullable(3)))
+FROM set_index_not__fuzz_0
+GROUP BY
+    toNullable(3),
+    concat(concat(NULLIF(1, 1), toNullable(toNullable(3))))
+WITH ROLLUP
+SETTINGS allow_experimental_analyzer = 1;

From 4f273c60c3432f1e919bae87188563e2a078cec1 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Wed, 20 Mar 2024 09:46:07 +0000
Subject: [PATCH 814/985] CI: disable some kerberos and hdfs integration tests
 for arm

 #ci_set_arm
 #batch_2
 #no_merge_commit
---
 tests/integration/helpers/cluster.py                   | 7 +++++++
 tests/integration/test_kerberos_auth/test.py           | 5 ++++-
 tests/integration/test_storage_kerberized_hdfs/test.py | 9 ++++++++-
 3 files changed, 19 insertions(+), 2 deletions(-)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 152b0d066ee..b3088ba7c81 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -1,8 +1,10 @@
 import base64
 import errno
+from functools import cache
 import http.client
 import logging
 import os
+import platform
 import stat
 import os.path as p
 import pprint
@@ -4743,3 +4745,8 @@ class ClickHouseKiller(object):
 
     def __exit__(self, exc_type, exc_val, exc_tb):
         self.clickhouse_node.start_clickhouse()
+
+
+@cache
+def is_arm():
+    return any(arch in platform.processor().lower() for arch in ("arm, aarch"))
diff --git a/tests/integration/test_kerberos_auth/test.py b/tests/integration/test_kerberos_auth/test.py
index a41255cff3e..0025ca7c6b6 100644
--- a/tests/integration/test_kerberos_auth/test.py
+++ b/tests/integration/test_kerberos_auth/test.py
@@ -1,5 +1,5 @@
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 
 cluster = ClickHouseCluster(__file__)
 instance1 = cluster.add_instance(
@@ -62,10 +62,12 @@ def make_auth(instance):
     )
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_kerberos_auth_with_keytab(kerberos_cluster):
     assert make_auth(instance1) == "kuser\n"
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_kerberos_auth_without_keytab(kerberos_cluster):
     assert (
         "DB::Exception: : Authentication failed: password is incorrect, or there is no user with such name."
@@ -73,6 +75,7 @@ def test_kerberos_auth_without_keytab(kerberos_cluster):
     )
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_bad_path_to_keytab(kerberos_cluster):
     assert (
         "DB::Exception: : Authentication failed: password is incorrect, or there is no user with such name."
diff --git a/tests/integration/test_storage_kerberized_hdfs/test.py b/tests/integration/test_storage_kerberized_hdfs/test.py
index 5ac8b4670f9..c33a9614945 100644
--- a/tests/integration/test_storage_kerberized_hdfs/test.py
+++ b/tests/integration/test_storage_kerberized_hdfs/test.py
@@ -3,7 +3,7 @@ import pytest
 
 import os
 
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 import subprocess
 
 cluster = ClickHouseCluster(__file__)
@@ -29,6 +29,7 @@ def started_cluster():
         cluster.shutdown()
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_read_table(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -44,6 +45,7 @@ def test_read_table(started_cluster):
     assert select_read == data
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_read_write_storage(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -59,6 +61,7 @@ def test_read_write_storage(started_cluster):
     assert select_read == "1\tMark\t72.53\n"
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_write_storage_not_expired(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -76,6 +79,7 @@ def test_write_storage_not_expired(started_cluster):
     assert select_read == "1\tMark\t72.53\n"
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_two_users(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -98,6 +102,7 @@ def test_two_users(started_cluster):
     )
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_read_table_expired(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -118,6 +123,7 @@ def test_read_table_expired(started_cluster):
     started_cluster.unpause_container("hdfskerberos")
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_prohibited(started_cluster):
     node1.query(
         "create table HDFSStorTwoProhibited (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://suser@kerberizedhdfs1:9010/storage_user_two_prohibited', 'TSV')"
@@ -132,6 +138,7 @@ def test_prohibited(started_cluster):
         )
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_cache_path(started_cluster):
     node1.query(
         "create table HDFSStorCachePath (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://dedicatedcachepath@kerberizedhdfs1:9010/storage_dedicated_cache_path', 'TSV')"

From 7b8c5f35b522c23a9abae735739496622cdef703 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Wed, 20 Mar 2024 14:05:06 +0000
Subject: [PATCH 815/985] disable test_strage_hdfs module  #ci_set_arm 
 #batch_2  #no_merge_commit

---
 tests/integration/test_storage_hdfs/test.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/integration/test_storage_hdfs/test.py b/tests/integration/test_storage_hdfs/test.py
index 121263fb622..9dec1954406 100644
--- a/tests/integration/test_storage_hdfs/test.py
+++ b/tests/integration/test_storage_hdfs/test.py
@@ -2,10 +2,13 @@ import os
 
 import pytest
 import time
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 from helpers.test_tools import TSV
 from pyhdfs import HdfsClient
 
+if is_arm():
+    pytestmark = pytest.mark.skip
+
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance(
     "node1",

From 984c7e69a0a58dfe1930a9e0ee18e8f19f52e9d1 Mon Sep 17 00:00:00 2001
From: Max K <max.kainov@clickhouse.com>
Date: Fri, 15 Mar 2024 15:18:45 +0100
Subject: [PATCH 816/985] disable test_allowed_url_with_config tests with HDFS 
 #no_merge_commit  #ci_set_arm

---
 tests/ci/ci_config.py                               |  2 +-
 .../test_allowed_url_from_config/test.py            | 13 +++++++++----
 2 files changed, 10 insertions(+), 5 deletions(-)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 7c213da27ec..d2caf75f4bd 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -380,7 +380,7 @@ upgrade_check_digest = DigestConfig(
     docker=["clickhouse/upgrade-check"],
 )
 integration_check_digest = DigestConfig(
-    include_paths=["./tests/ci/integration_test_check.py", "./tests/integration"],
+    include_paths=["./tests/ci/integration_test_check.py", "./tests/integration/"],
     exclude_files=[".md"],
     docker=IMAGES.copy(),
 )
diff --git a/tests/integration/test_allowed_url_from_config/test.py b/tests/integration/test_allowed_url_from_config/test.py
index 3106cf12702..df8934aa69b 100644
--- a/tests/integration/test_allowed_url_from_config/test.py
+++ b/tests/integration/test_allowed_url_from_config/test.py
@@ -1,5 +1,5 @@
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance("node1", main_configs=["configs/config_with_hosts.xml"])
@@ -16,9 +16,11 @@ node5 = cluster.add_instance(
     "node5", main_configs=["configs/config_without_allowed_hosts.xml"]
 )
 node6 = cluster.add_instance("node6", main_configs=["configs/config_for_remote.xml"])
-node7 = cluster.add_instance(
-    "node7", main_configs=["configs/config_for_redirect.xml"], with_hdfs=True
-)
+
+if not is_arm():
+    node7 = cluster.add_instance(
+        "node7", main_configs=["configs/config_for_redirect.xml"], with_hdfs=True
+    )
 
 
 @pytest.fixture(scope="module")
@@ -270,6 +272,7 @@ def test_table_function_remote(start_cluster):
     )
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_redirect(start_cluster):
     hdfs_api = start_cluster.hdfs_api
 
@@ -284,6 +287,7 @@ def test_redirect(start_cluster):
     node7.query("DROP TABLE table_test_7_1")
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_HDFS(start_cluster):
     assert "not allowed" in node7.query_and_get_error(
         "CREATE TABLE table_test_7_2 (word String) ENGINE=HDFS('http://hdfs1:50075/webhdfs/v1/simple_storage?op=OPEN&namenoderpcaddress=hdfs1:9000&offset=0', 'CSV')"
@@ -293,6 +297,7 @@ def test_HDFS(start_cluster):
     )
 
 
+@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_schema_inference(start_cluster):
     error = node7.query_and_get_error("desc url('http://test.com`, 'TSVRaw'')")
     assert error.find("ReadWriteBufferFromHTTPBase") == -1

From 55737de0e604760fadeacc5aae82b54d69d52df7 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Wed, 20 Mar 2024 15:48:53 +0000
Subject: [PATCH 817/985] disable more hdfs and kafka inttests

 #ci_set_arm
---
 tests/integration/test_disk_types/test.py             |  9 ++++++---
 .../test_endpoint_macro_substitution/test.py          |  4 +++-
 tests/integration/test_format_avro_confluent/test.py  |  6 +++++-
 tests/integration/test_jdbc_bridge/test.py            |  5 ++++-
 tests/integration/test_kafka_bad_messages/test.py     |  6 +++++-
 tests/integration/test_keeper_disks/test.py           |  6 +++++-
 tests/integration/test_log_family_hdfs/test.py        |  5 ++++-
 .../test_materialized_mysql_database/test.py          |  5 +++++
 tests/integration/test_merge_tree_hdfs/test.py        |  6 +++++-
 tests/integration/test_mysql_protocol/test.py         | 11 ++++++++++-
 tests/integration/test_redirect_url_storage/test.py   |  7 ++++++-
 tests/integration/test_storage_kafka/test.py          |  4 +++-
 12 files changed, 61 insertions(+), 13 deletions(-)

diff --git a/tests/integration/test_disk_types/test.py b/tests/integration/test_disk_types/test.py
index b9b8ef2010d..3c4169be4de 100644
--- a/tests/integration/test_disk_types/test.py
+++ b/tests/integration/test_disk_types/test.py
@@ -1,14 +1,17 @@
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 from helpers.test_tools import TSV
 
 disk_types = {
     "default": "Local",
     "disk_s3": "S3",
-    "disk_hdfs": "HDFS",
     "disk_encrypted": "S3",
 }
 
+# do not test HDFS on ARM
+if not is_arm():
+    disk_types["disk_hdfs"] = "HDFS"
+
 
 @pytest.fixture(scope="module")
 def cluster():
@@ -18,7 +21,7 @@ def cluster():
             "node",
             main_configs=["configs/storage.xml"],
             with_minio=True,
-            with_hdfs=True,
+            with_hdfs=not is_arm(),
         )
         cluster.start()
 
diff --git a/tests/integration/test_endpoint_macro_substitution/test.py b/tests/integration/test_endpoint_macro_substitution/test.py
index ee72fb9b492..22a649e2225 100644
--- a/tests/integration/test_endpoint_macro_substitution/test.py
+++ b/tests/integration/test_endpoint_macro_substitution/test.py
@@ -1,5 +1,5 @@
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 from helpers.test_tools import TSV
 from pyhdfs import HdfsClient
 
@@ -10,6 +10,8 @@ disk_types = {
     "disk_encrypted": "S3",
 }
 
+if is_arm():
+    pytestmark = pytest.mark.skip
 
 @pytest.fixture(scope="module")
 def cluster():
diff --git a/tests/integration/test_format_avro_confluent/test.py b/tests/integration/test_format_avro_confluent/test.py
index 540f90ae05e..ccaaee83514 100644
--- a/tests/integration/test_format_avro_confluent/test.py
+++ b/tests/integration/test_format_avro_confluent/test.py
@@ -8,9 +8,13 @@ from confluent_kafka.avro.cached_schema_registry_client import (
     CachedSchemaRegistryClient,
 )
 from confluent_kafka.avro.serializer.message_serializer import MessageSerializer
-from helpers.cluster import ClickHouseCluster, ClickHouseInstance
+from helpers.cluster import ClickHouseCluster, ClickHouseInstance, is_arm
 from urllib import parse
 
+# Skip on ARM due to Confluent/Kafka
+if is_arm():
+    pytestmark = pytest.mark.skip
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
diff --git a/tests/integration/test_jdbc_bridge/test.py b/tests/integration/test_jdbc_bridge/test.py
index 0e41cc8c8b7..c4a0a525df3 100644
--- a/tests/integration/test_jdbc_bridge/test.py
+++ b/tests/integration/test_jdbc_bridge/test.py
@@ -3,7 +3,7 @@ import os.path as p
 import pytest
 import uuid
 
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 from helpers.test_tools import TSV
 from string import Template
 
@@ -14,6 +14,9 @@ instance = cluster.add_instance(
 datasource = "self"
 records = 1000
 
+if is_arm():
+    pytestmark = pytest.mark.skip
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
diff --git a/tests/integration/test_kafka_bad_messages/test.py b/tests/integration/test_kafka_bad_messages/test.py
index 954b6042305..0446ca5cb47 100644
--- a/tests/integration/test_kafka_bad_messages/test.py
+++ b/tests/integration/test_kafka_bad_messages/test.py
@@ -2,10 +2,14 @@ import time
 import logging
 import pytest
 
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 from kafka import KafkaAdminClient, KafkaProducer, KafkaConsumer, BrokerConnection
 from kafka.admin import NewTopic
 
+if is_arm():
+    pytestmark = pytest.mark.skip
+
+
 cluster = ClickHouseCluster(__file__)
 instance = cluster.add_instance(
     "instance",
diff --git a/tests/integration/test_keeper_disks/test.py b/tests/integration/test_keeper_disks/test.py
index e41837b89b4..0c91aa03419 100644
--- a/tests/integration/test_keeper_disks/test.py
+++ b/tests/integration/test_keeper_disks/test.py
@@ -1,11 +1,15 @@
 #!/usr/bin/env python3
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 import helpers.keeper_utils as keeper_utils
 from minio.deleteobjects import DeleteObject
 
 import os
 
+if is_arm():
+    pytestmark = pytest.mark.skip
+
+
 CURRENT_TEST_DIR = os.path.dirname(os.path.abspath(__file__))
 cluster = ClickHouseCluster(__file__)
 node_logs = cluster.add_instance(
diff --git a/tests/integration/test_log_family_hdfs/test.py b/tests/integration/test_log_family_hdfs/test.py
index e8afe364ec4..6c3d28d2e3c 100644
--- a/tests/integration/test_log_family_hdfs/test.py
+++ b/tests/integration/test_log_family_hdfs/test.py
@@ -2,10 +2,13 @@ import logging
 import sys
 
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 
 from pyhdfs import HdfsClient
 
+if is_arm():
+    pytestmark = pytest.mark.skip
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
diff --git a/tests/integration/test_materialized_mysql_database/test.py b/tests/integration/test_materialized_mysql_database/test.py
index 89c69c42adc..57e496fe737 100644
--- a/tests/integration/test_materialized_mysql_database/test.py
+++ b/tests/integration/test_materialized_mysql_database/test.py
@@ -6,6 +6,7 @@ from helpers.cluster import (
     ClickHouseCluster,
     ClickHouseInstance,
     get_docker_compose_path,
+    is_arm,
 )
 import logging
 
@@ -13,6 +14,10 @@ from . import materialized_with_ddl
 
 DOCKER_COMPOSE_PATH = get_docker_compose_path()
 
+# skip all test on arm due to no arm support in mysql57
+if is_arm():
+    pytestmark = pytest.mark.skip
+
 cluster = ClickHouseCluster(__file__)
 mysql_node = None
 mysql8_node = None
diff --git a/tests/integration/test_merge_tree_hdfs/test.py b/tests/integration/test_merge_tree_hdfs/test.py
index 95b63a5c8a3..5ca7dc5feb0 100644
--- a/tests/integration/test_merge_tree_hdfs/test.py
+++ b/tests/integration/test_merge_tree_hdfs/test.py
@@ -3,7 +3,7 @@ import time
 import os
 
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 from helpers.utility import generate_values
 from helpers.wait_for_helpers import wait_for_delete_inactive_parts
 from helpers.wait_for_helpers import wait_for_delete_empty_parts
@@ -16,6 +16,10 @@ CONFIG_PATH = os.path.join(
 )
 
 
+if is_arm():
+    pytestmark = pytest.mark.skip
+
+
 def create_table(cluster, table_name, additional_settings=None):
     node = cluster.instances["node"]
 
diff --git a/tests/integration/test_mysql_protocol/test.py b/tests/integration/test_mysql_protocol/test.py
index 7a69d07633c..e641d4c2300 100644
--- a/tests/integration/test_mysql_protocol/test.py
+++ b/tests/integration/test_mysql_protocol/test.py
@@ -12,11 +12,20 @@ from typing import Literal
 import docker
 import pymysql.connections
 import pytest
-from helpers.cluster import ClickHouseCluster, get_docker_compose_path, run_and_check
+from helpers.cluster import (
+    ClickHouseCluster,
+    get_docker_compose_path,
+    is_arm,
+    run_and_check,
+)
 
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 DOCKER_COMPOSE_PATH = get_docker_compose_path()
 
+if is_arm():
+    pytestmark = pytest.mark.skip
+
+
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance(
     "node",
diff --git a/tests/integration/test_redirect_url_storage/test.py b/tests/integration/test_redirect_url_storage/test.py
index 033f02d7bde..ba3fb3e14ab 100644
--- a/tests/integration/test_redirect_url_storage/test.py
+++ b/tests/integration/test_redirect_url_storage/test.py
@@ -1,10 +1,15 @@
 import pytest
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 
 from helpers.network import PartitionManager
 import threading
 import time
 
+# skip all tests in the module on ARM due to HDFS
+if is_arm():
+    pytestmark = pytest.mark.skip
+
+
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance(
     "node1",
diff --git a/tests/integration/test_storage_kafka/test.py b/tests/integration/test_storage_kafka/test.py
index dea1ea49851..5bdea179449 100644
--- a/tests/integration/test_storage_kafka/test.py
+++ b/tests/integration/test_storage_kafka/test.py
@@ -22,7 +22,7 @@ import kafka.errors
 import pytest
 from google.protobuf.internal.encoder import _VarintBytes
 from helpers.client import QueryRuntimeException
-from helpers.cluster import ClickHouseCluster
+from helpers.cluster import ClickHouseCluster, is_arm
 from helpers.network import PartitionManager
 from helpers.test_tools import TSV
 from kafka import KafkaAdminClient, KafkaProducer, KafkaConsumer, BrokerConnection
@@ -40,6 +40,8 @@ from . import kafka_pb2
 from . import social_pb2
 from . import message_with_repeated_pb2
 
+if is_arm():
+    pytestmark = pytest.mark.skip
 
 # TODO: add test for run-time offset update in CH, if we manually update it on Kafka side.
 # TODO: add test for SELECT LIMIT is working.

From 9f3c625ab5034cadb2805bcd2068f4341eab5829 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Wed, 20 Mar 2024 17:23:08 +0000
Subject: [PATCH 818/985] fix mysql client tests to use mysql8 image

 #ci_set_integration
 #ci_set_arm
---
 .../compose/docker_compose_mysql_client.yml            |  2 +-
 .../test_endpoint_macro_substitution/test.py           |  1 +
 tests/integration/test_kerberos_auth/test.py           |  7 ++++---
 tests/integration/test_mysql_protocol/test.py          |  4 ----
 tests/integration/test_storage_kerberized_hdfs/test.py | 10 +++-------
 5 files changed, 9 insertions(+), 15 deletions(-)

diff --git a/tests/integration/compose/docker_compose_mysql_client.yml b/tests/integration/compose/docker_compose_mysql_client.yml
index 5b37b6e6c09..ee590118d4f 100644
--- a/tests/integration/compose/docker_compose_mysql_client.yml
+++ b/tests/integration/compose/docker_compose_mysql_client.yml
@@ -1,7 +1,7 @@
 version: '2.3'
 services:
   mysql_client:
-    image: mysql:5.7
+    image: mysql:8.0
     restart: always
     environment:
       MYSQL_ALLOW_EMPTY_PASSWORD: 1
diff --git a/tests/integration/test_endpoint_macro_substitution/test.py b/tests/integration/test_endpoint_macro_substitution/test.py
index 22a649e2225..7dc282a980f 100644
--- a/tests/integration/test_endpoint_macro_substitution/test.py
+++ b/tests/integration/test_endpoint_macro_substitution/test.py
@@ -13,6 +13,7 @@ disk_types = {
 if is_arm():
     pytestmark = pytest.mark.skip
 
+
 @pytest.fixture(scope="module")
 def cluster():
     try:
diff --git a/tests/integration/test_kerberos_auth/test.py b/tests/integration/test_kerberos_auth/test.py
index 0025ca7c6b6..2d0dce33c14 100644
--- a/tests/integration/test_kerberos_auth/test.py
+++ b/tests/integration/test_kerberos_auth/test.py
@@ -1,6 +1,10 @@
 import pytest
 from helpers.cluster import ClickHouseCluster, is_arm
 
+if is_arm():
+    pytestmark = pytest.mark.skip
+
+
 cluster = ClickHouseCluster(__file__)
 instance1 = cluster.add_instance(
     "instance1",
@@ -62,12 +66,10 @@ def make_auth(instance):
     )
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_kerberos_auth_with_keytab(kerberos_cluster):
     assert make_auth(instance1) == "kuser\n"
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_kerberos_auth_without_keytab(kerberos_cluster):
     assert (
         "DB::Exception: : Authentication failed: password is incorrect, or there is no user with such name."
@@ -75,7 +77,6 @@ def test_kerberos_auth_without_keytab(kerberos_cluster):
     )
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_bad_path_to_keytab(kerberos_cluster):
     assert (
         "DB::Exception: : Authentication failed: password is incorrect, or there is no user with such name."
diff --git a/tests/integration/test_mysql_protocol/test.py b/tests/integration/test_mysql_protocol/test.py
index e641d4c2300..094ae7b9fd0 100644
--- a/tests/integration/test_mysql_protocol/test.py
+++ b/tests/integration/test_mysql_protocol/test.py
@@ -15,16 +15,12 @@ import pytest
 from helpers.cluster import (
     ClickHouseCluster,
     get_docker_compose_path,
-    is_arm,
     run_and_check,
 )
 
 SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
 DOCKER_COMPOSE_PATH = get_docker_compose_path()
 
-if is_arm():
-    pytestmark = pytest.mark.skip
-
 
 cluster = ClickHouseCluster(__file__)
 node = cluster.add_instance(
diff --git a/tests/integration/test_storage_kerberized_hdfs/test.py b/tests/integration/test_storage_kerberized_hdfs/test.py
index c33a9614945..c72152fa376 100644
--- a/tests/integration/test_storage_kerberized_hdfs/test.py
+++ b/tests/integration/test_storage_kerberized_hdfs/test.py
@@ -6,6 +6,9 @@ import os
 from helpers.cluster import ClickHouseCluster, is_arm
 import subprocess
 
+if is_arm():
+    pytestmark = pytest.mark.skip
+
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance(
     "node1",
@@ -29,7 +32,6 @@ def started_cluster():
         cluster.shutdown()
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_read_table(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -45,7 +47,6 @@ def test_read_table(started_cluster):
     assert select_read == data
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_read_write_storage(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -61,7 +62,6 @@ def test_read_write_storage(started_cluster):
     assert select_read == "1\tMark\t72.53\n"
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_write_storage_not_expired(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -79,7 +79,6 @@ def test_write_storage_not_expired(started_cluster):
     assert select_read == "1\tMark\t72.53\n"
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_two_users(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -102,7 +101,6 @@ def test_two_users(started_cluster):
     )
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_read_table_expired(started_cluster):
     hdfs_api = started_cluster.hdfs_api
 
@@ -123,7 +121,6 @@ def test_read_table_expired(started_cluster):
     started_cluster.unpause_container("hdfskerberos")
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_prohibited(started_cluster):
     node1.query(
         "create table HDFSStorTwoProhibited (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://suser@kerberizedhdfs1:9010/storage_user_two_prohibited', 'TSV')"
@@ -138,7 +135,6 @@ def test_prohibited(started_cluster):
         )
 
 
-@pytest.mark.skipif(is_arm(), reason="skip for ARM")
 def test_cache_path(started_cluster):
     node1.query(
         "create table HDFSStorCachePath (id UInt32, name String, weight Float64) ENGINE = HDFS('hdfs://dedicatedcachepath@kerberizedhdfs1:9010/storage_dedicated_cache_path', 'TSV')"

From f44127ce19f3723eac91fcc795d0adf0adb0b427 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Wed, 20 Mar 2024 19:13:51 +0100
Subject: [PATCH 819/985] fix

---
 src/Databases/DatabaseReplicatedWorker.cpp | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/src/Databases/DatabaseReplicatedWorker.cpp b/src/Databases/DatabaseReplicatedWorker.cpp
index 0a6e8f9345e..51065062995 100644
--- a/src/Databases/DatabaseReplicatedWorker.cpp
+++ b/src/Databases/DatabaseReplicatedWorker.cpp
@@ -77,10 +77,7 @@ void DatabaseReplicatedDDLWorker::initializeReplication()
     zookeeper->deleteEphemeralNodeIfContentMatches(active_path, active_id);
     if (active_node_holder)
         active_node_holder->setAlreadyRemoved();
-    zookeeper->create(active_path, active_id, zkutil::CreateMode::Ephemeral);
     active_node_holder.reset();
-    active_node_holder_zookeeper = zookeeper;
-    active_node_holder = zkutil::EphemeralNodeHolder::existing(active_path, *active_node_holder_zookeeper);
 
     String log_ptr_str = zookeeper->get(database->replica_path + "/log_ptr");
     UInt32 our_log_ptr = parse<UInt32>(log_ptr_str);
@@ -129,9 +126,15 @@ void DatabaseReplicatedDDLWorker::initializeReplication()
         initializeLogPointer(log_entry_name);
     }
 
-    std::lock_guard lock{database->metadata_mutex};
-    if (!database->checkDigestValid(context, false))
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Inconsistent database metadata after reconnection to ZooKeeper");
+    {
+        std::lock_guard lock{database->metadata_mutex};
+        if (!database->checkDigestValid(context, false))
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Inconsistent database metadata after reconnection to ZooKeeper");
+    }
+
+    zookeeper->create(active_path, active_id, zkutil::CreateMode::Ephemeral);
+    active_node_holder_zookeeper = zookeeper;
+    active_node_holder = zkutil::EphemeralNodeHolder::existing(active_path, *active_node_holder_zookeeper);
 }
 
 String DatabaseReplicatedDDLWorker::enqueueQuery(DDLLogEntry & entry)

From d190ee8113ae6eae7d77850e884fae7e56c65924 Mon Sep 17 00:00:00 2001
From: Alexander Tokmakov <tavplubix@clickhouse.com>
Date: Wed, 20 Mar 2024 19:19:30 +0100
Subject: [PATCH 820/985] Update AsynchronousInsertQueue.h

---
 src/Interpreters/AsynchronousInsertQueue.h | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/src/Interpreters/AsynchronousInsertQueue.h b/src/Interpreters/AsynchronousInsertQueue.h
index 1a4678e3a7d..a8ee064877d 100644
--- a/src/Interpreters/AsynchronousInsertQueue.h
+++ b/src/Interpreters/AsynchronousInsertQueue.h
@@ -63,6 +63,8 @@ public:
     PushResult pushQueryWithBlock(ASTPtr query, Block block, ContextPtr query_context);
     size_t getPoolSize() const { return pool_size; }
 
+    /// This method should be called manually because it's not flushed automatically in dtor
+    /// because all tables may be already unloaded when we destroy AsynchronousInsertQueue
     void flushAndShutdown();
 
 private:

From 040b191899c8dab75ebc0c8149a170b177264a46 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Wed, 20 Mar 2024 20:25:38 +0100
Subject: [PATCH 821/985] Fix readBigAt

---
 src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp | 16 +++++++---------
 1 file changed, 7 insertions(+), 9 deletions(-)

diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
index 13f62c7ac25..5941dca0b48 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
@@ -279,26 +279,24 @@ size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t ran
         sleep_time_with_backoff_milliseconds *= 2;
     };
 
-    Azure::Storage::Blobs::DownloadBlobOptions download_options;
-    download_options.Range = {static_cast<int64_t>(range_begin), range_begin+n};
 
-    for (size_t i = 0; i < max_single_download_retries; ++i)
+
+    for (size_t i = 0; i < max_single_download_retries && n > 0; ++i)
     {
         size_t bytes_copied = 0;
         try
         {
+            Azure::Storage::Blobs::DownloadBlobOptions download_options;
+            download_options.Range = {static_cast<int64_t>(range_begin), n};
             auto download_response = blob_client->Download(download_options);
+
             std::unique_ptr<Azure::Core::IO::BodyStream> body_stream = std::move(download_response.Value.BodyStream);
-            auto length = body_stream->Length();
-            char buffer[length];
-            body_stream->Read(reinterpret_cast<uint8_t *>(buffer), length);
-            std::istringstream string_stream(String(static_cast<char *>(buffer),length)); // STYLE_CHECK_ALLOW_STD_STRING_STREAM
+            auto bytes = body_stream->ReadToCount(reinterpret_cast<uint8_t *>(data_ptr), body_stream->Length());
+            std::istringstream string_stream(String(static_cast<char *>(data_ptr),bytes)); // STYLE_CHECK_ALLOW_STD_STRING_STREAM
             copyFromIStreamWithProgressCallback(string_stream, to, n, progress_callback, &bytes_copied);
 
             if (read_settings.remote_throttler)
                 read_settings.remote_throttler->add(bytes_copied, ProfileEvents::RemoteReadThrottlerBytes, ProfileEvents::RemoteReadThrottlerSleepMicroseconds);
-
-            break;
         }
         catch (const Azure::Core::RequestFailedException & e)
         {

From 6f4ce33f027be0600eea4e563ff06a5eac0894f5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Wed, 20 Mar 2024 22:12:57 +0100
Subject: [PATCH 822/985] Change how fuzzer arguments are parsed

---
 programs/local/LocalServer.cpp | 12 ------------
 src/Client/ClientBase.cpp      | 19 +++++++++++++++++--
 src/Client/ClientBase.h        |  4 +---
 3 files changed, 18 insertions(+), 17 deletions(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index f485e3880c1..6f7d3681c46 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -878,11 +878,6 @@ void LocalServer::processOptions(const OptionsDescription &, const CommandLineOp
 
 void LocalServer::readArguments(int argc, char ** argv, Arguments & common_arguments, std::vector<Arguments> &, std::vector<Arguments> &)
 {
-#if defined(FUZZING_MODE)
-    if (argc)
-        fuzzer_args.push_back(argv[0]);
-#endif
-
     for (int arg_num = 1; arg_num < argc; ++arg_num)
     {
         std::string_view arg = argv[arg_num];
@@ -918,13 +913,6 @@ void LocalServer::readArguments(int argc, char ** argv, Arguments & common_argum
             arg = argv[arg_num];
             addMultiquery(arg, common_arguments);
         }
-        else if (arg == "--")
-        {
-#if defined(FUZZING_MODE)
-            fuzzer_args.insert(fuzzer_args.end(), &argv[arg_num + 1], &argv[argc]);
-            break;
-#endif
-        }
         else
         {
             common_arguments.emplace_back(arg);
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index c4cb6e1a5ad..05f583ef438 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -7,7 +7,6 @@
 
 #include <base/argsToConfig.h>
 #include <base/safeExit.h>
-#include <base/scope_guard.h>
 #include <Core/Block.h>
 #include <Core/Protocol.h>
 #include <Common/DateLUT.h>
@@ -16,7 +15,6 @@
 #include <Common/Exception.h>
 #include <Common/getNumberOfPhysicalCPUCores.h>
 #include <Common/typeid_cast.h>
-#include <Common/UTF8Helpers.h>
 #include <Common/TerminalSize.h>
 #include <Common/clearPasswordFromCommandLine.h>
 #include <Common/StringUtils/StringUtils.h>
@@ -70,6 +68,7 @@
 
 #include <boost/algorithm/string/case_conv.hpp>
 #include <boost/algorithm/string/replace.hpp>
+#include <boost/algorithm/string/split.hpp>
 #include <iostream>
 #include <filesystem>
 #include <limits>
@@ -2638,6 +2637,16 @@ ClientBase * app;
 void ClientBase::runLibFuzzer()
 {
     app = this;
+    std::vector<String> fuzzer_args_holder;
+
+    if (const char * fuzzer_args_env = getenv("FUZZER_ARGS")) // NOLINT(concurrency-mt-unsafe)
+        boost::split(fuzzer_args_holder, fuzzer_args_env, isWhitespaceASCII, boost::token_compress_on);
+
+    std::vector<char *> fuzzer_args;
+    fuzzer_args.push_back(argv0);
+    for (auto & arg : fuzzer_args_holder)
+        fuzzer_args.emplace_back(arg.data());
+
     int fuzzer_argc = fuzzer_args.size();
     char ** fuzzer_argv = fuzzer_args.data();
 
@@ -2656,6 +2665,8 @@ void ClientBase::runLibFuzzer()
         return 0;
     });
 }
+#else
+void ClientBase::runLibFuzzer() {}
 #endif
 
 
@@ -2828,6 +2839,8 @@ void ClientBase::init(int argc, char ** argv)
     Arguments common_arguments = {""}; /// 0th argument is ignored.
     std::vector<Arguments> hosts_and_ports_arguments;
 
+    if (argc)
+        argv0 = argv[0];
     readArguments(argc, argv, common_arguments, external_tables_arguments, hosts_and_ports_arguments);
 
     /// Support for Unicode dashes
@@ -2892,6 +2905,8 @@ void ClientBase::init(int argc, char ** argv)
         ("interactive", "Process queries-file or --query query and start interactive mode")
         ("pager", po::value<std::string>(), "Pipe all output into this command (less or similar)")
         ("max_memory_usage_in_client", po::value<std::string>(), "Set memory limit in client/local server")
+
+        ("fuzzer-args", po::value<std::string>(), "Command line arguments for the LLVM's libFuzzer driver. Only relevant if the application is compiled with libFuzzer.")
     ;
 
     addOptions(options_description);
diff --git a/src/Client/ClientBase.h b/src/Client/ClientBase.h
index c0052ade7aa..51dfaebd995 100644
--- a/src/Client/ClientBase.h
+++ b/src/Client/ClientBase.h
@@ -78,10 +78,8 @@ protected:
     void runInteractive();
     void runNonInteractive();
 
-#if defined(FUZZING_MODE)
-    std::vector<char *> fuzzer_args;
+    char * argv0 = nullptr;
     void runLibFuzzer();
-#endif
 
     virtual bool processWithFuzzing(const String &)
     {

From a31cf43499b1d02827ee3ca08e3fc961c3911eaa Mon Sep 17 00:00:00 2001
From: Nikita Mikhaylov <mikhaylovnikitka@gmail.com>
Date: Wed, 20 Mar 2024 23:13:17 +0100
Subject: [PATCH 823/985] Update the dictionary for OSSFuzz (#61672)

---
 tests/fuzz/README.md                   |   18 +-
 tests/fuzz/all.dict                    | 3455 +++++++++++++++-
 tests/fuzz/dictionaries/datatypes.dict |  287 +-
 tests/fuzz/dictionaries/functions.dict | 5264 +++++++++++++++++++-----
 tests/fuzz/dictionaries/key_words.dict |  426 +-
 5 files changed, 8089 insertions(+), 1361 deletions(-)

diff --git a/tests/fuzz/README.md b/tests/fuzz/README.md
index 5b864babde3..6b5b161b2d5 100644
--- a/tests/fuzz/README.md
+++ b/tests/fuzz/README.md
@@ -1,13 +1,23 @@
-The list of functions generated via following query
+The list of functions generated via the following query
 
 ```
-    clickhouse-client -q "select concat('\"', name, '\"') from system.functions union all select concat('\"', alias_to, '\"') from system.functions where alias_to != '' " > functions.dict
+    clickhouse client -q "SELECT * FROM (SELECT DISTINCT concat('\"', name, '\"') as res FROM system.functions ORDER BY name UNION ALL SELECT concat('\"', a.name, b.name, '\"') as res FROM system.functions as a CROSS JOIN system.aggregate_function_combinators as b WHERE a.is_aggregate = 1) ORDER BY res" > functions.dict
 ```
 
-The list of datatypes generated via following query:
+The list of datatypes generated via the following query:
 
 ```
-    clickhouse-client -q "select concat('\"', name, '\"') from system.data_type_families union all select concat('\"', alias_to, '\"') from system.data_type_families where alias_to != '' " > datatypes.dict
+    clickhouse client -q "SELECT DISTINCT concat('\"', name, '\"') as res FROM system.data_type_families ORDER BY name" > datatypes.dict
+```
+
+The list of keywords generated via the following query:
+
+```
+    clickhouse client -q "SELECT DISTINCT concat('\"', keyword, '\"') as res FROM system.keywords ORDER BY keyword" > key_words.dict
 ```
 
 Then merge all dictionaries into one (all.dict)
+
+```
+    cat ./dictionaries/* | sort | uniq > all.dict
+```
\ No newline at end of file
diff --git a/tests/fuzz/all.dict b/tests/fuzz/all.dict
index b38e2c11a1c..f08e319f0d4 100644
--- a/tests/fuzz/all.dict
+++ b/tests/fuzz/all.dict
@@ -1,59 +1,333 @@
-
 "abs"
-"accurate_Cast"
 "accurateCast"
-"accurate_CastOrNull"
+"accurateCastOrDefault"
 "accurateCastOrNull"
 "acos"
 "acosh"
 "ADD"
 "ADD COLUMN"
 "ADD CONSTRAINT"
+"addDate"
 "addDays"
 "addHours"
 "ADD INDEX"
+"addInterval"
+"addMicroseconds"
+"addMilliseconds"
 "addMinutes"
 "addMonths"
+"addNanoseconds"
+"ADD PROJECTION"
 "addQuarters"
 "addressToLine"
+"addressToLineWithInlines"
 "addressToSymbol"
 "addSeconds"
+"ADD STATISTIC"
+"addTupleOfIntervals"
 "addWeeks"
 "addYears"
+"ADMIN OPTION FOR"
 "aes_decrypt_mysql"
 "aes_encrypt_mysql"
 "AFTER"
+"age"
 "AggregateFunction"
 "aggThrow"
+"aggThrowArgMax"
+"aggThrowArgMin"
+"aggThrowArray"
+"aggThrowDistinct"
+"aggThrowForEach"
+"aggThrowIf"
+"aggThrowMap"
+"aggThrowMerge"
+"aggThrowNull"
+"aggThrowOrDefault"
+"aggThrowOrNull"
+"aggThrowResample"
+"aggThrowSimpleState"
+"aggThrowState"
+"ALGORITHM"
 "ALIAS"
 "ALL"
+"ALLOWED_LATENESS"
 "alphaTokens"
 "ALTER"
+"ALTER COLUMN"
+"ALTER DATABASE"
 "ALTER LIVE VIEW"
+"ALTER POLICY"
+"ALTER PROFILE"
+"ALTER QUOTA"
+"ALTER ROLE"
+"ALTER ROW POLICY"
+"ALTER SETTINGS PROFILE"
 "ALTER TABLE"
+"ALTER TEMPORARY TABLE"
+"ALTER USER"
+"analysisOfVariance"
+"analysisOfVarianceArgMax"
+"analysisOfVarianceArgMin"
+"analysisOfVarianceArray"
+"analysisOfVarianceDistinct"
+"analysisOfVarianceForEach"
+"analysisOfVarianceIf"
+"analysisOfVarianceMap"
+"analysisOfVarianceMerge"
+"analysisOfVarianceNull"
+"analysisOfVarianceOrDefault"
+"analysisOfVarianceOrNull"
+"analysisOfVarianceResample"
+"analysisOfVarianceSimpleState"
+"analysisOfVarianceState"
 "and"
 "AND"
+"AND STDOUT"
+"anova"
+"anovaArgMax"
+"anovaArgMin"
+"anovaArray"
+"anovaDistinct"
+"anovaForEach"
+"anovaIf"
+"anovaMap"
+"anovaMerge"
+"anovaNull"
+"anovaOrDefault"
+"anovaOrNull"
+"anovaResample"
+"anovaSimpleState"
+"anovaState"
 "ANTI"
 "any"
 "ANY"
+"anyArgMax"
+"anyArgMin"
+"anyArray"
+"anyDistinct"
+"anyForEach"
 "anyHeavy"
+"anyHeavyArgMax"
+"anyHeavyArgMin"
+"anyHeavyArray"
+"anyHeavyDistinct"
+"anyHeavyForEach"
+"anyHeavyIf"
+"anyHeavyMap"
+"anyHeavyMerge"
+"anyHeavyNull"
+"anyHeavyOrDefault"
+"anyHeavyOrNull"
+"anyHeavyResample"
+"anyHeavySimpleState"
+"anyHeavyState"
+"anyIf"
 "anyLast"
+"anyLastArgMax"
+"anyLastArgMin"
+"anyLastArray"
+"anyLastDistinct"
+"anyLastForEach"
+"anyLastIf"
+"anyLastMap"
+"anyLastMerge"
+"anyLastNull"
+"anyLastOrDefault"
+"anyLastOrNull"
+"anyLastResample"
+"anyLast_respect_nulls"
+"anyLast_respect_nullsArgMax"
+"anyLast_respect_nullsArgMin"
+"anyLast_respect_nullsArray"
+"anyLast_respect_nullsDistinct"
+"anyLast_respect_nullsForEach"
+"anyLast_respect_nullsIf"
+"anyLast_respect_nullsMap"
+"anyLast_respect_nullsMerge"
+"anyLast_respect_nullsNull"
+"anyLast_respect_nullsOrDefault"
+"anyLast_respect_nullsOrNull"
+"anyLast_respect_nullsResample"
+"anyLast_respect_nullsSimpleState"
+"anyLast_respect_nullsState"
+"anyLastSimpleState"
+"anyLastState"
+"anyMap"
+"anyMerge"
+"anyNull"
+"anyOrDefault"
+"anyOrNull"
+"anyResample"
+"any_respect_nulls"
+"any_respect_nullsArgMax"
+"any_respect_nullsArgMin"
+"any_respect_nullsArray"
+"any_respect_nullsDistinct"
+"any_respect_nullsForEach"
+"any_respect_nullsIf"
+"any_respect_nullsMap"
+"any_respect_nullsMerge"
+"any_respect_nullsNull"
+"any_respect_nullsOrDefault"
+"any_respect_nullsOrNull"
+"any_respect_nullsResample"
+"any_respect_nullsSimpleState"
+"any_respect_nullsState"
+"anySimpleState"
+"anyState"
+"any_value"
+"any_valueArgMax"
+"any_valueArgMin"
+"any_valueArray"
+"any_valueDistinct"
+"any_valueForEach"
+"any_valueIf"
+"any_valueMap"
+"any_valueMerge"
+"any_valueNull"
+"any_valueOrDefault"
+"any_valueOrNull"
+"any_valueResample"
+"any_value_respect_nulls"
+"any_value_respect_nullsArgMax"
+"any_value_respect_nullsArgMin"
+"any_value_respect_nullsArray"
+"any_value_respect_nullsDistinct"
+"any_value_respect_nullsForEach"
+"any_value_respect_nullsIf"
+"any_value_respect_nullsMap"
+"any_value_respect_nullsMerge"
+"any_value_respect_nullsNull"
+"any_value_respect_nullsOrDefault"
+"any_value_respect_nullsOrNull"
+"any_value_respect_nullsResample"
+"any_value_respect_nullsSimpleState"
+"any_value_respect_nullsState"
+"any_valueSimpleState"
+"any_valueState"
+"APPEND"
 "appendTrailingCharIfAbsent"
+"APPLY"
+"APPLY DELETED MASK"
+"approx_top_count"
+"approx_top_countArgMax"
+"approx_top_countArgMin"
+"approx_top_countArray"
+"approx_top_countDistinct"
+"approx_top_countForEach"
+"approx_top_countIf"
+"approx_top_countMap"
+"approx_top_countMerge"
+"approx_top_countNull"
+"approx_top_countOrDefault"
+"approx_top_countOrNull"
+"approx_top_countResample"
+"approx_top_countSimpleState"
+"approx_top_countState"
+"approx_top_k"
+"approx_top_kArgMax"
+"approx_top_kArgMin"
+"approx_top_kArray"
+"approx_top_kDistinct"
+"approx_top_kForEach"
+"approx_top_kIf"
+"approx_top_kMap"
+"approx_top_kMerge"
+"approx_top_kNull"
+"approx_top_kOrDefault"
+"approx_top_kOrNull"
+"approx_top_kResample"
+"approx_top_kSimpleState"
+"approx_top_kState"
+"approx_top_sum"
+"approx_top_sumArgMax"
+"approx_top_sumArgMin"
+"approx_top_sumArray"
+"approx_top_sumDistinct"
+"approx_top_sumForEach"
+"approx_top_sumIf"
+"approx_top_sumMap"
+"approx_top_sumMerge"
+"approx_top_sumNull"
+"approx_top_sumOrDefault"
+"approx_top_sumOrNull"
+"approx_top_sumResample"
+"approx_top_sumSimpleState"
+"approx_top_sumState"
 "argMax"
+"argMaxArgMax"
+"argMaxArgMin"
+"argMaxArray"
+"argMaxDistinct"
+"argMaxForEach"
+"argMaxIf"
+"argMaxMap"
+"argMaxMerge"
+"argMaxNull"
+"argMaxOrDefault"
+"argMaxOrNull"
+"argMaxResample"
+"argMaxSimpleState"
+"argMaxState"
 "argMin"
+"argMinArgMax"
+"argMinArgMin"
+"argMinArray"
+"argMinDistinct"
+"argMinForEach"
+"argMinIf"
+"argMinMap"
+"argMinMerge"
+"argMinNull"
+"argMinOrDefault"
+"argMinOrNull"
+"argMinResample"
+"argMinSimpleState"
+"argMinState"
 "array"
 "Array"
-"ARRAY"
+"array_agg"
+"array_aggArgMax"
+"array_aggArgMin"
+"array_aggArray"
+"array_aggDistinct"
+"array_aggForEach"
+"array_aggIf"
+"array_aggMap"
+"array_aggMerge"
+"array_aggNull"
+"array_aggOrDefault"
+"array_aggOrNull"
+"array_aggResample"
+"array_aggSimpleState"
+"array_aggState"
 "arrayAll"
 "arrayAUC"
 "arrayAvg"
 "arrayCompact"
 "arrayConcat"
+"array_concat_agg"
+"array_concat_aggArgMax"
+"array_concat_aggArgMin"
+"array_concat_aggArray"
+"array_concat_aggDistinct"
+"array_concat_aggForEach"
+"array_concat_aggIf"
+"array_concat_aggMap"
+"array_concat_aggMerge"
+"array_concat_aggNull"
+"array_concat_aggOrDefault"
+"array_concat_aggOrNull"
+"array_concat_aggResample"
+"array_concat_aggSimpleState"
+"array_concat_aggState"
 "arrayCount"
 "arrayCumSum"
 "arrayCumSumNonNegative"
 "arrayDifference"
 "arrayDistinct"
+"arrayDotProduct"
 "arrayElement"
 "arrayEnumerate"
 "arrayEnumerateDense"
@@ -65,10 +339,16 @@
 "arrayFilter"
 "arrayFirst"
 "arrayFirstIndex"
+"arrayFirstOrNull"
 "arrayFlatten"
+"arrayFold"
 "arrayIntersect"
+"arrayJaccardIndex"
 "arrayJoin"
 "ARRAY JOIN"
+"arrayLast"
+"arrayLastIndex"
+"arrayLastOrNull"
 "arrayMap"
 "arrayMax"
 "arrayMin"
@@ -80,6 +360,7 @@
 "arrayProduct"
 "arrayPushBack"
 "arrayPushFront"
+"arrayRandomSample"
 "arrayReduce"
 "arrayReduceInRanges"
 "arrayResize"
@@ -87,6 +368,11 @@
 "arrayReverseFill"
 "arrayReverseSort"
 "arrayReverseSplit"
+"arrayRotateLeft"
+"arrayRotateRight"
+"arrayShiftLeft"
+"arrayShiftRight"
+"arrayShingles"
 "arrayShuffle"
 "arraySlice"
 "arraySort"
@@ -99,9 +385,11 @@
 "AS"
 "ASC"
 "ASCENDING"
+"ascii"
 "asin"
 "asinh"
 "ASOF"
+"ASSUME"
 "assumeNotNull"
 "AST"
 "ASYNC"
@@ -111,14 +399,59 @@
 "ATTACH"
 "ATTACH PART"
 "ATTACH PARTITION"
+"ATTACH POLICY"
+"ATTACH PROFILE"
+"ATTACH QUOTA"
+"ATTACH ROLE"
+"ATTACH ROW POLICY"
+"ATTACH SETTINGS PROFILE"
+"ATTACH USER"
+"AUTO_INCREMENT"
 "avg"
+"avgArgMax"
+"avgArgMin"
+"avgArray"
+"avgDistinct"
+"avgForEach"
+"avgIf"
+"avgMap"
+"avgMerge"
+"avgNull"
+"avgOrDefault"
+"avgOrNull"
+"avgResample"
+"avgSimpleState"
+"avgState"
 "avgWeighted"
+"avgWeightedArgMax"
+"avgWeightedArgMin"
+"avgWeightedArray"
+"avgWeightedDistinct"
+"avgWeightedForEach"
+"avgWeightedIf"
+"avgWeightedMap"
+"avgWeightedMerge"
+"avgWeightedNull"
+"avgWeightedOrDefault"
+"avgWeightedOrNull"
+"avgWeightedResample"
+"avgWeightedSimpleState"
+"avgWeightedState"
+"AZURE"
+"BACKUP"
+"bagexpansion"
 "bar"
+"base58Decode"
+"base58Encode"
 "base64Decode"
 "base64Encode"
+"base_backup"
 "basename"
-"bayesAB"
+"BCRYPT_HASH"
+"BCRYPT_PASSWORD"
+"BEGIN TRANSACTION"
 "BETWEEN"
+"BIDIRECTIONAL"
 "BIGINT"
 "BIGINT SIGNED"
 "BIGINT UNSIGNED"
@@ -126,8 +459,23 @@
 "BINARY"
 "BINARY LARGE OBJECT"
 "BINARY VARYING"
+"BIT"
 "bitAnd"
 "BIT_AND"
+"BIT_ANDArgMax"
+"BIT_ANDArgMin"
+"BIT_ANDArray"
+"BIT_ANDDistinct"
+"BIT_ANDForEach"
+"BIT_ANDIf"
+"BIT_ANDMap"
+"BIT_ANDMerge"
+"BIT_ANDNull"
+"BIT_ANDOrDefault"
+"BIT_ANDOrNull"
+"BIT_ANDResample"
+"BIT_ANDSimpleState"
+"BIT_ANDState"
 "__bitBoolMaskAnd"
 "__bitBoolMaskOr"
 "bitCount"
@@ -156,11 +504,26 @@
 "bitNot"
 "bitOr"
 "BIT_OR"
+"BIT_ORArgMax"
+"BIT_ORArgMin"
+"BIT_ORArray"
+"BIT_ORDistinct"
+"BIT_ORForEach"
+"BIT_ORIf"
+"BIT_ORMap"
+"BIT_ORMerge"
+"BIT_ORNull"
+"BIT_OROrDefault"
+"BIT_OROrNull"
+"BIT_ORResample"
+"BIT_ORSimpleState"
+"BIT_ORState"
 "bitPositionsToArray"
 "bitRotateLeft"
 "bitRotateRight"
 "bitShiftLeft"
 "bitShiftRight"
+"bitSlice"
 "__bitSwapLastTwo"
 "bitTest"
 "bitTestAll"
@@ -168,19 +531,53 @@
 "__bitWrapperFunc"
 "bitXor"
 "BIT_XOR"
+"BIT_XORArgMax"
+"BIT_XORArgMin"
+"BIT_XORArray"
+"BIT_XORDistinct"
+"BIT_XORForEach"
+"BIT_XORIf"
+"BIT_XORMap"
+"BIT_XORMerge"
+"BIT_XORNull"
+"BIT_XOROrDefault"
+"BIT_XOROrNull"
+"BIT_XORResample"
+"BIT_XORSimpleState"
+"BIT_XORState"
+"BLAKE3"
 "BLOB"
 "blockNumber"
 "blockSerializedSize"
 "blockSize"
-"BOOL"
-"BOOLEAN"
+"bool"
+"Bool"
+"boolean"
 "BOTH"
 "boundingRatio"
+"boundingRatioArgMax"
+"boundingRatioArgMin"
+"boundingRatioArray"
+"boundingRatioDistinct"
+"boundingRatioForEach"
+"boundingRatioIf"
+"boundingRatioMap"
+"boundingRatioMerge"
+"boundingRatioNull"
+"boundingRatioOrDefault"
+"boundingRatioOrNull"
+"boundingRatioResample"
+"boundingRatioSimpleState"
+"boundingRatioState"
 "buildId"
 "BY"
 "BYTE"
 "BYTEA"
+"byteHammingDistance"
 "byteSize"
+"byteSlice"
+"byteSwap"
+"CASCADE"
 "CASE"
 "caseWithExpr"
 "caseWithExpression"
@@ -188,10 +585,28 @@
 "caseWithoutExpression"
 "_CAST"
 "CAST"
+"catboostEvaluate"
 "categoricalInformationValue"
+"categoricalInformationValueArgMax"
+"categoricalInformationValueArgMin"
+"categoricalInformationValueArray"
+"categoricalInformationValueDistinct"
+"categoricalInformationValueForEach"
+"categoricalInformationValueIf"
+"categoricalInformationValueMap"
+"categoricalInformationValueMerge"
+"categoricalInformationValueNull"
+"categoricalInformationValueOrDefault"
+"categoricalInformationValueOrNull"
+"categoricalInformationValueResample"
+"categoricalInformationValueSimpleState"
+"categoricalInformationValueState"
 "cbrt"
 "ceil"
 "ceiling"
+"CHANGE"
+"CHANGEABLE_IN_READONLY"
+"CHANGED"
 "char"
 "CHAR"
 "CHARACTER"
@@ -202,13 +617,19 @@
 "CHAR_LENGTH"
 "CHAR VARYING"
 "CHECK"
+"CHECK ALL TABLES"
 "CHECK TABLE"
 "cityHash64"
-"CLEAR"
+"CLEANUP"
 "CLEAR COLUMN"
 "CLEAR INDEX"
+"CLEAR PROJECTION"
+"CLEAR STATISTIC"
 "CLOB"
 "CLUSTER"
+"cluster_host_ids"
+"CLUSTERS"
+"CN"
 "coalesce"
 "CODEC"
 "COLLATE"
@@ -216,52 +637,301 @@
 "COLUMNS"
 "COMMENT"
 "COMMENT COLUMN"
+"COMMIT"
+"COMPRESSION"
 "concat"
 "concatAssumeInjective"
+"concatWithSeparator"
+"concatWithSeparatorAssumeInjective"
+"concat_ws"
 "connection_id"
-"connectionid"
 "connectionId"
+"CONST"
 "CONSTRAINT"
+"contingency"
+"contingencyArgMax"
+"contingencyArgMin"
+"contingencyArray"
+"contingencyDistinct"
+"contingencyForEach"
+"contingencyIf"
+"contingencyMap"
+"contingencyMerge"
+"contingencyNull"
+"contingencyOrDefault"
+"contingencyOrNull"
+"contingencyResample"
+"contingencySimpleState"
+"contingencyState"
 "convertCharset"
 "corr"
+"corrArgMax"
+"corrArgMin"
+"corrArray"
+"corrDistinct"
+"corrForEach"
+"corrIf"
+"corrMap"
+"corrMatrix"
+"corrMatrixArgMax"
+"corrMatrixArgMin"
+"corrMatrixArray"
+"corrMatrixDistinct"
+"corrMatrixForEach"
+"corrMatrixIf"
+"corrMatrixMap"
+"corrMatrixMerge"
+"corrMatrixNull"
+"corrMatrixOrDefault"
+"corrMatrixOrNull"
+"corrMatrixResample"
+"corrMatrixSimpleState"
+"corrMatrixState"
+"corrMerge"
+"corrNull"
+"corrOrDefault"
+"corrOrNull"
+"corrResample"
+"corrSimpleState"
 "corrStable"
+"corrStableArgMax"
+"corrStableArgMin"
+"corrStableArray"
+"corrStableDistinct"
+"corrStableForEach"
+"corrStableIf"
+"corrStableMap"
+"corrStableMerge"
+"corrStableNull"
+"corrStableOrDefault"
+"corrStableOrNull"
+"corrStableResample"
+"corrStableSimpleState"
+"corrStableState"
+"corrState"
 "cos"
 "cosh"
+"cosineDistance"
 "count"
+"countArgMax"
+"countArgMin"
+"countArray"
 "countDigits"
+"countDistinct"
 "countEqual"
+"countForEach"
+"countIf"
+"countMap"
 "countMatches"
 "countMatchesCaseInsensitive"
+"countMerge"
+"countNull"
+"countOrDefault"
+"countOrNull"
+"countResample"
+"countSimpleState"
+"countState"
 "countSubstrings"
 "countSubstringsCaseInsensitive"
 "countSubstringsCaseInsensitiveUTF8"
 "covarPop"
 "COVAR_POP"
+"covarPopArgMax"
+"COVAR_POPArgMax"
+"covarPopArgMin"
+"COVAR_POPArgMin"
+"covarPopArray"
+"COVAR_POPArray"
+"covarPopDistinct"
+"COVAR_POPDistinct"
+"covarPopForEach"
+"COVAR_POPForEach"
+"covarPopIf"
+"COVAR_POPIf"
+"covarPopMap"
+"COVAR_POPMap"
+"covarPopMatrix"
+"covarPopMatrixArgMax"
+"covarPopMatrixArgMin"
+"covarPopMatrixArray"
+"covarPopMatrixDistinct"
+"covarPopMatrixForEach"
+"covarPopMatrixIf"
+"covarPopMatrixMap"
+"covarPopMatrixMerge"
+"covarPopMatrixNull"
+"covarPopMatrixOrDefault"
+"covarPopMatrixOrNull"
+"covarPopMatrixResample"
+"covarPopMatrixSimpleState"
+"covarPopMatrixState"
+"covarPopMerge"
+"COVAR_POPMerge"
+"covarPopNull"
+"COVAR_POPNull"
+"covarPopOrDefault"
+"COVAR_POPOrDefault"
+"covarPopOrNull"
+"COVAR_POPOrNull"
+"covarPopResample"
+"COVAR_POPResample"
+"covarPopSimpleState"
+"COVAR_POPSimpleState"
 "covarPopStable"
+"covarPopStableArgMax"
+"covarPopStableArgMin"
+"covarPopStableArray"
+"covarPopStableDistinct"
+"covarPopStableForEach"
+"covarPopStableIf"
+"covarPopStableMap"
+"covarPopStableMerge"
+"covarPopStableNull"
+"covarPopStableOrDefault"
+"covarPopStableOrNull"
+"covarPopStableResample"
+"covarPopStableSimpleState"
+"covarPopStableState"
+"covarPopState"
+"COVAR_POPState"
 "covarSamp"
 "COVAR_SAMP"
+"covarSampArgMax"
+"COVAR_SAMPArgMax"
+"covarSampArgMin"
+"COVAR_SAMPArgMin"
+"covarSampArray"
+"COVAR_SAMPArray"
+"covarSampDistinct"
+"COVAR_SAMPDistinct"
+"covarSampForEach"
+"COVAR_SAMPForEach"
+"covarSampIf"
+"COVAR_SAMPIf"
+"covarSampMap"
+"COVAR_SAMPMap"
+"covarSampMatrix"
+"covarSampMatrixArgMax"
+"covarSampMatrixArgMin"
+"covarSampMatrixArray"
+"covarSampMatrixDistinct"
+"covarSampMatrixForEach"
+"covarSampMatrixIf"
+"covarSampMatrixMap"
+"covarSampMatrixMerge"
+"covarSampMatrixNull"
+"covarSampMatrixOrDefault"
+"covarSampMatrixOrNull"
+"covarSampMatrixResample"
+"covarSampMatrixSimpleState"
+"covarSampMatrixState"
+"covarSampMerge"
+"COVAR_SAMPMerge"
+"covarSampNull"
+"COVAR_SAMPNull"
+"covarSampOrDefault"
+"COVAR_SAMPOrDefault"
+"covarSampOrNull"
+"COVAR_SAMPOrNull"
+"covarSampResample"
+"COVAR_SAMPResample"
+"covarSampSimpleState"
+"COVAR_SAMPSimpleState"
 "covarSampStable"
+"covarSampStableArgMax"
+"covarSampStableArgMin"
+"covarSampStableArray"
+"covarSampStableDistinct"
+"covarSampStableForEach"
+"covarSampStableIf"
+"covarSampStableMap"
+"covarSampStableMerge"
+"covarSampStableNull"
+"covarSampStableOrDefault"
+"covarSampStableOrNull"
+"covarSampStableResample"
+"covarSampStableSimpleState"
+"covarSampStableState"
+"covarSampState"
+"COVAR_SAMPState"
+"cramersV"
+"cramersVArgMax"
+"cramersVArgMin"
+"cramersVArray"
+"cramersVBiasCorrected"
+"cramersVBiasCorrectedArgMax"
+"cramersVBiasCorrectedArgMin"
+"cramersVBiasCorrectedArray"
+"cramersVBiasCorrectedDistinct"
+"cramersVBiasCorrectedForEach"
+"cramersVBiasCorrectedIf"
+"cramersVBiasCorrectedMap"
+"cramersVBiasCorrectedMerge"
+"cramersVBiasCorrectedNull"
+"cramersVBiasCorrectedOrDefault"
+"cramersVBiasCorrectedOrNull"
+"cramersVBiasCorrectedResample"
+"cramersVBiasCorrectedSimpleState"
+"cramersVBiasCorrectedState"
+"cramersVDistinct"
+"cramersVForEach"
+"cramersVIf"
+"cramersVMap"
+"cramersVMerge"
+"cramersVNull"
+"cramersVOrDefault"
+"cramersVOrNull"
+"cramersVResample"
+"cramersVSimpleState"
+"cramersVState"
 "CRC32"
 "CRC32IEEE"
 "CRC64"
 "CREATE"
+"CREATE POLICY"
+"CREATE PROFILE"
+"CREATE QUOTA"
+"CREATE ROLE"
+"CREATE ROW POLICY"
+"CREATE SETTINGS PROFILE"
+"CREATE TABLE"
+"CREATE TEMPORARY TABLE"
+"CREATE USER"
 "CROSS"
 "CUBE"
+"curdate"
+"current_database"
 "currentDatabase"
+"current_date"
+"CURRENT GRANTS"
 "currentProfiles"
+"CURRENT QUOTA"
 "currentRoles"
+"CURRENT ROLES"
+"CURRENT ROW"
+"current_schemas"
+"currentSchemas"
+"current_timestamp"
+"CURRENT TRANSACTION"
 "currentUser"
+"CURRENT_USER"
+"CURRENTUSER"
 "cutFragment"
 "cutIPv6"
 "cutQueryString"
 "cutQueryStringAndFragment"
 "cutToFirstSignificantSubdomain"
 "cutToFirstSignificantSubdomainCustom"
+"cutToFirstSignificantSubdomainCustomRFC"
 "cutToFirstSignificantSubdomainCustomWithWWW"
+"cutToFirstSignificantSubdomainCustomWithWWWRFC"
+"cutToFirstSignificantSubdomainRFC"
 "cutToFirstSignificantSubdomainWithWWW"
+"cutToFirstSignificantSubdomainWithWWWRFC"
 "cutURLParameter"
 "cutWWW"
 "D"
+"damerauLevenshteinDistance"
 "DATABASE"
 "DATABASES"
 "Date"
@@ -269,9 +939,11 @@
 "Date32"
 "DATE_ADD"
 "DATEADD"
+"date_diff"
 "dateDiff"
 "DATE_DIFF"
 "DATEDIFF"
+"DATE_FORMAT"
 "dateName"
 "DATE_SUB"
 "DATESUB"
@@ -280,12 +952,13 @@
 "DateTime64"
 "dateTime64ToSnowflake"
 "dateTimeToSnowflake"
-"date_trunc"
 "dateTrunc"
+"DATE_TRUNC"
 "DAY"
 "DAYOFMONTH"
 "DAYOFWEEK"
 "DAYOFYEAR"
+"DAYS"
 "DD"
 "DEC"
 "Decimal"
@@ -293,28 +966,84 @@
 "Decimal256"
 "Decimal32"
 "Decimal64"
+"decodeHTMLComponent"
 "decodeURLComponent"
+"decodeURLFormComponent"
 "decodeXMLComponent"
 "decrypt"
 "DEDUPLICATE"
 "DEFAULT"
+"DEFAULT DATABASE"
 "defaultProfiles"
+"DEFAULT ROLE"
 "defaultRoles"
 "defaultValueOfArgumentType"
 "defaultValueOfTypeName"
-"DELAY"
+"DEFINER"
+"degrees"
 "DELETE"
 "DELETE WHERE"
 "deltaSum"
+"deltaSumArgMax"
+"deltaSumArgMin"
+"deltaSumArray"
+"deltaSumDistinct"
+"deltaSumForEach"
+"deltaSumIf"
+"deltaSumMap"
+"deltaSumMerge"
+"deltaSumNull"
+"deltaSumOrDefault"
+"deltaSumOrNull"
+"deltaSumResample"
+"deltaSumSimpleState"
+"deltaSumState"
 "deltaSumTimestamp"
+"deltaSumTimestampArgMax"
+"deltaSumTimestampArgMin"
+"deltaSumTimestampArray"
+"deltaSumTimestampDistinct"
+"deltaSumTimestampForEach"
+"deltaSumTimestampIf"
+"deltaSumTimestampMap"
+"deltaSumTimestampMerge"
+"deltaSumTimestampNull"
+"deltaSumTimestampOrDefault"
+"deltaSumTimestampOrNull"
+"deltaSumTimestampResample"
+"deltaSumTimestampSimpleState"
+"deltaSumTimestampState"
 "demangle"
 "dense_rank"
+"dense_rankArgMax"
+"dense_rankArgMin"
+"dense_rankArray"
+"dense_rankDistinct"
+"dense_rankForEach"
+"dense_rankIf"
+"dense_rankMap"
+"dense_rankMerge"
+"dense_rankNull"
+"dense_rankOrDefault"
+"dense_rankOrNull"
+"dense_rankResample"
+"dense_rankSimpleState"
+"dense_rankState"
+"DEPENDS ON"
 "DESC"
 "DESCENDING"
 "DESCRIBE"
 "DETACH"
+"DETACH PART"
 "DETACH PARTITION"
+"detectCharset"
+"detectLanguage"
+"detectLanguageMixed"
+"detectLanguageUnknown"
+"detectProgrammingLanguage"
+"detectTonality"
 "dictGet"
+"dictGetAll"
 "dictGetChildren"
 "dictGetDate"
 "dictGetDateOrDefault"
@@ -334,6 +1063,10 @@
 "dictGetInt64OrDefault"
 "dictGetInt8"
 "dictGetInt8OrDefault"
+"dictGetIPv4"
+"dictGetIPv4OrDefault"
+"dictGetIPv6"
+"dictGetIPv6OrDefault"
 "dictGetOrDefault"
 "dictGetOrNull"
 "dictGetString"
@@ -353,24 +1086,45 @@
 "DICTIONARY"
 "dictIsIn"
 "DISK"
+"displayName"
+"distanceL1"
+"distanceL2"
+"distanceL2Squared"
+"distanceLinf"
+"distanceLp"
 "DISTINCT"
-"DISTRIBUTED"
+"DISTINCT ON"
+"DIV"
 "divide"
+"divideDecimal"
 "domain"
+"domainRFC"
 "domainWithoutWWW"
+"domainWithoutWWWRFC"
+"dotProduct"
 "DOUBLE"
 "DOUBLE PRECISION"
+"DOUBLE_SHA1_HASH"
+"DOUBLE_SHA1_PASSWORD"
 "DROP"
 "DROP COLUMN"
 "DROP CONSTRAINT"
+"DROP DEFAULT"
 "DROP DETACHED PART"
 "DROP DETACHED PARTITION"
 "DROP INDEX"
+"DROP PART"
 "DROP PARTITION"
+"DROP PROJECTION"
+"DROP STATISTIC"
+"DROP TABLE"
+"DROP TEMPORARY TABLE"
 "dumpColumnStructure"
 "e"
+"editDistance"
 "ELSE"
 "empty"
+"EMPTY"
 "emptyArrayDate"
 "emptyArrayDateTime"
 "emptyArrayFloat32"
@@ -385,24 +1139,55 @@
 "emptyArrayUInt32"
 "emptyArrayUInt64"
 "emptyArrayUInt8"
+"EMPTY AS"
 "enabledProfiles"
 "enabledRoles"
+"ENABLED ROLES"
+"encodeURLComponent"
+"encodeURLFormComponent"
 "encodeXMLComponent"
 "encrypt"
 "END"
 "endsWith"
+"endsWithUTF8"
+"ENFORCED"
 "ENGINE"
 "entropy"
+"entropyArgMax"
+"entropyArgMin"
+"entropyArray"
+"entropyDistinct"
+"entropyForEach"
+"entropyIf"
+"entropyMap"
+"entropyMerge"
+"entropyNull"
+"entropyOrDefault"
+"entropyOrNull"
+"entropyResample"
+"entropySimpleState"
+"entropyState"
 "Enum"
 "ENUM"
 "Enum16"
 "Enum8"
+"EPHEMERAL"
+"EPHEMERAL SEQUENTIAL"
 "equals"
 "erf"
 "erfc"
 "errorCodeToName"
+"ESTIMATE"
 "evalMLMethod"
+"EVENT"
 "EVENTS"
+"EVERY"
+"EXCEPT"
+"EXCEPT DATABASE"
+"EXCEPT DATABASES"
+"EXCEPT TABLE"
+"EXCEPT TABLES"
+"EXCHANGE DICTIONARIES"
 "EXCHANGE TABLES"
 "EXISTS"
 "exp"
@@ -410,7 +1195,83 @@
 "exp2"
 "EXPLAIN"
 "exponentialMovingAverage"
+"exponentialMovingAverageArgMax"
+"exponentialMovingAverageArgMin"
+"exponentialMovingAverageArray"
+"exponentialMovingAverageDistinct"
+"exponentialMovingAverageForEach"
+"exponentialMovingAverageIf"
+"exponentialMovingAverageMap"
+"exponentialMovingAverageMerge"
+"exponentialMovingAverageNull"
+"exponentialMovingAverageOrDefault"
+"exponentialMovingAverageOrNull"
+"exponentialMovingAverageResample"
+"exponentialMovingAverageSimpleState"
+"exponentialMovingAverageState"
+"exponentialTimeDecayedAvg"
+"exponentialTimeDecayedAvgArgMax"
+"exponentialTimeDecayedAvgArgMin"
+"exponentialTimeDecayedAvgArray"
+"exponentialTimeDecayedAvgDistinct"
+"exponentialTimeDecayedAvgForEach"
+"exponentialTimeDecayedAvgIf"
+"exponentialTimeDecayedAvgMap"
+"exponentialTimeDecayedAvgMerge"
+"exponentialTimeDecayedAvgNull"
+"exponentialTimeDecayedAvgOrDefault"
+"exponentialTimeDecayedAvgOrNull"
+"exponentialTimeDecayedAvgResample"
+"exponentialTimeDecayedAvgSimpleState"
+"exponentialTimeDecayedAvgState"
+"exponentialTimeDecayedCount"
+"exponentialTimeDecayedCountArgMax"
+"exponentialTimeDecayedCountArgMin"
+"exponentialTimeDecayedCountArray"
+"exponentialTimeDecayedCountDistinct"
+"exponentialTimeDecayedCountForEach"
+"exponentialTimeDecayedCountIf"
+"exponentialTimeDecayedCountMap"
+"exponentialTimeDecayedCountMerge"
+"exponentialTimeDecayedCountNull"
+"exponentialTimeDecayedCountOrDefault"
+"exponentialTimeDecayedCountOrNull"
+"exponentialTimeDecayedCountResample"
+"exponentialTimeDecayedCountSimpleState"
+"exponentialTimeDecayedCountState"
+"exponentialTimeDecayedMax"
+"exponentialTimeDecayedMaxArgMax"
+"exponentialTimeDecayedMaxArgMin"
+"exponentialTimeDecayedMaxArray"
+"exponentialTimeDecayedMaxDistinct"
+"exponentialTimeDecayedMaxForEach"
+"exponentialTimeDecayedMaxIf"
+"exponentialTimeDecayedMaxMap"
+"exponentialTimeDecayedMaxMerge"
+"exponentialTimeDecayedMaxNull"
+"exponentialTimeDecayedMaxOrDefault"
+"exponentialTimeDecayedMaxOrNull"
+"exponentialTimeDecayedMaxResample"
+"exponentialTimeDecayedMaxSimpleState"
+"exponentialTimeDecayedMaxState"
+"exponentialTimeDecayedSum"
+"exponentialTimeDecayedSumArgMax"
+"exponentialTimeDecayedSumArgMin"
+"exponentialTimeDecayedSumArray"
+"exponentialTimeDecayedSumDistinct"
+"exponentialTimeDecayedSumForEach"
+"exponentialTimeDecayedSumIf"
+"exponentialTimeDecayedSumMap"
+"exponentialTimeDecayedSumMerge"
+"exponentialTimeDecayedSumNull"
+"exponentialTimeDecayedSumOrDefault"
+"exponentialTimeDecayedSumOrNull"
+"exponentialTimeDecayedSumResample"
+"exponentialTimeDecayedSumSimpleState"
+"exponentialTimeDecayedSumState"
 "EXPRESSION"
+"EXTENDED"
+"EXTERNAL DDL FROM"
 "extract"
 "EXTRACT"
 "extractAll"
@@ -418,40 +1279,106 @@
 "extractAllGroupsHorizontal"
 "extractAllGroupsVertical"
 "extractGroups"
+"extractKeyValuePairs"
+"extractKeyValuePairsWithEscaping"
 "extractTextFromHTML"
 "extractURLParameter"
 "extractURLParameterNames"
 "extractURLParameters"
+"factorial"
+"FALSE"
 "farmFingerprint64"
 "farmHash64"
-"FETCHES"
+"FETCH"
 "FETCH PART"
 "FETCH PARTITION"
+"FIELDS"
 "file"
+"FILE"
 "filesystemAvailable"
+"FILESYSTEM CACHE"
+"FILESYSTEM CACHES"
 "filesystemCapacity"
-"filesystemFree"
+"filesystemUnreserved"
+"FILTER"
 "FINAL"
 "finalizeAggregation"
 "FIRST"
+"firstLine"
 "firstSignificantSubdomain"
 "firstSignificantSubdomainCustom"
+"firstSignificantSubdomainCustomRFC"
+"firstSignificantSubdomainRFC"
 "first_value"
+"first_valueArgMax"
+"first_valueArgMin"
+"first_valueArray"
+"first_valueDistinct"
+"first_valueForEach"
+"first_valueIf"
+"first_valueMap"
+"first_valueMerge"
+"first_valueNull"
+"first_valueOrDefault"
+"first_valueOrNull"
+"first_valueResample"
+"first_value_respect_nulls"
+"first_value_respect_nullsArgMax"
+"first_value_respect_nullsArgMin"
+"first_value_respect_nullsArray"
+"first_value_respect_nullsDistinct"
+"first_value_respect_nullsForEach"
+"first_value_respect_nullsIf"
+"first_value_respect_nullsMap"
+"first_value_respect_nullsMerge"
+"first_value_respect_nullsNull"
+"first_value_respect_nullsOrDefault"
+"first_value_respect_nullsOrNull"
+"first_value_respect_nullsResample"
+"first_value_respect_nullsSimpleState"
+"first_value_respect_nullsState"
+"first_valueSimpleState"
+"first_valueState"
 "FIXED"
 "FixedString"
+"flameGraph"
+"flameGraphArgMax"
+"flameGraphArgMin"
+"flameGraphArray"
+"flameGraphDistinct"
+"flameGraphForEach"
+"flameGraphIf"
+"flameGraphMap"
+"flameGraphMerge"
+"flameGraphNull"
+"flameGraphOrDefault"
+"flameGraphOrNull"
+"flameGraphResample"
+"flameGraphSimpleState"
+"flameGraphState"
 "flatten"
+"flattenTuple"
 "FLOAT"
 "Float32"
 "Float64"
 "floor"
-"FLUSH"
+"FOLLOWING"
 "FOR"
 "ForEach"
+"FOREIGN"
+"FOREIGN KEY"
+"FORGET PARTITION"
 "format"
 "FORMAT"
+"FORMAT_BYTES"
 "formatDateTime"
-"formatReadableQuantity"
+"formatDateTimeInJodaSyntax"
+"formatQuery"
+"formatQueryOrNull"
+"formatQuerySingleLine"
+"formatQuerySingleLineOrNull"
 "formatReadableDecimalSize"
+"formatReadableQuantity"
 "formatReadableSize"
 "formatReadableTimeDelta"
 "formatRow"
@@ -461,132 +1388,437 @@
 "FREEZE"
 "FROM"
 "FROM_BASE64"
-"toDaysSinceYearZero"
+"FROM_DAYS"
 "fromDaysSinceYearZero"
 "fromDaysSinceYearZero32"
+"FROM INFILE"
 "fromModifiedJulianDay"
 "fromModifiedJulianDayOrNull"
+"FROM SHARD"
 "FROM_UNIXTIME"
 "fromUnixTimestamp"
 "fromUnixTimestamp64Micro"
 "fromUnixTimestamp64Milli"
 "fromUnixTimestamp64Nano"
+"fromUnixTimestampInJodaSyntax"
+"from_utc_timestamp"
+"fromUTCTimestamp"
 "FULL"
 "fullHostName"
+"FULLTEXT"
 "FUNCTION"
 "fuzzBits"
 "gccMurmurHash"
 "gcd"
+"generateRandomStructure"
+"generateULID"
 "generateUUIDv4"
 "geoDistance"
 "geohashDecode"
 "geohashEncode"
 "geohashesInBox"
+"GEOMETRY"
 "geoToH3"
 "geoToS2"
 "getMacro"
+"getOSKernelVersion"
 "__getScalar"
 "getServerPort"
 "getSetting"
 "getSizeOfEnumType"
+"getSubcolumn"
+"getTypeSerializationStreams"
 "GLOBAL"
 "globalIn"
+"GLOBAL IN"
 "globalInIgnoreSet"
 "globalNotIn"
+"GLOBAL NOT IN"
 "globalNotInIgnoreSet"
 "globalNotNullIn"
 "globalNotNullInIgnoreSet"
 "globalNullIn"
 "globalNullInIgnoreSet"
 "globalVariable"
+"GRANT"
+"GRANTEES"
+"GRANT OPTION FOR"
 "GRANULARITY"
 "greatCircleAngle"
 "greatCircleDistance"
 "greater"
 "greaterOrEquals"
 "greatest"
-"GROUP"
 "groupArray"
+"groupArrayArgMax"
+"groupArrayArgMin"
+"groupArrayArray"
+"groupArrayDistinct"
+"groupArrayForEach"
+"groupArrayIf"
 "groupArrayInsertAt"
+"groupArrayInsertAtArgMax"
+"groupArrayInsertAtArgMin"
+"groupArrayInsertAtArray"
+"groupArrayInsertAtDistinct"
+"groupArrayInsertAtForEach"
+"groupArrayInsertAtIf"
+"groupArrayInsertAtMap"
+"groupArrayInsertAtMerge"
+"groupArrayInsertAtNull"
+"groupArrayInsertAtOrDefault"
+"groupArrayInsertAtOrNull"
+"groupArrayInsertAtResample"
+"groupArrayInsertAtSimpleState"
+"groupArrayInsertAtState"
+"groupArrayIntersect"
+"groupArrayIntersectArgMax"
+"groupArrayIntersectArgMin"
+"groupArrayIntersectArray"
+"groupArrayIntersectDistinct"
+"groupArrayIntersectForEach"
+"groupArrayIntersectIf"
+"groupArrayIntersectMap"
+"groupArrayIntersectMerge"
+"groupArrayIntersectNull"
+"groupArrayIntersectOrDefault"
+"groupArrayIntersectOrNull"
+"groupArrayIntersectResample"
+"groupArrayIntersectSimpleState"
+"groupArrayIntersectState"
+"groupArrayLast"
+"groupArrayLastArgMax"
+"groupArrayLastArgMin"
+"groupArrayLastArray"
+"groupArrayLastDistinct"
+"groupArrayLastForEach"
+"groupArrayLastIf"
+"groupArrayLastMap"
+"groupArrayLastMerge"
+"groupArrayLastNull"
+"groupArrayLastOrDefault"
+"groupArrayLastOrNull"
+"groupArrayLastResample"
+"groupArrayLastSimpleState"
+"groupArrayLastState"
+"groupArrayMap"
+"groupArrayMerge"
 "groupArrayMovingAvg"
+"groupArrayMovingAvgArgMax"
+"groupArrayMovingAvgArgMin"
+"groupArrayMovingAvgArray"
+"groupArrayMovingAvgDistinct"
+"groupArrayMovingAvgForEach"
+"groupArrayMovingAvgIf"
+"groupArrayMovingAvgMap"
+"groupArrayMovingAvgMerge"
+"groupArrayMovingAvgNull"
+"groupArrayMovingAvgOrDefault"
+"groupArrayMovingAvgOrNull"
+"groupArrayMovingAvgResample"
+"groupArrayMovingAvgSimpleState"
+"groupArrayMovingAvgState"
 "groupArrayMovingSum"
+"groupArrayMovingSumArgMax"
+"groupArrayMovingSumArgMin"
+"groupArrayMovingSumArray"
+"groupArrayMovingSumDistinct"
+"groupArrayMovingSumForEach"
+"groupArrayMovingSumIf"
+"groupArrayMovingSumMap"
+"groupArrayMovingSumMerge"
+"groupArrayMovingSumNull"
+"groupArrayMovingSumOrDefault"
+"groupArrayMovingSumOrNull"
+"groupArrayMovingSumResample"
+"groupArrayMovingSumSimpleState"
+"groupArrayMovingSumState"
+"groupArrayNull"
+"groupArrayOrDefault"
+"groupArrayOrNull"
+"groupArrayResample"
 "groupArraySample"
+"groupArraySampleArgMax"
+"groupArraySampleArgMin"
+"groupArraySampleArray"
+"groupArraySampleDistinct"
+"groupArraySampleForEach"
+"groupArraySampleIf"
+"groupArraySampleMap"
+"groupArraySampleMerge"
+"groupArraySampleNull"
+"groupArraySampleOrDefault"
+"groupArraySampleOrNull"
+"groupArraySampleResample"
+"groupArraySampleSimpleState"
+"groupArraySampleState"
+"groupArraySimpleState"
+"groupArraySorted"
+"groupArraySortedArgMax"
+"groupArraySortedArgMin"
+"groupArraySortedArray"
+"groupArraySortedDistinct"
+"groupArraySortedForEach"
+"groupArraySortedIf"
+"groupArraySortedMap"
+"groupArraySortedMerge"
+"groupArraySortedNull"
+"groupArraySortedOrDefault"
+"groupArraySortedOrNull"
+"groupArraySortedResample"
+"groupArraySortedSimpleState"
+"groupArraySortedState"
+"groupArrayState"
 "groupBitAnd"
+"groupBitAndArgMax"
+"groupBitAndArgMin"
+"groupBitAndArray"
+"groupBitAndDistinct"
+"groupBitAndForEach"
+"groupBitAndIf"
+"groupBitAndMap"
+"groupBitAndMerge"
+"groupBitAndNull"
+"groupBitAndOrDefault"
+"groupBitAndOrNull"
+"groupBitAndResample"
+"groupBitAndSimpleState"
+"groupBitAndState"
 "groupBitmap"
 "groupBitmapAnd"
+"groupBitmapAndArgMax"
+"groupBitmapAndArgMin"
+"groupBitmapAndArray"
+"groupBitmapAndDistinct"
+"groupBitmapAndForEach"
+"groupBitmapAndIf"
+"groupBitmapAndMap"
+"groupBitmapAndMerge"
+"groupBitmapAndNull"
+"groupBitmapAndOrDefault"
+"groupBitmapAndOrNull"
+"groupBitmapAndResample"
+"groupBitmapAndSimpleState"
+"groupBitmapAndState"
+"groupBitmapArgMax"
+"groupBitmapArgMin"
+"groupBitmapArray"
+"groupBitmapDistinct"
+"groupBitmapForEach"
+"groupBitmapIf"
+"groupBitmapMap"
+"groupBitmapMerge"
+"groupBitmapNull"
 "groupBitmapOr"
+"groupBitmapOrArgMax"
+"groupBitmapOrArgMin"
+"groupBitmapOrArray"
+"groupBitmapOrDefault"
+"groupBitmapOrDistinct"
+"groupBitmapOrForEach"
+"groupBitmapOrIf"
+"groupBitmapOrMap"
+"groupBitmapOrMerge"
+"groupBitmapOrNull"
+"groupBitmapOrOrDefault"
+"groupBitmapOrOrNull"
+"groupBitmapOrResample"
+"groupBitmapOrSimpleState"
+"groupBitmapOrState"
+"groupBitmapResample"
+"groupBitmapSimpleState"
+"groupBitmapState"
 "groupBitmapXor"
+"groupBitmapXorArgMax"
+"groupBitmapXorArgMin"
+"groupBitmapXorArray"
+"groupBitmapXorDistinct"
+"groupBitmapXorForEach"
+"groupBitmapXorIf"
+"groupBitmapXorMap"
+"groupBitmapXorMerge"
+"groupBitmapXorNull"
+"groupBitmapXorOrDefault"
+"groupBitmapXorOrNull"
+"groupBitmapXorResample"
+"groupBitmapXorSimpleState"
+"groupBitmapXorState"
 "groupBitOr"
+"groupBitOrArgMax"
+"groupBitOrArgMin"
+"groupBitOrArray"
+"groupBitOrDistinct"
+"groupBitOrForEach"
+"groupBitOrIf"
+"groupBitOrMap"
+"groupBitOrMerge"
+"groupBitOrNull"
+"groupBitOrOrDefault"
+"groupBitOrOrNull"
+"groupBitOrResample"
+"groupBitOrSimpleState"
+"groupBitOrState"
 "groupBitXor"
+"groupBitXorArgMax"
+"groupBitXorArgMin"
+"groupBitXorArray"
+"groupBitXorDistinct"
+"groupBitXorForEach"
+"groupBitXorIf"
+"groupBitXorMap"
+"groupBitXorMerge"
+"groupBitXorNull"
+"groupBitXorOrDefault"
+"groupBitXorOrNull"
+"groupBitXorResample"
+"groupBitXorSimpleState"
+"groupBitXorState"
 "GROUP BY"
+"GROUPING SETS"
+"GROUPS"
 "groupUniqArray"
+"groupUniqArrayArgMax"
+"groupUniqArrayArgMin"
+"groupUniqArrayArray"
+"groupUniqArrayDistinct"
+"groupUniqArrayForEach"
+"groupUniqArrayIf"
+"groupUniqArrayMap"
+"groupUniqArrayMerge"
+"groupUniqArrayNull"
+"groupUniqArrayOrDefault"
+"groupUniqArrayOrNull"
+"groupUniqArrayResample"
+"groupUniqArraySimpleState"
+"groupUniqArrayState"
+"H"
+"h3CellAreaM2"
+"h3CellAreaRads2"
+"h3Distance"
 "h3EdgeAngle"
+"h3EdgeLengthKm"
 "h3EdgeLengthM"
+"h3ExactEdgeLengthKm"
+"h3ExactEdgeLengthM"
+"h3ExactEdgeLengthRads"
 "h3GetBaseCell"
+"h3GetDestinationIndexFromUnidirectionalEdge"
 "h3GetFaces"
+"h3GetIndexesFromUnidirectionalEdge"
+"h3GetOriginIndexFromUnidirectionalEdge"
+"h3GetPentagonIndexes"
+"h3GetRes0Indexes"
 "h3GetResolution"
+"h3GetUnidirectionalEdge"
+"h3GetUnidirectionalEdgeBoundary"
+"h3GetUnidirectionalEdgesFromHexagon"
+"h3HexAreaKm2"
 "h3HexAreaM2"
+"h3HexRing"
 "h3IndexesAreNeighbors"
 "h3IsPentagon"
 "h3IsResClassIII"
 "h3IsValid"
 "h3kRing"
+"h3Line"
+"h3NumHexagons"
+"h3PointDistKm"
+"h3PointDistM"
+"h3PointDistRads"
+"h3ToCenterChild"
 "h3ToChildren"
 "h3ToGeo"
 "h3ToGeoBoundary"
 "h3ToParent"
 "h3ToString"
+"h3UnidirectionalEdgeIsValid"
 "halfMD5"
 "has"
 "hasAll"
 "hasAny"
 "hasColumnInTable"
+"HASH"
+"hasSubsequence"
+"hasSubsequenceCaseInsensitive"
+"hasSubsequenceCaseInsensitiveUTF8"
+"hasSubsequenceUTF8"
 "hasSubstr"
 "hasThreadFuzzer"
 "hasToken"
 "hasTokenCaseInsensitive"
+"hasTokenCaseInsensitiveOrNull"
+"hasTokenOrNull"
 "HAVING"
+"HDFS"
 "hex"
 "HH"
 "HIERARCHICAL"
 "histogram"
+"histogramArgMax"
+"histogramArgMin"
+"histogramArray"
+"histogramDistinct"
+"histogramForEach"
+"histogramIf"
+"histogramMap"
+"histogramMerge"
+"histogramNull"
+"histogramOrDefault"
+"histogramOrNull"
+"histogramResample"
+"histogramSimpleState"
+"histogramState"
 "hiveHash"
+"hop"
+"hopEnd"
+"hopStart"
+"HOST"
 "hostname"
 "hostName"
 "HOUR"
+"HOURS"
+"HTTP"
 "hypot"
 "ID"
+"IDENTIFIED"
 "identity"
+"idnaDecode"
+"idnaEncode"
 "if"
-"IF"
+"IF EMPTY"
 "IF EXISTS"
 "IF NOT EXISTS"
 "ifNotFinite"
 "ifNull"
 "ignore"
+"IGNORE NULLS"
 "ilike"
 "ILIKE"
 "in"
 "IN"
 "INDEX"
+"INDEXES"
 "indexHint"
 "indexOf"
+"INDICES"
 "INET4"
 "INET6"
 "INET6_ATON"
 "INET6_NTOA"
 "INET_ATON"
 "INET_NTOA"
-"INF"
+"INHERIT"
 "inIgnoreSet"
+"initcap"
+"initcapUTF8"
 "initializeAggregation"
 "initial_query_id"
 "initialQueryID"
 "INJECTIVE"
 "INNER"
 "IN PARTITION"
-"INSERT"
 "INSERT INTO"
+"instr"
 "INT"
 "INT1"
 "Int128"
@@ -602,12 +1834,31 @@
 "INTEGER"
 "INTEGER SIGNED"
 "INTEGER UNSIGNED"
+"INTERPOLATE"
+"INTERSECT"
 "INTERVAL"
 "IntervalDay"
 "IntervalHour"
 "intervalLengthSum"
+"intervalLengthSumArgMax"
+"intervalLengthSumArgMin"
+"intervalLengthSumArray"
+"intervalLengthSumDistinct"
+"intervalLengthSumForEach"
+"intervalLengthSumIf"
+"intervalLengthSumMap"
+"intervalLengthSumMerge"
+"intervalLengthSumNull"
+"intervalLengthSumOrDefault"
+"intervalLengthSumOrNull"
+"intervalLengthSumResample"
+"intervalLengthSumSimpleState"
+"intervalLengthSumState"
+"IntervalMicrosecond"
+"IntervalMillisecond"
 "IntervalMinute"
 "IntervalMonth"
+"IntervalNanosecond"
 "IntervalQuarter"
 "IntervalSecond"
 "IntervalWeek"
@@ -616,21 +1867,26 @@
 "intExp2"
 "intHash32"
 "intHash64"
-"INTO"
 "INTO OUTFILE"
 "INT SIGNED"
 "INT UNSIGNED"
+"INVISIBLE"
+"INVOKER"
+"IP"
 "IPv4"
 "IPv4CIDRToRange"
 "IPv4NumToString"
 "IPv4NumToStringClassC"
 "IPv4StringToNum"
+"IPv4StringToNumOrDefault"
+"IPv4StringToNumOrNull"
 "IPv4ToIPv6"
 "IPv6"
 "IPv6CIDRToRange"
 "IPv6NumToString"
 "IPv6StringToNum"
-"IS"
+"IPv6StringToNumOrDefault"
+"IPv6StringToNumOrNull"
 "isConstant"
 "isDecimalOverflow"
 "isFinite"
@@ -639,64 +1895,220 @@
 "isIPv4String"
 "isIPv6String"
 "isNaN"
+"isNotDistinctFrom"
+"IS NOT DISTINCT FROM"
 "isNotNull"
+"IS NOT NULL"
 "isNull"
+"IS NULL"
+"isNullable"
 "IS_OBJECT_ID"
 "isValidJSON"
 "isValidUTF8"
 "isZeroOrNull"
+"jaroSimilarity"
+"jaroWinklerSimilarity"
 "javaHash"
 "javaHashUTF16LE"
 "JOIN"
 "joinGet"
 "joinGetOrNull"
+"JSON"
+"JSONArrayLength"
+"JSON_ARRAY_LENGTH"
 "JSON_EXISTS"
 "JSONExtract"
 "JSONExtractArrayRaw"
 "JSONExtractBool"
 "JSONExtractFloat"
 "JSONExtractInt"
+"JSONExtractKeys"
 "JSONExtractKeysAndValues"
 "JSONExtractKeysAndValuesRaw"
-"JSONExtractKeys"
 "JSONExtractRaw"
 "JSONExtractString"
 "JSONExtractUInt"
 "JSONHas"
 "JSONKey"
 "JSONLength"
+"jsonMergePatch"
 "JSON_QUERY"
 "JSONType"
 "JSON_VALUE"
 "jumpConsistentHash"
+"kafkaMurmurHash"
+"KERBEROS"
 "KEY"
-# Key words (based on keywords from antlr parser)
+"KEY BY"
+"KEYED BY"
+"KEYS"
 "KILL"
+"KIND"
+"kolmogorovSmirnovTest"
+"kolmogorovSmirnovTestArgMax"
+"kolmogorovSmirnovTestArgMin"
+"kolmogorovSmirnovTestArray"
+"kolmogorovSmirnovTestDistinct"
+"kolmogorovSmirnovTestForEach"
+"kolmogorovSmirnovTestIf"
+"kolmogorovSmirnovTestMap"
+"kolmogorovSmirnovTestMerge"
+"kolmogorovSmirnovTestNull"
+"kolmogorovSmirnovTestOrDefault"
+"kolmogorovSmirnovTestOrNull"
+"kolmogorovSmirnovTestResample"
+"kolmogorovSmirnovTestSimpleState"
+"kolmogorovSmirnovTestState"
+"kostikConsistentHash"
+"kql_array_sort_asc"
+"kql_array_sort_desc"
 "kurtPop"
+"kurtPopArgMax"
+"kurtPopArgMin"
+"kurtPopArray"
+"kurtPopDistinct"
+"kurtPopForEach"
+"kurtPopIf"
+"kurtPopMap"
+"kurtPopMerge"
+"kurtPopNull"
+"kurtPopOrDefault"
+"kurtPopOrNull"
+"kurtPopResample"
+"kurtPopSimpleState"
+"kurtPopState"
 "kurtSamp"
+"kurtSampArgMax"
+"kurtSampArgMin"
+"kurtSampArray"
+"kurtSampDistinct"
+"kurtSampForEach"
+"kurtSampIf"
+"kurtSampMap"
+"kurtSampMerge"
+"kurtSampNull"
+"kurtSampOrDefault"
+"kurtSampOrNull"
+"kurtSampResample"
+"kurtSampSimpleState"
+"kurtSampState"
+"L1Distance"
+"L1Norm"
+"L1Normalize"
+"L2Distance"
+"L2Norm"
+"L2Normalize"
+"L2SquaredDistance"
+"L2SquaredNorm"
 "lagInFrame"
+"lagInFrameArgMax"
+"lagInFrameArgMin"
+"lagInFrameArray"
+"lagInFrameDistinct"
+"lagInFrameForEach"
+"lagInFrameIf"
+"lagInFrameMap"
+"lagInFrameMerge"
+"lagInFrameNull"
+"lagInFrameOrDefault"
+"lagInFrameOrNull"
+"lagInFrameResample"
+"lagInFrameSimpleState"
+"lagInFrameState"
+"LARGE OBJECT"
+"largestTriangleThreeBuckets"
+"largestTriangleThreeBucketsArgMax"
+"largestTriangleThreeBucketsArgMin"
+"largestTriangleThreeBucketsArray"
+"largestTriangleThreeBucketsDistinct"
+"largestTriangleThreeBucketsForEach"
+"largestTriangleThreeBucketsIf"
+"largestTriangleThreeBucketsMap"
+"largestTriangleThreeBucketsMerge"
+"largestTriangleThreeBucketsNull"
+"largestTriangleThreeBucketsOrDefault"
+"largestTriangleThreeBucketsOrNull"
+"largestTriangleThreeBucketsResample"
+"largestTriangleThreeBucketsSimpleState"
+"largestTriangleThreeBucketsState"
 "LAST"
+"LAST_DAY"
 "last_value"
+"last_valueArgMax"
+"last_valueArgMin"
+"last_valueArray"
+"last_valueDistinct"
+"last_valueForEach"
+"last_valueIf"
+"last_valueMap"
+"last_valueMerge"
+"last_valueNull"
+"last_valueOrDefault"
+"last_valueOrNull"
+"last_valueResample"
+"last_value_respect_nulls"
+"last_value_respect_nullsArgMax"
+"last_value_respect_nullsArgMin"
+"last_value_respect_nullsArray"
+"last_value_respect_nullsDistinct"
+"last_value_respect_nullsForEach"
+"last_value_respect_nullsIf"
+"last_value_respect_nullsMap"
+"last_value_respect_nullsMerge"
+"last_value_respect_nullsNull"
+"last_value_respect_nullsOrDefault"
+"last_value_respect_nullsOrNull"
+"last_value_respect_nullsResample"
+"last_value_respect_nullsSimpleState"
+"last_value_respect_nullsState"
+"last_valueSimpleState"
+"last_valueState"
 "LAYOUT"
 "lcase"
 "lcm"
+"LDAP"
 "leadInFrame"
+"leadInFrameArgMax"
+"leadInFrameArgMin"
+"leadInFrameArray"
+"leadInFrameDistinct"
+"leadInFrameForEach"
+"leadInFrameIf"
+"leadInFrameMap"
+"leadInFrameMerge"
+"leadInFrameNull"
+"leadInFrameOrDefault"
+"leadInFrameOrNull"
+"leadInFrameResample"
+"leadInFrameSimpleState"
+"leadInFrameState"
 "LEADING"
 "least"
+"left"
 "LEFT"
 "LEFT ARRAY JOIN"
 "leftPad"
 "leftPadUTF8"
+"leftUTF8"
 "lemmatize"
 "length"
 "lengthUTF8"
 "less"
 "lessOrEquals"
+"LESS THAN"
+"LEVEL"
+"levenshteinDistance"
 "lgamma"
 "LIFETIME"
+"LIGHTWEIGHT"
 "like"
 "LIKE"
 "LIMIT"
+"LINEAR"
+"LinfDistance"
+"LinfNorm"
+"LinfNormalize"
+"LIST"
 "LIVE"
 "ln"
 "LOCAL"
@@ -705,7 +2117,6 @@
 "log10"
 "log1p"
 "log2"
-"LOGS"
 "logTrace"
 "LONGBLOB"
 "LONGTEXT"
@@ -715,76 +2126,467 @@
 "lower"
 "lowerUTF8"
 "lpad"
+"LpDistance"
+"LpNorm"
+"LpNormalize"
+"ltrim"
 "LTRIM"
+"lttb"
+"lttbArgMax"
+"lttbArgMin"
+"lttbArray"
+"lttbDistinct"
+"lttbForEach"
+"lttbIf"
+"lttbMap"
+"lttbMerge"
+"lttbNull"
+"lttbOrDefault"
+"lttbOrNull"
+"lttbResample"
+"lttbSimpleState"
+"lttbState"
 "M"
 "MACNumToString"
 "MACStringToNum"
 "MACStringToOUI"
+"makeDate"
+"makeDate32"
+"makeDateTime"
+"makeDateTime64"
 "mannWhitneyUTest"
+"mannWhitneyUTestArgMax"
+"mannWhitneyUTestArgMin"
+"mannWhitneyUTestArray"
+"mannWhitneyUTestDistinct"
+"mannWhitneyUTestForEach"
+"mannWhitneyUTestIf"
+"mannWhitneyUTestMap"
+"mannWhitneyUTestMerge"
+"mannWhitneyUTestNull"
+"mannWhitneyUTestOrDefault"
+"mannWhitneyUTestOrNull"
+"mannWhitneyUTestResample"
+"mannWhitneyUTestSimpleState"
+"mannWhitneyUTestState"
 "map"
 "Map"
 "mapAdd"
+"mapAll"
+"mapApply"
+"mapConcat"
 "mapContains"
+"mapContainsKeyLike"
+"mapExists"
+"mapExtractKeyLike"
+"mapFilter"
+"mapFromArrays"
+"MAP_FROM_ARRAYS"
+"mapFromString"
 "mapKeys"
+"mapPartialReverseSort"
+"mapPartialSort"
 "mapPopulateSeries"
+"mapReverseSort"
+"mapSort"
 "mapSubtract"
+"mapUpdate"
 "mapValues"
 "match"
+"MATCH"
 "materialize"
 "MATERIALIZE"
+"MATERIALIZE COLUMN"
 "MATERIALIZED"
 "MATERIALIZE INDEX"
+"MATERIALIZE PROJECTION"
+"MATERIALIZE STATISTIC"
 "MATERIALIZE TTL"
 "max"
 "MAX"
+"max2"
+"maxArgMax"
+"maxArgMin"
+"maxArray"
+"maxDistinct"
+"maxForEach"
+"maxIf"
 "maxIntersections"
+"maxIntersectionsArgMax"
+"maxIntersectionsArgMin"
+"maxIntersectionsArray"
+"maxIntersectionsDistinct"
+"maxIntersectionsForEach"
+"maxIntersectionsIf"
+"maxIntersectionsMap"
+"maxIntersectionsMerge"
+"maxIntersectionsNull"
+"maxIntersectionsOrDefault"
+"maxIntersectionsOrNull"
 "maxIntersectionsPosition"
+"maxIntersectionsPositionArgMax"
+"maxIntersectionsPositionArgMin"
+"maxIntersectionsPositionArray"
+"maxIntersectionsPositionDistinct"
+"maxIntersectionsPositionForEach"
+"maxIntersectionsPositionIf"
+"maxIntersectionsPositionMap"
+"maxIntersectionsPositionMerge"
+"maxIntersectionsPositionNull"
+"maxIntersectionsPositionOrDefault"
+"maxIntersectionsPositionOrNull"
+"maxIntersectionsPositionResample"
+"maxIntersectionsPositionSimpleState"
+"maxIntersectionsPositionState"
+"maxIntersectionsResample"
+"maxIntersectionsSimpleState"
+"maxIntersectionsState"
 "maxMap"
+"maxMappedArrays"
+"maxMappedArraysArgMax"
+"maxMappedArraysArgMin"
+"maxMappedArraysArray"
+"maxMappedArraysDistinct"
+"maxMappedArraysForEach"
+"maxMappedArraysIf"
+"maxMappedArraysMap"
+"maxMappedArraysMerge"
+"maxMappedArraysNull"
+"maxMappedArraysOrDefault"
+"maxMappedArraysOrNull"
+"maxMappedArraysResample"
+"maxMappedArraysSimpleState"
+"maxMappedArraysState"
+"maxMerge"
+"maxNull"
+"maxOrDefault"
+"maxOrNull"
+"maxResample"
+"maxSimpleState"
+"maxState"
+"MCS"
 "MD4"
 "MD5"
+"meanZTest"
+"meanZTestArgMax"
+"meanZTestArgMin"
+"meanZTestArray"
+"meanZTestDistinct"
+"meanZTestForEach"
+"meanZTestIf"
+"meanZTestMap"
+"meanZTestMerge"
+"meanZTestNull"
+"meanZTestOrDefault"
+"meanZTestOrNull"
+"meanZTestResample"
+"meanZTestSimpleState"
+"meanZTestState"
 "median"
+"medianArgMax"
+"medianArgMin"
+"medianArray"
 "medianBFloat16"
+"medianBFloat16ArgMax"
+"medianBFloat16ArgMin"
+"medianBFloat16Array"
+"medianBFloat16Distinct"
+"medianBFloat16ForEach"
+"medianBFloat16If"
+"medianBFloat16Map"
+"medianBFloat16Merge"
+"medianBFloat16Null"
+"medianBFloat16OrDefault"
+"medianBFloat16OrNull"
+"medianBFloat16Resample"
+"medianBFloat16SimpleState"
+"medianBFloat16State"
 "medianBFloat16Weighted"
+"medianBFloat16WeightedArgMax"
+"medianBFloat16WeightedArgMin"
+"medianBFloat16WeightedArray"
+"medianBFloat16WeightedDistinct"
+"medianBFloat16WeightedForEach"
+"medianBFloat16WeightedIf"
+"medianBFloat16WeightedMap"
+"medianBFloat16WeightedMerge"
+"medianBFloat16WeightedNull"
+"medianBFloat16WeightedOrDefault"
+"medianBFloat16WeightedOrNull"
+"medianBFloat16WeightedResample"
+"medianBFloat16WeightedSimpleState"
+"medianBFloat16WeightedState"
+"medianDD"
+"medianDDArgMax"
+"medianDDArgMin"
+"medianDDArray"
+"medianDDDistinct"
+"medianDDForEach"
+"medianDDIf"
+"medianDDMap"
+"medianDDMerge"
+"medianDDNull"
+"medianDDOrDefault"
+"medianDDOrNull"
+"medianDDResample"
+"medianDDSimpleState"
+"medianDDState"
 "medianDeterministic"
+"medianDeterministicArgMax"
+"medianDeterministicArgMin"
+"medianDeterministicArray"
+"medianDeterministicDistinct"
+"medianDeterministicForEach"
+"medianDeterministicIf"
+"medianDeterministicMap"
+"medianDeterministicMerge"
+"medianDeterministicNull"
+"medianDeterministicOrDefault"
+"medianDeterministicOrNull"
+"medianDeterministicResample"
+"medianDeterministicSimpleState"
+"medianDeterministicState"
+"medianDistinct"
 "medianExact"
+"medianExactArgMax"
+"medianExactArgMin"
+"medianExactArray"
+"medianExactDistinct"
+"medianExactForEach"
 "medianExactHigh"
+"medianExactHighArgMax"
+"medianExactHighArgMin"
+"medianExactHighArray"
+"medianExactHighDistinct"
+"medianExactHighForEach"
+"medianExactHighIf"
+"medianExactHighMap"
+"medianExactHighMerge"
+"medianExactHighNull"
+"medianExactHighOrDefault"
+"medianExactHighOrNull"
+"medianExactHighResample"
+"medianExactHighSimpleState"
+"medianExactHighState"
+"medianExactIf"
 "medianExactLow"
+"medianExactLowArgMax"
+"medianExactLowArgMin"
+"medianExactLowArray"
+"medianExactLowDistinct"
+"medianExactLowForEach"
+"medianExactLowIf"
+"medianExactLowMap"
+"medianExactLowMerge"
+"medianExactLowNull"
+"medianExactLowOrDefault"
+"medianExactLowOrNull"
+"medianExactLowResample"
+"medianExactLowSimpleState"
+"medianExactLowState"
+"medianExactMap"
+"medianExactMerge"
+"medianExactNull"
+"medianExactOrDefault"
+"medianExactOrNull"
+"medianExactResample"
+"medianExactSimpleState"
+"medianExactState"
 "medianExactWeighted"
+"medianExactWeightedArgMax"
+"medianExactWeightedArgMin"
+"medianExactWeightedArray"
+"medianExactWeightedDistinct"
+"medianExactWeightedForEach"
+"medianExactWeightedIf"
+"medianExactWeightedMap"
+"medianExactWeightedMerge"
+"medianExactWeightedNull"
+"medianExactWeightedOrDefault"
+"medianExactWeightedOrNull"
+"medianExactWeightedResample"
+"medianExactWeightedSimpleState"
+"medianExactWeightedState"
+"medianForEach"
+"medianGK"
+"medianGKArgMax"
+"medianGKArgMin"
+"medianGKArray"
+"medianGKDistinct"
+"medianGKForEach"
+"medianGKIf"
+"medianGKMap"
+"medianGKMerge"
+"medianGKNull"
+"medianGKOrDefault"
+"medianGKOrNull"
+"medianGKResample"
+"medianGKSimpleState"
+"medianGKState"
+"medianIf"
+"medianInterpolatedWeighted"
+"medianInterpolatedWeightedArgMax"
+"medianInterpolatedWeightedArgMin"
+"medianInterpolatedWeightedArray"
+"medianInterpolatedWeightedDistinct"
+"medianInterpolatedWeightedForEach"
+"medianInterpolatedWeightedIf"
+"medianInterpolatedWeightedMap"
+"medianInterpolatedWeightedMerge"
+"medianInterpolatedWeightedNull"
+"medianInterpolatedWeightedOrDefault"
+"medianInterpolatedWeightedOrNull"
+"medianInterpolatedWeightedResample"
+"medianInterpolatedWeightedSimpleState"
+"medianInterpolatedWeightedState"
+"medianMap"
+"medianMerge"
+"medianNull"
+"medianOrDefault"
+"medianOrNull"
+"medianResample"
+"medianSimpleState"
+"medianState"
 "medianTDigest"
+"medianTDigestArgMax"
+"medianTDigestArgMin"
+"medianTDigestArray"
+"medianTDigestDistinct"
+"medianTDigestForEach"
+"medianTDigestIf"
+"medianTDigestMap"
+"medianTDigestMerge"
+"medianTDigestNull"
+"medianTDigestOrDefault"
+"medianTDigestOrNull"
+"medianTDigestResample"
+"medianTDigestSimpleState"
+"medianTDigestState"
 "medianTDigestWeighted"
+"medianTDigestWeightedArgMax"
+"medianTDigestWeightedArgMin"
+"medianTDigestWeightedArray"
+"medianTDigestWeightedDistinct"
+"medianTDigestWeightedForEach"
+"medianTDigestWeightedIf"
+"medianTDigestWeightedMap"
+"medianTDigestWeightedMerge"
+"medianTDigestWeightedNull"
+"medianTDigestWeightedOrDefault"
+"medianTDigestWeightedOrNull"
+"medianTDigestWeightedResample"
+"medianTDigestWeightedSimpleState"
+"medianTDigestWeightedState"
 "medianTiming"
+"medianTimingArgMax"
+"medianTimingArgMin"
+"medianTimingArray"
+"medianTimingDistinct"
+"medianTimingForEach"
+"medianTimingIf"
+"medianTimingMap"
+"medianTimingMerge"
+"medianTimingNull"
+"medianTimingOrDefault"
+"medianTimingOrNull"
+"medianTimingResample"
+"medianTimingSimpleState"
+"medianTimingState"
 "medianTimingWeighted"
+"medianTimingWeightedArgMax"
+"medianTimingWeightedArgMin"
+"medianTimingWeightedArray"
+"medianTimingWeightedDistinct"
+"medianTimingWeightedForEach"
+"medianTimingWeightedIf"
+"medianTimingWeightedMap"
+"medianTimingWeightedMerge"
+"medianTimingWeightedNull"
+"medianTimingWeightedOrDefault"
+"medianTimingWeightedOrNull"
+"medianTimingWeightedResample"
+"medianTimingWeightedSimpleState"
+"medianTimingWeightedState"
 "MEDIUMBLOB"
 "MEDIUMINT"
 "MEDIUMINT SIGNED"
 "MEDIUMINT UNSIGNED"
 "MEDIUMTEXT"
+"MEMORY"
 "Merge"
 "MERGES"
 "metroHash64"
 "MI"
+"MICROSECOND"
+"MICROSECONDS"
 "mid"
+"MILLISECOND"
+"MILLISECONDS"
 "min"
 "MIN"
+"min2"
+"minArgMax"
+"minArgMin"
+"minArray"
+"minDistinct"
+"minForEach"
+"minIf"
 "minMap"
+"minMappedArrays"
+"minMappedArraysArgMax"
+"minMappedArraysArgMin"
+"minMappedArraysArray"
+"minMappedArraysDistinct"
+"minMappedArraysForEach"
+"minMappedArraysIf"
+"minMappedArraysMap"
+"minMappedArraysMerge"
+"minMappedArraysNull"
+"minMappedArraysOrDefault"
+"minMappedArraysOrNull"
+"minMappedArraysResample"
+"minMappedArraysSimpleState"
+"minMappedArraysState"
+"minMerge"
+"minNull"
+"minOrDefault"
+"minOrNull"
+"minResample"
+"minSampleSizeContinous"
+"minSampleSizeContinuous"
+"minSampleSizeConversion"
+"minSimpleState"
+"minState"
 "minus"
 "MINUTE"
+"MINUTES"
+"mismatches"
 "MM"
 "mod"
+"MOD"
 "MODIFY"
 "MODIFY COLUMN"
+"MODIFY COMMENT"
 "MODIFY ORDER BY"
 "MODIFY QUERY"
+"MODIFY REFRESH"
+"MODIFY SAMPLE BY"
 "MODIFY SETTING"
+"MODIFY SQL SECURITY"
 "MODIFY TTL"
 "modulo"
 "moduloLegacy"
 "moduloOrZero"
 "MONTH"
+"monthName"
+"MONTHS"
+"mortonDecode"
+"mortonEncode"
 "MOVE"
 "MOVE PART"
 "MOVE PARTITION"
 "movingXXX"
+"MS"
 "multiFuzzyMatchAllIndices"
 "multiFuzzyMatchAny"
 "multiFuzzyMatchAnyIndex"
@@ -793,6 +2595,7 @@
 "multiMatchAny"
 "multiMatchAnyIndex"
 "multiply"
+"multiplyDecimal"
 "MultiPolygon"
 "multiSearchAllPositions"
 "multiSearchAllPositionsCaseInsensitive"
@@ -818,7 +2621,9 @@
 "MUTATION"
 "N"
 "NAME"
-"NAN_SQL"
+"NAMED COLLECTION"
+"NANOSECOND"
+"NANOSECONDS"
 "NATIONAL CHAR"
 "NATIONAL CHARACTER"
 "NATIONAL CHARACTER LARGE OBJECT"
@@ -829,8 +2634,10 @@
 "NCHAR VARYING"
 "negate"
 "neighbor"
+"nested"
 "Nested"
 "netloc"
+"NEXT"
 "ngramDistance"
 "ngramDistanceCaseInsensitive"
 "ngramDistanceCaseInsensitiveUTF8"
@@ -843,6 +2650,7 @@
 "ngramMinHashCaseInsensitive"
 "ngramMinHashCaseInsensitiveUTF8"
 "ngramMinHashUTF8"
+"ngrams"
 "ngramSearch"
 "ngramSearchCaseInsensitive"
 "ngramSearchCaseInsensitiveUTF8"
@@ -851,68 +2659,207 @@
 "ngramSimHashCaseInsensitive"
 "ngramSimHashCaseInsensitiveUTF8"
 "ngramSimHashUTF8"
-"NO"
+"NO ACTION"
 "NO DELAY"
+"NO LIMITS"
 "NONE"
+"nonNegativeDerivative"
+"nonNegativeDerivativeArgMax"
+"nonNegativeDerivativeArgMin"
+"nonNegativeDerivativeArray"
+"nonNegativeDerivativeDistinct"
+"nonNegativeDerivativeForEach"
+"nonNegativeDerivativeIf"
+"nonNegativeDerivativeMap"
+"nonNegativeDerivativeMerge"
+"nonNegativeDerivativeNull"
+"nonNegativeDerivativeOrDefault"
+"nonNegativeDerivativeOrNull"
+"nonNegativeDerivativeResample"
+"nonNegativeDerivativeSimpleState"
+"nonNegativeDerivativeState"
+"NO_PASSWORD"
 "normalizedQueryHash"
 "normalizedQueryHashKeepNames"
+"normalizeL1"
+"normalizeL2"
+"normalizeLinf"
+"normalizeLp"
 "normalizeQuery"
 "normalizeQueryKeepNames"
+"normalizeUTF8NFC"
+"normalizeUTF8NFD"
+"normalizeUTF8NFKC"
+"normalizeUTF8NFKD"
+"normL1"
+"normL2"
+"normL2Squared"
+"normLinf"
+"normLp"
 "not"
 "NOT"
+"NOT BETWEEN"
 "notEmpty"
 "notEquals"
 "nothing"
 "Nothing"
+"nothingArgMax"
+"nothingArgMin"
+"nothingArray"
+"nothingDistinct"
+"nothingForEach"
+"nothingIf"
+"nothingMap"
+"nothingMerge"
+"nothingNull"
+"nothingNullArgMax"
+"nothingNullArgMin"
+"nothingNullArray"
+"nothingNullDistinct"
+"nothingNullForEach"
+"nothingNullIf"
+"nothingNullMap"
+"nothingNullMerge"
+"nothingNullNull"
+"nothingNullOrDefault"
+"nothingNullOrNull"
+"nothingNullResample"
+"nothingNullSimpleState"
+"nothingNullState"
+"nothingOrDefault"
+"nothingOrNull"
+"nothingResample"
+"nothingSimpleState"
+"nothingState"
+"nothingUInt64"
+"nothingUInt64ArgMax"
+"nothingUInt64ArgMin"
+"nothingUInt64Array"
+"nothingUInt64Distinct"
+"nothingUInt64ForEach"
+"nothingUInt64If"
+"nothingUInt64Map"
+"nothingUInt64Merge"
+"nothingUInt64Null"
+"nothingUInt64OrDefault"
+"nothingUInt64OrNull"
+"nothingUInt64Resample"
+"nothingUInt64SimpleState"
+"nothingUInt64State"
+"NOT IDENTIFIED"
 "notILike"
+"NOT ILIKE"
 "notIn"
+"NOT IN"
 "notInIgnoreSet"
+"NOT KEYED"
 "notLike"
+"NOT LIKE"
 "notNullIn"
 "notNullInIgnoreSet"
+"NOT OVERRIDABLE"
 "now"
 "now64"
+"nowInBlock"
+"NS"
+"nth_value"
+"nth_valueArgMax"
+"nth_valueArgMin"
+"nth_valueArray"
+"nth_valueDistinct"
+"nth_valueForEach"
+"nth_valueIf"
+"nth_valueMap"
+"nth_valueMerge"
+"nth_valueNull"
+"nth_valueOrDefault"
+"nth_valueOrNull"
+"nth_valueResample"
+"nth_valueSimpleState"
+"nth_valueState"
+"ntile"
+"ntileArgMax"
+"ntileArgMin"
+"ntileArray"
+"ntileDistinct"
+"ntileForEach"
+"ntileIf"
+"ntileMap"
+"ntileMerge"
+"ntileNull"
+"ntileOrDefault"
+"ntileOrNull"
+"ntileResample"
+"ntileSimpleState"
+"ntileState"
 "Null"
+"NULL"
 "Nullable"
 "nullIf"
 "nullIn"
 "nullInIgnoreSet"
 "NULLS"
-"NULL_SQL"
 "NUMERIC"
 "NVARCHAR"
+"Object"
+"OCTET_LENGTH"
 "OFFSET"
 "ON"
+"ON DELETE"
 "ONLY"
-"OPTIMIZE"
+"ON UPDATE"
+"ON VOLUME"
 "OPTIMIZE TABLE"
 "or"
 "OR"
-"ORDER"
 "ORDER BY"
 "OR REPLACE"
 "OUTER"
-"OUTFILE"
+"OVER"
+"OVERRIDABLE"
+"parseDateTime"
 "parseDateTime32BestEffort"
 "parseDateTime32BestEffortOrNull"
 "parseDateTime32BestEffortOrZero"
 "parseDateTime64BestEffort"
 "parseDateTime64BestEffortOrNull"
 "parseDateTime64BestEffortOrZero"
+"parseDateTime64BestEffortUS"
+"parseDateTime64BestEffortUSOrNull"
+"parseDateTime64BestEffortUSOrZero"
 "parseDateTimeBestEffort"
 "parseDateTimeBestEffortOrNull"
 "parseDateTimeBestEffortOrZero"
 "parseDateTimeBestEffortUS"
 "parseDateTimeBestEffortUSOrNull"
 "parseDateTimeBestEffortUSOrZero"
+"parseDateTimeInJodaSyntax"
+"parseDateTimeInJodaSyntaxOrNull"
+"parseDateTimeInJodaSyntaxOrZero"
+"parseDateTimeOrNull"
+"parseDateTimeOrZero"
 "parseTimeDelta"
+"PART"
+"PARTIAL"
 "PARTITION"
 "PARTITION BY"
 "partitionId"
+"PARTITIONS"
+"PART_MOVE_TO_SHARD"
+"PASTE"
 "path"
 "pathFull"
+"PERIODIC REFRESH"
+"PERMANENTLY"
+"PERMISSIVE"
+"PERSISTENT"
+"PERSISTENT SEQUENTIAL"
 "pi"
+"PIPELINE"
+"PLAINTEXT_PASSWORD"
+"PLAN"
 "plus"
+"pmod"
 "Point"
 "pointInEllipses"
 "pointInPolygon"
@@ -935,71 +2882,620 @@
 "polygonsWithinSpherical"
 "POPULATE"
 "port"
+"portRFC"
 "position"
 "positionCaseInsensitive"
 "positionCaseInsensitiveUTF8"
 "positionUTF8"
+"positive_modulo"
+"positiveModulo"
 "pow"
 "power"
+"PRECEDING"
+"PRECISION"
 "PREWHERE"
 "PRIMARY"
 "PRIMARY KEY"
+"PROFILE"
 "PROJECTION"
+"proportionsZTest"
+"Protobuf"
 "protocol"
+"PULL"
+"punycodeDecode"
+"punycodeEncode"
 "Q"
 "QQ"
 "quantile"
+"quantileArgMax"
+"quantileArgMin"
+"quantileArray"
 "quantileBFloat16"
+"quantileBFloat16ArgMax"
+"quantileBFloat16ArgMin"
+"quantileBFloat16Array"
+"quantileBFloat16Distinct"
+"quantileBFloat16ForEach"
+"quantileBFloat16If"
+"quantileBFloat16Map"
+"quantileBFloat16Merge"
+"quantileBFloat16Null"
+"quantileBFloat16OrDefault"
+"quantileBFloat16OrNull"
+"quantileBFloat16Resample"
+"quantileBFloat16SimpleState"
+"quantileBFloat16State"
 "quantileBFloat16Weighted"
+"quantileBFloat16WeightedArgMax"
+"quantileBFloat16WeightedArgMin"
+"quantileBFloat16WeightedArray"
+"quantileBFloat16WeightedDistinct"
+"quantileBFloat16WeightedForEach"
+"quantileBFloat16WeightedIf"
+"quantileBFloat16WeightedMap"
+"quantileBFloat16WeightedMerge"
+"quantileBFloat16WeightedNull"
+"quantileBFloat16WeightedOrDefault"
+"quantileBFloat16WeightedOrNull"
+"quantileBFloat16WeightedResample"
+"quantileBFloat16WeightedSimpleState"
+"quantileBFloat16WeightedState"
+"quantileDD"
+"quantileDDArgMax"
+"quantileDDArgMin"
+"quantileDDArray"
+"quantileDDDistinct"
+"quantileDDForEach"
+"quantileDDIf"
+"quantileDDMap"
+"quantileDDMerge"
+"quantileDDNull"
+"quantileDDOrDefault"
+"quantileDDOrNull"
+"quantileDDResample"
+"quantileDDSimpleState"
+"quantileDDState"
 "quantileDeterministic"
+"quantileDeterministicArgMax"
+"quantileDeterministicArgMin"
+"quantileDeterministicArray"
+"quantileDeterministicDistinct"
+"quantileDeterministicForEach"
+"quantileDeterministicIf"
+"quantileDeterministicMap"
+"quantileDeterministicMerge"
+"quantileDeterministicNull"
+"quantileDeterministicOrDefault"
+"quantileDeterministicOrNull"
+"quantileDeterministicResample"
+"quantileDeterministicSimpleState"
+"quantileDeterministicState"
+"quantileDistinct"
 "quantileExact"
+"quantileExactArgMax"
+"quantileExactArgMin"
+"quantileExactArray"
+"quantileExactDistinct"
 "quantileExactExclusive"
+"quantileExactExclusiveArgMax"
+"quantileExactExclusiveArgMin"
+"quantileExactExclusiveArray"
+"quantileExactExclusiveDistinct"
+"quantileExactExclusiveForEach"
+"quantileExactExclusiveIf"
+"quantileExactExclusiveMap"
+"quantileExactExclusiveMerge"
+"quantileExactExclusiveNull"
+"quantileExactExclusiveOrDefault"
+"quantileExactExclusiveOrNull"
+"quantileExactExclusiveResample"
+"quantileExactExclusiveSimpleState"
+"quantileExactExclusiveState"
+"quantileExactForEach"
 "quantileExactHigh"
+"quantileExactHighArgMax"
+"quantileExactHighArgMin"
+"quantileExactHighArray"
+"quantileExactHighDistinct"
+"quantileExactHighForEach"
+"quantileExactHighIf"
+"quantileExactHighMap"
+"quantileExactHighMerge"
+"quantileExactHighNull"
+"quantileExactHighOrDefault"
+"quantileExactHighOrNull"
+"quantileExactHighResample"
+"quantileExactHighSimpleState"
+"quantileExactHighState"
+"quantileExactIf"
 "quantileExactInclusive"
+"quantileExactInclusiveArgMax"
+"quantileExactInclusiveArgMin"
+"quantileExactInclusiveArray"
+"quantileExactInclusiveDistinct"
+"quantileExactInclusiveForEach"
+"quantileExactInclusiveIf"
+"quantileExactInclusiveMap"
+"quantileExactInclusiveMerge"
+"quantileExactInclusiveNull"
+"quantileExactInclusiveOrDefault"
+"quantileExactInclusiveOrNull"
+"quantileExactInclusiveResample"
+"quantileExactInclusiveSimpleState"
+"quantileExactInclusiveState"
 "quantileExactLow"
+"quantileExactLowArgMax"
+"quantileExactLowArgMin"
+"quantileExactLowArray"
+"quantileExactLowDistinct"
+"quantileExactLowForEach"
+"quantileExactLowIf"
+"quantileExactLowMap"
+"quantileExactLowMerge"
+"quantileExactLowNull"
+"quantileExactLowOrDefault"
+"quantileExactLowOrNull"
+"quantileExactLowResample"
+"quantileExactLowSimpleState"
+"quantileExactLowState"
+"quantileExactMap"
+"quantileExactMerge"
+"quantileExactNull"
+"quantileExactOrDefault"
+"quantileExactOrNull"
+"quantileExactResample"
+"quantileExactSimpleState"
+"quantileExactState"
 "quantileExactWeighted"
+"quantileExactWeightedArgMax"
+"quantileExactWeightedArgMin"
+"quantileExactWeightedArray"
+"quantileExactWeightedDistinct"
+"quantileExactWeightedForEach"
+"quantileExactWeightedIf"
+"quantileExactWeightedMap"
+"quantileExactWeightedMerge"
+"quantileExactWeightedNull"
+"quantileExactWeightedOrDefault"
+"quantileExactWeightedOrNull"
+"quantileExactWeightedResample"
+"quantileExactWeightedSimpleState"
+"quantileExactWeightedState"
+"quantileForEach"
+"quantileGK"
+"quantileGKArgMax"
+"quantileGKArgMin"
+"quantileGKArray"
+"quantileGKDistinct"
+"quantileGKForEach"
+"quantileGKIf"
+"quantileGKMap"
+"quantileGKMerge"
+"quantileGKNull"
+"quantileGKOrDefault"
+"quantileGKOrNull"
+"quantileGKResample"
+"quantileGKSimpleState"
+"quantileGKState"
+"quantileIf"
+"quantileInterpolatedWeighted"
+"quantileInterpolatedWeightedArgMax"
+"quantileInterpolatedWeightedArgMin"
+"quantileInterpolatedWeightedArray"
+"quantileInterpolatedWeightedDistinct"
+"quantileInterpolatedWeightedForEach"
+"quantileInterpolatedWeightedIf"
+"quantileInterpolatedWeightedMap"
+"quantileInterpolatedWeightedMerge"
+"quantileInterpolatedWeightedNull"
+"quantileInterpolatedWeightedOrDefault"
+"quantileInterpolatedWeightedOrNull"
+"quantileInterpolatedWeightedResample"
+"quantileInterpolatedWeightedSimpleState"
+"quantileInterpolatedWeightedState"
+"quantileMap"
+"quantileMerge"
+"quantileNull"
+"quantileOrDefault"
+"quantileOrNull"
+"quantileResample"
 "quantiles"
+"quantilesArgMax"
+"quantilesArgMin"
+"quantilesArray"
 "quantilesBFloat16"
+"quantilesBFloat16ArgMax"
+"quantilesBFloat16ArgMin"
+"quantilesBFloat16Array"
+"quantilesBFloat16Distinct"
+"quantilesBFloat16ForEach"
+"quantilesBFloat16If"
+"quantilesBFloat16Map"
+"quantilesBFloat16Merge"
+"quantilesBFloat16Null"
+"quantilesBFloat16OrDefault"
+"quantilesBFloat16OrNull"
+"quantilesBFloat16Resample"
+"quantilesBFloat16SimpleState"
+"quantilesBFloat16State"
 "quantilesBFloat16Weighted"
+"quantilesBFloat16WeightedArgMax"
+"quantilesBFloat16WeightedArgMin"
+"quantilesBFloat16WeightedArray"
+"quantilesBFloat16WeightedDistinct"
+"quantilesBFloat16WeightedForEach"
+"quantilesBFloat16WeightedIf"
+"quantilesBFloat16WeightedMap"
+"quantilesBFloat16WeightedMerge"
+"quantilesBFloat16WeightedNull"
+"quantilesBFloat16WeightedOrDefault"
+"quantilesBFloat16WeightedOrNull"
+"quantilesBFloat16WeightedResample"
+"quantilesBFloat16WeightedSimpleState"
+"quantilesBFloat16WeightedState"
+"quantilesDD"
+"quantilesDDArgMax"
+"quantilesDDArgMin"
+"quantilesDDArray"
+"quantilesDDDistinct"
+"quantilesDDForEach"
+"quantilesDDIf"
+"quantilesDDMap"
+"quantilesDDMerge"
+"quantilesDDNull"
+"quantilesDDOrDefault"
+"quantilesDDOrNull"
+"quantilesDDResample"
+"quantilesDDSimpleState"
+"quantilesDDState"
 "quantilesDeterministic"
+"quantilesDeterministicArgMax"
+"quantilesDeterministicArgMin"
+"quantilesDeterministicArray"
+"quantilesDeterministicDistinct"
+"quantilesDeterministicForEach"
+"quantilesDeterministicIf"
+"quantilesDeterministicMap"
+"quantilesDeterministicMerge"
+"quantilesDeterministicNull"
+"quantilesDeterministicOrDefault"
+"quantilesDeterministicOrNull"
+"quantilesDeterministicResample"
+"quantilesDeterministicSimpleState"
+"quantilesDeterministicState"
+"quantilesDistinct"
 "quantilesExact"
+"quantilesExactArgMax"
+"quantilesExactArgMin"
+"quantilesExactArray"
+"quantilesExactDistinct"
 "quantilesExactExclusive"
+"quantilesExactExclusiveArgMax"
+"quantilesExactExclusiveArgMin"
+"quantilesExactExclusiveArray"
+"quantilesExactExclusiveDistinct"
+"quantilesExactExclusiveForEach"
+"quantilesExactExclusiveIf"
+"quantilesExactExclusiveMap"
+"quantilesExactExclusiveMerge"
+"quantilesExactExclusiveNull"
+"quantilesExactExclusiveOrDefault"
+"quantilesExactExclusiveOrNull"
+"quantilesExactExclusiveResample"
+"quantilesExactExclusiveSimpleState"
+"quantilesExactExclusiveState"
+"quantilesExactForEach"
 "quantilesExactHigh"
+"quantilesExactHighArgMax"
+"quantilesExactHighArgMin"
+"quantilesExactHighArray"
+"quantilesExactHighDistinct"
+"quantilesExactHighForEach"
+"quantilesExactHighIf"
+"quantilesExactHighMap"
+"quantilesExactHighMerge"
+"quantilesExactHighNull"
+"quantilesExactHighOrDefault"
+"quantilesExactHighOrNull"
+"quantilesExactHighResample"
+"quantilesExactHighSimpleState"
+"quantilesExactHighState"
+"quantilesExactIf"
 "quantilesExactInclusive"
+"quantilesExactInclusiveArgMax"
+"quantilesExactInclusiveArgMin"
+"quantilesExactInclusiveArray"
+"quantilesExactInclusiveDistinct"
+"quantilesExactInclusiveForEach"
+"quantilesExactInclusiveIf"
+"quantilesExactInclusiveMap"
+"quantilesExactInclusiveMerge"
+"quantilesExactInclusiveNull"
+"quantilesExactInclusiveOrDefault"
+"quantilesExactInclusiveOrNull"
+"quantilesExactInclusiveResample"
+"quantilesExactInclusiveSimpleState"
+"quantilesExactInclusiveState"
 "quantilesExactLow"
+"quantilesExactLowArgMax"
+"quantilesExactLowArgMin"
+"quantilesExactLowArray"
+"quantilesExactLowDistinct"
+"quantilesExactLowForEach"
+"quantilesExactLowIf"
+"quantilesExactLowMap"
+"quantilesExactLowMerge"
+"quantilesExactLowNull"
+"quantilesExactLowOrDefault"
+"quantilesExactLowOrNull"
+"quantilesExactLowResample"
+"quantilesExactLowSimpleState"
+"quantilesExactLowState"
+"quantilesExactMap"
+"quantilesExactMerge"
+"quantilesExactNull"
+"quantilesExactOrDefault"
+"quantilesExactOrNull"
+"quantilesExactResample"
+"quantilesExactSimpleState"
+"quantilesExactState"
 "quantilesExactWeighted"
+"quantilesExactWeightedArgMax"
+"quantilesExactWeightedArgMin"
+"quantilesExactWeightedArray"
+"quantilesExactWeightedDistinct"
+"quantilesExactWeightedForEach"
+"quantilesExactWeightedIf"
+"quantilesExactWeightedMap"
+"quantilesExactWeightedMerge"
+"quantilesExactWeightedNull"
+"quantilesExactWeightedOrDefault"
+"quantilesExactWeightedOrNull"
+"quantilesExactWeightedResample"
+"quantilesExactWeightedSimpleState"
+"quantilesExactWeightedState"
+"quantilesForEach"
+"quantilesGK"
+"quantilesGKArgMax"
+"quantilesGKArgMin"
+"quantilesGKArray"
+"quantilesGKDistinct"
+"quantilesGKForEach"
+"quantilesGKIf"
+"quantilesGKMap"
+"quantilesGKMerge"
+"quantilesGKNull"
+"quantilesGKOrDefault"
+"quantilesGKOrNull"
+"quantilesGKResample"
+"quantilesGKSimpleState"
+"quantilesGKState"
+"quantilesIf"
+"quantileSimpleState"
+"quantilesInterpolatedWeighted"
+"quantilesInterpolatedWeightedArgMax"
+"quantilesInterpolatedWeightedArgMin"
+"quantilesInterpolatedWeightedArray"
+"quantilesInterpolatedWeightedDistinct"
+"quantilesInterpolatedWeightedForEach"
+"quantilesInterpolatedWeightedIf"
+"quantilesInterpolatedWeightedMap"
+"quantilesInterpolatedWeightedMerge"
+"quantilesInterpolatedWeightedNull"
+"quantilesInterpolatedWeightedOrDefault"
+"quantilesInterpolatedWeightedOrNull"
+"quantilesInterpolatedWeightedResample"
+"quantilesInterpolatedWeightedSimpleState"
+"quantilesInterpolatedWeightedState"
+"quantilesMap"
+"quantilesMerge"
+"quantilesNull"
+"quantilesOrDefault"
+"quantilesOrNull"
+"quantilesResample"
+"quantilesSimpleState"
+"quantilesState"
+"quantileState"
 "quantilesTDigest"
+"quantilesTDigestArgMax"
+"quantilesTDigestArgMin"
+"quantilesTDigestArray"
+"quantilesTDigestDistinct"
+"quantilesTDigestForEach"
+"quantilesTDigestIf"
+"quantilesTDigestMap"
+"quantilesTDigestMerge"
+"quantilesTDigestNull"
+"quantilesTDigestOrDefault"
+"quantilesTDigestOrNull"
+"quantilesTDigestResample"
+"quantilesTDigestSimpleState"
+"quantilesTDigestState"
 "quantilesTDigestWeighted"
+"quantilesTDigestWeightedArgMax"
+"quantilesTDigestWeightedArgMin"
+"quantilesTDigestWeightedArray"
+"quantilesTDigestWeightedDistinct"
+"quantilesTDigestWeightedForEach"
+"quantilesTDigestWeightedIf"
+"quantilesTDigestWeightedMap"
+"quantilesTDigestWeightedMerge"
+"quantilesTDigestWeightedNull"
+"quantilesTDigestWeightedOrDefault"
+"quantilesTDigestWeightedOrNull"
+"quantilesTDigestWeightedResample"
+"quantilesTDigestWeightedSimpleState"
+"quantilesTDigestWeightedState"
 "quantilesTiming"
+"quantilesTimingArgMax"
+"quantilesTimingArgMin"
+"quantilesTimingArray"
+"quantilesTimingDistinct"
+"quantilesTimingForEach"
+"quantilesTimingIf"
+"quantilesTimingMap"
+"quantilesTimingMerge"
+"quantilesTimingNull"
+"quantilesTimingOrDefault"
+"quantilesTimingOrNull"
+"quantilesTimingResample"
+"quantilesTimingSimpleState"
+"quantilesTimingState"
 "quantilesTimingWeighted"
+"quantilesTimingWeightedArgMax"
+"quantilesTimingWeightedArgMin"
+"quantilesTimingWeightedArray"
+"quantilesTimingWeightedDistinct"
+"quantilesTimingWeightedForEach"
+"quantilesTimingWeightedIf"
+"quantilesTimingWeightedMap"
+"quantilesTimingWeightedMerge"
+"quantilesTimingWeightedNull"
+"quantilesTimingWeightedOrDefault"
+"quantilesTimingWeightedOrNull"
+"quantilesTimingWeightedResample"
+"quantilesTimingWeightedSimpleState"
+"quantilesTimingWeightedState"
 "quantileTDigest"
+"quantileTDigestArgMax"
+"quantileTDigestArgMin"
+"quantileTDigestArray"
+"quantileTDigestDistinct"
+"quantileTDigestForEach"
+"quantileTDigestIf"
+"quantileTDigestMap"
+"quantileTDigestMerge"
+"quantileTDigestNull"
+"quantileTDigestOrDefault"
+"quantileTDigestOrNull"
+"quantileTDigestResample"
+"quantileTDigestSimpleState"
+"quantileTDigestState"
 "quantileTDigestWeighted"
+"quantileTDigestWeightedArgMax"
+"quantileTDigestWeightedArgMin"
+"quantileTDigestWeightedArray"
+"quantileTDigestWeightedDistinct"
+"quantileTDigestWeightedForEach"
+"quantileTDigestWeightedIf"
+"quantileTDigestWeightedMap"
+"quantileTDigestWeightedMerge"
+"quantileTDigestWeightedNull"
+"quantileTDigestWeightedOrDefault"
+"quantileTDigestWeightedOrNull"
+"quantileTDigestWeightedResample"
+"quantileTDigestWeightedSimpleState"
+"quantileTDigestWeightedState"
 "quantileTiming"
+"quantileTimingArgMax"
+"quantileTimingArgMin"
+"quantileTimingArray"
+"quantileTimingDistinct"
+"quantileTimingForEach"
+"quantileTimingIf"
+"quantileTimingMap"
+"quantileTimingMerge"
+"quantileTimingNull"
+"quantileTimingOrDefault"
+"quantileTimingOrNull"
+"quantileTimingResample"
+"quantileTimingSimpleState"
+"quantileTimingState"
 "quantileTimingWeighted"
+"quantileTimingWeightedArgMax"
+"quantileTimingWeightedArgMin"
+"quantileTimingWeightedArray"
+"quantileTimingWeightedDistinct"
+"quantileTimingWeightedForEach"
+"quantileTimingWeightedIf"
+"quantileTimingWeightedMap"
+"quantileTimingWeightedMerge"
+"quantileTimingWeightedNull"
+"quantileTimingWeightedOrDefault"
+"quantileTimingWeightedOrNull"
+"quantileTimingWeightedResample"
+"quantileTimingWeightedSimpleState"
+"quantileTimingWeightedState"
 "QUARTER"
+"QUARTERS"
+"QUERY"
 "query_id"
 "queryID"
 "queryString"
 "queryStringAndFragment"
+"QUERY TREE"
+"QUOTA"
+"radians"
 "rand"
 "rand32"
 "rand64"
+"randBernoulli"
+"randBinomial"
+"randCanonical"
+"randChiSquared"
 "randConstant"
+"randExponential"
+"randFisherF"
+"randLogNormal"
+"randNegativeBinomial"
+"randNormal"
 "randomFixedString"
+"RANDOMIZED"
+"RANDOMIZE FOR"
 "randomPrintableASCII"
 "randomString"
 "randomStringUTF8"
+"randPoisson"
+"randStudentT"
+"randUniform"
 "range"
 "RANGE"
 "rank"
+"rankArgMax"
+"rankArgMin"
+"rankArray"
 "rankCorr"
+"rankCorrArgMax"
+"rankCorrArgMin"
+"rankCorrArray"
+"rankCorrDistinct"
+"rankCorrForEach"
+"rankCorrIf"
+"rankCorrMap"
+"rankCorrMerge"
+"rankCorrNull"
+"rankCorrOrDefault"
+"rankCorrOrNull"
+"rankCorrResample"
+"rankCorrSimpleState"
+"rankCorrState"
+"rankDistinct"
+"rankForEach"
+"rankIf"
+"rankMap"
+"rankMerge"
+"rankNull"
+"rankOrDefault"
+"rankOrNull"
+"rankResample"
+"rankSimpleState"
+"rankState"
+"READONLY"
 "readWKTMultiPolygon"
 "readWKTPoint"
 "readWKTPolygon"
 "readWKTRing"
 "REAL"
+"REALM"
+"RECOMPRESS"
+"REFERENCES"
 "REFRESH"
+"REGEXP"
+"regexpExtract"
+"REGEXP_EXTRACT"
+"REGEXP_MATCHES"
 "regexpQuoteMeta"
+"REGEXP_REPLACE"
 "regionHierarchy"
 "regionIn"
 "regionToArea"
@@ -1030,11 +3526,15 @@
 "reinterpretAsUInt64"
 "reinterpretAsUInt8"
 "reinterpretAsUUID"
-"RELOAD"
 "REMOVE"
+"REMOVE SAMPLE BY"
+"REMOVE TTL"
 "RENAME"
 "RENAME COLUMN"
+"RENAME DATABASE"
+"RENAME DICTIONARY"
 "RENAME TABLE"
+"RENAME TO"
 "repeat"
 "replace"
 "REPLACE"
@@ -1043,18 +3543,40 @@
 "REPLACE PARTITION"
 "replaceRegexpAll"
 "replaceRegexpOne"
-"REPLICA"
 "replicate"
-"REPLICATED"
 "Resample"
+"RESET SETTING"
+"RESPECT NULLS"
+"RESTORE"
+"RESTRICT"
+"RESTRICTIVE"
 "RESUME"
 "retention"
+"retentionArgMax"
+"retentionArgMin"
+"retentionArray"
+"retentionDistinct"
+"retentionForEach"
+"retentionIf"
+"retentionMap"
+"retentionMerge"
+"retentionNull"
+"retentionOrDefault"
+"retentionOrNull"
+"retentionResample"
+"retentionSimpleState"
+"retentionState"
 "reverse"
 "reverseUTF8"
+"revision"
+"REVOKE"
+"right"
 "RIGHT"
 "rightPad"
 "rightPadUTF8"
+"rightUTF8"
 "Ring"
+"ROLLBACK"
 "ROLLUP"
 "round"
 "roundAge"
@@ -1062,10 +3584,27 @@
 "roundDown"
 "roundDuration"
 "roundToExp2"
+"ROW"
 "row_number"
+"row_numberArgMax"
+"row_numberArgMin"
+"row_numberArray"
+"row_numberDistinct"
+"row_numberForEach"
+"row_numberIf"
 "rowNumberInAllBlocks"
 "rowNumberInBlock"
+"row_numberMap"
+"row_numberMerge"
+"row_numberNull"
+"row_numberOrDefault"
+"row_numberOrNull"
+"row_numberResample"
+"row_numberSimpleState"
+"row_numberState"
+"ROWS"
 "rpad"
+"rtrim"
 "RTRIM"
 "runningAccumulate"
 "runningConcurrency"
@@ -1081,29 +3620,103 @@
 "s2RectIntersection"
 "s2RectUnion"
 "s2ToGeo"
+"S3"
+"SALT"
 "SAMPLE"
 "SAMPLE BY"
+"scalarProduct"
+"__scalarSubqueryResult"
+"SCHEMA"
+"SCHEME"
 "SECOND"
+"SECONDS"
 "SELECT"
 "SEMI"
-"SENDS"
 "sequenceCount"
+"sequenceCountArgMax"
+"sequenceCountArgMin"
+"sequenceCountArray"
+"sequenceCountDistinct"
+"sequenceCountForEach"
+"sequenceCountIf"
+"sequenceCountMap"
+"sequenceCountMerge"
+"sequenceCountNull"
+"sequenceCountOrDefault"
+"sequenceCountOrNull"
+"sequenceCountResample"
+"sequenceCountSimpleState"
+"sequenceCountState"
 "sequenceMatch"
+"sequenceMatchArgMax"
+"sequenceMatchArgMin"
+"sequenceMatchArray"
+"sequenceMatchDistinct"
+"sequenceMatchForEach"
+"sequenceMatchIf"
+"sequenceMatchMap"
+"sequenceMatchMerge"
+"sequenceMatchNull"
+"sequenceMatchOrDefault"
+"sequenceMatchOrNull"
+"sequenceMatchResample"
+"sequenceMatchSimpleState"
+"sequenceMatchState"
 "sequenceNextNode"
+"sequenceNextNodeArgMax"
+"sequenceNextNodeArgMin"
+"sequenceNextNodeArray"
+"sequenceNextNodeDistinct"
+"sequenceNextNodeForEach"
+"sequenceNextNodeIf"
+"sequenceNextNodeMap"
+"sequenceNextNodeMerge"
+"sequenceNextNodeNull"
+"sequenceNextNodeOrDefault"
+"sequenceNextNodeOrNull"
+"sequenceNextNodeResample"
+"sequenceNextNodeSimpleState"
+"sequenceNextNodeState"
+"seriesDecomposeSTL"
+"seriesOutliersDetectTukey"
+"seriesPeriodDetectFFT"
+"SERVER"
+"serverTimezone"
+"serverTimeZone"
 "serverUUID"
 "SET"
+"SET DEFAULT"
+"SET DEFAULT ROLE"
+"SET FAKE TIME"
+"SET NULL"
+"SET ROLE"
+"SET ROLE DEFAULT"
 "SETTINGS"
+"SET TRANSACTION SNAPSHOT"
 "SHA1"
 "SHA224"
 "SHA256"
+"SHA256_HASH"
+"SHA256_PASSWORD"
 "SHA384"
 "SHA512"
+"SHA512_256"
 "shardCount"
 "shardNum"
 "SHOW"
+"SHOW ACCESS"
+"showCertificate"
+"SHOW CREATE"
+"SHOW ENGINES"
+"SHOW FUNCTIONS"
+"SHOW GRANTS"
+"SHOW PRIVILEGES"
 "SHOW PROCESSLIST"
+"SHOW SETTING"
 "sigmoid"
 "sign"
+"SIGNED"
+"SIMPLE"
 "SimpleAggregateFunction"
 "simpleJSONExtractBool"
 "simpleJSONExtractFloat"
@@ -1113,14 +3726,74 @@
 "simpleJSONExtractUInt"
 "simpleJSONHas"
 "simpleLinearRegression"
+"simpleLinearRegressionArgMax"
+"simpleLinearRegressionArgMin"
+"simpleLinearRegressionArray"
+"simpleLinearRegressionDistinct"
+"simpleLinearRegressionForEach"
+"simpleLinearRegressionIf"
+"simpleLinearRegressionMap"
+"simpleLinearRegressionMerge"
+"simpleLinearRegressionNull"
+"simpleLinearRegressionOrDefault"
+"simpleLinearRegressionOrNull"
+"simpleLinearRegressionResample"
+"simpleLinearRegressionSimpleState"
+"simpleLinearRegressionState"
 "sin"
 "SINGLE"
 "singleValueOrNull"
+"singleValueOrNullArgMax"
+"singleValueOrNullArgMin"
+"singleValueOrNullArray"
+"singleValueOrNullDistinct"
+"singleValueOrNullForEach"
+"singleValueOrNullIf"
+"singleValueOrNullMap"
+"singleValueOrNullMerge"
+"singleValueOrNullNull"
+"singleValueOrNullOrDefault"
+"singleValueOrNullOrNull"
+"singleValueOrNullResample"
+"singleValueOrNullSimpleState"
+"singleValueOrNullState"
 "sinh"
 "sipHash128"
+"sipHash128Keyed"
+"sipHash128Reference"
+"sipHash128ReferenceKeyed"
 "sipHash64"
+"sipHash64Keyed"
 "skewPop"
+"skewPopArgMax"
+"skewPopArgMin"
+"skewPopArray"
+"skewPopDistinct"
+"skewPopForEach"
+"skewPopIf"
+"skewPopMap"
+"skewPopMerge"
+"skewPopNull"
+"skewPopOrDefault"
+"skewPopOrNull"
+"skewPopResample"
+"skewPopSimpleState"
+"skewPopState"
 "skewSamp"
+"skewSampArgMax"
+"skewSampArgMin"
+"skewSampArray"
+"skewSampDistinct"
+"skewSampForEach"
+"skewSampIf"
+"skewSampMap"
+"skewSampMerge"
+"skewSampNull"
+"skewSampOrDefault"
+"skewSampOrNull"
+"skewSampResample"
+"skewSampSimpleState"
+"skewSampState"
 "sleep"
 "sleepEachRow"
 "SMALLINT"
@@ -1128,61 +3801,377 @@
 "SMALLINT UNSIGNED"
 "snowflakeToDateTime"
 "snowflakeToDateTime64"
+"soundex"
 "SOURCE"
+"space"
 "sparkbar"
+"sparkBar"
+"sparkbarArgMax"
+"sparkBarArgMax"
+"sparkbarArgMin"
+"sparkBarArgMin"
+"sparkbarArray"
+"sparkBarArray"
+"sparkbarDistinct"
+"sparkBarDistinct"
+"sparkbarForEach"
+"sparkBarForEach"
+"sparkbarIf"
+"sparkBarIf"
+"sparkbarMap"
+"sparkBarMap"
+"sparkbarMerge"
+"sparkBarMerge"
+"sparkbarNull"
+"sparkBarNull"
+"sparkbarOrDefault"
+"sparkBarOrDefault"
+"sparkbarOrNull"
+"sparkBarOrNull"
+"sparkbarResample"
+"sparkBarResample"
+"sparkbarSimpleState"
+"sparkBarSimpleState"
+"sparkbarState"
+"sparkBarState"
+"SPATIAL"
+"splitByAlpha"
 "splitByChar"
 "splitByNonAlpha"
 "splitByRegexp"
 "splitByString"
 "splitByWhitespace"
+"sqid"
+"sqidDecode"
+"sqidEncode"
+"SQL SECURITY"
 "SQL_TSI_DAY"
 "SQL_TSI_HOUR"
+"SQL_TSI_MICROSECOND"
+"SQL_TSI_MILLISECOND"
 "SQL_TSI_MINUTE"
 "SQL_TSI_MONTH"
+"SQL_TSI_NANOSECOND"
 "SQL_TSI_QUARTER"
 "SQL_TSI_SECOND"
 "SQL_TSI_WEEK"
 "SQL_TSI_YEAR"
 "sqrt"
 "SS"
-"START"
+"SSH_KEY"
+"SSL_CERTIFICATE"
 "startsWith"
+"startsWithUTF8"
 "State"
+"STATISTIC"
+"STD"
+"STDArgMax"
+"STDArgMin"
+"STDArray"
 "stddevPop"
 "STDDEV_POP"
+"stddevPopArgMax"
+"STDDEV_POPArgMax"
+"stddevPopArgMin"
+"STDDEV_POPArgMin"
+"stddevPopArray"
+"STDDEV_POPArray"
+"stddevPopDistinct"
+"STDDEV_POPDistinct"
+"stddevPopForEach"
+"STDDEV_POPForEach"
+"stddevPopIf"
+"STDDEV_POPIf"
+"stddevPopMap"
+"STDDEV_POPMap"
+"stddevPopMerge"
+"STDDEV_POPMerge"
+"stddevPopNull"
+"STDDEV_POPNull"
+"stddevPopOrDefault"
+"STDDEV_POPOrDefault"
+"stddevPopOrNull"
+"STDDEV_POPOrNull"
+"stddevPopResample"
+"STDDEV_POPResample"
+"stddevPopSimpleState"
+"STDDEV_POPSimpleState"
 "stddevPopStable"
+"stddevPopStableArgMax"
+"stddevPopStableArgMin"
+"stddevPopStableArray"
+"stddevPopStableDistinct"
+"stddevPopStableForEach"
+"stddevPopStableIf"
+"stddevPopStableMap"
+"stddevPopStableMerge"
+"stddevPopStableNull"
+"stddevPopStableOrDefault"
+"stddevPopStableOrNull"
+"stddevPopStableResample"
+"stddevPopStableSimpleState"
+"stddevPopStableState"
+"stddevPopState"
+"STDDEV_POPState"
 "stddevSamp"
 "STDDEV_SAMP"
+"stddevSampArgMax"
+"STDDEV_SAMPArgMax"
+"stddevSampArgMin"
+"STDDEV_SAMPArgMin"
+"stddevSampArray"
+"STDDEV_SAMPArray"
+"stddevSampDistinct"
+"STDDEV_SAMPDistinct"
+"stddevSampForEach"
+"STDDEV_SAMPForEach"
+"stddevSampIf"
+"STDDEV_SAMPIf"
+"stddevSampMap"
+"STDDEV_SAMPMap"
+"stddevSampMerge"
+"STDDEV_SAMPMerge"
+"stddevSampNull"
+"STDDEV_SAMPNull"
+"stddevSampOrDefault"
+"STDDEV_SAMPOrDefault"
+"stddevSampOrNull"
+"STDDEV_SAMPOrNull"
+"stddevSampResample"
+"STDDEV_SAMPResample"
+"stddevSampSimpleState"
+"STDDEV_SAMPSimpleState"
 "stddevSampStable"
+"stddevSampStableArgMax"
+"stddevSampStableArgMin"
+"stddevSampStableArray"
+"stddevSampStableDistinct"
+"stddevSampStableForEach"
+"stddevSampStableIf"
+"stddevSampStableMap"
+"stddevSampStableMerge"
+"stddevSampStableNull"
+"stddevSampStableOrDefault"
+"stddevSampStableOrNull"
+"stddevSampStableResample"
+"stddevSampStableSimpleState"
+"stddevSampStableState"
+"stddevSampState"
+"STDDEV_SAMPState"
+"STDDistinct"
+"STDForEach"
+"STDIf"
+"STDMap"
+"STDMerge"
+"STDNull"
+"STDOrDefault"
+"STDOrNull"
+"STDResample"
+"STDSimpleState"
+"STDState"
 "stem"
 "STEP"
 "stochasticLinearRegression"
+"stochasticLinearRegressionArgMax"
+"stochasticLinearRegressionArgMin"
+"stochasticLinearRegressionArray"
+"stochasticLinearRegressionDistinct"
+"stochasticLinearRegressionForEach"
+"stochasticLinearRegressionIf"
+"stochasticLinearRegressionMap"
+"stochasticLinearRegressionMerge"
+"stochasticLinearRegressionNull"
+"stochasticLinearRegressionOrDefault"
+"stochasticLinearRegressionOrNull"
+"stochasticLinearRegressionResample"
+"stochasticLinearRegressionSimpleState"
+"stochasticLinearRegressionState"
 "stochasticLogisticRegression"
-"STOP"
+"stochasticLogisticRegressionArgMax"
+"stochasticLogisticRegressionArgMin"
+"stochasticLogisticRegressionArray"
+"stochasticLogisticRegressionDistinct"
+"stochasticLogisticRegressionForEach"
+"stochasticLogisticRegressionIf"
+"stochasticLogisticRegressionMap"
+"stochasticLogisticRegressionMerge"
+"stochasticLogisticRegressionNull"
+"stochasticLogisticRegressionOrDefault"
+"stochasticLogisticRegressionOrNull"
+"stochasticLogisticRegressionResample"
+"stochasticLogisticRegressionSimpleState"
+"stochasticLogisticRegressionState"
+"STORAGE"
+"STRICT"
+"STRICTLY_ASCENDING"
 "String"
+"stringJaccardIndex"
+"stringJaccardIndexUTF8"
 "stringToH3"
+"str_to_date"
+"str_to_map"
+"structureToCapnProtoSchema"
+"structureToProtobufSchema"
 "studentTTest"
+"studentTTestArgMax"
+"studentTTestArgMin"
+"studentTTestArray"
+"studentTTestDistinct"
+"studentTTestForEach"
+"studentTTestIf"
+"studentTTestMap"
+"studentTTestMerge"
+"studentTTestNull"
+"studentTTestOrDefault"
+"studentTTestOrNull"
+"studentTTestResample"
+"studentTTestSimpleState"
+"studentTTestState"
 "subBitmap"
+"subDate"
+"SUBPARTITION"
+"SUBPARTITION BY"
+"SUBPARTITIONS"
 "substr"
 "substring"
 "SUBSTRING"
+"substringIndex"
+"SUBSTRING_INDEX"
+"substringIndexUTF8"
 "substringUTF8"
 "subtractDays"
 "subtractHours"
+"subtractInterval"
+"subtractMicroseconds"
+"subtractMilliseconds"
 "subtractMinutes"
 "subtractMonths"
+"subtractNanoseconds"
 "subtractQuarters"
 "subtractSeconds"
+"subtractTupleOfIntervals"
 "subtractWeeks"
 "subtractYears"
 "sum"
+"sumArgMax"
+"sumArgMin"
+"sumArray"
 "sumCount"
+"sumCountArgMax"
+"sumCountArgMin"
+"sumCountArray"
+"sumCountDistinct"
+"sumCountForEach"
+"sumCountIf"
+"sumCountMap"
+"sumCountMerge"
+"sumCountNull"
+"sumCountOrDefault"
+"sumCountOrNull"
+"sumCountResample"
+"sumCountSimpleState"
+"sumCountState"
+"sumDistinct"
+"sumForEach"
+"sumIf"
 "sumKahan"
+"sumKahanArgMax"
+"sumKahanArgMin"
+"sumKahanArray"
+"sumKahanDistinct"
+"sumKahanForEach"
+"sumKahanIf"
+"sumKahanMap"
+"sumKahanMerge"
+"sumKahanNull"
+"sumKahanOrDefault"
+"sumKahanOrNull"
+"sumKahanResample"
+"sumKahanSimpleState"
+"sumKahanState"
 "sumMap"
 "sumMapFiltered"
+"sumMapFilteredArgMax"
+"sumMapFilteredArgMin"
+"sumMapFilteredArray"
+"sumMapFilteredDistinct"
+"sumMapFilteredForEach"
+"sumMapFilteredIf"
+"sumMapFilteredMap"
+"sumMapFilteredMerge"
+"sumMapFilteredNull"
+"sumMapFilteredOrDefault"
+"sumMapFilteredOrNull"
+"sumMapFilteredResample"
+"sumMapFilteredSimpleState"
+"sumMapFilteredState"
 "sumMapFilteredWithOverflow"
+"sumMapFilteredWithOverflowArgMax"
+"sumMapFilteredWithOverflowArgMin"
+"sumMapFilteredWithOverflowArray"
+"sumMapFilteredWithOverflowDistinct"
+"sumMapFilteredWithOverflowForEach"
+"sumMapFilteredWithOverflowIf"
+"sumMapFilteredWithOverflowMap"
+"sumMapFilteredWithOverflowMerge"
+"sumMapFilteredWithOverflowNull"
+"sumMapFilteredWithOverflowOrDefault"
+"sumMapFilteredWithOverflowOrNull"
+"sumMapFilteredWithOverflowResample"
+"sumMapFilteredWithOverflowSimpleState"
+"sumMapFilteredWithOverflowState"
+"sumMappedArrays"
+"sumMappedArraysArgMax"
+"sumMappedArraysArgMin"
+"sumMappedArraysArray"
+"sumMappedArraysDistinct"
+"sumMappedArraysForEach"
+"sumMappedArraysIf"
+"sumMappedArraysMap"
+"sumMappedArraysMerge"
+"sumMappedArraysNull"
+"sumMappedArraysOrDefault"
+"sumMappedArraysOrNull"
+"sumMappedArraysResample"
+"sumMappedArraysSimpleState"
+"sumMappedArraysState"
 "sumMapWithOverflow"
+"sumMapWithOverflowArgMax"
+"sumMapWithOverflowArgMin"
+"sumMapWithOverflowArray"
+"sumMapWithOverflowDistinct"
+"sumMapWithOverflowForEach"
+"sumMapWithOverflowIf"
+"sumMapWithOverflowMap"
+"sumMapWithOverflowMerge"
+"sumMapWithOverflowNull"
+"sumMapWithOverflowOrDefault"
+"sumMapWithOverflowOrNull"
+"sumMapWithOverflowResample"
+"sumMapWithOverflowSimpleState"
+"sumMapWithOverflowState"
+"sumMerge"
+"sumNull"
+"sumOrDefault"
+"sumOrNull"
+"sumResample"
+"sumSimpleState"
+"sumState"
 "sumWithOverflow"
+"sumWithOverflowArgMax"
+"sumWithOverflowArgMin"
+"sumWithOverflowArray"
+"sumWithOverflowDistinct"
+"sumWithOverflowForEach"
+"sumWithOverflowIf"
+"sumWithOverflowMap"
+"sumWithOverflowMerge"
+"sumWithOverflowNull"
+"sumWithOverflowOrDefault"
+"sumWithOverflowOrNull"
+"sumWithOverflowResample"
+"sumWithOverflowSimpleState"
+"sumWithOverflowState"
 "SUSPEND"
 "svg"
 "SVG"
@@ -1191,24 +4180,44 @@
 "SYNTAX"
 "SYSTEM"
 "TABLE"
+"TABLE OVERRIDE"
 "TABLES"
 "tan"
 "tanh"
 "tcpPort"
 "TEMPORARY"
+"TEMPORARY TABLE"
 "TEST"
 "TEXT"
 "tgamma"
+"theilsU"
+"theilsUArgMax"
+"theilsUArgMin"
+"theilsUArray"
+"theilsUDistinct"
+"theilsUForEach"
+"theilsUIf"
+"theilsUMap"
+"theilsUMerge"
+"theilsUNull"
+"theilsUOrDefault"
+"theilsUOrNull"
+"theilsUResample"
+"theilsUSimpleState"
+"theilsUState"
 "THEN"
 "throwIf"
 "tid"
-"TIES"
-"TIMEOUT"
+"TIME"
+"timeDiff"
 "timeSlot"
 "timeSlots"
+"timestamp"
 "TIMESTAMP"
 "TIMESTAMP_ADD"
 "TIMESTAMPADD"
+"timestamp_diff"
+"timestampDiff"
 "TIMESTAMP_DIFF"
 "TIMESTAMPDIFF"
 "TIMESTAMP_SUB"
@@ -1226,77 +4235,111 @@
 "TINYTEXT"
 "TO"
 "TO_BASE64"
+"toBool"
 "toColumnTypeName"
 "toDate"
 "toDate32"
+"toDate32OrDefault"
 "toDate32OrNull"
 "toDate32OrZero"
+"toDateOrDefault"
 "toDateOrNull"
 "toDateOrZero"
 "toDateTime"
 "toDateTime32"
 "toDateTime64"
+"toDateTime64OrDefault"
 "toDateTime64OrNull"
 "toDateTime64OrZero"
+"toDateTimeOrDefault"
 "toDateTimeOrNull"
 "toDateTimeOrZero"
 "today"
 "toDayOfMonth"
 "toDayOfWeek"
 "toDayOfYear"
+"TO_DAYS"
+"toDaysSinceYearZero"
 "toDecimal128"
+"toDecimal128OrDefault"
 "toDecimal128OrNull"
 "toDecimal128OrZero"
 "toDecimal256"
+"toDecimal256OrDefault"
 "toDecimal256OrNull"
 "toDecimal256OrZero"
 "toDecimal32"
+"toDecimal32OrDefault"
 "toDecimal32OrNull"
 "toDecimal32OrZero"
 "toDecimal64"
+"toDecimal64OrDefault"
 "toDecimal64OrNull"
 "toDecimal64OrZero"
+"toDecimalString"
 "TO DISK"
 "toFixedString"
 "toFloat32"
+"toFloat32OrDefault"
 "toFloat32OrNull"
 "toFloat32OrZero"
 "toFloat64"
+"toFloat64OrDefault"
 "toFloat64OrNull"
 "toFloat64OrZero"
 "toHour"
+"TO INNER UUID"
 "toInt128"
+"toInt128OrDefault"
 "toInt128OrNull"
 "toInt128OrZero"
 "toInt16"
+"toInt16OrDefault"
 "toInt16OrNull"
 "toInt16OrZero"
 "toInt256"
+"toInt256OrDefault"
 "toInt256OrNull"
 "toInt256OrZero"
 "toInt32"
+"toInt32OrDefault"
 "toInt32OrNull"
 "toInt32OrZero"
 "toInt64"
+"toInt64OrDefault"
 "toInt64OrNull"
 "toInt64OrZero"
 "toInt8"
+"toInt8OrDefault"
 "toInt8OrNull"
 "toInt8OrZero"
 "toIntervalDay"
 "toIntervalHour"
+"toIntervalMicrosecond"
+"toIntervalMillisecond"
 "toIntervalMinute"
 "toIntervalMonth"
+"toIntervalNanosecond"
 "toIntervalQuarter"
 "toIntervalSecond"
 "toIntervalWeek"
 "toIntervalYear"
 "toIPv4"
+"toIPv4OrDefault"
+"toIPv4OrNull"
+"toIPv4OrZero"
 "toIPv6"
+"toIPv6OrDefault"
+"toIPv6OrNull"
+"toIPv6OrZero"
 "toISOWeek"
 "toISOYear"
 "toJSONString"
+"tokens"
+"toLastDayOfMonth"
+"toLastDayOfWeek"
 "toLowCardinality"
+"toMillisecond"
 "toMinute"
 "toModifiedJulianDay"
 "toModifiedJulianDayOrNull"
@@ -1305,8 +4348,37 @@
 "toNullable"
 "TOP"
 "topK"
+"topKArgMax"
+"topKArgMin"
+"topKArray"
+"topKDistinct"
+"topKForEach"
+"topKIf"
+"topKMap"
+"topKMerge"
+"topKNull"
+"topKOrDefault"
+"topKOrNull"
+"topKResample"
+"topKSimpleState"
+"topKState"
 "topKWeighted"
+"topKWeightedArgMax"
+"topKWeightedArgMin"
+"topKWeightedArray"
+"topKWeightedDistinct"
+"topKWeightedForEach"
+"topKWeightedIf"
+"topKWeightedMap"
+"topKWeightedMerge"
+"topKWeightedNull"
+"topKWeightedOrDefault"
+"topKWeightedOrNull"
+"topKWeightedResample"
+"topKWeightedSimpleState"
+"topKWeightedState"
 "topLevelDomain"
+"topLevelDomainRFC"
 "toQuarter"
 "toRelativeDayNum"
 "toRelativeHourNum"
@@ -1317,14 +4389,19 @@
 "toRelativeWeekNum"
 "toRelativeYearNum"
 "toSecond"
+"TO SHARD"
 "toStartOfDay"
 "toStartOfFifteenMinutes"
+"toStartOfFiveMinute"
 "toStartOfFiveMinutes"
 "toStartOfHour"
 "toStartOfInterval"
 "toStartOfISOYear"
+"toStartOfMicrosecond"
+"toStartOfMillisecond"
 "toStartOfMinute"
 "toStartOfMonth"
+"toStartOfNanosecond"
 "toStartOfQuarter"
 "toStartOfSecond"
 "toStartOfTenMinutes"
@@ -1339,28 +4416,38 @@
 "toTimeZone"
 "toTypeName"
 "toUInt128"
+"toUInt128OrDefault"
 "toUInt128OrNull"
 "toUInt128OrZero"
 "toUInt16"
+"toUInt16OrDefault"
 "toUInt16OrNull"
 "toUInt16OrZero"
 "toUInt256"
+"toUInt256OrDefault"
 "toUInt256OrNull"
 "toUInt256OrZero"
 "toUInt32"
+"toUInt32OrDefault"
 "toUInt32OrNull"
 "toUInt32OrZero"
 "toUInt64"
+"toUInt64OrDefault"
 "toUInt64OrNull"
 "toUInt64OrZero"
 "toUInt8"
+"toUInt8OrDefault"
 "toUInt8OrNull"
 "toUInt8OrZero"
+"TO_UNIXTIME"
 "toUnixTimestamp"
 "toUnixTimestamp64Micro"
 "toUnixTimestamp64Milli"
 "toUnixTimestamp64Nano"
+"to_utc_timestamp"
+"toUTCTimestamp"
 "toUUID"
+"toUUIDOrDefault"
 "toUUIDOrNull"
 "toUUIDOrZero"
 "toValidUTF8"
@@ -1371,23 +4458,55 @@
 "toYYYYMM"
 "toYYYYMMDD"
 "toYYYYMMDDhhmmss"
+"TRACKING ONLY"
 "TRAILING"
+"TRANSACTION"
+"transactionID"
+"transactionLatestSnapshot"
+"transactionOldestSnapshot"
 "transform"
+"translate"
+"translateUTF8"
+"TRIGGER"
+"trim"
 "TRIM"
 "trimBoth"
 "trimLeft"
 "trimRight"
+"TRUE"
 "trunc"
 "truncate"
 "TRUNCATE"
+"tryBase58Decode"
 "tryBase64Decode"
+"tryDecrypt"
+"tryIdnaEncode"
+"tryPunycodeDecode"
 "TTL"
+"tumble"
+"tumbleEnd"
+"tumbleStart"
 "tuple"
 "Tuple"
+"tupleConcat"
+"tupleDivide"
+"tupleDivideByNumber"
 "tupleElement"
 "tupleHammingDistance"
+"tupleIntDiv"
+"tupleIntDivByNumber"
+"tupleIntDivOrZero"
+"tupleIntDivOrZeroByNumber"
+"tupleMinus"
+"tupleModulo"
+"tupleModuloByNumber"
+"tupleMultiply"
+"tupleMultiplyByNumber"
+"tupleNegate"
+"tuplePlus"
 "tupleToNameValuePairs"
 "TYPE"
+"TYPEOF"
 "ucase"
 "UInt128"
 "UInt16"
@@ -1395,41 +4514,245 @@
 "UInt32"
 "UInt64"
 "UInt8"
+"ULIDStringToDateTime"
 "unbin"
+"UNBOUNDED"
+"UNDROP"
+"UNFREEZE"
 "unhex"
 "UNION"
 "uniq"
+"uniqArgMax"
+"uniqArgMin"
+"uniqArray"
 "uniqCombined"
 "uniqCombined64"
+"uniqCombined64ArgMax"
+"uniqCombined64ArgMin"
+"uniqCombined64Array"
+"uniqCombined64Distinct"
+"uniqCombined64ForEach"
+"uniqCombined64If"
+"uniqCombined64Map"
+"uniqCombined64Merge"
+"uniqCombined64Null"
+"uniqCombined64OrDefault"
+"uniqCombined64OrNull"
+"uniqCombined64Resample"
+"uniqCombined64SimpleState"
+"uniqCombined64State"
+"uniqCombinedArgMax"
+"uniqCombinedArgMin"
+"uniqCombinedArray"
+"uniqCombinedDistinct"
+"uniqCombinedForEach"
+"uniqCombinedIf"
+"uniqCombinedMap"
+"uniqCombinedMerge"
+"uniqCombinedNull"
+"uniqCombinedOrDefault"
+"uniqCombinedOrNull"
+"uniqCombinedResample"
+"uniqCombinedSimpleState"
+"uniqCombinedState"
+"uniqDistinct"
 "uniqExact"
+"uniqExactArgMax"
+"uniqExactArgMin"
+"uniqExactArray"
+"uniqExactDistinct"
+"uniqExactForEach"
+"uniqExactIf"
+"uniqExactMap"
+"uniqExactMerge"
+"uniqExactNull"
+"uniqExactOrDefault"
+"uniqExactOrNull"
+"uniqExactResample"
+"uniqExactSimpleState"
+"uniqExactState"
+"uniqForEach"
 "uniqHLL12"
+"uniqHLL12ArgMax"
+"uniqHLL12ArgMin"
+"uniqHLL12Array"
+"uniqHLL12Distinct"
+"uniqHLL12ForEach"
+"uniqHLL12If"
+"uniqHLL12Map"
+"uniqHLL12Merge"
+"uniqHLL12Null"
+"uniqHLL12OrDefault"
+"uniqHLL12OrNull"
+"uniqHLL12Resample"
+"uniqHLL12SimpleState"
+"uniqHLL12State"
+"uniqIf"
+"uniqMap"
+"uniqMerge"
+"uniqNull"
+"uniqOrDefault"
+"uniqOrNull"
+"uniqResample"
+"uniqSimpleState"
+"uniqState"
 "uniqTheta"
+"uniqThetaArgMax"
+"uniqThetaArgMin"
+"uniqThetaArray"
+"uniqThetaDistinct"
+"uniqThetaForEach"
+"uniqThetaIf"
+"uniqThetaIntersect"
+"uniqThetaMap"
+"uniqThetaMerge"
+"uniqThetaNot"
+"uniqThetaNull"
+"uniqThetaOrDefault"
+"uniqThetaOrNull"
+"uniqThetaResample"
+"uniqThetaSimpleState"
+"uniqThetaState"
+"uniqThetaUnion"
+"UNIQUE"
 "uniqUpTo"
+"uniqUpToArgMax"
+"uniqUpToArgMin"
+"uniqUpToArray"
+"uniqUpToDistinct"
+"uniqUpToForEach"
+"uniqUpToIf"
+"uniqUpToMap"
+"uniqUpToMerge"
+"uniqUpToNull"
+"uniqUpToOrDefault"
+"uniqUpToOrNull"
+"uniqUpToResample"
+"uniqUpToSimpleState"
+"uniqUpToState"
+"UNSET FAKE TIME"
+"UNSIGNED"
 "UPDATE"
 "upper"
 "upperUTF8"
 "uptime"
+"URL"
 "URLHash"
 "URLHierarchy"
 "URLPathHierarchy"
 "USE"
 "user"
 "USING"
+"UTC_timestamp"
+"UTCTimestamp"
 "UUID"
 "UUIDNumToString"
 "UUIDStringToNum"
 "validateNestedArraySizes"
+"VALID UNTIL"
 "VALUES"
+"VARBINARY"
 "VARCHAR"
 "VARCHAR2"
+"Variant"
+"variantElement"
+"variantType"
 "varPop"
 "VAR_POP"
+"varPopArgMax"
+"VAR_POPArgMax"
+"varPopArgMin"
+"VAR_POPArgMin"
+"varPopArray"
+"VAR_POPArray"
+"varPopDistinct"
+"VAR_POPDistinct"
+"varPopForEach"
+"VAR_POPForEach"
+"varPopIf"
+"VAR_POPIf"
+"varPopMap"
+"VAR_POPMap"
+"varPopMerge"
+"VAR_POPMerge"
+"varPopNull"
+"VAR_POPNull"
+"varPopOrDefault"
+"VAR_POPOrDefault"
+"varPopOrNull"
+"VAR_POPOrNull"
+"varPopResample"
+"VAR_POPResample"
+"varPopSimpleState"
+"VAR_POPSimpleState"
 "varPopStable"
+"varPopStableArgMax"
+"varPopStableArgMin"
+"varPopStableArray"
+"varPopStableDistinct"
+"varPopStableForEach"
+"varPopStableIf"
+"varPopStableMap"
+"varPopStableMerge"
+"varPopStableNull"
+"varPopStableOrDefault"
+"varPopStableOrNull"
+"varPopStableResample"
+"varPopStableSimpleState"
+"varPopStableState"
+"varPopState"
+"VAR_POPState"
 "varSamp"
 "VAR_SAMP"
+"varSampArgMax"
+"VAR_SAMPArgMax"
+"varSampArgMin"
+"VAR_SAMPArgMin"
+"varSampArray"
+"VAR_SAMPArray"
+"varSampDistinct"
+"VAR_SAMPDistinct"
+"varSampForEach"
+"VAR_SAMPForEach"
+"varSampIf"
+"VAR_SAMPIf"
+"varSampMap"
+"VAR_SAMPMap"
+"varSampMerge"
+"VAR_SAMPMerge"
+"varSampNull"
+"VAR_SAMPNull"
+"varSampOrDefault"
+"VAR_SAMPOrDefault"
+"varSampOrNull"
+"VAR_SAMPOrNull"
+"varSampResample"
+"VAR_SAMPResample"
+"varSampSimpleState"
+"VAR_SAMPSimpleState"
 "varSampStable"
+"varSampStableArgMax"
+"varSampStableArgMin"
+"varSampStableArray"
+"varSampStableDistinct"
+"varSampStableForEach"
+"varSampStableIf"
+"varSampStableMap"
+"varSampStableMerge"
+"varSampStableNull"
+"varSampStableOrDefault"
+"varSampStableOrNull"
+"varSampStableResample"
+"varSampStableSimpleState"
+"varSampStableState"
+"varSampState"
+"VAR_SAMPState"
+"VARYING"
+"vectorDifference"
+"vectorSum"
 "version"
 "VIEW"
+"VISIBLE"
 "visibleWidth"
 "visitParamExtractBool"
 "visitParamExtractFloat"
@@ -1438,16 +4761,55 @@
 "visitParamExtractString"
 "visitParamExtractUInt"
 "visitParamHas"
-"VOLUME"
 "WATCH"
+"WATERMARK"
 "week"
 "WEEK"
+"WEEKS"
 "welchTTest"
+"welchTTestArgMax"
+"welchTTestArgMin"
+"welchTTestArray"
+"welchTTestDistinct"
+"welchTTestForEach"
+"welchTTestIf"
+"welchTTestMap"
+"welchTTestMerge"
+"welchTTestNull"
+"welchTTestOrDefault"
+"welchTTestOrNull"
+"welchTTestResample"
+"welchTTestSimpleState"
+"welchTTestState"
 "WHEN"
 "WHERE"
+"width_bucket"
+"widthBucket"
+"WINDOW"
 "windowFunnel"
+"windowFunnelArgMax"
+"windowFunnelArgMin"
+"windowFunnelArray"
+"windowFunnelDistinct"
+"windowFunnelForEach"
+"windowFunnelIf"
+"windowFunnelMap"
+"windowFunnelMerge"
+"windowFunnelNull"
+"windowFunnelOrDefault"
+"windowFunnelOrNull"
+"windowFunnelResample"
+"windowFunnelSimpleState"
+"windowFunnelState"
+"windowID"
 "WITH"
+"WITH ADMIN OPTION"
+"WITH CHECK"
 "WITH FILL"
+"WITH GRANT OPTION"
+"with_itemindex"
+"WITH NAME"
+"WITH REPLACE OPTION"
 "WITH TIES"
 "WK"
 "wkt"
@@ -1463,14 +4825,23 @@
 "wordShingleSimHashCaseInsensitive"
 "wordShingleSimHashCaseInsensitiveUTF8"
 "wordShingleSimHashUTF8"
+"WRITABLE"
 "WW"
+"wyHash64"
 "xor"
+"xxh3"
 "xxHash32"
 "xxHash64"
-"kostikConsistentHash"
+"yandexConsistentHash"
 "YEAR"
+"YEARS"
 "yearweek"
 "yesterday"
 "YY"
 "YYYY"
+"YYYYMMDDhhmmssToDateTime"
+"YYYYMMDDhhmmssToDateTime64"
+"YYYYMMDDToDate"
+"YYYYMMDDToDate32"
+"ZKPATH"
 "zookeeperSessionUptime"
diff --git a/tests/fuzz/dictionaries/datatypes.dict b/tests/fuzz/dictionaries/datatypes.dict
index e4983ae5f68..232e89db0c0 100644
--- a/tests/fuzz/dictionaries/datatypes.dict
+++ b/tests/fuzz/dictionaries/datatypes.dict
@@ -1,185 +1,134 @@
-"Polygon"
-"Ring"
-"Point"
-"SimpleAggregateFunction"
-"MultiPolygon"
-"IPv6"
-"IntervalSecond"
+"AggregateFunction"
+"Array"
+"BIGINT"
+"BIGINT SIGNED"
+"BIGINT UNSIGNED"
+"BINARY"
+"BINARY LARGE OBJECT"
+"BINARY VARYING"
+"BIT"
+"BLOB"
+"BYTE"
+"BYTEA"
+"Bool"
+"CHAR"
+"CHAR LARGE OBJECT"
+"CHAR VARYING"
+"CHARACTER"
+"CHARACTER LARGE OBJECT"
+"CHARACTER VARYING"
+"CLOB"
+"DEC"
+"DOUBLE"
+"DOUBLE PRECISION"
+"Date"
+"Date32"
+"DateTime"
+"DateTime32"
+"DateTime64"
+"Decimal"
+"Decimal128"
+"Decimal256"
+"Decimal32"
+"Decimal64"
+"ENUM"
+"Enum"
+"Enum16"
+"Enum8"
+"FIXED"
+"FLOAT"
+"FixedString"
+"Float32"
+"Float64"
+"GEOMETRY"
+"INET4"
+"INET6"
+"INT"
+"INT SIGNED"
+"INT UNSIGNED"
+"INT1"
+"INT1 SIGNED"
+"INT1 UNSIGNED"
+"INTEGER"
+"INTEGER SIGNED"
+"INTEGER UNSIGNED"
 "IPv4"
-"UInt32"
-"IntervalYear"
-"IntervalQuarter"
-"IntervalMonth"
+"IPv6"
+"Int128"
+"Int16"
+"Int256"
+"Int32"
 "Int64"
+"Int8"
 "IntervalDay"
 "IntervalHour"
-"Int16"
-"UInt256"
-"LowCardinality"
-"AggregateFunction"
-"Nothing"
-"Decimal256"
-"Tuple"
-"Array"
-"Enum16"
+"IntervalMicrosecond"
+"IntervalMillisecond"
 "IntervalMinute"
-"FixedString"
-"String"
-"DateTime"
-"Map"
-"UUID"
-"Decimal64"
-"Nullable"
-"Enum"
-"Int32"
-"UInt8"
-"Date"
-"Decimal32"
-"UInt128"
-"Float64"
-"Nested"
-"Int128"
-"Decimal128"
-"Int8"
-"Decimal"
-"Int256"
-"DateTime64"
-"Enum8"
-"DateTime32"
-"Date32"
+"IntervalMonth"
+"IntervalNanosecond"
+"IntervalQuarter"
+"IntervalSecond"
 "IntervalWeek"
-"UInt64"
-"UInt16"
-"Float32"
-"INET6"
-"INET4"
-"ENUM"
-"BINARY"
-"NATIONAL CHAR VARYING"
-"BINARY VARYING"
-"NCHAR LARGE OBJECT"
-"NATIONAL CHARACTER VARYING"
-"NATIONAL CHARACTER LARGE OBJECT"
-"NATIONAL CHARACTER"
-"NATIONAL CHAR"
-"CHARACTER VARYING"
+"IntervalYear"
+"JSON"
 "LONGBLOB"
-"MEDIUMTEXT"
-"TEXT"
-"TINYBLOB"
-"VARCHAR2"
-"CHARACTER LARGE OBJECT"
-"DOUBLE PRECISION"
 "LONGTEXT"
-"NVARCHAR"
-"INT1 UNSIGNED"
-"VARCHAR"
-"CHAR VARYING"
+"LowCardinality"
 "MEDIUMBLOB"
-"NCHAR"
-"CHAR"
-"SMALLINT UNSIGNED"
-"TIMESTAMP"
-"FIXED"
-"TINYTEXT"
-"NUMERIC"
-"DEC"
-"TINYINT UNSIGNED"
-"INTEGER UNSIGNED"
-"INT UNSIGNED"
-"CLOB"
-"MEDIUMINT UNSIGNED"
-"BOOL"
-"SMALLINT"
-"INTEGER SIGNED"
-"NCHAR VARYING"
-"INT SIGNED"
-"TINYINT SIGNED"
-"BIGINT SIGNED"
-"BINARY LARGE OBJECT"
-"SMALLINT SIGNED"
 "MEDIUMINT"
-"INTEGER"
-"INT1 SIGNED"
-"BIGINT UNSIGNED"
-"BYTEA"
-"INT"
-"SINGLE"
-"FLOAT"
 "MEDIUMINT SIGNED"
-"BOOLEAN"
-"DOUBLE"
-"INT1"
-"CHAR LARGE OBJECT"
-"TINYINT"
-"BIGINT"
-"CHARACTER"
-"BYTE"
-"BLOB"
+"MEDIUMINT UNSIGNED"
+"MEDIUMTEXT"
+"Map"
+"MultiPolygon"
+"NATIONAL CHAR"
+"NATIONAL CHAR VARYING"
+"NATIONAL CHARACTER"
+"NATIONAL CHARACTER LARGE OBJECT"
+"NATIONAL CHARACTER VARYING"
+"NCHAR"
+"NCHAR LARGE OBJECT"
+"NCHAR VARYING"
+"NUMERIC"
+"NVARCHAR"
+"Nested"
+"Nothing"
+"Nullable"
+"Object"
+"Point"
+"Polygon"
 "REAL"
-"IPv6"
-"IPv4"
-"Enum"
-"FixedString"
-"String"
-"String"
-"String"
-"String"
-"String"
-"String"
-"String"
-"String"
-"String"
-"String"
-"String"
-"String"
-"String"
-"String"
-"Float64"
-"String"
-"String"
-"UInt8"
-"String"
-"String"
-"String"
-"String"
+"Ring"
+"SET"
+"SIGNED"
+"SINGLE"
+"SMALLINT"
+"SMALLINT SIGNED"
+"SMALLINT UNSIGNED"
+"SimpleAggregateFunction"
 "String"
+"TEXT"
+"TIME"
+"TIMESTAMP"
+"TINYBLOB"
+"TINYINT"
+"TINYINT SIGNED"
+"TINYINT UNSIGNED"
+"TINYTEXT"
+"Tuple"
+"UInt128"
 "UInt16"
-"DateTime"
-"Decimal"
-"String"
-"Decimal"
-"Decimal"
-"UInt8"
+"UInt256"
 "UInt32"
-"UInt32"
-"String"
-"UInt32"
-"Int8"
-"Int16"
-"Int32"
-"String"
-"Int32"
-"Int8"
-"Int64"
-"String"
-"Int16"
-"Int32"
-"Int32"
-"Int8"
 "UInt64"
-"String"
-"Int32"
-"Float32"
-"Float32"
-"Int32"
-"Int8"
-"Float64"
-"Int8"
-"String"
-"Int8"
-"Int64"
-"String"
-"Int8"
-"String"
-"Float32"
+"UInt8"
+"UNSIGNED"
+"UUID"
+"VARBINARY"
+"VARCHAR"
+"VARCHAR2"
+"Variant"
+"YEAR"
+"bool"
+"boolean"
diff --git a/tests/fuzz/dictionaries/functions.dict b/tests/fuzz/dictionaries/functions.dict
index 3fe8dbfe501..ec7f8017fb2 100644
--- a/tests/fuzz/dictionaries/functions.dict
+++ b/tests/fuzz/dictionaries/functions.dict
@@ -1,1134 +1,4172 @@
-"logTrace"
-"aes_decrypt_mysql"
-"aes_encrypt_mysql"
-"decrypt"
-"encrypt"
-"bayesAB"
-"snowflakeToDateTime64"
-"snowflakeToDateTime"
-"validateNestedArraySizes"
-"wordShingleMinHashArgCaseInsensitiveUTF8"
-"wordShingleMinHashArgUTF8"
-"wordShingleMinHashArgCaseInsensitive"
-"wordShingleMinHashArg"
-"ngramMinHashArgCaseInsensitiveUTF8"
-"ngramMinHashArgUTF8"
-"ngramMinHashArgCaseInsensitive"
-"wordShingleMinHashCaseInsensitiveUTF8"
-"wordShingleMinHashUTF8"
-"ngramMinHashCaseInsensitiveUTF8"
-"ngramMinHashUTF8"
-"ngramMinHashCaseInsensitive"
-"wordShingleSimHashUTF8"
-"ngramSimHashUTF8"
-"ngramSimHashCaseInsensitive"
-"ngramSimHash"
-"toUnixTimestamp64Nano"
-"toUnixTimestamp64Micro"
-"jumpConsistentHash"
-"kostikConsistentHash"
-"addressToSymbol"
-"toJSONString"
-"JSON_VALUE"
-"JSONExtractKeysAndValuesRaw"
+"BIT_AND"
+"BIT_ANDArgMax"
+"BIT_ANDArgMin"
+"BIT_ANDArray"
+"BIT_ANDDistinct"
+"BIT_ANDForEach"
+"BIT_ANDIf"
+"BIT_ANDMap"
+"BIT_ANDMerge"
+"BIT_ANDNull"
+"BIT_ANDOrDefault"
+"BIT_ANDOrNull"
+"BIT_ANDResample"
+"BIT_ANDSimpleState"
+"BIT_ANDState"
+"BIT_OR"
+"BIT_ORArgMax"
+"BIT_ORArgMin"
+"BIT_ORArray"
+"BIT_ORDistinct"
+"BIT_ORForEach"
+"BIT_ORIf"
+"BIT_ORMap"
+"BIT_ORMerge"
+"BIT_ORNull"
+"BIT_OROrDefault"
+"BIT_OROrNull"
+"BIT_ORResample"
+"BIT_ORSimpleState"
+"BIT_ORState"
+"BIT_XOR"
+"BIT_XORArgMax"
+"BIT_XORArgMin"
+"BIT_XORArray"
+"BIT_XORDistinct"
+"BIT_XORForEach"
+"BIT_XORIf"
+"BIT_XORMap"
+"BIT_XORMerge"
+"BIT_XORNull"
+"BIT_XOROrDefault"
+"BIT_XOROrNull"
+"BIT_XORResample"
+"BIT_XORSimpleState"
+"BIT_XORState"
+"BLAKE3"
+"CAST"
+"CHARACTER_LENGTH"
+"CHAR_LENGTH"
+"COVAR_POP"
+"COVAR_POPArgMax"
+"COVAR_POPArgMin"
+"COVAR_POPArray"
+"COVAR_POPDistinct"
+"COVAR_POPForEach"
+"COVAR_POPIf"
+"COVAR_POPMap"
+"COVAR_POPMerge"
+"COVAR_POPNull"
+"COVAR_POPOrDefault"
+"COVAR_POPOrNull"
+"COVAR_POPResample"
+"COVAR_POPSimpleState"
+"COVAR_POPState"
+"COVAR_SAMP"
+"COVAR_SAMPArgMax"
+"COVAR_SAMPArgMin"
+"COVAR_SAMPArray"
+"COVAR_SAMPDistinct"
+"COVAR_SAMPForEach"
+"COVAR_SAMPIf"
+"COVAR_SAMPMap"
+"COVAR_SAMPMerge"
+"COVAR_SAMPNull"
+"COVAR_SAMPOrDefault"
+"COVAR_SAMPOrNull"
+"COVAR_SAMPResample"
+"COVAR_SAMPSimpleState"
+"COVAR_SAMPState"
+"CRC32"
+"CRC32IEEE"
+"CRC64"
+"DATABASE"
+"DATE"
+"DATE_DIFF"
+"DATE_FORMAT"
+"DATE_TRUNC"
+"DAY"
+"DAYOFMONTH"
+"DAYOFWEEK"
+"DAYOFYEAR"
+"FORMAT_BYTES"
+"FQDN"
+"FROM_BASE64"
+"FROM_DAYS"
+"FROM_UNIXTIME"
+"HOUR"
+"INET6_ATON"
+"INET6_NTOA"
+"INET_ATON"
+"INET_NTOA"
+"IPv4CIDRToRange"
+"IPv4NumToString"
+"IPv4NumToStringClassC"
+"IPv4StringToNum"
+"IPv4StringToNumOrDefault"
+"IPv4StringToNumOrNull"
+"IPv4ToIPv6"
+"IPv6CIDRToRange"
+"IPv6NumToString"
+"IPv6StringToNum"
+"IPv6StringToNumOrDefault"
+"IPv6StringToNumOrNull"
+"JSONArrayLength"
+"JSONExtract"
+"JSONExtractArrayRaw"
+"JSONExtractBool"
+"JSONExtractFloat"
+"JSONExtractInt"
 "JSONExtractKeys"
+"JSONExtractKeysAndValues"
+"JSONExtractKeysAndValuesRaw"
+"JSONExtractRaw"
 "JSONExtractString"
-"JSONType"
+"JSONExtractUInt"
+"JSONHas"
 "JSONKey"
 "JSONLength"
-"isValidJSON"
-"isZeroOrNull"
-"assumeNotNull"
-"s2CapUnion"
-"s2CapContains"
-"s2CellsIntersect"
-"s2GetNeighbors"
-"s2ToGeo"
-"h3GetFaces"
-"h3IsResClassIII"
-"h3ToString"
-"stringToH3"
-"h3ToParent"
-"h3GetResolution"
-"h3EdgeLengthM"
-"svg"
-"SVG"
-"equals"
-"geohashesInBox"
-"polygonsIntersectionCartesian"
-"polygonPerimeterSpherical"
-"bitHammingDistance"
-"polygonsDistanceSpherical"
-"polygonsSymDifferenceSpherical"
-"polygonAreaSpherical"
-"greatCircleDistance"
-"toInt256"
-"mapKeys"
-"sign"
-"reinterpretAsUInt8"
-"atanh"
-"formatReadableTimeDelta"
-"parseTimeDelta"
-"geohashEncode"
-"atan2"
-"acos"
+"JSONType"
+"JSON_ARRAY_LENGTH"
+"JSON_EXISTS"
+"JSON_QUERY"
+"JSON_VALUE"
+"L1Distance"
+"L1Norm"
+"L1Normalize"
+"L2Distance"
+"L2Norm"
+"L2Normalize"
+"L2SquaredDistance"
+"L2SquaredNorm"
+"LAST_DAY"
+"LinfDistance"
+"LinfNorm"
+"LinfNormalize"
+"LpDistance"
+"LpNorm"
+"LpNormalize"
+"MACNumToString"
+"MACStringToNum"
+"MACStringToOUI"
+"MAP_FROM_ARRAYS"
+"MD4"
+"MD5"
+"MILLISECOND"
+"MINUTE"
+"MONTH"
+"OCTET_LENGTH"
+"QUARTER"
+"REGEXP_EXTRACT"
+"REGEXP_MATCHES"
+"REGEXP_REPLACE"
+"SCHEMA"
+"SECOND"
+"SHA1"
 "SHA224"
-"visitParamExtractBool"
-"h3kRing"
-"asin"
-"sin"
-"reinterpretAsUInt128"
-"lgamma"
-"log2"
-"geoToH3"
-"toUnixTimestamp64Milli"
-"firstSignificantSubdomainCustom"
-"simpleJSONExtractBool"
-"visitParamExtractFloat"
-"visitParamExtractInt"
-"simpleJSONHas"
-"visitParamHas"
-"sigmoid"
-"cutQueryStringAndFragment"
-"dictGetInt16OrDefault"
-"cutToFirstSignificantSubdomainCustom"
+"SHA256"
+"SHA384"
+"SHA512"
+"SHA512_256"
+"STD"
+"STDArgMax"
+"STDArgMin"
+"STDArray"
+"STDDEV_POP"
+"STDDEV_POPArgMax"
+"STDDEV_POPArgMin"
+"STDDEV_POPArray"
+"STDDEV_POPDistinct"
+"STDDEV_POPForEach"
+"STDDEV_POPIf"
+"STDDEV_POPMap"
+"STDDEV_POPMerge"
+"STDDEV_POPNull"
+"STDDEV_POPOrDefault"
+"STDDEV_POPOrNull"
+"STDDEV_POPResample"
+"STDDEV_POPSimpleState"
+"STDDEV_POPState"
+"STDDEV_SAMP"
+"STDDEV_SAMPArgMax"
+"STDDEV_SAMPArgMin"
+"STDDEV_SAMPArray"
+"STDDEV_SAMPDistinct"
+"STDDEV_SAMPForEach"
+"STDDEV_SAMPIf"
+"STDDEV_SAMPMap"
+"STDDEV_SAMPMerge"
+"STDDEV_SAMPNull"
+"STDDEV_SAMPOrDefault"
+"STDDEV_SAMPOrNull"
+"STDDEV_SAMPResample"
+"STDDEV_SAMPSimpleState"
+"STDDEV_SAMPState"
+"STDDistinct"
+"STDForEach"
+"STDIf"
+"STDMap"
+"STDMerge"
+"STDNull"
+"STDOrDefault"
+"STDOrNull"
+"STDResample"
+"STDSimpleState"
+"STDState"
+"SUBSTRING_INDEX"
+"SVG"
+"TIMESTAMP_DIFF"
+"TO_BASE64"
+"TO_DAYS"
+"TO_UNIXTIME"
+"ULIDStringToDateTime"
+"URLHash"
 "URLHierarchy"
-"extractURLParameterNames"
-"toDecimal128OrZero"
-"extractURLParameters"
-"path"
-"pathFull"
-"port"
-"domain"
+"URLPathHierarchy"
+"UTCTimestamp"
+"UTC_timestamp"
+"UUIDNumToString"
+"UUIDStringToNum"
+"VAR_POP"
+"VAR_POPArgMax"
+"VAR_POPArgMin"
+"VAR_POPArray"
+"VAR_POPDistinct"
+"VAR_POPForEach"
+"VAR_POPIf"
+"VAR_POPMap"
+"VAR_POPMerge"
+"VAR_POPNull"
+"VAR_POPOrDefault"
+"VAR_POPOrNull"
+"VAR_POPResample"
+"VAR_POPSimpleState"
+"VAR_POPState"
+"VAR_SAMP"
+"VAR_SAMPArgMax"
+"VAR_SAMPArgMin"
+"VAR_SAMPArray"
+"VAR_SAMPDistinct"
+"VAR_SAMPForEach"
+"VAR_SAMPIf"
+"VAR_SAMPMap"
+"VAR_SAMPMerge"
+"VAR_SAMPNull"
+"VAR_SAMPOrDefault"
+"VAR_SAMPOrNull"
+"VAR_SAMPResample"
+"VAR_SAMPSimpleState"
+"VAR_SAMPState"
+"YEAR"
+"YYYYMMDDToDate"
+"YYYYMMDDToDate32"
+"YYYYMMDDhhmmssToDateTime"
+"YYYYMMDDhhmmssToDateTime64"
+"_CAST"
+"__bitBoolMaskAnd"
+"__bitBoolMaskOr"
+"__bitSwapLastTwo"
+"__bitWrapperFunc"
+"__getScalar"
+"__scalarSubqueryResult"
+"abs"
+"accurateCast"
+"accurateCastOrDefault"
+"accurateCastOrNull"
+"acos"
+"acosh"
+"addDate"
+"addDays"
+"addHours"
+"addInterval"
+"addMicroseconds"
+"addMilliseconds"
+"addMinutes"
+"addMonths"
+"addNanoseconds"
+"addQuarters"
+"addSeconds"
+"addTupleOfIntervals"
+"addWeeks"
+"addYears"
+"addressToLine"
+"addressToLineWithInlines"
+"addressToSymbol"
+"aes_decrypt_mysql"
+"aes_encrypt_mysql"
+"age"
+"aggThrow"
+"aggThrowArgMax"
+"aggThrowArgMin"
+"aggThrowArray"
+"aggThrowDistinct"
+"aggThrowForEach"
+"aggThrowIf"
+"aggThrowMap"
+"aggThrowMerge"
+"aggThrowNull"
+"aggThrowOrDefault"
+"aggThrowOrNull"
+"aggThrowResample"
+"aggThrowSimpleState"
+"aggThrowState"
+"alphaTokens"
+"analysisOfVariance"
+"analysisOfVarianceArgMax"
+"analysisOfVarianceArgMin"
+"analysisOfVarianceArray"
+"analysisOfVarianceDistinct"
+"analysisOfVarianceForEach"
+"analysisOfVarianceIf"
+"analysisOfVarianceMap"
+"analysisOfVarianceMerge"
+"analysisOfVarianceNull"
+"analysisOfVarianceOrDefault"
+"analysisOfVarianceOrNull"
+"analysisOfVarianceResample"
+"analysisOfVarianceSimpleState"
+"analysisOfVarianceState"
+"and"
+"anova"
+"anovaArgMax"
+"anovaArgMin"
+"anovaArray"
+"anovaDistinct"
+"anovaForEach"
+"anovaIf"
+"anovaMap"
+"anovaMerge"
+"anovaNull"
+"anovaOrDefault"
+"anovaOrNull"
+"anovaResample"
+"anovaSimpleState"
+"anovaState"
+"any"
+"anyArgMax"
+"anyArgMin"
+"anyArray"
+"anyDistinct"
+"anyForEach"
+"anyHeavy"
+"anyHeavyArgMax"
+"anyHeavyArgMin"
+"anyHeavyArray"
+"anyHeavyDistinct"
+"anyHeavyForEach"
+"anyHeavyIf"
+"anyHeavyMap"
+"anyHeavyMerge"
+"anyHeavyNull"
+"anyHeavyOrDefault"
+"anyHeavyOrNull"
+"anyHeavyResample"
+"anyHeavySimpleState"
+"anyHeavyState"
+"anyIf"
+"anyLast"
+"anyLastArgMax"
+"anyLastArgMin"
+"anyLastArray"
+"anyLastDistinct"
+"anyLastForEach"
+"anyLastIf"
+"anyLastMap"
+"anyLastMerge"
+"anyLastNull"
+"anyLastOrDefault"
+"anyLastOrNull"
+"anyLastResample"
+"anyLastSimpleState"
+"anyLastState"
+"anyLast_respect_nulls"
+"anyLast_respect_nullsArgMax"
+"anyLast_respect_nullsArgMin"
+"anyLast_respect_nullsArray"
+"anyLast_respect_nullsDistinct"
+"anyLast_respect_nullsForEach"
+"anyLast_respect_nullsIf"
+"anyLast_respect_nullsMap"
+"anyLast_respect_nullsMerge"
+"anyLast_respect_nullsNull"
+"anyLast_respect_nullsOrDefault"
+"anyLast_respect_nullsOrNull"
+"anyLast_respect_nullsResample"
+"anyLast_respect_nullsSimpleState"
+"anyLast_respect_nullsState"
+"anyMap"
+"anyMerge"
+"anyNull"
+"anyOrDefault"
+"anyOrNull"
+"anyResample"
+"anySimpleState"
+"anyState"
+"any_respect_nulls"
+"any_respect_nullsArgMax"
+"any_respect_nullsArgMin"
+"any_respect_nullsArray"
+"any_respect_nullsDistinct"
+"any_respect_nullsForEach"
+"any_respect_nullsIf"
+"any_respect_nullsMap"
+"any_respect_nullsMerge"
+"any_respect_nullsNull"
+"any_respect_nullsOrDefault"
+"any_respect_nullsOrNull"
+"any_respect_nullsResample"
+"any_respect_nullsSimpleState"
+"any_respect_nullsState"
+"any_value"
+"any_valueArgMax"
+"any_valueArgMin"
+"any_valueArray"
+"any_valueDistinct"
+"any_valueForEach"
+"any_valueIf"
+"any_valueMap"
+"any_valueMerge"
+"any_valueNull"
+"any_valueOrDefault"
+"any_valueOrNull"
+"any_valueResample"
+"any_valueSimpleState"
+"any_valueState"
+"any_value_respect_nulls"
+"any_value_respect_nullsArgMax"
+"any_value_respect_nullsArgMin"
+"any_value_respect_nullsArray"
+"any_value_respect_nullsDistinct"
+"any_value_respect_nullsForEach"
+"any_value_respect_nullsIf"
+"any_value_respect_nullsMap"
+"any_value_respect_nullsMerge"
+"any_value_respect_nullsNull"
+"any_value_respect_nullsOrDefault"
+"any_value_respect_nullsOrNull"
+"any_value_respect_nullsResample"
+"any_value_respect_nullsSimpleState"
+"any_value_respect_nullsState"
+"appendTrailingCharIfAbsent"
+"approx_top_count"
+"approx_top_countArgMax"
+"approx_top_countArgMin"
+"approx_top_countArray"
+"approx_top_countDistinct"
+"approx_top_countForEach"
+"approx_top_countIf"
+"approx_top_countMap"
+"approx_top_countMerge"
+"approx_top_countNull"
+"approx_top_countOrDefault"
+"approx_top_countOrNull"
+"approx_top_countResample"
+"approx_top_countSimpleState"
+"approx_top_countState"
+"approx_top_k"
+"approx_top_kArgMax"
+"approx_top_kArgMin"
+"approx_top_kArray"
+"approx_top_kDistinct"
+"approx_top_kForEach"
+"approx_top_kIf"
+"approx_top_kMap"
+"approx_top_kMerge"
+"approx_top_kNull"
+"approx_top_kOrDefault"
+"approx_top_kOrNull"
+"approx_top_kResample"
+"approx_top_kSimpleState"
+"approx_top_kState"
+"approx_top_sum"
+"approx_top_sumArgMax"
+"approx_top_sumArgMin"
+"approx_top_sumArray"
+"approx_top_sumDistinct"
+"approx_top_sumForEach"
+"approx_top_sumIf"
+"approx_top_sumMap"
+"approx_top_sumMerge"
+"approx_top_sumNull"
+"approx_top_sumOrDefault"
+"approx_top_sumOrNull"
+"approx_top_sumResample"
+"approx_top_sumSimpleState"
+"approx_top_sumState"
+"argMax"
+"argMaxArgMax"
+"argMaxArgMin"
+"argMaxArray"
+"argMaxDistinct"
+"argMaxForEach"
+"argMaxIf"
+"argMaxMap"
+"argMaxMerge"
+"argMaxNull"
+"argMaxOrDefault"
+"argMaxOrNull"
+"argMaxResample"
+"argMaxSimpleState"
+"argMaxState"
+"argMin"
+"argMinArgMax"
+"argMinArgMin"
+"argMinArray"
+"argMinDistinct"
+"argMinForEach"
+"argMinIf"
+"argMinMap"
+"argMinMerge"
+"argMinNull"
+"argMinOrDefault"
+"argMinOrNull"
+"argMinResample"
+"argMinSimpleState"
+"argMinState"
+"array"
+"arrayAUC"
+"arrayAll"
+"arrayAvg"
+"arrayCompact"
+"arrayConcat"
+"arrayCount"
+"arrayCumSum"
+"arrayCumSumNonNegative"
+"arrayDifference"
+"arrayDistinct"
+"arrayDotProduct"
+"arrayElement"
+"arrayEnumerate"
+"arrayEnumerateDense"
+"arrayEnumerateDenseRanked"
+"arrayEnumerateUniq"
+"arrayEnumerateUniqRanked"
+"arrayExists"
+"arrayFill"
+"arrayFilter"
+"arrayFirst"
+"arrayFirstIndex"
+"arrayFirstOrNull"
+"arrayFlatten"
+"arrayFold"
+"arrayIntersect"
+"arrayJaccardIndex"
+"arrayJoin"
+"arrayLast"
+"arrayLastIndex"
+"arrayLastOrNull"
+"arrayMap"
+"arrayMax"
+"arrayMin"
+"arrayPartialReverseSort"
+"arrayPartialShuffle"
+"arrayPartialSort"
+"arrayPopBack"
+"arrayPopFront"
+"arrayProduct"
+"arrayPushBack"
+"arrayPushFront"
+"arrayRandomSample"
+"arrayReduce"
+"arrayReduceInRanges"
+"arrayResize"
+"arrayReverse"
+"arrayReverseFill"
+"arrayReverseSort"
+"arrayReverseSplit"
+"arrayRotateLeft"
+"arrayRotateRight"
+"arrayShiftLeft"
+"arrayShiftRight"
+"arrayShingles"
+"arrayShuffle"
+"arraySlice"
+"arraySort"
+"arraySplit"
+"arrayStringConcat"
+"arraySum"
+"arrayUniq"
+"arrayWithConstant"
+"arrayZip"
+"array_agg"
+"array_aggArgMax"
+"array_aggArgMin"
+"array_aggArray"
+"array_aggDistinct"
+"array_aggForEach"
+"array_aggIf"
+"array_aggMap"
+"array_aggMerge"
+"array_aggNull"
+"array_aggOrDefault"
+"array_aggOrNull"
+"array_aggResample"
+"array_aggSimpleState"
+"array_aggState"
+"array_concat_agg"
+"array_concat_aggArgMax"
+"array_concat_aggArgMin"
+"array_concat_aggArray"
+"array_concat_aggDistinct"
+"array_concat_aggForEach"
+"array_concat_aggIf"
+"array_concat_aggMap"
+"array_concat_aggMerge"
+"array_concat_aggNull"
+"array_concat_aggOrDefault"
+"array_concat_aggOrNull"
+"array_concat_aggResample"
+"array_concat_aggSimpleState"
+"array_concat_aggState"
+"ascii"
+"asin"
+"asinh"
+"assumeNotNull"
+"atan"
+"atan2"
+"atanh"
+"avg"
+"avgArgMax"
+"avgArgMin"
+"avgArray"
+"avgDistinct"
+"avgForEach"
+"avgIf"
+"avgMap"
+"avgMerge"
+"avgNull"
+"avgOrDefault"
+"avgOrNull"
+"avgResample"
+"avgSimpleState"
+"avgState"
+"avgWeighted"
+"avgWeightedArgMax"
+"avgWeightedArgMin"
+"avgWeightedArray"
+"avgWeightedDistinct"
+"avgWeightedForEach"
+"avgWeightedIf"
+"avgWeightedMap"
+"avgWeightedMerge"
+"avgWeightedNull"
+"avgWeightedOrDefault"
+"avgWeightedOrNull"
+"avgWeightedResample"
+"avgWeightedSimpleState"
+"avgWeightedState"
+"bar"
+"base58Decode"
+"base58Encode"
+"base64Decode"
+"base64Encode"
+"basename"
+"bin"
+"bitAnd"
+"bitCount"
+"bitHammingDistance"
+"bitNot"
+"bitOr"
+"bitPositionsToArray"
+"bitRotateLeft"
+"bitRotateRight"
+"bitShiftLeft"
+"bitShiftRight"
+"bitSlice"
 "bitTest"
-"ngramSearchCaseInsensitiveUTF8"
+"bitTestAll"
+"bitTestAny"
+"bitXor"
+"bitmapAnd"
+"bitmapAndCardinality"
+"bitmapAndnot"
+"bitmapAndnotCardinality"
+"bitmapBuild"
+"bitmapCardinality"
+"bitmapContains"
+"bitmapHasAll"
+"bitmapHasAny"
 "bitmapMax"
-"ngramDistanceCaseInsensitiveUTF8"
-"ngramDistance"
+"bitmapMin"
+"bitmapOr"
+"bitmapOrCardinality"
+"bitmapSubsetInRange"
+"bitmapSubsetLimit"
+"bitmapToArray"
+"bitmapTransform"
+"bitmapXor"
+"bitmapXorCardinality"
+"bitmaskToArray"
+"bitmaskToList"
+"blockNumber"
+"blockSerializedSize"
+"blockSize"
+"boundingRatio"
+"boundingRatioArgMax"
+"boundingRatioArgMin"
+"boundingRatioArray"
+"boundingRatioDistinct"
+"boundingRatioForEach"
+"boundingRatioIf"
+"boundingRatioMap"
+"boundingRatioMerge"
+"boundingRatioNull"
+"boundingRatioOrDefault"
+"boundingRatioOrNull"
+"boundingRatioResample"
+"boundingRatioSimpleState"
+"boundingRatioState"
+"buildId"
+"byteHammingDistance"
+"byteSize"
+"byteSlice"
+"byteSwap"
+"caseWithExpr"
+"caseWithExpression"
+"caseWithoutExpr"
+"caseWithoutExpression"
+"catboostEvaluate"
+"categoricalInformationValue"
+"categoricalInformationValueArgMax"
+"categoricalInformationValueArgMin"
+"categoricalInformationValueArray"
+"categoricalInformationValueDistinct"
+"categoricalInformationValueForEach"
+"categoricalInformationValueIf"
+"categoricalInformationValueMap"
+"categoricalInformationValueMerge"
+"categoricalInformationValueNull"
+"categoricalInformationValueOrDefault"
+"categoricalInformationValueOrNull"
+"categoricalInformationValueResample"
+"categoricalInformationValueSimpleState"
+"categoricalInformationValueState"
+"cbrt"
+"ceil"
+"ceiling"
+"char"
+"cityHash64"
+"coalesce"
+"concat"
+"concatAssumeInjective"
+"concatWithSeparator"
+"concatWithSeparatorAssumeInjective"
+"concat_ws"
+"connectionId"
+"connection_id"
+"contingency"
+"contingencyArgMax"
+"contingencyArgMin"
+"contingencyArray"
+"contingencyDistinct"
+"contingencyForEach"
+"contingencyIf"
+"contingencyMap"
+"contingencyMerge"
+"contingencyNull"
+"contingencyOrDefault"
+"contingencyOrNull"
+"contingencyResample"
+"contingencySimpleState"
+"contingencyState"
+"convertCharset"
+"corr"
+"corrArgMax"
+"corrArgMin"
+"corrArray"
+"corrDistinct"
+"corrForEach"
+"corrIf"
+"corrMap"
+"corrMatrix"
+"corrMatrixArgMax"
+"corrMatrixArgMin"
+"corrMatrixArray"
+"corrMatrixDistinct"
+"corrMatrixForEach"
+"corrMatrixIf"
+"corrMatrixMap"
+"corrMatrixMerge"
+"corrMatrixNull"
+"corrMatrixOrDefault"
+"corrMatrixOrNull"
+"corrMatrixResample"
+"corrMatrixSimpleState"
+"corrMatrixState"
+"corrMerge"
+"corrNull"
+"corrOrDefault"
+"corrOrNull"
+"corrResample"
+"corrSimpleState"
+"corrStable"
+"corrStableArgMax"
+"corrStableArgMin"
+"corrStableArray"
+"corrStableDistinct"
+"corrStableForEach"
+"corrStableIf"
+"corrStableMap"
+"corrStableMerge"
+"corrStableNull"
+"corrStableOrDefault"
+"corrStableOrNull"
+"corrStableResample"
+"corrStableSimpleState"
+"corrStableState"
+"corrState"
+"cos"
+"cosh"
+"cosineDistance"
+"count"
+"countArgMax"
+"countArgMin"
+"countArray"
+"countDigits"
+"countDistinct"
+"countEqual"
+"countForEach"
+"countIf"
+"countMap"
+"countMatches"
+"countMatchesCaseInsensitive"
+"countMerge"
+"countNull"
+"countOrDefault"
+"countOrNull"
+"countResample"
+"countSimpleState"
+"countState"
+"countSubstrings"
+"countSubstringsCaseInsensitive"
+"countSubstringsCaseInsensitiveUTF8"
+"covarPop"
+"covarPopArgMax"
+"covarPopArgMin"
+"covarPopArray"
+"covarPopDistinct"
+"covarPopForEach"
+"covarPopIf"
+"covarPopMap"
+"covarPopMatrix"
+"covarPopMatrixArgMax"
+"covarPopMatrixArgMin"
+"covarPopMatrixArray"
+"covarPopMatrixDistinct"
+"covarPopMatrixForEach"
+"covarPopMatrixIf"
+"covarPopMatrixMap"
+"covarPopMatrixMerge"
+"covarPopMatrixNull"
+"covarPopMatrixOrDefault"
+"covarPopMatrixOrNull"
+"covarPopMatrixResample"
+"covarPopMatrixSimpleState"
+"covarPopMatrixState"
+"covarPopMerge"
+"covarPopNull"
+"covarPopOrDefault"
+"covarPopOrNull"
+"covarPopResample"
+"covarPopSimpleState"
+"covarPopStable"
+"covarPopStableArgMax"
+"covarPopStableArgMin"
+"covarPopStableArray"
+"covarPopStableDistinct"
+"covarPopStableForEach"
+"covarPopStableIf"
+"covarPopStableMap"
+"covarPopStableMerge"
+"covarPopStableNull"
+"covarPopStableOrDefault"
+"covarPopStableOrNull"
+"covarPopStableResample"
+"covarPopStableSimpleState"
+"covarPopStableState"
+"covarPopState"
+"covarSamp"
+"covarSampArgMax"
+"covarSampArgMin"
+"covarSampArray"
+"covarSampDistinct"
+"covarSampForEach"
+"covarSampIf"
+"covarSampMap"
+"covarSampMatrix"
+"covarSampMatrixArgMax"
+"covarSampMatrixArgMin"
+"covarSampMatrixArray"
+"covarSampMatrixDistinct"
+"covarSampMatrixForEach"
+"covarSampMatrixIf"
+"covarSampMatrixMap"
+"covarSampMatrixMerge"
+"covarSampMatrixNull"
+"covarSampMatrixOrDefault"
+"covarSampMatrixOrNull"
+"covarSampMatrixResample"
+"covarSampMatrixSimpleState"
+"covarSampMatrixState"
+"covarSampMerge"
+"covarSampNull"
+"covarSampOrDefault"
+"covarSampOrNull"
+"covarSampResample"
+"covarSampSimpleState"
+"covarSampStable"
+"covarSampStableArgMax"
+"covarSampStableArgMin"
+"covarSampStableArray"
+"covarSampStableDistinct"
+"covarSampStableForEach"
+"covarSampStableIf"
+"covarSampStableMap"
+"covarSampStableMerge"
+"covarSampStableNull"
+"covarSampStableOrDefault"
+"covarSampStableOrNull"
+"covarSampStableResample"
+"covarSampStableSimpleState"
+"covarSampStableState"
+"covarSampState"
+"cramersV"
+"cramersVArgMax"
+"cramersVArgMin"
+"cramersVArray"
+"cramersVBiasCorrected"
+"cramersVBiasCorrectedArgMax"
+"cramersVBiasCorrectedArgMin"
+"cramersVBiasCorrectedArray"
+"cramersVBiasCorrectedDistinct"
+"cramersVBiasCorrectedForEach"
+"cramersVBiasCorrectedIf"
+"cramersVBiasCorrectedMap"
+"cramersVBiasCorrectedMerge"
+"cramersVBiasCorrectedNull"
+"cramersVBiasCorrectedOrDefault"
+"cramersVBiasCorrectedOrNull"
+"cramersVBiasCorrectedResample"
+"cramersVBiasCorrectedSimpleState"
+"cramersVBiasCorrectedState"
+"cramersVDistinct"
+"cramersVForEach"
+"cramersVIf"
+"cramersVMap"
+"cramersVMerge"
+"cramersVNull"
+"cramersVOrDefault"
+"cramersVOrNull"
+"cramersVResample"
+"cramersVSimpleState"
+"cramersVState"
+"curdate"
+"currentDatabase"
+"currentProfiles"
+"currentRoles"
+"currentSchemas"
+"currentUser"
+"current_database"
+"current_date"
+"current_schemas"
+"current_timestamp"
+"cutFragment"
+"cutIPv6"
+"cutQueryString"
+"cutQueryStringAndFragment"
+"cutToFirstSignificantSubdomain"
+"cutToFirstSignificantSubdomainCustom"
+"cutToFirstSignificantSubdomainCustomRFC"
+"cutToFirstSignificantSubdomainCustomWithWWW"
+"cutToFirstSignificantSubdomainCustomWithWWWRFC"
+"cutToFirstSignificantSubdomainRFC"
+"cutToFirstSignificantSubdomainWithWWW"
+"cutToFirstSignificantSubdomainWithWWWRFC"
+"cutURLParameter"
+"cutWWW"
+"damerauLevenshteinDistance"
+"dateDiff"
+"dateName"
+"dateTime64ToSnowflake"
+"dateTimeToSnowflake"
+"dateTrunc"
+"date_diff"
+"decodeHTMLComponent"
+"decodeURLComponent"
+"decodeURLFormComponent"
+"decodeXMLComponent"
+"decrypt"
+"defaultProfiles"
+"defaultRoles"
+"defaultValueOfArgumentType"
+"defaultValueOfTypeName"
+"degrees"
+"deltaSum"
+"deltaSumArgMax"
+"deltaSumArgMin"
+"deltaSumArray"
+"deltaSumDistinct"
+"deltaSumForEach"
+"deltaSumIf"
+"deltaSumMap"
+"deltaSumMerge"
+"deltaSumNull"
+"deltaSumOrDefault"
+"deltaSumOrNull"
+"deltaSumResample"
+"deltaSumSimpleState"
+"deltaSumState"
+"deltaSumTimestamp"
+"deltaSumTimestampArgMax"
+"deltaSumTimestampArgMin"
+"deltaSumTimestampArray"
+"deltaSumTimestampDistinct"
+"deltaSumTimestampForEach"
+"deltaSumTimestampIf"
+"deltaSumTimestampMap"
+"deltaSumTimestampMerge"
+"deltaSumTimestampNull"
+"deltaSumTimestampOrDefault"
+"deltaSumTimestampOrNull"
+"deltaSumTimestampResample"
+"deltaSumTimestampSimpleState"
+"deltaSumTimestampState"
+"demangle"
+"dense_rank"
+"dense_rankArgMax"
+"dense_rankArgMin"
+"dense_rankArray"
+"dense_rankDistinct"
+"dense_rankForEach"
+"dense_rankIf"
+"dense_rankMap"
+"dense_rankMerge"
+"dense_rankNull"
+"dense_rankOrDefault"
+"dense_rankOrNull"
+"dense_rankResample"
+"dense_rankSimpleState"
+"dense_rankState"
+"detectCharset"
+"detectLanguage"
+"detectLanguageMixed"
+"detectLanguageUnknown"
+"detectProgrammingLanguage"
+"detectTonality"
+"dictGet"
+"dictGetAll"
+"dictGetChildren"
+"dictGetDate"
+"dictGetDateOrDefault"
+"dictGetDateTime"
+"dictGetDateTimeOrDefault"
+"dictGetDescendants"
+"dictGetFloat32"
+"dictGetFloat32OrDefault"
+"dictGetFloat64"
+"dictGetFloat64OrDefault"
+"dictGetHierarchy"
+"dictGetIPv4"
+"dictGetIPv4OrDefault"
+"dictGetIPv6"
+"dictGetIPv6OrDefault"
+"dictGetInt16"
+"dictGetInt16OrDefault"
+"dictGetInt32"
+"dictGetInt32OrDefault"
+"dictGetInt64"
+"dictGetInt64OrDefault"
+"dictGetInt8"
+"dictGetInt8OrDefault"
+"dictGetOrDefault"
+"dictGetOrNull"
+"dictGetString"
+"dictGetStringOrDefault"
+"dictGetUInt16"
+"dictGetUInt16OrDefault"
+"dictGetUInt32"
+"dictGetUInt32OrDefault"
+"dictGetUInt64"
+"dictGetUInt64OrDefault"
+"dictGetUInt8"
+"dictGetUInt8OrDefault"
+"dictGetUUID"
+"dictGetUUIDOrDefault"
+"dictHas"
+"dictIsIn"
+"displayName"
+"distanceL1"
+"distanceL2"
+"distanceL2Squared"
+"distanceLinf"
+"distanceLp"
+"divide"
+"divideDecimal"
+"domain"
+"domainRFC"
+"domainWithoutWWW"
+"domainWithoutWWWRFC"
+"dotProduct"
+"dumpColumnStructure"
+"e"
+"editDistance"
+"empty"
+"emptyArrayDate"
+"emptyArrayDateTime"
+"emptyArrayFloat32"
+"emptyArrayFloat64"
+"emptyArrayInt16"
+"emptyArrayInt32"
+"emptyArrayInt64"
+"emptyArrayInt8"
+"emptyArrayString"
+"emptyArrayToSingle"
+"emptyArrayUInt16"
+"emptyArrayUInt32"
+"emptyArrayUInt64"
+"emptyArrayUInt8"
+"enabledProfiles"
+"enabledRoles"
+"encodeURLComponent"
+"encodeURLFormComponent"
+"encodeXMLComponent"
+"encrypt"
+"endsWith"
+"endsWithUTF8"
+"entropy"
+"entropyArgMax"
+"entropyArgMin"
+"entropyArray"
+"entropyDistinct"
+"entropyForEach"
+"entropyIf"
+"entropyMap"
+"entropyMerge"
+"entropyNull"
+"entropyOrDefault"
+"entropyOrNull"
+"entropyResample"
+"entropySimpleState"
+"entropyState"
+"equals"
+"erf"
+"erfc"
+"errorCodeToName"
+"evalMLMethod"
+"exp"
+"exp10"
+"exp2"
+"exponentialMovingAverage"
+"exponentialMovingAverageArgMax"
+"exponentialMovingAverageArgMin"
+"exponentialMovingAverageArray"
+"exponentialMovingAverageDistinct"
+"exponentialMovingAverageForEach"
+"exponentialMovingAverageIf"
+"exponentialMovingAverageMap"
+"exponentialMovingAverageMerge"
+"exponentialMovingAverageNull"
+"exponentialMovingAverageOrDefault"
+"exponentialMovingAverageOrNull"
+"exponentialMovingAverageResample"
+"exponentialMovingAverageSimpleState"
+"exponentialMovingAverageState"
+"exponentialTimeDecayedAvg"
+"exponentialTimeDecayedAvgArgMax"
+"exponentialTimeDecayedAvgArgMin"
+"exponentialTimeDecayedAvgArray"
+"exponentialTimeDecayedAvgDistinct"
+"exponentialTimeDecayedAvgForEach"
+"exponentialTimeDecayedAvgIf"
+"exponentialTimeDecayedAvgMap"
+"exponentialTimeDecayedAvgMerge"
+"exponentialTimeDecayedAvgNull"
+"exponentialTimeDecayedAvgOrDefault"
+"exponentialTimeDecayedAvgOrNull"
+"exponentialTimeDecayedAvgResample"
+"exponentialTimeDecayedAvgSimpleState"
+"exponentialTimeDecayedAvgState"
+"exponentialTimeDecayedCount"
+"exponentialTimeDecayedCountArgMax"
+"exponentialTimeDecayedCountArgMin"
+"exponentialTimeDecayedCountArray"
+"exponentialTimeDecayedCountDistinct"
+"exponentialTimeDecayedCountForEach"
+"exponentialTimeDecayedCountIf"
+"exponentialTimeDecayedCountMap"
+"exponentialTimeDecayedCountMerge"
+"exponentialTimeDecayedCountNull"
+"exponentialTimeDecayedCountOrDefault"
+"exponentialTimeDecayedCountOrNull"
+"exponentialTimeDecayedCountResample"
+"exponentialTimeDecayedCountSimpleState"
+"exponentialTimeDecayedCountState"
+"exponentialTimeDecayedMax"
+"exponentialTimeDecayedMaxArgMax"
+"exponentialTimeDecayedMaxArgMin"
+"exponentialTimeDecayedMaxArray"
+"exponentialTimeDecayedMaxDistinct"
+"exponentialTimeDecayedMaxForEach"
+"exponentialTimeDecayedMaxIf"
+"exponentialTimeDecayedMaxMap"
+"exponentialTimeDecayedMaxMerge"
+"exponentialTimeDecayedMaxNull"
+"exponentialTimeDecayedMaxOrDefault"
+"exponentialTimeDecayedMaxOrNull"
+"exponentialTimeDecayedMaxResample"
+"exponentialTimeDecayedMaxSimpleState"
+"exponentialTimeDecayedMaxState"
+"exponentialTimeDecayedSum"
+"exponentialTimeDecayedSumArgMax"
+"exponentialTimeDecayedSumArgMin"
+"exponentialTimeDecayedSumArray"
+"exponentialTimeDecayedSumDistinct"
+"exponentialTimeDecayedSumForEach"
+"exponentialTimeDecayedSumIf"
+"exponentialTimeDecayedSumMap"
+"exponentialTimeDecayedSumMerge"
+"exponentialTimeDecayedSumNull"
+"exponentialTimeDecayedSumOrDefault"
+"exponentialTimeDecayedSumOrNull"
+"exponentialTimeDecayedSumResample"
+"exponentialTimeDecayedSumSimpleState"
+"exponentialTimeDecayedSumState"
+"extract"
+"extractAll"
+"extractAllGroups"
 "extractAllGroupsHorizontal"
 "extractAllGroupsVertical"
-"multiFuzzyMatchAllIndices"
-"multiFuzzyMatchAnyIndex"
-"multiMatchAnyIndex"
-"replaceRegexpAll"
-"emptyArrayInt16"
-"dictGetOrDefault"
-"replaceOne"
-"emptyArrayInt32"
-"extract"
-"readWKTPolygon"
-"notILike"
-"geohashDecode"
-"toModifiedJulianDay"
-"notLike"
-"countSubstringsCaseInsensitive"
-"IPv4StringToNum"
-"positionUTF8"
-"hasToken"
-"dictGetDate"
-"multiSearchFirstPosition"
-"multiSearchFirstIndexCaseInsensitiveUTF8"
-"atan"
-"rowNumberInAllBlocks"
-"multiSearchFirstIndexCaseInsensitive"
-"multiSearchAnyUTF8"
-"parseDateTime32BestEffortOrZero"
-"blockNumber"
-"cutURLParameter"
-"multiSearchFirstPositionCaseInsensitive"
-"positionCaseInsensitiveUTF8"
-"positionCaseInsensitive"
-"splitByRegexp"
-"toInt256OrZero"
-"pointInPolygon"
-"splitByWhitespace"
-"lemmatize"
-"synonyms"
-"tryBase64Decode"
-"multiSearchAllPositions"
-"FROM_BASE64"
-"replaceRegexpOne"
-"subBitmap"
-"defaultValueOfArgumentType"
-"base64Decode"
-"regionToContinent"
-"ilike"
-"fromModifiedJulianDay"
-"TO_BASE64"
-"dictIsIn"
-"base64Encode"
-"decodeXMLComponent"
-"countMatchesCaseInsensitive"
-"normalizeQuery"
-"erf"
-"trimBoth"
-"fromUnixTimestamp64Nano"
-"lessOrEquals"
-"subtractQuarters"
-"ngramSearch"
-"readWKTRing"
-"trimRight"
-"endsWith"
-"ngramDistanceCaseInsensitive"
-"connectionId"
-"initialQueryID"
-"startsWith"
-"tan"
-"substring"
+"extractGroups"
+"extractKeyValuePairs"
+"extractKeyValuePairsWithEscaping"
+"extractTextFromHTML"
+"extractURLParameter"
+"extractURLParameterNames"
+"extractURLParameters"
+"factorial"
+"farmFingerprint64"
+"farmHash64"
+"file"
+"filesystemAvailable"
+"filesystemCapacity"
+"filesystemUnreserved"
+"finalizeAggregation"
+"firstLine"
+"firstSignificantSubdomain"
+"firstSignificantSubdomainCustom"
+"firstSignificantSubdomainCustomRFC"
+"firstSignificantSubdomainRFC"
+"first_value"
+"first_valueArgMax"
+"first_valueArgMin"
+"first_valueArray"
+"first_valueDistinct"
+"first_valueForEach"
+"first_valueIf"
+"first_valueMap"
+"first_valueMerge"
+"first_valueNull"
+"first_valueOrDefault"
+"first_valueOrNull"
+"first_valueResample"
+"first_valueSimpleState"
+"first_valueState"
+"first_value_respect_nulls"
+"first_value_respect_nullsArgMax"
+"first_value_respect_nullsArgMin"
+"first_value_respect_nullsArray"
+"first_value_respect_nullsDistinct"
+"first_value_respect_nullsForEach"
+"first_value_respect_nullsIf"
+"first_value_respect_nullsMap"
+"first_value_respect_nullsMerge"
+"first_value_respect_nullsNull"
+"first_value_respect_nullsOrDefault"
+"first_value_respect_nullsOrNull"
+"first_value_respect_nullsResample"
+"first_value_respect_nullsSimpleState"
+"first_value_respect_nullsState"
+"flameGraph"
+"flameGraphArgMax"
+"flameGraphArgMin"
+"flameGraphArray"
+"flameGraphDistinct"
+"flameGraphForEach"
+"flameGraphIf"
+"flameGraphMap"
+"flameGraphMerge"
+"flameGraphNull"
+"flameGraphOrDefault"
+"flameGraphOrNull"
+"flameGraphResample"
+"flameGraphSimpleState"
+"flameGraphState"
+"flatten"
+"flattenTuple"
+"floor"
+"format"
+"formatDateTime"
+"formatDateTimeInJodaSyntax"
+"formatQuery"
+"formatQueryOrNull"
+"formatQuerySingleLine"
+"formatQuerySingleLineOrNull"
+"formatReadableDecimalSize"
+"formatReadableQuantity"
+"formatReadableSize"
+"formatReadableTimeDelta"
 "formatRow"
 "formatRowNoNewline"
-"dictGetHierarchy"
-"notEmpty"
-"format"
-"murmurHash3_64"
-"reverseUTF8"
-"arrayEnumerateUniqRanked"
-"CRC64"
-"pow"
-"toInt16"
-"reverse"
-"lower"
-"toStartOfDay"
-"caseWithoutExpr"
-"CHAR_LENGTH"
-"lengthUTF8"
-"length"
-"bitTestAny"
-"floor"
-"round"
-"reinterpretAsFixedString"
-"reinterpretAsString"
-"h3ToChildren"
-"emptyArrayToSingle"
-"tgamma"
-"reinterpretAsInt128"
-"visitParamExtractRaw"
-"reinterpretAsInt64"
-"reinterpretAsUInt32"
-"reinterpretAsUInt16"
-"fuzzBits"
-"randomFixedString"
-"tupleHammingDistance"
-"JSONExtractBool"
-"ngramSearchUTF8"
-"generateUUIDv4"
-"multiSearchAllPositionsCaseInsensitive"
-"randConstant"
-"leftPad"
-"convertCharset"
-"extractURLParameter"
-"zookeeperSessionUptime"
-"serverUUID"
-"firstSignificantSubdomain"
-"rand64"
-"JSON_EXISTS"
-"isIPAddressInRange"
-"wordShingleSimHashCaseInsensitive"
-"parseDateTime32BestEffortOrNull"
-"cutToFirstSignificantSubdomainWithWWW"
-"roundToExp2"
-"mapSubtract"
-"partitionId"
-"intExp2"
-"byteSize"
-"errorCodeToName"
-"toDateTime64"
-"yesterday"
-"initializeAggregation"
-"globalVariable"
-"countDigits"
-"toStartOfHour"
-"toWeek"
-"isDecimalOverflow"
-"visitParamExtractString"
-"isConstant"
-"getSetting"
-"shardNum"
-"__getScalar"
-"position"
-"__bitBoolMaskOr"
-"cosh"
-"basename"
-"evalMLMethod"
-"filesystemUnreserved"
-"filesystemCapacity"
-"reinterpretAsDate"
-"filesystemAvailable"
-"joinGet"
-"globalNullInIgnoreSet"
-"globalNotInIgnoreSet"
-"toRelativeDayNum"
-"splitByChar"
-"notInIgnoreSet"
-"globalInIgnoreSet"
-"notNullIn"
-"ngramSearchCaseInsensitive"
-"notIn"
-"trunc"
-"JSONExtractArrayRaw"
-"version"
-"joinGetOrNull"
-"globalIn"
-"toDate32"
-"lowCardinalityIndices"
-"toLowCardinality"
-"runningConcurrency"
-"runningDifferenceStartingWithFirstValue"
-"bitCount"
-"timezoneOf"
-"timezone"
-"uptime"
-"pi"
-"extractTextFromHTML"
-"UUIDStringToNum"
-"roundDown"
-"IPv6NumToString"
-"throwIf"
-"ifNotFinite"
-"FROM_UNIXTIME"
-"isInfinite"
-"arrayProduct"
-"polygonsIntersectionSpherical"
-"toRelativeHourNum"
-"hasColumnInTable"
-"bar"
-"JSONExtractKeysAndValues"
-"replicate"
-"arrayJoin"
-"s2RectUnion"
-"ngramDistanceUTF8"
-"identity"
-"indexHint"
-"ignore"
-"regionHierarchy"
-"toDateTime64OrNull"
-"polygonsWithinCartesian"
-"materialize"
-"sleepEachRow"
-"parseDateTimeBestEffortUSOrNull"
-"neighbor"
-"splitByString"
-"rowNumberInBlock"
-"blockSize"
-"defaultValueOfTypeName"
-"hiveHash"
-"randomStringUTF8"
-"blockSerializedSize"
-"visibleWidth"
-"fullHostName"
-"hostName"
-"arrayFilter"
-"defaultRoles"
-"currentRoles"
-"toUInt64OrZero"
-"dictGetUInt16"
-"DATABASE"
-"toUInt8OrZero"
-"reinterpretAsInt8"
-"not"
-"log1p"
-"and"
-"wordShingleMinHash"
-"arrayDifference"
-"arrayCumSumNonNegative"
-"wordShingleSimHash"
-"arrayCumSum"
-"arraySort"
-"arrayPartialSort"
-"arrayPartialReverseSort"
-"toDaysSinceYearZero"
+"fragment"
 "fromDaysSinceYearZero"
 "fromDaysSinceYearZero32"
-"dumpColumnStructure"
-"multiSearchFirstIndex"
-"arrayReverseSplit"
-"ifNull"
-"normalizeQueryKeepNames"
-"xxHash64"
-"in"
-"arrayReverseFill"
-"erfc"
-"cutToFirstSignificantSubdomainCustomWithWWW"
-"arrayFill"
-"substringUTF8"
-"arrayFirst"
-"arrayAvg"
-"cos"
-"arrayMax"
-"toColumnTypeName"
-"arrayMin"
-"toIntervalDay"
-"reinterpretAsFloat32"
-"arrayAll"
-"or"
-"arrayExists"
-"trimLeft"
-"arrayMap"
-"polygonsSymDifferenceCartesian"
-"gccMurmurHash"
-"exp2"
-"polygonPerimeterCartesian"
-"SHA384"
-"murmurHash3_128"
-"polygonConvexHullCartesian"
-"murmurHash3_32"
-"h3GetBaseCell"
-"murmurHash2_64"
-"globalNullIn"
-"javaHashUTF16LE"
-"URLHash"
-"reinterpretAsInt16"
-"regionToCountry"
-"toUUID"
-"intHash32"
-"metroHash64"
-"arrayPushFront"
-"bitmapAndnotCardinality"
-"toFloat32"
-"sipHash64"
-"JSONExtractFloat"
-"SHA512"
-"JSONExtractUInt"
-"arrayReduce"
-"SHA256"
-"array"
-"parseDateTimeBestEffortUSOrZero"
-"toInt32OrNull"
-"MD5"
-"randomString"
-"__bitBoolMaskAnd"
-"hasSubstr"
-"formatReadableQuantity"
-"replaceAll"
-"toIntervalWeek"
-"toRelativeSecondNum"
-"demangle"
-"toNullable"
-"concat"
-"formatReadableDecimalSize"
-"formatReadableSize"
-"shardCount"
+"fromModifiedJulianDay"
 "fromModifiedJulianDayOrNull"
-"toInt128OrZero"
-"bitmaskToList"
-"xor"
-"bitPositionsToArray"
-"empty"
-"ngramMinHashArg"
-"_CAST"
-"dictGetStringOrDefault"
-"arrayZip"
-"dictGetUUIDOrDefault"
-"dictGetFloat64OrDefault"
-"dictGetInt64OrDefault"
-"today"
-"dictGetUInt32OrDefault"
-"countSubstringsCaseInsensitiveUTF8"
-"h3IsPentagon"
-"dictGetUInt16OrDefault"
-"dictGetDescendants"
-"dictGetString"
-"inIgnoreSet"
-"dictGetUUID"
-"arraySlice"
-"reinterpretAsInt32"
-"dictGetFloat64"
-"globalNotNullInIgnoreSet"
-"arrayUniq"
-"polygonAreaCartesian"
-"intDiv"
-"cityHash64"
-"regionToTopContinent"
-"toInt32"
-"e"
-"wordShingleSimHashCaseInsensitiveUTF8"
-"JSON_QUERY"
-"isIPv4String"
-"UUIDNumToString"
-"modulo"
-"reinterpret"
-"unbin"
-"regionToDistrict"
-"sinh"
-"date_trunc"
-"__bitSwapLastTwo"
-"formatDateTime"
-"dateDiff"
-"tanh"
-"multiSearchAnyCaseInsensitiveUTF8"
-"upperUTF8"
-"bitmaskToArray"
-"arrayAUC"
-"multiMatchAllIndices"
-"hasThreadFuzzer"
-"toDayOfWeek"
-"isFinite"
-"transform"
-"timezoneOffset"
-"toTimezone"
-"cutQueryString"
-"subtractYears"
-"tcpPort"
-"subtractHours"
-"tid"
-"toDateTime64OrZero"
-"subtractSeconds"
-"alphaTokens"
-"negate"
-"file"
-"roundAge"
-"MACStringToOUI"
-"addQuarters"
-"arrayResize"
-"addWeeks"
-"HOUR"
-"addHours"
-"visitParamExtractUInt"
-"caseWithExpression"
-"rand"
-"addSeconds"
-"splitByNonAlpha"
-"arrayStringConcat"
-"randomPrintableASCII"
-"h3HexAreaM2"
-"toYYYYMMDDhhmmss"
-"toInt16OrNull"
-"timeSlots"
-"timeSlot"
-"dictGetInt16"
-"queryString"
-"javaHash"
-"acosh"
-"toRelativeMinuteNum"
-"toRelativeYearNum"
-"unhex"
-"toInt8OrNull"
-"regionToPopulation"
-"toStartOfISOYear"
-"getSizeOfEnumType"
-"toStartOfInterval"
-"toYYYYMMDD"
-"multiSearchFirstPositionUTF8"
-"CRC32"
-"toStartOfFifteenMinutes"
-"emptyArrayUInt8"
-"dictGetUInt8"
-"toStartOfFiveMinutes"
-"cbrt"
-"toStartOfMinute"
-"dictGet"
-"toStartOfSecond"
-"hasTokenCaseInsensitive"
-"toStartOfYear"
-"farmHash64"
-"toStartOfMonth"
-"queryID"
-"wordShingleMinHashCaseInsensitive"
-"dictGetDateOrDefault"
-"dictGetUInt64OrDefault"
-"arrayElement"
-"sleep"
-"dictHas"
-"enabledProfiles"
-"toDecimal32OrNull"
-"multiFuzzyMatchAny"
-"toStartOfWeek"
-"isValidUTF8"
-"dictGetInt8"
-"dictGetInt32OrDefault"
-"toMonday"
-"multiSearchFirstIndexUTF8"
-"lowCardinalityKeys"
-"halfMD5"
-"domainWithoutWWW"
-"MINUTE"
-"addDays"
-"toMinute"
-"JSONExtractRaw"
-"toUInt16OrNull"
-"bin"
-"toDayOfYear"
-"log"
-"DAYOFMONTH"
-"toUInt32"
-"toDecimal32"
-"s2RectAdd"
-"dictGetFloat32OrDefault"
-"xxHash32"
-"DAY"
-"toISOWeek"
-"ngramMinHash"
-"toMonth"
-"countMatches"
-"toQuarter"
-"toISOYear"
-"YEAR"
-"toIntervalYear"
-"hypot"
-"multiSearchAny"
-"toIntervalQuarter"
-"toSecond"
-"accurate_CastOrNull"
-"reinterpretAsUInt64"
-"defaultProfiles"
-"toIntervalMonth"
-"bitRotateRight"
-"arrayReverseSort"
-"toInt8OrZero"
-"SHA1"
-"multiSearchFirstPositionCaseInsensitiveUTF8"
-"cutFragment"
-"toDecimal256"
-"toIntervalSecond"
-"toUInt256OrZero"
-"toStringCutToZero"
-"normalizedQueryHashKeepNames"
-"coalesce"
-"parseDateTime64BestEffortOrNull"
-"toIntervalHour"
-"bitmapSubsetLimit"
-"parseDateTimeBestEffortOrNull"
-"match"
-"fragment"
-"repeat"
-"parseDateTimeBestEffortOrZero"
-"toDecimal128OrNull"
-"parseDateTimeBestEffort"
-"simpleJSONExtractUInt"
-"multiMatchAny"
-"toDecimal256OrNull"
-"roundDuration"
-"addMinutes"
-"toStartOfQuarter"
-"exp10"
-"regionIn"
-"toDecimal64OrNull"
-"toDateTimeOrNull"
-"simpleJSONExtractFloat"
-"reinterpretAsUUID"
-"dictGetDateTimeOrDefault"
-"greater"
-"toRelativeMonthNum"
-"toDate32OrNull"
-"h3IndexesAreNeighbors"
-"toFloat32OrNull"
-"toInt256OrNull"
-"leftPadUTF8"
-"regionToArea"
-"toInt64OrNull"
-"toModifiedJulianDayOrNull"
-"toUInt64OrNull"
-"polygonsEqualsCartesian"
-"accurateCast"
-"toUInt32OrNull"
-"encodeXMLComponent"
-"toUInt8OrNull"
-"toUUIDOrZero"
-"arrayEnumerateDenseRanked"
-"toYYYYMM"
-"toDecimal256OrZero"
-"fromUnixTimestamp64Milli"
-"CHARACTER_LENGTH"
-"isNull"
-"isNaN"
-"multiSearchAllPositionsCaseInsensitiveUTF8"
-"FQDN"
-"currentProfiles"
-"toDateTime32"
-"arraySplit"
-"toIPv6"
-"toDecimal32OrZero"
-"bitmapCardinality"
-"arrayFlatten"
-"dateName"
-"s2RectIntersection"
-"CAST"
-"caseWithExpr"
-"nullIf"
-"toDateTimeOrZero"
-"bitOr"
-"CRC32IEEE"
-"emptyArrayDate"
-"toUInt128OrZero"
-"toUInt128OrNull"
-"toFloat32OrZero"
-"SECOND"
-"arrayCompact"
-"bitmapMin"
-"toInt16OrZero"
-"reinterpretAsUInt256"
-"dictGetOrNull"
-"map"
-"bitmapHasAny"
-"emptyArrayUInt16"
-"cutIPv6"
-"toUInt32OrZero"
-"toTypeName"
-"polygonsUnionCartesian"
-"char"
-"mapContains"
-"emptyArrayDateTime"
-"toUInt16OrZero"
-"toInt64"
-"wkt"
-"dictGetUInt64"
-"JSONHas"
-"runningDifference"
-"getServerPort"
-"IPv4ToIPv6"
-"__bitWrapperFunc"
-"multiply"
-"accurate_Cast"
-"toDecimal64"
-"toString"
-"arrayIntersect"
-"dictGetUInt8OrDefault"
-"toTime"
-"hasAll"
-"now"
-"parseDateTime64BestEffortOrZero"
-"rightPadUTF8"
-"emptyArrayInt64"
-"simpleJSONExtractInt"
-"toDecimal128"
-"toRelativeWeekNum"
-"toDateOrNull"
-"topLevelDomain"
-"greatest"
-"isIPv6String"
-"toHour"
-"toFixedString"
-"bitmapOrCardinality"
-"toInt128"
-"toDateOrZero"
-"emptyArrayUInt64"
-"toUInt128"
-"isNotNull"
-"toUInt16"
-"MACNumToString"
-"multiSearchAllPositionsUTF8"
-"toUInt8"
-"regionToCity"
-"DAYOFYEAR"
-"simpleJSONExtractRaw"
-"appendTrailingCharIfAbsent"
-"toUInt64"
-"regionToName"
-"IPv4NumToStringClassC"
-"upper"
-"greaterOrEquals"
-"s2RectContains"
-"toDate"
-"regexpQuoteMeta"
-"readWKTMultiPolygon"
-"emptyArrayString"
-"bitmapOr"
-"cutWWW"
-"emptyArrayInt8"
-"less"
-"readWKTPoint"
-"reinterpretAsDateTime"
-"notEquals"
-"geoToS2"
-"nullInIgnoreSet"
-"globalNotNullIn"
-"arrayConcat"
-"mapPopulateSeries"
-"parseDateTimeBestEffortUS"
-"toDayOfMonth"
-"gcd"
-"protocol"
-"currentUser"
-"if"
-"caseWithoutExpression"
-"currentDatabase"
-"log10"
-"moduloOrZero"
-"MD4"
-"toInt64OrZero"
-"arrayWithConstant"
-"IPv4NumToString"
-"dictGetUInt32"
-"multiSearchAnyCaseInsensitive"
-"countSubstrings"
-"reinterpretAsFloat64"
-"plus"
-"dictGetChildren"
-"IPv6CIDRToRange"
-"toIntervalMinute"
-"bitRotateLeft"
-"geoDistance"
-"mapValues"
-"toIPv4"
-"extractGroups"
-"toYearWeek"
-"polygonsDistanceCartesian"
-"lowerUTF8"
-"toUInt256OrNull"
-"IPv4CIDRToRange"
-"MACStringToNum"
-"toFloat64OrNull"
-"sipHash128"
-"toFloat64"
-"arrayPopFront"
-"bitmapAnd"
-"bitmapHasAll"
-"subtractWeeks"
-"arrayFirstIndex"
-"bitmapXorCardinality"
-"bitmapAndnot"
-"asinh"
-"dictGetInt32"
-"toFloat64OrZero"
-"toInt8"
-"polygonsWithinSpherical"
-"bitmapXor"
-"intExp10"
-"dictGetDateTime"
-"h3ToGeoBoundary"
-"decodeURLComponent"
-"bitAnd"
-"toUUIDOrNull"
-"notNullInIgnoreSet"
-"tupleElement"
-"tupleToNameValuePairs"
-"tuple"
-"ceil"
-"DAYOFWEEK"
-"toDateTime"
-"bitNot"
-"rightPad"
-"has"
-"bitmapToArray"
-"arrayCount"
-"arrayDistinct"
-"greatCircleAngle"
-"IPv6StringToNum"
-"dictGetInt64"
-"toUnixTimestamp"
-"getMacro"
-"runningAccumulate"
-"multiIf"
-"abs"
-"toValidUTF8"
-"arrayEnumerateUniq"
-"moduloLegacy"
-"JSONExtractInt"
-"subtractMonths"
-"dateTimeToSnowflake"
-"cutToFirstSignificantSubdomain"
-"roundBankers"
-"toUInt256"
-"arrayEnumerateDense"
-"stem"
-"bitmapAndCardinality"
-"bitTestAll"
-"normalizedQueryHash"
-"toYear"
-"emptyArrayFloat64"
-"bitmapTransform"
-"JSONExtract"
-"bitShiftRight"
-"bitmapContains"
-"sqrt"
-"minus"
-"QUARTER"
-"parseDateTime64BestEffort"
-"h3IsValid"
-"h3EdgeAngle"
-"concatAssumeInjective"
-"emptyArrayUInt32"
-"intHash64"
-"enabledRoles"
-"fromUnixTimestamp64Micro"
-"range"
-"subtractMinutes"
-"farmFingerprint64"
-"arrayReduceInRanges"
-"bitmapBuild"
-"bitmapSubsetInRange"
-"arrayPopBack"
-"h3ToGeo"
-"hex"
-"arrayPushBack"
-"subtractDays"
-"buildId"
-"URLPathHierarchy"
-"addMonths"
-"parseDateTime32BestEffort"
-"indexOf"
-"polygonsUnionSpherical"
-"arraySum"
-"dictGetFloat32"
-"ngramSimHashCaseInsensitiveUTF8"
-"finalizeAggregation"
-"divide"
-"netloc"
-"bitShiftLeft"
-"toInt32OrZero"
-"extractAll"
-"toInt128OrNull"
-"bitXor"
-"lcm"
-"accurateCastOrNull"
-"toDate32OrZero"
-"simpleJSONExtractString"
-"least"
-"nullIn"
-"MONTH"
-"arrayReverse"
-"arrayShuffle"
-"arrayPartialShuffle"
-"now64"
-"DATE"
-"addressToLine"
-"globalNotIn"
-"dateTime64ToSnowflake"
-"dictGetInt8OrDefault"
-"exp"
-"toRelativeQuarterNum"
-"arrayEnumerate"
-"mapAdd"
-"murmurHash2_32"
-"toStartOfTenMinutes"
-"intDivOrZero"
-"addYears"
-"queryStringAndFragment"
-"emptyArrayFloat32"
-"countEqual"
-"pointInEllipses"
-"like"
-"toDecimal64OrZero"
-"reinterpretAsInt256"
-"hasAny"
-"ln"
-"replace"
-"rpad"
-"mid"
-"lcase"
+"fromUTCTimestamp"
 "fromUnixTimestamp"
-"truncate"
-"ceiling"
-"ucase"
-"rand32"
-"power"
-"initial_query_id"
-"timeZone"
-"hostname"
-"yearweek"
-"timeZoneOffset"
-"extractAllGroups"
-"lpad"
-"substr"
-"INET6_NTOA"
-"INET6_ATON"
-"INET_ATON"
-"timeZoneOf"
-"locate"
-"INET_NTOA"
-"connection_id"
-"user"
-"toTimeZone"
-"week"
-"flatten"
-"query_id"
-"dateTrunc"
-"mod"
-"lagInFrame"
-"dense_rank"
-"rank"
-"exponentialMovingAverage"
-"sparkbar"
-"singleValueOrNull"
-"studentTTest"
-"aggThrow"
-"categoricalInformationValue"
-"groupArrayMovingAvg"
-"groupArrayMovingSum"
-"simpleLinearRegression"
-"entropy"
-"quantilesBFloat16"
-"maxIntersectionsPosition"
-"groupBitmapXor"
-"groupBitmap"
-"skewPop"
-"groupBitXor"
-"groupBitOr"
-"groupBitmapAnd"
-"topKWeighted"
-"stochasticLinearRegression"
-"corr"
-"corrMatrix"
-"uniqCombined64"
-"intervalLengthSum"
-"uniqCombined"
-"rankCorr"
-"maxMap"
-"minMap"
-"sumMapFiltered"
-"quantileExactWeighted"
-"sumMapFilteredWithOverflow"
-"sumMap"
-"histogram"
-"quantiles"
-"sum"
-"covarPop"
-"covarPopMatrix"
-"row_number"
-"kurtPop"
-"kurtSamp"
-"skewSamp"
-"uniqExact"
-"sumMapWithOverflow"
-"stddevSamp"
-"varPop"
-"corrStable"
-"quantileTimingWeighted"
-"covarPopStable"
-"stddevSampStable"
-"varSamp"
-"topK"
-"last_value"
-"mannWhitneyUTest"
-"maxIntersections"
-"quantilesExact"
-"uniqHLL12"
-"quantileBFloat16"
-"uniq"
-"min"
-"sequenceNextNode"
-"quantilesTimingWeighted"
-"boundingRatio"
-"any"
-"anyLast"
-"deltaSum"
-"retention"
-"sequenceMatch"
-"uniqUpTo"
-"windowFunnel"
-"deltaSumTimestamp"
-"varSampStable"
-"uniqTheta"
-"quantilesExactWeighted"
-"max"
-"quantilesBFloat16Weighted"
-"quantileBFloat16Weighted"
-"sumKahan"
-"quantilesTDigestWeighted"
-"groupBitAnd"
-"quantileTDigest"
-"quantileTDigestWeighted"
-"argMax"
-"quantileDeterministic"
-"quantilesTDigest"
-"stochasticLogisticRegression"
-"argMin"
-"avg"
-"covarSampStable"
-"quantilesTiming"
-"welchTTest"
-"covarSamp"
-"covarSampMatrix"
-"varPopStable"
-"quantileTiming"
-"quantileExactInclusive"
-"quantileExactHigh"
-"groupArraySample"
-"quantilesExactLow"
-"groupBitmapOr"
-"first_value"
-"quantileExactExclusive"
-"quantileExact"
-"sumCount"
-"groupArrayInsertAt"
-"quantilesExactHigh"
-"sumWithOverflow"
-"sequenceCount"
-"quantilesDeterministic"
-"groupUniqArray"
+"fromUnixTimestamp64Micro"
+"fromUnixTimestamp64Milli"
+"fromUnixTimestamp64Nano"
+"fromUnixTimestampInJodaSyntax"
+"from_utc_timestamp"
+"fullHostName"
+"fuzzBits"
+"gccMurmurHash"
+"gcd"
+"generateRandomStructure"
+"generateULID"
+"generateUUIDv4"
+"geoDistance"
+"geoToH3"
+"geoToS2"
+"geohashDecode"
+"geohashEncode"
+"geohashesInBox"
+"getMacro"
+"getOSKernelVersion"
+"getServerPort"
+"getSetting"
+"getSizeOfEnumType"
+"getSubcolumn"
+"getTypeSerializationStreams"
+"globalIn"
+"globalInIgnoreSet"
+"globalNotIn"
+"globalNotInIgnoreSet"
+"globalNotNullIn"
+"globalNotNullInIgnoreSet"
+"globalNullIn"
+"globalNullInIgnoreSet"
+"globalVariable"
+"greatCircleAngle"
+"greatCircleDistance"
+"greater"
+"greaterOrEquals"
+"greatest"
 "groupArray"
-"anyHeavy"
-"stddevPop"
-"quantile"
-"leadInFrame"
-"quantilesExactExclusive"
-"count"
-"quantilesExactInclusive"
-"stddevPopStable"
-"quantileExactLow"
-"avgWeighted"
-"BIT_AND"
-"VAR_SAMP"
-"COVAR_SAMP"
-"VAR_POP"
-"medianTDigest"
-"medianBFloat16"
-"medianTimingWeighted"
-"medianTiming"
-"medianExactHigh"
-"BIT_OR"
-"medianDeterministic"
-"STDDEV_POP"
-"STDDEV_SAMP"
-"medianExactLow"
-"medianTDigestWeighted"
-"medianExact"
-"COVAR_POP"
-"medianBFloat16Weighted"
-"medianExactWeighted"
-"BIT_XOR"
-"median"
-"log"
-"replaceAll"
-"rightPad"
-"substring"
-"lower"
-"FROM_UNIXTIME"
-"trunc"
-"ceil"
-"upper"
-"rand"
-"pow"
-"initialQueryID"
-"timezone"
-"hostName"
-"toYearWeek"
-"timezoneOffset"
-"extractAllGroupsVertical"
-"leftPad"
-"substring"
-"IPv6NumToString"
-"IPv6StringToNum"
-"IPv4StringToNum"
-"timezoneOf"
-"position"
-"IPv4NumToString"
-"connectionid"
-"currentUser"
-"toTimezone"
-"toWeek"
-"arrayFlatten"
-"queryID"
-"date_trunc"
-"modulo"
+"groupArrayArgMax"
+"groupArrayArgMin"
+"groupArrayArray"
+"groupArrayDistinct"
+"groupArrayForEach"
+"groupArrayIf"
+"groupArrayInsertAt"
+"groupArrayInsertAtArgMax"
+"groupArrayInsertAtArgMin"
+"groupArrayInsertAtArray"
+"groupArrayInsertAtDistinct"
+"groupArrayInsertAtForEach"
+"groupArrayInsertAtIf"
+"groupArrayInsertAtMap"
+"groupArrayInsertAtMerge"
+"groupArrayInsertAtNull"
+"groupArrayInsertAtOrDefault"
+"groupArrayInsertAtOrNull"
+"groupArrayInsertAtResample"
+"groupArrayInsertAtSimpleState"
+"groupArrayInsertAtState"
+"groupArrayIntersect"
+"groupArrayIntersectArgMax"
+"groupArrayIntersectArgMin"
+"groupArrayIntersectArray"
+"groupArrayIntersectDistinct"
+"groupArrayIntersectForEach"
+"groupArrayIntersectIf"
+"groupArrayIntersectMap"
+"groupArrayIntersectMerge"
+"groupArrayIntersectNull"
+"groupArrayIntersectOrDefault"
+"groupArrayIntersectOrNull"
+"groupArrayIntersectResample"
+"groupArrayIntersectSimpleState"
+"groupArrayIntersectState"
+"groupArrayLast"
+"groupArrayLastArgMax"
+"groupArrayLastArgMin"
+"groupArrayLastArray"
+"groupArrayLastDistinct"
+"groupArrayLastForEach"
+"groupArrayLastIf"
+"groupArrayLastMap"
+"groupArrayLastMerge"
+"groupArrayLastNull"
+"groupArrayLastOrDefault"
+"groupArrayLastOrNull"
+"groupArrayLastResample"
+"groupArrayLastSimpleState"
+"groupArrayLastState"
+"groupArrayMap"
+"groupArrayMerge"
+"groupArrayMovingAvg"
+"groupArrayMovingAvgArgMax"
+"groupArrayMovingAvgArgMin"
+"groupArrayMovingAvgArray"
+"groupArrayMovingAvgDistinct"
+"groupArrayMovingAvgForEach"
+"groupArrayMovingAvgIf"
+"groupArrayMovingAvgMap"
+"groupArrayMovingAvgMerge"
+"groupArrayMovingAvgNull"
+"groupArrayMovingAvgOrDefault"
+"groupArrayMovingAvgOrNull"
+"groupArrayMovingAvgResample"
+"groupArrayMovingAvgSimpleState"
+"groupArrayMovingAvgState"
+"groupArrayMovingSum"
+"groupArrayMovingSumArgMax"
+"groupArrayMovingSumArgMin"
+"groupArrayMovingSumArray"
+"groupArrayMovingSumDistinct"
+"groupArrayMovingSumForEach"
+"groupArrayMovingSumIf"
+"groupArrayMovingSumMap"
+"groupArrayMovingSumMerge"
+"groupArrayMovingSumNull"
+"groupArrayMovingSumOrDefault"
+"groupArrayMovingSumOrNull"
+"groupArrayMovingSumResample"
+"groupArrayMovingSumSimpleState"
+"groupArrayMovingSumState"
+"groupArrayNull"
+"groupArrayOrDefault"
+"groupArrayOrNull"
+"groupArrayResample"
+"groupArraySample"
+"groupArraySampleArgMax"
+"groupArraySampleArgMin"
+"groupArraySampleArray"
+"groupArraySampleDistinct"
+"groupArraySampleForEach"
+"groupArraySampleIf"
+"groupArraySampleMap"
+"groupArraySampleMerge"
+"groupArraySampleNull"
+"groupArraySampleOrDefault"
+"groupArraySampleOrNull"
+"groupArraySampleResample"
+"groupArraySampleSimpleState"
+"groupArraySampleState"
+"groupArraySimpleState"
+"groupArraySorted"
+"groupArraySortedArgMax"
+"groupArraySortedArgMin"
+"groupArraySortedArray"
+"groupArraySortedDistinct"
+"groupArraySortedForEach"
+"groupArraySortedIf"
+"groupArraySortedMap"
+"groupArraySortedMerge"
+"groupArraySortedNull"
+"groupArraySortedOrDefault"
+"groupArraySortedOrNull"
+"groupArraySortedResample"
+"groupArraySortedSimpleState"
+"groupArraySortedState"
+"groupArrayState"
 "groupBitAnd"
-"varSamp"
-"covarSamp"
-"varPop"
-"quantileTDigest"
-"quantileBFloat16"
-"quantileTimingWeighted"
-"quantileTiming"
-"quantileExactHigh"
+"groupBitAndArgMax"
+"groupBitAndArgMin"
+"groupBitAndArray"
+"groupBitAndDistinct"
+"groupBitAndForEach"
+"groupBitAndIf"
+"groupBitAndMap"
+"groupBitAndMerge"
+"groupBitAndNull"
+"groupBitAndOrDefault"
+"groupBitAndOrNull"
+"groupBitAndResample"
+"groupBitAndSimpleState"
+"groupBitAndState"
 "groupBitOr"
-"quantileDeterministic"
-"stddevPop"
-"stddevSamp"
-"quantileExactLow"
-"quantileTDigestWeighted"
-"quantileExact"
-"covarPop"
-"quantileBFloat16Weighted"
-"quantileExactWeighted"
+"groupBitOrArgMax"
+"groupBitOrArgMin"
+"groupBitOrArray"
+"groupBitOrDistinct"
+"groupBitOrForEach"
+"groupBitOrIf"
+"groupBitOrMap"
+"groupBitOrMerge"
+"groupBitOrNull"
+"groupBitOrOrDefault"
+"groupBitOrOrNull"
+"groupBitOrResample"
+"groupBitOrSimpleState"
+"groupBitOrState"
 "groupBitXor"
+"groupBitXorArgMax"
+"groupBitXorArgMin"
+"groupBitXorArray"
+"groupBitXorDistinct"
+"groupBitXorForEach"
+"groupBitXorIf"
+"groupBitXorMap"
+"groupBitXorMerge"
+"groupBitXorNull"
+"groupBitXorOrDefault"
+"groupBitXorOrNull"
+"groupBitXorResample"
+"groupBitXorSimpleState"
+"groupBitXorState"
+"groupBitmap"
+"groupBitmapAnd"
+"groupBitmapAndArgMax"
+"groupBitmapAndArgMin"
+"groupBitmapAndArray"
+"groupBitmapAndDistinct"
+"groupBitmapAndForEach"
+"groupBitmapAndIf"
+"groupBitmapAndMap"
+"groupBitmapAndMerge"
+"groupBitmapAndNull"
+"groupBitmapAndOrDefault"
+"groupBitmapAndOrNull"
+"groupBitmapAndResample"
+"groupBitmapAndSimpleState"
+"groupBitmapAndState"
+"groupBitmapArgMax"
+"groupBitmapArgMin"
+"groupBitmapArray"
+"groupBitmapDistinct"
+"groupBitmapForEach"
+"groupBitmapIf"
+"groupBitmapMap"
+"groupBitmapMerge"
+"groupBitmapNull"
+"groupBitmapOr"
+"groupBitmapOrArgMax"
+"groupBitmapOrArgMin"
+"groupBitmapOrArray"
+"groupBitmapOrDefault"
+"groupBitmapOrDistinct"
+"groupBitmapOrForEach"
+"groupBitmapOrIf"
+"groupBitmapOrMap"
+"groupBitmapOrMerge"
+"groupBitmapOrNull"
+"groupBitmapOrNull"
+"groupBitmapOrOrDefault"
+"groupBitmapOrOrNull"
+"groupBitmapOrResample"
+"groupBitmapOrSimpleState"
+"groupBitmapOrState"
+"groupBitmapResample"
+"groupBitmapSimpleState"
+"groupBitmapState"
+"groupBitmapXor"
+"groupBitmapXorArgMax"
+"groupBitmapXorArgMin"
+"groupBitmapXorArray"
+"groupBitmapXorDistinct"
+"groupBitmapXorForEach"
+"groupBitmapXorIf"
+"groupBitmapXorMap"
+"groupBitmapXorMerge"
+"groupBitmapXorNull"
+"groupBitmapXorOrDefault"
+"groupBitmapXorOrNull"
+"groupBitmapXorResample"
+"groupBitmapXorSimpleState"
+"groupBitmapXorState"
+"groupUniqArray"
+"groupUniqArrayArgMax"
+"groupUniqArrayArgMin"
+"groupUniqArrayArray"
+"groupUniqArrayDistinct"
+"groupUniqArrayForEach"
+"groupUniqArrayIf"
+"groupUniqArrayMap"
+"groupUniqArrayMerge"
+"groupUniqArrayNull"
+"groupUniqArrayOrDefault"
+"groupUniqArrayOrNull"
+"groupUniqArrayResample"
+"groupUniqArraySimpleState"
+"groupUniqArrayState"
+"h3CellAreaM2"
+"h3CellAreaRads2"
+"h3Distance"
+"h3EdgeAngle"
+"h3EdgeLengthKm"
+"h3EdgeLengthM"
+"h3ExactEdgeLengthKm"
+"h3ExactEdgeLengthM"
+"h3ExactEdgeLengthRads"
+"h3GetBaseCell"
+"h3GetDestinationIndexFromUnidirectionalEdge"
+"h3GetFaces"
+"h3GetIndexesFromUnidirectionalEdge"
+"h3GetOriginIndexFromUnidirectionalEdge"
+"h3GetPentagonIndexes"
+"h3GetRes0Indexes"
+"h3GetResolution"
+"h3GetUnidirectionalEdge"
+"h3GetUnidirectionalEdgeBoundary"
+"h3GetUnidirectionalEdgesFromHexagon"
+"h3HexAreaKm2"
+"h3HexAreaM2"
+"h3HexRing"
+"h3IndexesAreNeighbors"
+"h3IsPentagon"
+"h3IsResClassIII"
+"h3IsValid"
+"h3Line"
+"h3NumHexagons"
+"h3PointDistKm"
+"h3PointDistM"
+"h3PointDistRads"
+"h3ToCenterChild"
+"h3ToChildren"
+"h3ToGeo"
+"h3ToGeoBoundary"
+"h3ToParent"
+"h3ToString"
+"h3UnidirectionalEdgeIsValid"
+"h3kRing"
+"halfMD5"
+"has"
+"hasAll"
+"hasAny"
+"hasColumnInTable"
+"hasSubsequence"
+"hasSubsequenceCaseInsensitive"
+"hasSubsequenceCaseInsensitiveUTF8"
+"hasSubsequenceUTF8"
+"hasSubstr"
+"hasThreadFuzzer"
+"hasToken"
+"hasTokenCaseInsensitive"
+"hasTokenCaseInsensitiveOrNull"
+"hasTokenOrNull"
+"hex"
+"histogram"
+"histogramArgMax"
+"histogramArgMin"
+"histogramArray"
+"histogramDistinct"
+"histogramForEach"
+"histogramIf"
+"histogramMap"
+"histogramMerge"
+"histogramNull"
+"histogramOrDefault"
+"histogramOrNull"
+"histogramResample"
+"histogramSimpleState"
+"histogramState"
+"hiveHash"
+"hop"
+"hopEnd"
+"hopStart"
+"hostName"
+"hostname"
+"hypot"
+"identity"
+"idnaDecode"
+"idnaEncode"
+"if"
+"ifNotFinite"
+"ifNull"
+"ignore"
+"ilike"
+"in"
+"inIgnoreSet"
+"indexHint"
+"indexOf"
+"initcap"
+"initcapUTF8"
+"initialQueryID"
+"initial_query_id"
+"initializeAggregation"
+"instr"
+"intDiv"
+"intDivOrZero"
+"intExp10"
+"intExp2"
+"intHash32"
+"intHash64"
+"intervalLengthSum"
+"intervalLengthSumArgMax"
+"intervalLengthSumArgMin"
+"intervalLengthSumArray"
+"intervalLengthSumDistinct"
+"intervalLengthSumForEach"
+"intervalLengthSumIf"
+"intervalLengthSumMap"
+"intervalLengthSumMerge"
+"intervalLengthSumNull"
+"intervalLengthSumOrDefault"
+"intervalLengthSumOrNull"
+"intervalLengthSumResample"
+"intervalLengthSumSimpleState"
+"intervalLengthSumState"
+"isConstant"
+"isDecimalOverflow"
+"isFinite"
+"isIPAddressInRange"
+"isIPv4String"
+"isIPv6String"
+"isInfinite"
+"isNaN"
+"isNotDistinctFrom"
+"isNotNull"
+"isNull"
+"isNullable"
+"isValidJSON"
+"isValidUTF8"
+"isZeroOrNull"
+"jaroSimilarity"
+"jaroWinklerSimilarity"
+"javaHash"
+"javaHashUTF16LE"
+"joinGet"
+"joinGetOrNull"
+"jsonMergePatch"
+"jumpConsistentHash"
+"kafkaMurmurHash"
+"kolmogorovSmirnovTest"
+"kolmogorovSmirnovTestArgMax"
+"kolmogorovSmirnovTestArgMin"
+"kolmogorovSmirnovTestArray"
+"kolmogorovSmirnovTestDistinct"
+"kolmogorovSmirnovTestForEach"
+"kolmogorovSmirnovTestIf"
+"kolmogorovSmirnovTestMap"
+"kolmogorovSmirnovTestMerge"
+"kolmogorovSmirnovTestNull"
+"kolmogorovSmirnovTestOrDefault"
+"kolmogorovSmirnovTestOrNull"
+"kolmogorovSmirnovTestResample"
+"kolmogorovSmirnovTestSimpleState"
+"kolmogorovSmirnovTestState"
+"kostikConsistentHash"
+"kql_array_sort_asc"
+"kql_array_sort_desc"
+"kurtPop"
+"kurtPopArgMax"
+"kurtPopArgMin"
+"kurtPopArray"
+"kurtPopDistinct"
+"kurtPopForEach"
+"kurtPopIf"
+"kurtPopMap"
+"kurtPopMerge"
+"kurtPopNull"
+"kurtPopOrDefault"
+"kurtPopOrNull"
+"kurtPopResample"
+"kurtPopSimpleState"
+"kurtPopState"
+"kurtSamp"
+"kurtSampArgMax"
+"kurtSampArgMin"
+"kurtSampArray"
+"kurtSampDistinct"
+"kurtSampForEach"
+"kurtSampIf"
+"kurtSampMap"
+"kurtSampMerge"
+"kurtSampNull"
+"kurtSampOrDefault"
+"kurtSampOrNull"
+"kurtSampResample"
+"kurtSampSimpleState"
+"kurtSampState"
+"lagInFrame"
+"lagInFrameArgMax"
+"lagInFrameArgMin"
+"lagInFrameArray"
+"lagInFrameDistinct"
+"lagInFrameForEach"
+"lagInFrameIf"
+"lagInFrameMap"
+"lagInFrameMerge"
+"lagInFrameNull"
+"lagInFrameOrDefault"
+"lagInFrameOrNull"
+"lagInFrameResample"
+"lagInFrameSimpleState"
+"lagInFrameState"
+"largestTriangleThreeBuckets"
+"largestTriangleThreeBucketsArgMax"
+"largestTriangleThreeBucketsArgMin"
+"largestTriangleThreeBucketsArray"
+"largestTriangleThreeBucketsDistinct"
+"largestTriangleThreeBucketsForEach"
+"largestTriangleThreeBucketsIf"
+"largestTriangleThreeBucketsMap"
+"largestTriangleThreeBucketsMerge"
+"largestTriangleThreeBucketsNull"
+"largestTriangleThreeBucketsOrDefault"
+"largestTriangleThreeBucketsOrNull"
+"largestTriangleThreeBucketsResample"
+"largestTriangleThreeBucketsSimpleState"
+"largestTriangleThreeBucketsState"
+"last_value"
+"last_valueArgMax"
+"last_valueArgMin"
+"last_valueArray"
+"last_valueDistinct"
+"last_valueForEach"
+"last_valueIf"
+"last_valueMap"
+"last_valueMerge"
+"last_valueNull"
+"last_valueOrDefault"
+"last_valueOrNull"
+"last_valueResample"
+"last_valueSimpleState"
+"last_valueState"
+"last_value_respect_nulls"
+"last_value_respect_nullsArgMax"
+"last_value_respect_nullsArgMin"
+"last_value_respect_nullsArray"
+"last_value_respect_nullsDistinct"
+"last_value_respect_nullsForEach"
+"last_value_respect_nullsIf"
+"last_value_respect_nullsMap"
+"last_value_respect_nullsMerge"
+"last_value_respect_nullsNull"
+"last_value_respect_nullsOrDefault"
+"last_value_respect_nullsOrNull"
+"last_value_respect_nullsResample"
+"last_value_respect_nullsSimpleState"
+"last_value_respect_nullsState"
+"lcase"
+"lcm"
+"leadInFrame"
+"leadInFrameArgMax"
+"leadInFrameArgMin"
+"leadInFrameArray"
+"leadInFrameDistinct"
+"leadInFrameForEach"
+"leadInFrameIf"
+"leadInFrameMap"
+"leadInFrameMerge"
+"leadInFrameNull"
+"leadInFrameOrDefault"
+"leadInFrameOrNull"
+"leadInFrameResample"
+"leadInFrameSimpleState"
+"leadInFrameState"
+"least"
+"left"
+"leftPad"
+"leftPadUTF8"
+"leftUTF8"
+"lemmatize"
+"length"
+"lengthUTF8"
+"less"
+"lessOrEquals"
+"levenshteinDistance"
+"lgamma"
+"like"
+"ln"
+"locate"
+"log"
+"log10"
+"log1p"
+"log2"
+"logTrace"
+"lowCardinalityIndices"
+"lowCardinalityKeys"
+"lower"
+"lowerUTF8"
+"lpad"
+"ltrim"
+"lttb"
+"lttbArgMax"
+"lttbArgMin"
+"lttbArray"
+"lttbDistinct"
+"lttbForEach"
+"lttbIf"
+"lttbMap"
+"lttbMerge"
+"lttbNull"
+"lttbOrDefault"
+"lttbOrNull"
+"lttbResample"
+"lttbSimpleState"
+"lttbState"
+"makeDate"
+"makeDate32"
+"makeDateTime"
+"makeDateTime64"
+"mannWhitneyUTest"
+"mannWhitneyUTestArgMax"
+"mannWhitneyUTestArgMin"
+"mannWhitneyUTestArray"
+"mannWhitneyUTestDistinct"
+"mannWhitneyUTestForEach"
+"mannWhitneyUTestIf"
+"mannWhitneyUTestMap"
+"mannWhitneyUTestMerge"
+"mannWhitneyUTestNull"
+"mannWhitneyUTestOrDefault"
+"mannWhitneyUTestOrNull"
+"mannWhitneyUTestResample"
+"mannWhitneyUTestSimpleState"
+"mannWhitneyUTestState"
+"map"
+"mapAdd"
+"mapAll"
+"mapApply"
+"mapConcat"
+"mapContains"
+"mapContainsKeyLike"
+"mapExists"
+"mapExtractKeyLike"
+"mapFilter"
+"mapFromArrays"
+"mapFromString"
+"mapKeys"
+"mapPartialReverseSort"
+"mapPartialSort"
+"mapPopulateSeries"
+"mapReverseSort"
+"mapSort"
+"mapSubtract"
+"mapUpdate"
+"mapValues"
+"match"
+"materialize"
+"max"
+"max2"
+"maxArgMax"
+"maxArgMin"
+"maxArray"
+"maxDistinct"
+"maxForEach"
+"maxIf"
+"maxIntersections"
+"maxIntersectionsArgMax"
+"maxIntersectionsArgMin"
+"maxIntersectionsArray"
+"maxIntersectionsDistinct"
+"maxIntersectionsForEach"
+"maxIntersectionsIf"
+"maxIntersectionsMap"
+"maxIntersectionsMerge"
+"maxIntersectionsNull"
+"maxIntersectionsOrDefault"
+"maxIntersectionsOrNull"
+"maxIntersectionsPosition"
+"maxIntersectionsPositionArgMax"
+"maxIntersectionsPositionArgMin"
+"maxIntersectionsPositionArray"
+"maxIntersectionsPositionDistinct"
+"maxIntersectionsPositionForEach"
+"maxIntersectionsPositionIf"
+"maxIntersectionsPositionMap"
+"maxIntersectionsPositionMerge"
+"maxIntersectionsPositionNull"
+"maxIntersectionsPositionOrDefault"
+"maxIntersectionsPositionOrNull"
+"maxIntersectionsPositionResample"
+"maxIntersectionsPositionSimpleState"
+"maxIntersectionsPositionState"
+"maxIntersectionsResample"
+"maxIntersectionsSimpleState"
+"maxIntersectionsState"
+"maxMap"
+"maxMappedArrays"
+"maxMappedArraysArgMax"
+"maxMappedArraysArgMin"
+"maxMappedArraysArray"
+"maxMappedArraysDistinct"
+"maxMappedArraysForEach"
+"maxMappedArraysIf"
+"maxMappedArraysMap"
+"maxMappedArraysMerge"
+"maxMappedArraysNull"
+"maxMappedArraysOrDefault"
+"maxMappedArraysOrNull"
+"maxMappedArraysResample"
+"maxMappedArraysSimpleState"
+"maxMappedArraysState"
+"maxMerge"
+"maxNull"
+"maxOrDefault"
+"maxOrNull"
+"maxResample"
+"maxSimpleState"
+"maxState"
+"meanZTest"
+"meanZTestArgMax"
+"meanZTestArgMin"
+"meanZTestArray"
+"meanZTestDistinct"
+"meanZTestForEach"
+"meanZTestIf"
+"meanZTestMap"
+"meanZTestMerge"
+"meanZTestNull"
+"meanZTestOrDefault"
+"meanZTestOrNull"
+"meanZTestResample"
+"meanZTestSimpleState"
+"meanZTestState"
+"median"
+"medianArgMax"
+"medianArgMin"
+"medianArray"
+"medianBFloat16"
+"medianBFloat16ArgMax"
+"medianBFloat16ArgMin"
+"medianBFloat16Array"
+"medianBFloat16Distinct"
+"medianBFloat16ForEach"
+"medianBFloat16If"
+"medianBFloat16Map"
+"medianBFloat16Merge"
+"medianBFloat16Null"
+"medianBFloat16OrDefault"
+"medianBFloat16OrNull"
+"medianBFloat16Resample"
+"medianBFloat16SimpleState"
+"medianBFloat16State"
+"medianBFloat16Weighted"
+"medianBFloat16WeightedArgMax"
+"medianBFloat16WeightedArgMin"
+"medianBFloat16WeightedArray"
+"medianBFloat16WeightedDistinct"
+"medianBFloat16WeightedForEach"
+"medianBFloat16WeightedIf"
+"medianBFloat16WeightedMap"
+"medianBFloat16WeightedMerge"
+"medianBFloat16WeightedNull"
+"medianBFloat16WeightedOrDefault"
+"medianBFloat16WeightedOrNull"
+"medianBFloat16WeightedResample"
+"medianBFloat16WeightedSimpleState"
+"medianBFloat16WeightedState"
+"medianDD"
+"medianDDArgMax"
+"medianDDArgMin"
+"medianDDArray"
+"medianDDDistinct"
+"medianDDForEach"
+"medianDDIf"
+"medianDDMap"
+"medianDDMerge"
+"medianDDNull"
+"medianDDOrDefault"
+"medianDDOrNull"
+"medianDDResample"
+"medianDDSimpleState"
+"medianDDState"
+"medianDeterministic"
+"medianDeterministicArgMax"
+"medianDeterministicArgMin"
+"medianDeterministicArray"
+"medianDeterministicDistinct"
+"medianDeterministicForEach"
+"medianDeterministicIf"
+"medianDeterministicMap"
+"medianDeterministicMerge"
+"medianDeterministicNull"
+"medianDeterministicOrDefault"
+"medianDeterministicOrNull"
+"medianDeterministicResample"
+"medianDeterministicSimpleState"
+"medianDeterministicState"
+"medianDistinct"
+"medianExact"
+"medianExactArgMax"
+"medianExactArgMin"
+"medianExactArray"
+"medianExactDistinct"
+"medianExactForEach"
+"medianExactHigh"
+"medianExactHighArgMax"
+"medianExactHighArgMin"
+"medianExactHighArray"
+"medianExactHighDistinct"
+"medianExactHighForEach"
+"medianExactHighIf"
+"medianExactHighMap"
+"medianExactHighMerge"
+"medianExactHighNull"
+"medianExactHighOrDefault"
+"medianExactHighOrNull"
+"medianExactHighResample"
+"medianExactHighSimpleState"
+"medianExactHighState"
+"medianExactIf"
+"medianExactLow"
+"medianExactLowArgMax"
+"medianExactLowArgMin"
+"medianExactLowArray"
+"medianExactLowDistinct"
+"medianExactLowForEach"
+"medianExactLowIf"
+"medianExactLowMap"
+"medianExactLowMerge"
+"medianExactLowNull"
+"medianExactLowOrDefault"
+"medianExactLowOrNull"
+"medianExactLowResample"
+"medianExactLowSimpleState"
+"medianExactLowState"
+"medianExactMap"
+"medianExactMerge"
+"medianExactNull"
+"medianExactOrDefault"
+"medianExactOrNull"
+"medianExactResample"
+"medianExactSimpleState"
+"medianExactState"
+"medianExactWeighted"
+"medianExactWeightedArgMax"
+"medianExactWeightedArgMin"
+"medianExactWeightedArray"
+"medianExactWeightedDistinct"
+"medianExactWeightedForEach"
+"medianExactWeightedIf"
+"medianExactWeightedMap"
+"medianExactWeightedMerge"
+"medianExactWeightedNull"
+"medianExactWeightedOrDefault"
+"medianExactWeightedOrNull"
+"medianExactWeightedResample"
+"medianExactWeightedSimpleState"
+"medianExactWeightedState"
+"medianForEach"
+"medianGK"
+"medianGKArgMax"
+"medianGKArgMin"
+"medianGKArray"
+"medianGKDistinct"
+"medianGKForEach"
+"medianGKIf"
+"medianGKMap"
+"medianGKMerge"
+"medianGKNull"
+"medianGKOrDefault"
+"medianGKOrNull"
+"medianGKResample"
+"medianGKSimpleState"
+"medianGKState"
+"medianIf"
+"medianInterpolatedWeighted"
+"medianInterpolatedWeightedArgMax"
+"medianInterpolatedWeightedArgMin"
+"medianInterpolatedWeightedArray"
+"medianInterpolatedWeightedDistinct"
+"medianInterpolatedWeightedForEach"
+"medianInterpolatedWeightedIf"
+"medianInterpolatedWeightedMap"
+"medianInterpolatedWeightedMerge"
+"medianInterpolatedWeightedNull"
+"medianInterpolatedWeightedOrDefault"
+"medianInterpolatedWeightedOrNull"
+"medianInterpolatedWeightedResample"
+"medianInterpolatedWeightedSimpleState"
+"medianInterpolatedWeightedState"
+"medianMap"
+"medianMerge"
+"medianNull"
+"medianOrDefault"
+"medianOrNull"
+"medianResample"
+"medianSimpleState"
+"medianState"
+"medianTDigest"
+"medianTDigestArgMax"
+"medianTDigestArgMin"
+"medianTDigestArray"
+"medianTDigestDistinct"
+"medianTDigestForEach"
+"medianTDigestIf"
+"medianTDigestMap"
+"medianTDigestMerge"
+"medianTDigestNull"
+"medianTDigestOrDefault"
+"medianTDigestOrNull"
+"medianTDigestResample"
+"medianTDigestSimpleState"
+"medianTDigestState"
+"medianTDigestWeighted"
+"medianTDigestWeightedArgMax"
+"medianTDigestWeightedArgMin"
+"medianTDigestWeightedArray"
+"medianTDigestWeightedDistinct"
+"medianTDigestWeightedForEach"
+"medianTDigestWeightedIf"
+"medianTDigestWeightedMap"
+"medianTDigestWeightedMerge"
+"medianTDigestWeightedNull"
+"medianTDigestWeightedOrDefault"
+"medianTDigestWeightedOrNull"
+"medianTDigestWeightedResample"
+"medianTDigestWeightedSimpleState"
+"medianTDigestWeightedState"
+"medianTiming"
+"medianTimingArgMax"
+"medianTimingArgMin"
+"medianTimingArray"
+"medianTimingDistinct"
+"medianTimingForEach"
+"medianTimingIf"
+"medianTimingMap"
+"medianTimingMerge"
+"medianTimingNull"
+"medianTimingOrDefault"
+"medianTimingOrNull"
+"medianTimingResample"
+"medianTimingSimpleState"
+"medianTimingState"
+"medianTimingWeighted"
+"medianTimingWeightedArgMax"
+"medianTimingWeightedArgMin"
+"medianTimingWeightedArray"
+"medianTimingWeightedDistinct"
+"medianTimingWeightedForEach"
+"medianTimingWeightedIf"
+"medianTimingWeightedMap"
+"medianTimingWeightedMerge"
+"medianTimingWeightedNull"
+"medianTimingWeightedOrDefault"
+"medianTimingWeightedOrNull"
+"medianTimingWeightedResample"
+"medianTimingWeightedSimpleState"
+"medianTimingWeightedState"
+"metroHash64"
+"mid"
+"min"
+"min2"
+"minArgMax"
+"minArgMin"
+"minArray"
+"minDistinct"
+"minForEach"
+"minIf"
+"minMap"
+"minMappedArrays"
+"minMappedArraysArgMax"
+"minMappedArraysArgMin"
+"minMappedArraysArray"
+"minMappedArraysDistinct"
+"minMappedArraysForEach"
+"minMappedArraysIf"
+"minMappedArraysMap"
+"minMappedArraysMerge"
+"minMappedArraysNull"
+"minMappedArraysOrDefault"
+"minMappedArraysOrNull"
+"minMappedArraysResample"
+"minMappedArraysSimpleState"
+"minMappedArraysState"
+"minMerge"
+"minNull"
+"minOrDefault"
+"minOrNull"
+"minResample"
+"minSampleSizeContinous"
+"minSampleSizeContinuous"
+"minSampleSizeConversion"
+"minSimpleState"
+"minState"
+"minus"
+"mismatches"
+"mod"
+"modulo"
+"moduloLegacy"
+"moduloOrZero"
+"monthName"
+"mortonDecode"
+"mortonEncode"
+"multiFuzzyMatchAllIndices"
+"multiFuzzyMatchAny"
+"multiFuzzyMatchAnyIndex"
+"multiIf"
+"multiMatchAllIndices"
+"multiMatchAny"
+"multiMatchAnyIndex"
+"multiSearchAllPositions"
+"multiSearchAllPositionsCaseInsensitive"
+"multiSearchAllPositionsCaseInsensitiveUTF8"
+"multiSearchAllPositionsUTF8"
+"multiSearchAny"
+"multiSearchAnyCaseInsensitive"
+"multiSearchAnyCaseInsensitiveUTF8"
+"multiSearchAnyUTF8"
+"multiSearchFirstIndex"
+"multiSearchFirstIndexCaseInsensitive"
+"multiSearchFirstIndexCaseInsensitiveUTF8"
+"multiSearchFirstIndexUTF8"
+"multiSearchFirstPosition"
+"multiSearchFirstPositionCaseInsensitive"
+"multiSearchFirstPositionCaseInsensitiveUTF8"
+"multiSearchFirstPositionUTF8"
+"multiply"
+"multiplyDecimal"
+"murmurHash2_32"
+"murmurHash2_64"
+"murmurHash3_128"
+"murmurHash3_32"
+"murmurHash3_64"
+"negate"
+"neighbor"
+"nested"
+"netloc"
+"ngramDistance"
+"ngramDistanceCaseInsensitive"
+"ngramDistanceCaseInsensitiveUTF8"
+"ngramDistanceUTF8"
+"ngramMinHash"
+"ngramMinHashArg"
+"ngramMinHashArgCaseInsensitive"
+"ngramMinHashArgCaseInsensitiveUTF8"
+"ngramMinHashArgUTF8"
+"ngramMinHashCaseInsensitive"
+"ngramMinHashCaseInsensitiveUTF8"
+"ngramMinHashUTF8"
+"ngramSearch"
+"ngramSearchCaseInsensitive"
+"ngramSearchCaseInsensitiveUTF8"
+"ngramSearchUTF8"
+"ngramSimHash"
+"ngramSimHashCaseInsensitive"
+"ngramSimHashCaseInsensitiveUTF8"
+"ngramSimHashUTF8"
+"ngrams"
+"nonNegativeDerivative"
+"nonNegativeDerivativeArgMax"
+"nonNegativeDerivativeArgMin"
+"nonNegativeDerivativeArray"
+"nonNegativeDerivativeDistinct"
+"nonNegativeDerivativeForEach"
+"nonNegativeDerivativeIf"
+"nonNegativeDerivativeMap"
+"nonNegativeDerivativeMerge"
+"nonNegativeDerivativeNull"
+"nonNegativeDerivativeOrDefault"
+"nonNegativeDerivativeOrNull"
+"nonNegativeDerivativeResample"
+"nonNegativeDerivativeSimpleState"
+"nonNegativeDerivativeState"
+"normL1"
+"normL2"
+"normL2Squared"
+"normLinf"
+"normLp"
+"normalizeL1"
+"normalizeL2"
+"normalizeLinf"
+"normalizeLp"
+"normalizeQuery"
+"normalizeQueryKeepNames"
+"normalizeUTF8NFC"
+"normalizeUTF8NFD"
+"normalizeUTF8NFKC"
+"normalizeUTF8NFKD"
+"normalizedQueryHash"
+"normalizedQueryHashKeepNames"
+"not"
+"notEmpty"
+"notEquals"
+"notILike"
+"notIn"
+"notInIgnoreSet"
+"notLike"
+"notNullIn"
+"notNullInIgnoreSet"
+"nothing"
+"nothingArgMax"
+"nothingArgMin"
+"nothingArray"
+"nothingDistinct"
+"nothingForEach"
+"nothingIf"
+"nothingMap"
+"nothingMerge"
+"nothingNull"
+"nothingNull"
+"nothingNullArgMax"
+"nothingNullArgMin"
+"nothingNullArray"
+"nothingNullDistinct"
+"nothingNullForEach"
+"nothingNullIf"
+"nothingNullMap"
+"nothingNullMerge"
+"nothingNullNull"
+"nothingNullOrDefault"
+"nothingNullOrNull"
+"nothingNullResample"
+"nothingNullSimpleState"
+"nothingNullState"
+"nothingOrDefault"
+"nothingOrNull"
+"nothingResample"
+"nothingSimpleState"
+"nothingState"
+"nothingUInt64"
+"nothingUInt64ArgMax"
+"nothingUInt64ArgMin"
+"nothingUInt64Array"
+"nothingUInt64Distinct"
+"nothingUInt64ForEach"
+"nothingUInt64If"
+"nothingUInt64Map"
+"nothingUInt64Merge"
+"nothingUInt64Null"
+"nothingUInt64OrDefault"
+"nothingUInt64OrNull"
+"nothingUInt64Resample"
+"nothingUInt64SimpleState"
+"nothingUInt64State"
+"now"
+"now64"
+"nowInBlock"
+"nth_value"
+"nth_valueArgMax"
+"nth_valueArgMin"
+"nth_valueArray"
+"nth_valueDistinct"
+"nth_valueForEach"
+"nth_valueIf"
+"nth_valueMap"
+"nth_valueMerge"
+"nth_valueNull"
+"nth_valueOrDefault"
+"nth_valueOrNull"
+"nth_valueResample"
+"nth_valueSimpleState"
+"nth_valueState"
+"ntile"
+"ntileArgMax"
+"ntileArgMin"
+"ntileArray"
+"ntileDistinct"
+"ntileForEach"
+"ntileIf"
+"ntileMap"
+"ntileMerge"
+"ntileNull"
+"ntileOrDefault"
+"ntileOrNull"
+"ntileResample"
+"ntileSimpleState"
+"ntileState"
+"nullIf"
+"nullIn"
+"nullInIgnoreSet"
+"or"
+"parseDateTime"
+"parseDateTime32BestEffort"
+"parseDateTime32BestEffortOrNull"
+"parseDateTime32BestEffortOrZero"
+"parseDateTime64BestEffort"
+"parseDateTime64BestEffortOrNull"
+"parseDateTime64BestEffortOrZero"
+"parseDateTime64BestEffortUS"
+"parseDateTime64BestEffortUSOrNull"
+"parseDateTime64BestEffortUSOrZero"
+"parseDateTimeBestEffort"
+"parseDateTimeBestEffortOrNull"
+"parseDateTimeBestEffortOrZero"
+"parseDateTimeBestEffortUS"
+"parseDateTimeBestEffortUSOrNull"
+"parseDateTimeBestEffortUSOrZero"
+"parseDateTimeInJodaSyntax"
+"parseDateTimeInJodaSyntaxOrNull"
+"parseDateTimeInJodaSyntaxOrZero"
+"parseDateTimeOrNull"
+"parseDateTimeOrZero"
+"parseTimeDelta"
+"partitionId"
+"path"
+"pathFull"
+"pi"
+"plus"
+"pmod"
+"pointInEllipses"
+"pointInPolygon"
+"polygonAreaCartesian"
+"polygonAreaSpherical"
+"polygonConvexHullCartesian"
+"polygonPerimeterCartesian"
+"polygonPerimeterSpherical"
+"polygonsDistanceCartesian"
+"polygonsDistanceSpherical"
+"polygonsEqualsCartesian"
+"polygonsIntersectionCartesian"
+"polygonsIntersectionSpherical"
+"polygonsSymDifferenceCartesian"
+"polygonsSymDifferenceSpherical"
+"polygonsUnionCartesian"
+"polygonsUnionSpherical"
+"polygonsWithinCartesian"
+"polygonsWithinSpherical"
+"port"
+"portRFC"
+"position"
+"positionCaseInsensitive"
+"positionCaseInsensitiveUTF8"
+"positionUTF8"
+"positiveModulo"
+"positive_modulo"
+"pow"
+"power"
+"proportionsZTest"
+"protocol"
+"punycodeDecode"
+"punycodeEncode"
 "quantile"
+"quantileArgMax"
+"quantileArgMin"
+"quantileArray"
+"quantileBFloat16"
+"quantileBFloat16ArgMax"
+"quantileBFloat16ArgMin"
+"quantileBFloat16Array"
+"quantileBFloat16Distinct"
+"quantileBFloat16ForEach"
+"quantileBFloat16If"
+"quantileBFloat16Map"
+"quantileBFloat16Merge"
+"quantileBFloat16Null"
+"quantileBFloat16OrDefault"
+"quantileBFloat16OrNull"
+"quantileBFloat16Resample"
+"quantileBFloat16SimpleState"
+"quantileBFloat16State"
+"quantileBFloat16Weighted"
+"quantileBFloat16WeightedArgMax"
+"quantileBFloat16WeightedArgMin"
+"quantileBFloat16WeightedArray"
+"quantileBFloat16WeightedDistinct"
+"quantileBFloat16WeightedForEach"
+"quantileBFloat16WeightedIf"
+"quantileBFloat16WeightedMap"
+"quantileBFloat16WeightedMerge"
+"quantileBFloat16WeightedNull"
+"quantileBFloat16WeightedOrDefault"
+"quantileBFloat16WeightedOrNull"
+"quantileBFloat16WeightedResample"
+"quantileBFloat16WeightedSimpleState"
+"quantileBFloat16WeightedState"
+"quantileDD"
+"quantileDDArgMax"
+"quantileDDArgMin"
+"quantileDDArray"
+"quantileDDDistinct"
+"quantileDDForEach"
+"quantileDDIf"
+"quantileDDMap"
+"quantileDDMerge"
+"quantileDDNull"
+"quantileDDOrDefault"
+"quantileDDOrNull"
+"quantileDDResample"
+"quantileDDSimpleState"
+"quantileDDState"
+"quantileDeterministic"
+"quantileDeterministicArgMax"
+"quantileDeterministicArgMin"
+"quantileDeterministicArray"
+"quantileDeterministicDistinct"
+"quantileDeterministicForEach"
+"quantileDeterministicIf"
+"quantileDeterministicMap"
+"quantileDeterministicMerge"
+"quantileDeterministicNull"
+"quantileDeterministicOrDefault"
+"quantileDeterministicOrNull"
+"quantileDeterministicResample"
+"quantileDeterministicSimpleState"
+"quantileDeterministicState"
+"quantileDistinct"
+"quantileExact"
+"quantileExactArgMax"
+"quantileExactArgMin"
+"quantileExactArray"
+"quantileExactDistinct"
+"quantileExactExclusive"
+"quantileExactExclusiveArgMax"
+"quantileExactExclusiveArgMin"
+"quantileExactExclusiveArray"
+"quantileExactExclusiveDistinct"
+"quantileExactExclusiveForEach"
+"quantileExactExclusiveIf"
+"quantileExactExclusiveMap"
+"quantileExactExclusiveMerge"
+"quantileExactExclusiveNull"
+"quantileExactExclusiveOrDefault"
+"quantileExactExclusiveOrNull"
+"quantileExactExclusiveResample"
+"quantileExactExclusiveSimpleState"
+"quantileExactExclusiveState"
+"quantileExactForEach"
+"quantileExactHigh"
+"quantileExactHighArgMax"
+"quantileExactHighArgMin"
+"quantileExactHighArray"
+"quantileExactHighDistinct"
+"quantileExactHighForEach"
+"quantileExactHighIf"
+"quantileExactHighMap"
+"quantileExactHighMerge"
+"quantileExactHighNull"
+"quantileExactHighOrDefault"
+"quantileExactHighOrNull"
+"quantileExactHighResample"
+"quantileExactHighSimpleState"
+"quantileExactHighState"
+"quantileExactIf"
+"quantileExactInclusive"
+"quantileExactInclusiveArgMax"
+"quantileExactInclusiveArgMin"
+"quantileExactInclusiveArray"
+"quantileExactInclusiveDistinct"
+"quantileExactInclusiveForEach"
+"quantileExactInclusiveIf"
+"quantileExactInclusiveMap"
+"quantileExactInclusiveMerge"
+"quantileExactInclusiveNull"
+"quantileExactInclusiveOrDefault"
+"quantileExactInclusiveOrNull"
+"quantileExactInclusiveResample"
+"quantileExactInclusiveSimpleState"
+"quantileExactInclusiveState"
+"quantileExactLow"
+"quantileExactLowArgMax"
+"quantileExactLowArgMin"
+"quantileExactLowArray"
+"quantileExactLowDistinct"
+"quantileExactLowForEach"
+"quantileExactLowIf"
+"quantileExactLowMap"
+"quantileExactLowMerge"
+"quantileExactLowNull"
+"quantileExactLowOrDefault"
+"quantileExactLowOrNull"
+"quantileExactLowResample"
+"quantileExactLowSimpleState"
+"quantileExactLowState"
+"quantileExactMap"
+"quantileExactMerge"
+"quantileExactNull"
+"quantileExactOrDefault"
+"quantileExactOrNull"
+"quantileExactResample"
+"quantileExactSimpleState"
+"quantileExactState"
+"quantileExactWeighted"
+"quantileExactWeightedArgMax"
+"quantileExactWeightedArgMin"
+"quantileExactWeightedArray"
+"quantileExactWeightedDistinct"
+"quantileExactWeightedForEach"
+"quantileExactWeightedIf"
+"quantileExactWeightedMap"
+"quantileExactWeightedMerge"
+"quantileExactWeightedNull"
+"quantileExactWeightedOrDefault"
+"quantileExactWeightedOrNull"
+"quantileExactWeightedResample"
+"quantileExactWeightedSimpleState"
+"quantileExactWeightedState"
+"quantileForEach"
+"quantileGK"
+"quantileGKArgMax"
+"quantileGKArgMin"
+"quantileGKArray"
+"quantileGKDistinct"
+"quantileGKForEach"
+"quantileGKIf"
+"quantileGKMap"
+"quantileGKMerge"
+"quantileGKNull"
+"quantileGKOrDefault"
+"quantileGKOrNull"
+"quantileGKResample"
+"quantileGKSimpleState"
+"quantileGKState"
+"quantileIf"
+"quantileInterpolatedWeighted"
+"quantileInterpolatedWeightedArgMax"
+"quantileInterpolatedWeightedArgMin"
+"quantileInterpolatedWeightedArray"
+"quantileInterpolatedWeightedDistinct"
+"quantileInterpolatedWeightedForEach"
+"quantileInterpolatedWeightedIf"
+"quantileInterpolatedWeightedMap"
+"quantileInterpolatedWeightedMerge"
+"quantileInterpolatedWeightedNull"
+"quantileInterpolatedWeightedOrDefault"
+"quantileInterpolatedWeightedOrNull"
+"quantileInterpolatedWeightedResample"
+"quantileInterpolatedWeightedSimpleState"
+"quantileInterpolatedWeightedState"
+"quantileMap"
+"quantileMerge"
+"quantileNull"
+"quantileOrDefault"
+"quantileOrNull"
+"quantileResample"
+"quantileSimpleState"
+"quantileState"
+"quantileTDigest"
+"quantileTDigestArgMax"
+"quantileTDigestArgMin"
+"quantileTDigestArray"
+"quantileTDigestDistinct"
+"quantileTDigestForEach"
+"quantileTDigestIf"
+"quantileTDigestMap"
+"quantileTDigestMerge"
+"quantileTDigestNull"
+"quantileTDigestOrDefault"
+"quantileTDigestOrNull"
+"quantileTDigestResample"
+"quantileTDigestSimpleState"
+"quantileTDigestState"
+"quantileTDigestWeighted"
+"quantileTDigestWeightedArgMax"
+"quantileTDigestWeightedArgMin"
+"quantileTDigestWeightedArray"
+"quantileTDigestWeightedDistinct"
+"quantileTDigestWeightedForEach"
+"quantileTDigestWeightedIf"
+"quantileTDigestWeightedMap"
+"quantileTDigestWeightedMerge"
+"quantileTDigestWeightedNull"
+"quantileTDigestWeightedOrDefault"
+"quantileTDigestWeightedOrNull"
+"quantileTDigestWeightedResample"
+"quantileTDigestWeightedSimpleState"
+"quantileTDigestWeightedState"
+"quantileTiming"
+"quantileTimingArgMax"
+"quantileTimingArgMin"
+"quantileTimingArray"
+"quantileTimingDistinct"
+"quantileTimingForEach"
+"quantileTimingIf"
+"quantileTimingMap"
+"quantileTimingMerge"
+"quantileTimingNull"
+"quantileTimingOrDefault"
+"quantileTimingOrNull"
+"quantileTimingResample"
+"quantileTimingSimpleState"
+"quantileTimingState"
+"quantileTimingWeighted"
+"quantileTimingWeightedArgMax"
+"quantileTimingWeightedArgMin"
+"quantileTimingWeightedArray"
+"quantileTimingWeightedDistinct"
+"quantileTimingWeightedForEach"
+"quantileTimingWeightedIf"
+"quantileTimingWeightedMap"
+"quantileTimingWeightedMerge"
+"quantileTimingWeightedNull"
+"quantileTimingWeightedOrDefault"
+"quantileTimingWeightedOrNull"
+"quantileTimingWeightedResample"
+"quantileTimingWeightedSimpleState"
+"quantileTimingWeightedState"
+"quantiles"
+"quantilesArgMax"
+"quantilesArgMin"
+"quantilesArray"
+"quantilesBFloat16"
+"quantilesBFloat16ArgMax"
+"quantilesBFloat16ArgMin"
+"quantilesBFloat16Array"
+"quantilesBFloat16Distinct"
+"quantilesBFloat16ForEach"
+"quantilesBFloat16If"
+"quantilesBFloat16Map"
+"quantilesBFloat16Merge"
+"quantilesBFloat16Null"
+"quantilesBFloat16OrDefault"
+"quantilesBFloat16OrNull"
+"quantilesBFloat16Resample"
+"quantilesBFloat16SimpleState"
+"quantilesBFloat16State"
+"quantilesBFloat16Weighted"
+"quantilesBFloat16WeightedArgMax"
+"quantilesBFloat16WeightedArgMin"
+"quantilesBFloat16WeightedArray"
+"quantilesBFloat16WeightedDistinct"
+"quantilesBFloat16WeightedForEach"
+"quantilesBFloat16WeightedIf"
+"quantilesBFloat16WeightedMap"
+"quantilesBFloat16WeightedMerge"
+"quantilesBFloat16WeightedNull"
+"quantilesBFloat16WeightedOrDefault"
+"quantilesBFloat16WeightedOrNull"
+"quantilesBFloat16WeightedResample"
+"quantilesBFloat16WeightedSimpleState"
+"quantilesBFloat16WeightedState"
+"quantilesDD"
+"quantilesDDArgMax"
+"quantilesDDArgMin"
+"quantilesDDArray"
+"quantilesDDDistinct"
+"quantilesDDForEach"
+"quantilesDDIf"
+"quantilesDDMap"
+"quantilesDDMerge"
+"quantilesDDNull"
+"quantilesDDOrDefault"
+"quantilesDDOrNull"
+"quantilesDDResample"
+"quantilesDDSimpleState"
+"quantilesDDState"
+"quantilesDeterministic"
+"quantilesDeterministicArgMax"
+"quantilesDeterministicArgMin"
+"quantilesDeterministicArray"
+"quantilesDeterministicDistinct"
+"quantilesDeterministicForEach"
+"quantilesDeterministicIf"
+"quantilesDeterministicMap"
+"quantilesDeterministicMerge"
+"quantilesDeterministicNull"
+"quantilesDeterministicOrDefault"
+"quantilesDeterministicOrNull"
+"quantilesDeterministicResample"
+"quantilesDeterministicSimpleState"
+"quantilesDeterministicState"
+"quantilesDistinct"
+"quantilesExact"
+"quantilesExactArgMax"
+"quantilesExactArgMin"
+"quantilesExactArray"
+"quantilesExactDistinct"
+"quantilesExactExclusive"
+"quantilesExactExclusiveArgMax"
+"quantilesExactExclusiveArgMin"
+"quantilesExactExclusiveArray"
+"quantilesExactExclusiveDistinct"
+"quantilesExactExclusiveForEach"
+"quantilesExactExclusiveIf"
+"quantilesExactExclusiveMap"
+"quantilesExactExclusiveMerge"
+"quantilesExactExclusiveNull"
+"quantilesExactExclusiveOrDefault"
+"quantilesExactExclusiveOrNull"
+"quantilesExactExclusiveResample"
+"quantilesExactExclusiveSimpleState"
+"quantilesExactExclusiveState"
+"quantilesExactForEach"
+"quantilesExactHigh"
+"quantilesExactHighArgMax"
+"quantilesExactHighArgMin"
+"quantilesExactHighArray"
+"quantilesExactHighDistinct"
+"quantilesExactHighForEach"
+"quantilesExactHighIf"
+"quantilesExactHighMap"
+"quantilesExactHighMerge"
+"quantilesExactHighNull"
+"quantilesExactHighOrDefault"
+"quantilesExactHighOrNull"
+"quantilesExactHighResample"
+"quantilesExactHighSimpleState"
+"quantilesExactHighState"
+"quantilesExactIf"
+"quantilesExactInclusive"
+"quantilesExactInclusiveArgMax"
+"quantilesExactInclusiveArgMin"
+"quantilesExactInclusiveArray"
+"quantilesExactInclusiveDistinct"
+"quantilesExactInclusiveForEach"
+"quantilesExactInclusiveIf"
+"quantilesExactInclusiveMap"
+"quantilesExactInclusiveMerge"
+"quantilesExactInclusiveNull"
+"quantilesExactInclusiveOrDefault"
+"quantilesExactInclusiveOrNull"
+"quantilesExactInclusiveResample"
+"quantilesExactInclusiveSimpleState"
+"quantilesExactInclusiveState"
+"quantilesExactLow"
+"quantilesExactLowArgMax"
+"quantilesExactLowArgMin"
+"quantilesExactLowArray"
+"quantilesExactLowDistinct"
+"quantilesExactLowForEach"
+"quantilesExactLowIf"
+"quantilesExactLowMap"
+"quantilesExactLowMerge"
+"quantilesExactLowNull"
+"quantilesExactLowOrDefault"
+"quantilesExactLowOrNull"
+"quantilesExactLowResample"
+"quantilesExactLowSimpleState"
+"quantilesExactLowState"
+"quantilesExactMap"
+"quantilesExactMerge"
+"quantilesExactNull"
+"quantilesExactOrDefault"
+"quantilesExactOrNull"
+"quantilesExactResample"
+"quantilesExactSimpleState"
+"quantilesExactState"
+"quantilesExactWeighted"
+"quantilesExactWeightedArgMax"
+"quantilesExactWeightedArgMin"
+"quantilesExactWeightedArray"
+"quantilesExactWeightedDistinct"
+"quantilesExactWeightedForEach"
+"quantilesExactWeightedIf"
+"quantilesExactWeightedMap"
+"quantilesExactWeightedMerge"
+"quantilesExactWeightedNull"
+"quantilesExactWeightedOrDefault"
+"quantilesExactWeightedOrNull"
+"quantilesExactWeightedResample"
+"quantilesExactWeightedSimpleState"
+"quantilesExactWeightedState"
+"quantilesForEach"
+"quantilesGK"
+"quantilesGKArgMax"
+"quantilesGKArgMin"
+"quantilesGKArray"
+"quantilesGKDistinct"
+"quantilesGKForEach"
+"quantilesGKIf"
+"quantilesGKMap"
+"quantilesGKMerge"
+"quantilesGKNull"
+"quantilesGKOrDefault"
+"quantilesGKOrNull"
+"quantilesGKResample"
+"quantilesGKSimpleState"
+"quantilesGKState"
+"quantilesIf"
+"quantilesInterpolatedWeighted"
+"quantilesInterpolatedWeightedArgMax"
+"quantilesInterpolatedWeightedArgMin"
+"quantilesInterpolatedWeightedArray"
+"quantilesInterpolatedWeightedDistinct"
+"quantilesInterpolatedWeightedForEach"
+"quantilesInterpolatedWeightedIf"
+"quantilesInterpolatedWeightedMap"
+"quantilesInterpolatedWeightedMerge"
+"quantilesInterpolatedWeightedNull"
+"quantilesInterpolatedWeightedOrDefault"
+"quantilesInterpolatedWeightedOrNull"
+"quantilesInterpolatedWeightedResample"
+"quantilesInterpolatedWeightedSimpleState"
+"quantilesInterpolatedWeightedState"
+"quantilesMap"
+"quantilesMerge"
+"quantilesNull"
+"quantilesOrDefault"
+"quantilesOrNull"
+"quantilesResample"
+"quantilesSimpleState"
+"quantilesState"
+"quantilesTDigest"
+"quantilesTDigestArgMax"
+"quantilesTDigestArgMin"
+"quantilesTDigestArray"
+"quantilesTDigestDistinct"
+"quantilesTDigestForEach"
+"quantilesTDigestIf"
+"quantilesTDigestMap"
+"quantilesTDigestMerge"
+"quantilesTDigestNull"
+"quantilesTDigestOrDefault"
+"quantilesTDigestOrNull"
+"quantilesTDigestResample"
+"quantilesTDigestSimpleState"
+"quantilesTDigestState"
+"quantilesTDigestWeighted"
+"quantilesTDigestWeightedArgMax"
+"quantilesTDigestWeightedArgMin"
+"quantilesTDigestWeightedArray"
+"quantilesTDigestWeightedDistinct"
+"quantilesTDigestWeightedForEach"
+"quantilesTDigestWeightedIf"
+"quantilesTDigestWeightedMap"
+"quantilesTDigestWeightedMerge"
+"quantilesTDigestWeightedNull"
+"quantilesTDigestWeightedOrDefault"
+"quantilesTDigestWeightedOrNull"
+"quantilesTDigestWeightedResample"
+"quantilesTDigestWeightedSimpleState"
+"quantilesTDigestWeightedState"
+"quantilesTiming"
+"quantilesTimingArgMax"
+"quantilesTimingArgMin"
+"quantilesTimingArray"
+"quantilesTimingDistinct"
+"quantilesTimingForEach"
+"quantilesTimingIf"
+"quantilesTimingMap"
+"quantilesTimingMerge"
+"quantilesTimingNull"
+"quantilesTimingOrDefault"
+"quantilesTimingOrNull"
+"quantilesTimingResample"
+"quantilesTimingSimpleState"
+"quantilesTimingState"
+"quantilesTimingWeighted"
+"quantilesTimingWeightedArgMax"
+"quantilesTimingWeightedArgMin"
+"quantilesTimingWeightedArray"
+"quantilesTimingWeightedDistinct"
+"quantilesTimingWeightedForEach"
+"quantilesTimingWeightedIf"
+"quantilesTimingWeightedMap"
+"quantilesTimingWeightedMerge"
+"quantilesTimingWeightedNull"
+"quantilesTimingWeightedOrDefault"
+"quantilesTimingWeightedOrNull"
+"quantilesTimingWeightedResample"
+"quantilesTimingWeightedSimpleState"
+"quantilesTimingWeightedState"
+"queryID"
+"queryString"
+"queryStringAndFragment"
+"query_id"
+"radians"
+"rand"
+"rand32"
+"rand64"
+"randBernoulli"
+"randBinomial"
+"randCanonical"
+"randChiSquared"
+"randConstant"
+"randExponential"
+"randFisherF"
+"randLogNormal"
+"randNegativeBinomial"
+"randNormal"
+"randPoisson"
+"randStudentT"
+"randUniform"
+"randomFixedString"
+"randomPrintableASCII"
+"randomString"
+"randomStringUTF8"
+"range"
+"rank"
+"rankArgMax"
+"rankArgMin"
+"rankArray"
+"rankCorr"
+"rankCorrArgMax"
+"rankCorrArgMin"
+"rankCorrArray"
+"rankCorrDistinct"
+"rankCorrForEach"
+"rankCorrIf"
+"rankCorrMap"
+"rankCorrMerge"
+"rankCorrNull"
+"rankCorrOrDefault"
+"rankCorrOrNull"
+"rankCorrResample"
+"rankCorrSimpleState"
+"rankCorrState"
+"rankDistinct"
+"rankForEach"
+"rankIf"
+"rankMap"
+"rankMerge"
+"rankNull"
+"rankOrDefault"
+"rankOrNull"
+"rankResample"
+"rankSimpleState"
+"rankState"
+"readWKTMultiPolygon"
+"readWKTPoint"
+"readWKTPolygon"
+"readWKTRing"
+"regexpExtract"
+"regexpQuoteMeta"
+"regionHierarchy"
+"regionIn"
+"regionToArea"
+"regionToCity"
+"regionToContinent"
+"regionToCountry"
+"regionToDistrict"
+"regionToName"
+"regionToPopulation"
+"regionToTopContinent"
+"reinterpret"
+"reinterpretAsDate"
+"reinterpretAsDateTime"
+"reinterpretAsFixedString"
+"reinterpretAsFloat32"
+"reinterpretAsFloat64"
+"reinterpretAsInt128"
+"reinterpretAsInt16"
+"reinterpretAsInt256"
+"reinterpretAsInt32"
+"reinterpretAsInt64"
+"reinterpretAsInt8"
+"reinterpretAsString"
+"reinterpretAsUInt128"
+"reinterpretAsUInt16"
+"reinterpretAsUInt256"
+"reinterpretAsUInt32"
+"reinterpretAsUInt64"
+"reinterpretAsUInt8"
+"reinterpretAsUUID"
+"repeat"
+"replace"
+"replaceAll"
+"replaceOne"
+"replaceRegexpAll"
+"replaceRegexpOne"
+"replicate"
+"retention"
+"retentionArgMax"
+"retentionArgMin"
+"retentionArray"
+"retentionDistinct"
+"retentionForEach"
+"retentionIf"
+"retentionMap"
+"retentionMerge"
+"retentionNull"
+"retentionOrDefault"
+"retentionOrNull"
+"retentionResample"
+"retentionSimpleState"
+"retentionState"
+"reverse"
+"reverseUTF8"
+"revision"
+"right"
+"rightPad"
+"rightPadUTF8"
+"rightUTF8"
+"round"
+"roundAge"
+"roundBankers"
+"roundDown"
+"roundDuration"
+"roundToExp2"
+"rowNumberInAllBlocks"
+"rowNumberInBlock"
+"row_number"
+"row_numberArgMax"
+"row_numberArgMin"
+"row_numberArray"
+"row_numberDistinct"
+"row_numberForEach"
+"row_numberIf"
+"row_numberMap"
+"row_numberMerge"
+"row_numberNull"
+"row_numberOrDefault"
+"row_numberOrNull"
+"row_numberResample"
+"row_numberSimpleState"
+"row_numberState"
+"rpad"
+"rtrim"
+"runningAccumulate"
+"runningConcurrency"
+"runningDifference"
+"runningDifferenceStartingWithFirstValue"
+"s2CapContains"
+"s2CapUnion"
+"s2CellsIntersect"
+"s2GetNeighbors"
+"s2RectAdd"
+"s2RectContains"
+"s2RectIntersection"
+"s2RectUnion"
+"s2ToGeo"
+"scalarProduct"
+"sequenceCount"
+"sequenceCountArgMax"
+"sequenceCountArgMin"
+"sequenceCountArray"
+"sequenceCountDistinct"
+"sequenceCountForEach"
+"sequenceCountIf"
+"sequenceCountMap"
+"sequenceCountMerge"
+"sequenceCountNull"
+"sequenceCountOrDefault"
+"sequenceCountOrNull"
+"sequenceCountResample"
+"sequenceCountSimpleState"
+"sequenceCountState"
+"sequenceMatch"
+"sequenceMatchArgMax"
+"sequenceMatchArgMin"
+"sequenceMatchArray"
+"sequenceMatchDistinct"
+"sequenceMatchForEach"
+"sequenceMatchIf"
+"sequenceMatchMap"
+"sequenceMatchMerge"
+"sequenceMatchNull"
+"sequenceMatchOrDefault"
+"sequenceMatchOrNull"
+"sequenceMatchResample"
+"sequenceMatchSimpleState"
+"sequenceMatchState"
+"sequenceNextNode"
+"sequenceNextNodeArgMax"
+"sequenceNextNodeArgMin"
+"sequenceNextNodeArray"
+"sequenceNextNodeDistinct"
+"sequenceNextNodeForEach"
+"sequenceNextNodeIf"
+"sequenceNextNodeMap"
+"sequenceNextNodeMerge"
+"sequenceNextNodeNull"
+"sequenceNextNodeOrDefault"
+"sequenceNextNodeOrNull"
+"sequenceNextNodeResample"
+"sequenceNextNodeSimpleState"
+"sequenceNextNodeState"
+"seriesDecomposeSTL"
+"seriesOutliersDetectTukey"
+"seriesPeriodDetectFFT"
+"serverTimeZone"
+"serverTimezone"
+"serverUUID"
+"shardCount"
+"shardNum"
+"showCertificate"
+"sigmoid"
+"sign"
+"simpleJSONExtractBool"
+"simpleJSONExtractFloat"
+"simpleJSONExtractInt"
+"simpleJSONExtractRaw"
+"simpleJSONExtractString"
+"simpleJSONExtractUInt"
+"simpleJSONHas"
+"simpleLinearRegression"
+"simpleLinearRegressionArgMax"
+"simpleLinearRegressionArgMin"
+"simpleLinearRegressionArray"
+"simpleLinearRegressionDistinct"
+"simpleLinearRegressionForEach"
+"simpleLinearRegressionIf"
+"simpleLinearRegressionMap"
+"simpleLinearRegressionMerge"
+"simpleLinearRegressionNull"
+"simpleLinearRegressionOrDefault"
+"simpleLinearRegressionOrNull"
+"simpleLinearRegressionResample"
+"simpleLinearRegressionSimpleState"
+"simpleLinearRegressionState"
+"sin"
+"singleValueOrNull"
+"singleValueOrNullArgMax"
+"singleValueOrNullArgMin"
+"singleValueOrNullArray"
+"singleValueOrNullDistinct"
+"singleValueOrNullForEach"
+"singleValueOrNullIf"
+"singleValueOrNullMap"
+"singleValueOrNullMerge"
+"singleValueOrNullNull"
+"singleValueOrNullOrDefault"
+"singleValueOrNullOrNull"
+"singleValueOrNullResample"
+"singleValueOrNullSimpleState"
+"singleValueOrNullState"
+"sinh"
+"sipHash128"
+"sipHash128Keyed"
+"sipHash128Reference"
+"sipHash128ReferenceKeyed"
+"sipHash64"
+"sipHash64Keyed"
+"skewPop"
+"skewPopArgMax"
+"skewPopArgMin"
+"skewPopArray"
+"skewPopDistinct"
+"skewPopForEach"
+"skewPopIf"
+"skewPopMap"
+"skewPopMerge"
+"skewPopNull"
+"skewPopOrDefault"
+"skewPopOrNull"
+"skewPopResample"
+"skewPopSimpleState"
+"skewPopState"
+"skewSamp"
+"skewSampArgMax"
+"skewSampArgMin"
+"skewSampArray"
+"skewSampDistinct"
+"skewSampForEach"
+"skewSampIf"
+"skewSampMap"
+"skewSampMerge"
+"skewSampNull"
+"skewSampOrDefault"
+"skewSampOrNull"
+"skewSampResample"
+"skewSampSimpleState"
+"skewSampState"
+"sleep"
+"sleepEachRow"
+"snowflakeToDateTime"
+"snowflakeToDateTime64"
+"soundex"
+"space"
+"sparkBar"
+"sparkBarArgMax"
+"sparkBarArgMin"
+"sparkBarArray"
+"sparkBarDistinct"
+"sparkBarForEach"
+"sparkBarIf"
+"sparkBarMap"
+"sparkBarMerge"
+"sparkBarNull"
+"sparkBarOrDefault"
+"sparkBarOrNull"
+"sparkBarResample"
+"sparkBarSimpleState"
+"sparkBarState"
+"sparkbar"
+"sparkbarArgMax"
+"sparkbarArgMin"
+"sparkbarArray"
+"sparkbarDistinct"
+"sparkbarForEach"
+"sparkbarIf"
+"sparkbarMap"
+"sparkbarMerge"
+"sparkbarNull"
+"sparkbarOrDefault"
+"sparkbarOrNull"
+"sparkbarResample"
+"sparkbarSimpleState"
+"sparkbarState"
+"splitByAlpha"
+"splitByChar"
+"splitByNonAlpha"
+"splitByRegexp"
+"splitByString"
+"splitByWhitespace"
+"sqid"
+"sqidDecode"
+"sqidEncode"
+"sqrt"
+"startsWith"
+"startsWithUTF8"
+"stddevPop"
+"stddevPopArgMax"
+"stddevPopArgMin"
+"stddevPopArray"
+"stddevPopDistinct"
+"stddevPopForEach"
+"stddevPopIf"
+"stddevPopMap"
+"stddevPopMerge"
+"stddevPopNull"
+"stddevPopOrDefault"
+"stddevPopOrNull"
+"stddevPopResample"
+"stddevPopSimpleState"
+"stddevPopStable"
+"stddevPopStableArgMax"
+"stddevPopStableArgMin"
+"stddevPopStableArray"
+"stddevPopStableDistinct"
+"stddevPopStableForEach"
+"stddevPopStableIf"
+"stddevPopStableMap"
+"stddevPopStableMerge"
+"stddevPopStableNull"
+"stddevPopStableOrDefault"
+"stddevPopStableOrNull"
+"stddevPopStableResample"
+"stddevPopStableSimpleState"
+"stddevPopStableState"
+"stddevPopState"
+"stddevSamp"
+"stddevSampArgMax"
+"stddevSampArgMin"
+"stddevSampArray"
+"stddevSampDistinct"
+"stddevSampForEach"
+"stddevSampIf"
+"stddevSampMap"
+"stddevSampMerge"
+"stddevSampNull"
+"stddevSampOrDefault"
+"stddevSampOrNull"
+"stddevSampResample"
+"stddevSampSimpleState"
+"stddevSampStable"
+"stddevSampStableArgMax"
+"stddevSampStableArgMin"
+"stddevSampStableArray"
+"stddevSampStableDistinct"
+"stddevSampStableForEach"
+"stddevSampStableIf"
+"stddevSampStableMap"
+"stddevSampStableMerge"
+"stddevSampStableNull"
+"stddevSampStableOrDefault"
+"stddevSampStableOrNull"
+"stddevSampStableResample"
+"stddevSampStableSimpleState"
+"stddevSampStableState"
+"stddevSampState"
+"stem"
+"stochasticLinearRegression"
+"stochasticLinearRegressionArgMax"
+"stochasticLinearRegressionArgMin"
+"stochasticLinearRegressionArray"
+"stochasticLinearRegressionDistinct"
+"stochasticLinearRegressionForEach"
+"stochasticLinearRegressionIf"
+"stochasticLinearRegressionMap"
+"stochasticLinearRegressionMerge"
+"stochasticLinearRegressionNull"
+"stochasticLinearRegressionOrDefault"
+"stochasticLinearRegressionOrNull"
+"stochasticLinearRegressionResample"
+"stochasticLinearRegressionSimpleState"
+"stochasticLinearRegressionState"
+"stochasticLogisticRegression"
+"stochasticLogisticRegressionArgMax"
+"stochasticLogisticRegressionArgMin"
+"stochasticLogisticRegressionArray"
+"stochasticLogisticRegressionDistinct"
+"stochasticLogisticRegressionForEach"
+"stochasticLogisticRegressionIf"
+"stochasticLogisticRegressionMap"
+"stochasticLogisticRegressionMerge"
+"stochasticLogisticRegressionNull"
+"stochasticLogisticRegressionOrDefault"
+"stochasticLogisticRegressionOrNull"
+"stochasticLogisticRegressionResample"
+"stochasticLogisticRegressionSimpleState"
+"stochasticLogisticRegressionState"
+"str_to_date"
+"str_to_map"
+"stringJaccardIndex"
+"stringJaccardIndexUTF8"
+"stringToH3"
+"structureToCapnProtoSchema"
+"structureToProtobufSchema"
+"studentTTest"
+"studentTTestArgMax"
+"studentTTestArgMin"
+"studentTTestArray"
+"studentTTestDistinct"
+"studentTTestForEach"
+"studentTTestIf"
+"studentTTestMap"
+"studentTTestMerge"
+"studentTTestNull"
+"studentTTestOrDefault"
+"studentTTestOrNull"
+"studentTTestResample"
+"studentTTestSimpleState"
+"studentTTestState"
+"subBitmap"
+"subDate"
+"substr"
+"substring"
+"substringIndex"
+"substringIndexUTF8"
+"substringUTF8"
+"subtractDays"
+"subtractHours"
+"subtractInterval"
+"subtractMicroseconds"
+"subtractMilliseconds"
+"subtractMinutes"
+"subtractMonths"
+"subtractNanoseconds"
+"subtractQuarters"
+"subtractSeconds"
+"subtractTupleOfIntervals"
+"subtractWeeks"
+"subtractYears"
+"sum"
+"sumArgMax"
+"sumArgMin"
+"sumArray"
+"sumCount"
+"sumCountArgMax"
+"sumCountArgMin"
+"sumCountArray"
+"sumCountDistinct"
+"sumCountForEach"
+"sumCountIf"
+"sumCountMap"
+"sumCountMerge"
+"sumCountNull"
+"sumCountOrDefault"
+"sumCountOrNull"
+"sumCountResample"
+"sumCountSimpleState"
+"sumCountState"
+"sumDistinct"
+"sumForEach"
+"sumIf"
+"sumKahan"
+"sumKahanArgMax"
+"sumKahanArgMin"
+"sumKahanArray"
+"sumKahanDistinct"
+"sumKahanForEach"
+"sumKahanIf"
+"sumKahanMap"
+"sumKahanMerge"
+"sumKahanNull"
+"sumKahanOrDefault"
+"sumKahanOrNull"
+"sumKahanResample"
+"sumKahanSimpleState"
+"sumKahanState"
+"sumMap"
+"sumMapFiltered"
+"sumMapFilteredArgMax"
+"sumMapFilteredArgMin"
+"sumMapFilteredArray"
+"sumMapFilteredDistinct"
+"sumMapFilteredForEach"
+"sumMapFilteredIf"
+"sumMapFilteredMap"
+"sumMapFilteredMerge"
+"sumMapFilteredNull"
+"sumMapFilteredOrDefault"
+"sumMapFilteredOrNull"
+"sumMapFilteredResample"
+"sumMapFilteredSimpleState"
+"sumMapFilteredState"
+"sumMapFilteredWithOverflow"
+"sumMapFilteredWithOverflowArgMax"
+"sumMapFilteredWithOverflowArgMin"
+"sumMapFilteredWithOverflowArray"
+"sumMapFilteredWithOverflowDistinct"
+"sumMapFilteredWithOverflowForEach"
+"sumMapFilteredWithOverflowIf"
+"sumMapFilteredWithOverflowMap"
+"sumMapFilteredWithOverflowMerge"
+"sumMapFilteredWithOverflowNull"
+"sumMapFilteredWithOverflowOrDefault"
+"sumMapFilteredWithOverflowOrNull"
+"sumMapFilteredWithOverflowResample"
+"sumMapFilteredWithOverflowSimpleState"
+"sumMapFilteredWithOverflowState"
+"sumMapWithOverflow"
+"sumMapWithOverflowArgMax"
+"sumMapWithOverflowArgMin"
+"sumMapWithOverflowArray"
+"sumMapWithOverflowDistinct"
+"sumMapWithOverflowForEach"
+"sumMapWithOverflowIf"
+"sumMapWithOverflowMap"
+"sumMapWithOverflowMerge"
+"sumMapWithOverflowNull"
+"sumMapWithOverflowOrDefault"
+"sumMapWithOverflowOrNull"
+"sumMapWithOverflowResample"
+"sumMapWithOverflowSimpleState"
+"sumMapWithOverflowState"
+"sumMappedArrays"
+"sumMappedArraysArgMax"
+"sumMappedArraysArgMin"
+"sumMappedArraysArray"
+"sumMappedArraysDistinct"
+"sumMappedArraysForEach"
+"sumMappedArraysIf"
+"sumMappedArraysMap"
+"sumMappedArraysMerge"
+"sumMappedArraysNull"
+"sumMappedArraysOrDefault"
+"sumMappedArraysOrNull"
+"sumMappedArraysResample"
+"sumMappedArraysSimpleState"
+"sumMappedArraysState"
+"sumMerge"
+"sumNull"
+"sumOrDefault"
+"sumOrNull"
+"sumResample"
+"sumSimpleState"
+"sumState"
+"sumWithOverflow"
+"sumWithOverflowArgMax"
+"sumWithOverflowArgMin"
+"sumWithOverflowArray"
+"sumWithOverflowDistinct"
+"sumWithOverflowForEach"
+"sumWithOverflowIf"
+"sumWithOverflowMap"
+"sumWithOverflowMerge"
+"sumWithOverflowNull"
+"sumWithOverflowOrDefault"
+"sumWithOverflowOrNull"
+"sumWithOverflowResample"
+"sumWithOverflowSimpleState"
+"sumWithOverflowState"
+"svg"
+"synonyms"
+"tan"
+"tanh"
+"tcpPort"
+"tgamma"
+"theilsU"
+"theilsUArgMax"
+"theilsUArgMin"
+"theilsUArray"
+"theilsUDistinct"
+"theilsUForEach"
+"theilsUIf"
+"theilsUMap"
+"theilsUMerge"
+"theilsUNull"
+"theilsUOrDefault"
+"theilsUOrNull"
+"theilsUResample"
+"theilsUSimpleState"
+"theilsUState"
+"throwIf"
+"tid"
+"timeDiff"
+"timeSlot"
+"timeSlots"
+"timeZone"
+"timeZoneOf"
+"timeZoneOffset"
+"timestamp"
+"timestampDiff"
+"timestamp_diff"
+"timezone"
+"timezoneOf"
+"timezoneOffset"
+"toBool"
+"toColumnTypeName"
+"toDate"
+"toDate32"
+"toDate32OrDefault"
+"toDate32OrNull"
+"toDate32OrZero"
+"toDateOrDefault"
+"toDateOrNull"
+"toDateOrZero"
+"toDateTime"
+"toDateTime32"
+"toDateTime64"
+"toDateTime64OrDefault"
+"toDateTime64OrNull"
+"toDateTime64OrZero"
+"toDateTimeOrDefault"
+"toDateTimeOrNull"
+"toDateTimeOrZero"
+"toDayOfMonth"
+"toDayOfWeek"
+"toDayOfYear"
+"toDaysSinceYearZero"
+"toDecimal128"
+"toDecimal128OrDefault"
+"toDecimal128OrNull"
+"toDecimal128OrZero"
+"toDecimal256"
+"toDecimal256OrDefault"
+"toDecimal256OrNull"
+"toDecimal256OrZero"
+"toDecimal32"
+"toDecimal32OrDefault"
+"toDecimal32OrNull"
+"toDecimal32OrZero"
+"toDecimal64"
+"toDecimal64OrDefault"
+"toDecimal64OrNull"
+"toDecimal64OrZero"
+"toDecimalString"
+"toFixedString"
+"toFloat32"
+"toFloat32OrDefault"
+"toFloat32OrNull"
+"toFloat32OrZero"
+"toFloat64"
+"toFloat64OrDefault"
+"toFloat64OrNull"
+"toFloat64OrZero"
+"toHour"
+"toIPv4"
+"toIPv4OrDefault"
+"toIPv4OrNull"
+"toIPv4OrZero"
+"toIPv6"
+"toIPv6OrDefault"
+"toIPv6OrNull"
+"toIPv6OrZero"
+"toISOWeek"
+"toISOYear"
+"toInt128"
+"toInt128OrDefault"
+"toInt128OrNull"
+"toInt128OrZero"
+"toInt16"
+"toInt16OrDefault"
+"toInt16OrNull"
+"toInt16OrZero"
+"toInt256"
+"toInt256OrDefault"
+"toInt256OrNull"
+"toInt256OrZero"
+"toInt32"
+"toInt32OrDefault"
+"toInt32OrNull"
+"toInt32OrZero"
+"toInt64"
+"toInt64OrDefault"
+"toInt64OrNull"
+"toInt64OrZero"
+"toInt8"
+"toInt8OrDefault"
+"toInt8OrNull"
+"toInt8OrZero"
+"toIntervalDay"
+"toIntervalHour"
+"toIntervalMicrosecond"
+"toIntervalMillisecond"
+"toIntervalMinute"
+"toIntervalMonth"
+"toIntervalNanosecond"
+"toIntervalQuarter"
+"toIntervalSecond"
+"toIntervalWeek"
+"toIntervalYear"
+"toJSONString"
+"toLastDayOfMonth"
+"toLastDayOfWeek"
+"toLowCardinality"
+"toMillisecond"
+"toMinute"
+"toModifiedJulianDay"
+"toModifiedJulianDayOrNull"
+"toMonday"
+"toMonth"
+"toNullable"
+"toQuarter"
+"toRelativeDayNum"
+"toRelativeHourNum"
+"toRelativeMinuteNum"
+"toRelativeMonthNum"
+"toRelativeQuarterNum"
+"toRelativeSecondNum"
+"toRelativeWeekNum"
+"toRelativeYearNum"
+"toSecond"
+"toStartOfDay"
+"toStartOfFifteenMinutes"
+"toStartOfFiveMinute"
+"toStartOfFiveMinutes"
+"toStartOfHour"
+"toStartOfISOYear"
+"toStartOfInterval"
+"toStartOfMicrosecond"
+"toStartOfMillisecond"
+"toStartOfMinute"
+"toStartOfMonth"
+"toStartOfNanosecond"
+"toStartOfQuarter"
+"toStartOfSecond"
+"toStartOfTenMinutes"
+"toStartOfWeek"
+"toStartOfYear"
+"toString"
+"toStringCutToZero"
+"toTime"
+"toTimeZone"
+"toTimezone"
+"toTypeName"
+"toUInt128"
+"toUInt128OrDefault"
+"toUInt128OrNull"
+"toUInt128OrZero"
+"toUInt16"
+"toUInt16OrDefault"
+"toUInt16OrNull"
+"toUInt16OrZero"
+"toUInt256"
+"toUInt256OrDefault"
+"toUInt256OrNull"
+"toUInt256OrZero"
+"toUInt32"
+"toUInt32OrDefault"
+"toUInt32OrNull"
+"toUInt32OrZero"
+"toUInt64"
+"toUInt64OrDefault"
+"toUInt64OrNull"
+"toUInt64OrZero"
+"toUInt8"
+"toUInt8OrDefault"
+"toUInt8OrNull"
+"toUInt8OrZero"
+"toUTCTimestamp"
+"toUUID"
+"toUUIDOrDefault"
+"toUUIDOrNull"
+"toUUIDOrZero"
+"toUnixTimestamp"
+"toUnixTimestamp64Micro"
+"toUnixTimestamp64Milli"
+"toUnixTimestamp64Nano"
+"toValidUTF8"
+"toWeek"
+"toYYYYMM"
+"toYYYYMMDD"
+"toYYYYMMDDhhmmss"
+"toYear"
+"toYearWeek"
+"to_utc_timestamp"
+"today"
+"tokens"
+"topK"
+"topKArgMax"
+"topKArgMin"
+"topKArray"
+"topKDistinct"
+"topKForEach"
+"topKIf"
+"topKMap"
+"topKMerge"
+"topKNull"
+"topKOrDefault"
+"topKOrNull"
+"topKResample"
+"topKSimpleState"
+"topKState"
+"topKWeighted"
+"topKWeightedArgMax"
+"topKWeightedArgMin"
+"topKWeightedArray"
+"topKWeightedDistinct"
+"topKWeightedForEach"
+"topKWeightedIf"
+"topKWeightedMap"
+"topKWeightedMerge"
+"topKWeightedNull"
+"topKWeightedOrDefault"
+"topKWeightedOrNull"
+"topKWeightedResample"
+"topKWeightedSimpleState"
+"topKWeightedState"
+"topLevelDomain"
+"topLevelDomainRFC"
+"transactionID"
+"transactionLatestSnapshot"
+"transactionOldestSnapshot"
+"transform"
+"translate"
+"translateUTF8"
+"trim"
+"trimBoth"
+"trimLeft"
+"trimRight"
+"trunc"
+"truncate"
+"tryBase58Decode"
+"tryBase64Decode"
+"tryDecrypt"
+"tryIdnaEncode"
+"tryPunycodeDecode"
+"tumble"
+"tumbleEnd"
+"tumbleStart"
+"tuple"
+"tupleConcat"
+"tupleDivide"
+"tupleDivideByNumber"
+"tupleElement"
+"tupleHammingDistance"
+"tupleIntDiv"
+"tupleIntDivByNumber"
+"tupleIntDivOrZero"
+"tupleIntDivOrZeroByNumber"
+"tupleMinus"
+"tupleModulo"
+"tupleModuloByNumber"
+"tupleMultiply"
+"tupleMultiplyByNumber"
+"tupleNegate"
+"tuplePlus"
+"tupleToNameValuePairs"
+"ucase"
+"unbin"
+"unhex"
+"uniq"
+"uniqArgMax"
+"uniqArgMin"
+"uniqArray"
+"uniqCombined"
+"uniqCombined64"
+"uniqCombined64ArgMax"
+"uniqCombined64ArgMin"
+"uniqCombined64Array"
+"uniqCombined64Distinct"
+"uniqCombined64ForEach"
+"uniqCombined64If"
+"uniqCombined64Map"
+"uniqCombined64Merge"
+"uniqCombined64Null"
+"uniqCombined64OrDefault"
+"uniqCombined64OrNull"
+"uniqCombined64Resample"
+"uniqCombined64SimpleState"
+"uniqCombined64State"
+"uniqCombinedArgMax"
+"uniqCombinedArgMin"
+"uniqCombinedArray"
+"uniqCombinedDistinct"
+"uniqCombinedForEach"
+"uniqCombinedIf"
+"uniqCombinedMap"
+"uniqCombinedMerge"
+"uniqCombinedNull"
+"uniqCombinedOrDefault"
+"uniqCombinedOrNull"
+"uniqCombinedResample"
+"uniqCombinedSimpleState"
+"uniqCombinedState"
+"uniqDistinct"
+"uniqExact"
+"uniqExactArgMax"
+"uniqExactArgMin"
+"uniqExactArray"
+"uniqExactDistinct"
+"uniqExactForEach"
+"uniqExactIf"
+"uniqExactMap"
+"uniqExactMerge"
+"uniqExactNull"
+"uniqExactOrDefault"
+"uniqExactOrNull"
+"uniqExactResample"
+"uniqExactSimpleState"
+"uniqExactState"
+"uniqForEach"
+"uniqHLL12"
+"uniqHLL12ArgMax"
+"uniqHLL12ArgMin"
+"uniqHLL12Array"
+"uniqHLL12Distinct"
+"uniqHLL12ForEach"
+"uniqHLL12If"
+"uniqHLL12Map"
+"uniqHLL12Merge"
+"uniqHLL12Null"
+"uniqHLL12OrDefault"
+"uniqHLL12OrNull"
+"uniqHLL12Resample"
+"uniqHLL12SimpleState"
+"uniqHLL12State"
+"uniqIf"
+"uniqMap"
+"uniqMerge"
+"uniqNull"
+"uniqOrDefault"
+"uniqOrNull"
+"uniqResample"
+"uniqSimpleState"
+"uniqState"
+"uniqTheta"
+"uniqThetaArgMax"
+"uniqThetaArgMin"
+"uniqThetaArray"
+"uniqThetaDistinct"
+"uniqThetaForEach"
+"uniqThetaIf"
+"uniqThetaIntersect"
+"uniqThetaMap"
+"uniqThetaMerge"
+"uniqThetaNot"
+"uniqThetaNull"
+"uniqThetaOrDefault"
+"uniqThetaOrNull"
+"uniqThetaResample"
+"uniqThetaSimpleState"
+"uniqThetaState"
+"uniqThetaUnion"
+"uniqUpTo"
+"uniqUpToArgMax"
+"uniqUpToArgMin"
+"uniqUpToArray"
+"uniqUpToDistinct"
+"uniqUpToForEach"
+"uniqUpToIf"
+"uniqUpToMap"
+"uniqUpToMerge"
+"uniqUpToNull"
+"uniqUpToOrDefault"
+"uniqUpToOrNull"
+"uniqUpToResample"
+"uniqUpToSimpleState"
+"uniqUpToState"
+"upper"
+"upperUTF8"
+"uptime"
+"user"
+"validateNestedArraySizes"
+"varPop"
+"varPopArgMax"
+"varPopArgMin"
+"varPopArray"
+"varPopDistinct"
+"varPopForEach"
+"varPopIf"
+"varPopMap"
+"varPopMerge"
+"varPopNull"
+"varPopOrDefault"
+"varPopOrNull"
+"varPopResample"
+"varPopSimpleState"
+"varPopStable"
+"varPopStableArgMax"
+"varPopStableArgMin"
+"varPopStableArray"
+"varPopStableDistinct"
+"varPopStableForEach"
+"varPopStableIf"
+"varPopStableMap"
+"varPopStableMerge"
+"varPopStableNull"
+"varPopStableOrDefault"
+"varPopStableOrNull"
+"varPopStableResample"
+"varPopStableSimpleState"
+"varPopStableState"
+"varPopState"
+"varSamp"
+"varSampArgMax"
+"varSampArgMin"
+"varSampArray"
+"varSampDistinct"
+"varSampForEach"
+"varSampIf"
+"varSampMap"
+"varSampMerge"
+"varSampNull"
+"varSampOrDefault"
+"varSampOrNull"
+"varSampResample"
+"varSampSimpleState"
+"varSampStable"
+"varSampStableArgMax"
+"varSampStableArgMin"
+"varSampStableArray"
+"varSampStableDistinct"
+"varSampStableForEach"
+"varSampStableIf"
+"varSampStableMap"
+"varSampStableMerge"
+"varSampStableNull"
+"varSampStableOrDefault"
+"varSampStableOrNull"
+"varSampStableResample"
+"varSampStableSimpleState"
+"varSampStableState"
+"varSampState"
+"variantElement"
+"variantType"
+"vectorDifference"
+"vectorSum"
+"version"
+"visibleWidth"
+"visitParamExtractBool"
+"visitParamExtractFloat"
+"visitParamExtractInt"
+"visitParamExtractRaw"
+"visitParamExtractString"
+"visitParamExtractUInt"
+"visitParamHas"
+"week"
+"welchTTest"
+"welchTTestArgMax"
+"welchTTestArgMin"
+"welchTTestArray"
+"welchTTestDistinct"
+"welchTTestForEach"
+"welchTTestIf"
+"welchTTestMap"
+"welchTTestMerge"
+"welchTTestNull"
+"welchTTestOrDefault"
+"welchTTestOrNull"
+"welchTTestResample"
+"welchTTestSimpleState"
+"welchTTestState"
+"widthBucket"
+"width_bucket"
+"windowFunnel"
+"windowFunnelArgMax"
+"windowFunnelArgMin"
+"windowFunnelArray"
+"windowFunnelDistinct"
+"windowFunnelForEach"
+"windowFunnelIf"
+"windowFunnelMap"
+"windowFunnelMerge"
+"windowFunnelNull"
+"windowFunnelOrDefault"
+"windowFunnelOrNull"
+"windowFunnelResample"
+"windowFunnelSimpleState"
+"windowFunnelState"
+"windowID"
+"wkt"
+"wordShingleMinHash"
+"wordShingleMinHashArg"
+"wordShingleMinHashArgCaseInsensitive"
+"wordShingleMinHashArgCaseInsensitiveUTF8"
+"wordShingleMinHashArgUTF8"
+"wordShingleMinHashCaseInsensitive"
+"wordShingleMinHashCaseInsensitiveUTF8"
+"wordShingleMinHashUTF8"
+"wordShingleSimHash"
+"wordShingleSimHashCaseInsensitive"
+"wordShingleSimHashCaseInsensitiveUTF8"
+"wordShingleSimHashUTF8"
+"wyHash64"
+"xor"
+"xxHash32"
+"xxHash64"
+"xxh3"
+"yandexConsistentHash"
+"yearweek"
+"yesterday"
+"zookeeperSessionUptime"
diff --git a/tests/fuzz/dictionaries/key_words.dict b/tests/fuzz/dictionaries/key_words.dict
index 0db2d159759..db517a2382c 100644
--- a/tests/fuzz/dictionaries/key_words.dict
+++ b/tests/fuzz/dictionaries/key_words.dict
@@ -1,183 +1,543 @@
-# Key words (based on keywords from antlr parser)
-
 "ADD"
+"ADD COLUMN"
+"ADD CONSTRAINT"
+"ADD INDEX"
+"ADD PROJECTION"
+"ADD STATISTIC"
+"ADMIN OPTION FOR"
 "AFTER"
+"ALGORITHM"
 "ALIAS"
 "ALL"
+"ALLOWED_LATENESS"
 "ALTER"
+"ALTER COLUMN"
+"ALTER DATABASE"
+"ALTER LIVE VIEW"
+"ALTER POLICY"
+"ALTER PROFILE"
+"ALTER QUOTA"
+"ALTER ROLE"
+"ALTER ROW POLICY"
+"ALTER SETTINGS PROFILE"
+"ALTER TABLE"
+"ALTER TEMPORARY TABLE"
+"ALTER USER"
 "AND"
+"AND STDOUT"
 "ANTI"
 "ANY"
-"ARRAY"
+"APPEND"
+"APPLY"
+"APPLY DELETED MASK"
+"ARRAY JOIN"
 "AS"
+"ASC"
 "ASCENDING"
 "ASOF"
+"ASSUME"
 "AST"
 "ASYNC"
 "ATTACH"
+"ATTACH PART"
+"ATTACH PARTITION"
+"ATTACH POLICY"
+"ATTACH PROFILE"
+"ATTACH QUOTA"
+"ATTACH ROLE"
+"ATTACH ROW POLICY"
+"ATTACH SETTINGS PROFILE"
+"ATTACH USER"
+"AUTO_INCREMENT"
+"AZURE"
+"BACKUP"
+"BCRYPT_HASH"
+"BCRYPT_PASSWORD"
+"BEGIN TRANSACTION"
 "BETWEEN"
+"BIDIRECTIONAL"
 "BOTH"
 "BY"
+"CASCADE"
 "CASE"
 "CAST"
+"CHANGE"
+"CHANGEABLE_IN_READONLY"
+"CHANGED"
+"CHAR"
+"CHAR VARYING"
+"CHARACTER"
+"CHARACTER LARGE OBJECT"
+"CHARACTER VARYING"
 "CHECK"
-"CLEAR"
+"CHECK ALL TABLES"
+"CHECK TABLE"
+"CLEANUP"
+"CLEAR COLUMN"
+"CLEAR INDEX"
+"CLEAR PROJECTION"
+"CLEAR STATISTIC"
 "CLUSTER"
+"CLUSTERS"
+"CN"
 "CODEC"
 "COLLATE"
 "COLUMN"
+"COLUMNS"
 "COMMENT"
+"COMMENT COLUMN"
+"COMMIT"
+"COMPRESSION"
+"CONST"
 "CONSTRAINT"
 "CREATE"
+"CREATE POLICY"
+"CREATE PROFILE"
+"CREATE QUOTA"
+"CREATE ROLE"
+"CREATE ROW POLICY"
+"CREATE SETTINGS PROFILE"
+"CREATE TABLE"
+"CREATE TEMPORARY TABLE"
+"CREATE USER"
 "CROSS"
 "CUBE"
+"CURRENT GRANTS"
+"CURRENT QUOTA"
+"CURRENT ROLES"
+"CURRENT ROW"
+"CURRENT TRANSACTION"
+"CURRENTUSER"
+"CURRENT_USER"
+"D"
 "DATABASE"
 "DATABASES"
 "DATE"
 "DAY"
+"DAYS"
+"DD"
 "DEDUPLICATE"
 "DEFAULT"
-"DELAY"
+"DEFAULT DATABASE"
+"DEFAULT ROLE"
+"DEFINER"
 "DELETE"
+"DEPENDS ON"
 "DESC"
 "DESCENDING"
 "DESCRIBE"
 "DETACH"
+"DETACH PART"
+"DETACH PARTITION"
 "DICTIONARIES"
 "DICTIONARY"
 "DISK"
 "DISTINCT"
-"DISTRIBUTED"
+"DISTINCT ON"
+"DIV"
+"DOUBLE_SHA1_HASH"
+"DOUBLE_SHA1_PASSWORD"
 "DROP"
+"DROP COLUMN"
+"DROP CONSTRAINT"
+"DROP DEFAULT"
+"DROP DETACHED PART"
+"DROP DETACHED PARTITION"
+"DROP INDEX"
+"DROP PART"
+"DROP PARTITION"
+"DROP PROJECTION"
+"DROP STATISTIC"
+"DROP TABLE"
+"DROP TEMPORARY TABLE"
 "ELSE"
+"EMPTY"
+"EMPTY AS"
+"ENABLED ROLES"
 "END"
+"ENFORCED"
 "ENGINE"
+"EPHEMERAL"
+"EPHEMERAL SEQUENTIAL"
+"ESTIMATE"
+"EVENT"
 "EVENTS"
+"EVERY"
+"EXCEPT"
+"EXCEPT DATABASE"
+"EXCEPT DATABASES"
+"EXCEPT TABLE"
+"EXCEPT TABLES"
+"EXCHANGE DICTIONARIES"
+"EXCHANGE TABLES"
 "EXISTS"
 "EXPLAIN"
 "EXPRESSION"
-"EXTRACT"
-"FETCHES"
+"EXTENDED"
+"EXTERNAL DDL FROM"
+"FALSE"
+"FETCH"
+"FETCH PART"
+"FETCH PARTITION"
+"FIELDS"
+"FILE"
+"FILESYSTEM CACHE"
+"FILESYSTEM CACHES"
+"FILTER"
 "FINAL"
 "FIRST"
-"FLUSH"
+"FOLLOWING"
 "FOR"
+"FOREIGN"
+"FOREIGN KEY"
+"FORGET PARTITION"
 "FORMAT"
 "FREEZE"
 "FROM"
+"FROM INFILE"
+"FROM SHARD"
 "FULL"
+"FULLTEXT"
 "FUNCTION"
 "GLOBAL"
+"GLOBAL IN"
+"GLOBAL NOT IN"
+"GRANT"
+"GRANT OPTION FOR"
+"GRANTEES"
 "GRANULARITY"
-"GROUP"
+"GROUP BY"
+"GROUPING SETS"
+"GROUPS"
+"H"
+"HASH"
 "HAVING"
+"HDFS"
+"HH"
 "HIERARCHICAL"
+"HOST"
 "HOUR"
+"HOURS"
+"HTTP"
 "ID"
-"IF"
+"IDENTIFIED"
+"IF EMPTY"
+"IF EXISTS"
+"IF NOT EXISTS"
+"IGNORE NULLS"
 "ILIKE"
 "IN"
+"IN PARTITION"
 "INDEX"
-"INF"
+"INDEXES"
+"INDICES"
+"INHERIT"
 "INJECTIVE"
 "INNER"
-"INSERT"
+"INSERT INTO"
+"INTERPOLATE"
+"INTERSECT"
 "INTERVAL"
-"INTO"
-"IS"
+"INTO OUTFILE"
+"INVISIBLE"
+"INVOKER"
+"IP"
+"IS NOT DISTINCT FROM"
+"IS NOT NULL"
+"IS NULL"
 "IS_OBJECT_ID"
 "JOIN"
+"KERBEROS"
 "KEY"
+"KEY BY"
+"KEYED BY"
+"KEYS"
 "KILL"
+"KIND"
+"LARGE OBJECT"
 "LAST"
 "LAYOUT"
+"LDAP"
 "LEADING"
 "LEFT"
+"LEFT ARRAY JOIN"
+"LESS THAN"
+"LEVEL"
 "LIFETIME"
+"LIGHTWEIGHT"
 "LIKE"
 "LIMIT"
+"LINEAR"
+"LIST"
 "LIVE"
 "LOCAL"
-"LOGS"
+"M"
+"MATCH"
 "MATERIALIZE"
+"MATERIALIZE COLUMN"
+"MATERIALIZE INDEX"
+"MATERIALIZE PROJECTION"
+"MATERIALIZE STATISTIC"
+"MATERIALIZE TTL"
 "MATERIALIZED"
 "MAX"
+"MCS"
+"MEMORY"
 "MERGES"
+"MI"
+"MICROSECOND"
+"MICROSECONDS"
+"MILLISECOND"
+"MILLISECONDS"
 "MIN"
 "MINUTE"
+"MINUTES"
+"MM"
+"MOD"
 "MODIFY"
+"MODIFY COLUMN"
+"MODIFY COMMENT"
+"MODIFY ORDER BY"
+"MODIFY QUERY"
+"MODIFY REFRESH"
+"MODIFY SAMPLE BY"
+"MODIFY SETTING"
+"MODIFY SQL SECURITY"
+"MODIFY TTL"
 "MONTH"
+"MONTHS"
 "MOVE"
+"MOVE PART"
+"MOVE PARTITION"
+"MS"
 "MUTATION"
-"NAN_SQL"
-"NO"
+"N"
+"NAME"
+"NAMED COLLECTION"
+"NANOSECOND"
+"NANOSECONDS"
+"NEXT"
+"NO ACTION"
+"NO DELAY"
+"NO LIMITS"
+"NONE"
 "NOT"
-"NULL_SQL"
+"NOT BETWEEN"
+"NOT IDENTIFIED"
+"NOT ILIKE"
+"NOT IN"
+"NOT KEYED"
+"NOT LIKE"
+"NOT OVERRIDABLE"
+"NO_PASSWORD"
+"NS"
+"NULL"
 "NULLS"
 "OFFSET"
 "ON"
-"OPTIMIZE"
+"ON DELETE"
+"ON UPDATE"
+"ON VOLUME"
+"ONLY"
+"OPTIMIZE TABLE"
 "OR"
-"ORDER"
+"OR REPLACE"
+"ORDER BY"
 "OUTER"
-"OUTFILE"
+"OVER"
+"OVERRIDABLE"
+"PART"
+"PARTIAL"
 "PARTITION"
+"PARTITION BY"
+"PARTITIONS"
+"PART_MOVE_TO_SHARD"
+"PASTE"
+"PERIODIC REFRESH"
+"PERMANENTLY"
+"PERMISSIVE"
+"PERSISTENT"
+"PERSISTENT SEQUENTIAL"
+"PIPELINE"
+"PLAINTEXT_PASSWORD"
+"PLAN"
 "POPULATE"
+"PRECEDING"
+"PRECISION"
 "PREWHERE"
 "PRIMARY"
+"PRIMARY KEY"
+"PROFILE"
 "PROJECTION"
+"PULL"
+"Protobuf"
+"Q"
+"QQ"
 "QUARTER"
+"QUARTERS"
+"QUERY"
+"QUERY TREE"
+"QUOTA"
+"RANDOMIZE FOR"
+"RANDOMIZED"
 "RANGE"
-"RELOAD"
+"READONLY"
+"REALM"
+"RECOMPRESS"
+"REFERENCES"
+"REFRESH"
+"REGEXP"
 "REMOVE"
+"REMOVE SAMPLE BY"
+"REMOVE TTL"
 "RENAME"
+"RENAME COLUMN"
+"RENAME DATABASE"
+"RENAME DICTIONARY"
+"RENAME TABLE"
+"RENAME TO"
 "REPLACE"
-"REPLICA"
-"REPLICATED"
+"REPLACE PARTITION"
+"RESET SETTING"
+"RESPECT NULLS"
+"RESTORE"
+"RESTRICT"
+"RESTRICTIVE"
+"RESUME"
+"REVOKE"
 "RIGHT"
+"ROLLBACK"
 "ROLLUP"
+"ROW"
+"ROWS"
+"S"
+"S3"
+"SALT"
 "SAMPLE"
+"SAMPLE BY"
+"SCHEME"
 "SECOND"
+"SECONDS"
 "SELECT"
 "SEMI"
-"SENDS"
+"SERVER"
 "SET"
+"SET DEFAULT"
+"SET DEFAULT ROLE"
+"SET FAKE TIME"
+"SET NULL"
+"SET ROLE"
+"SET ROLE DEFAULT"
+"SET TRANSACTION SNAPSHOT"
 "SETTINGS"
+"SHA256_HASH"
+"SHA256_PASSWORD"
 "SHOW"
+"SHOW ACCESS"
+"SHOW CREATE"
+"SHOW ENGINES"
+"SHOW FUNCTIONS"
+"SHOW GRANTS"
+"SHOW PRIVILEGES"
+"SHOW PROCESSLIST"
+"SHOW SETTING"
+"SIGNED"
+"SIMPLE"
 "SOURCE"
-"START"
-"STOP"
-"SUBSTRING"
+"SPATIAL"
+"SQL SECURITY"
+"SQL_TSI_DAY"
+"SQL_TSI_HOUR"
+"SQL_TSI_MICROSECOND"
+"SQL_TSI_MILLISECOND"
+"SQL_TSI_MINUTE"
+"SQL_TSI_MONTH"
+"SQL_TSI_NANOSECOND"
+"SQL_TSI_QUARTER"
+"SQL_TSI_SECOND"
+"SQL_TSI_WEEK"
+"SQL_TSI_YEAR"
+"SS"
+"SSH_KEY"
+"SSL_CERTIFICATE"
+"STATISTIC"
+"STEP"
+"STORAGE"
+"STRICT"
+"STRICTLY_ASCENDING"
+"SUBPARTITION"
+"SUBPARTITION BY"
+"SUBPARTITIONS"
+"SUSPEND"
 "SYNC"
 "SYNTAX"
 "SYSTEM"
 "TABLE"
+"TABLE OVERRIDE"
 "TABLES"
 "TEMPORARY"
+"TEMPORARY TABLE"
 "TEST"
 "THEN"
-"TIES"
-"TIMEOUT"
 "TIMESTAMP"
 "TO"
+"TO DISK"
+"TO INNER UUID"
+"TO SHARD"
+"TO TABLE"
+"TO VOLUME"
 "TOP"
 "TOTALS"
+"TRACKING ONLY"
 "TRAILING"
-"TRIM"
+"TRANSACTION"
+"TRIGGER"
+"TRUE"
 "TRUNCATE"
 "TTL"
 "TYPE"
+"TYPEOF"
+"UNBOUNDED"
+"UNDROP"
+"UNFREEZE"
 "UNION"
+"UNIQUE"
+"UNSET FAKE TIME"
+"UNSIGNED"
 "UPDATE"
+"URL"
 "USE"
 "USING"
 "UUID"
+"VALID UNTIL"
 "VALUES"
+"VARYING"
 "VIEW"
-"VOLUME"
+"VISIBLE"
 "WATCH"
+"WATERMARK"
 "WEEK"
+"WEEKS"
 "WHEN"
 "WHERE"
+"WINDOW"
 "WITH"
+"WITH ADMIN OPTION"
+"WITH CHECK"
+"WITH FILL"
+"WITH GRANT OPTION"
+"WITH NAME"
+"WITH REPLACE OPTION"
+"WITH TIES"
+"WK"
+"WRITABLE"
+"WW"
 "YEAR"
+"YEARS"
+"YY"
+"YYYY"
+"ZKPATH"
+"bagexpansion"
+"base_backup"
+"cluster_host_ids"
+"with_itemindex"

From a55fabdd5d6c46ab677f081bb4ec8a7491771ca4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 21 Mar 2024 00:10:22 +0100
Subject: [PATCH 824/985] Inhibit randomization in the test

---
 tests/queries/0_stateless/02998_primary_key_skip_columns.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
index b567155ab1f..6574a82a165 100644
--- a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
@@ -1,4 +1,4 @@
--- Tags: no-asan, no-tsan, no-msan, no-ubsan
+-- Tags: no-asan, no-tsan, no-msan, no-ubsan, no-random-settings
 
 DROP TABLE IF EXISTS test;
 

From 15aff51dfcae4679238c7cf78e542e40a2f4d4c3 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 21 Mar 2024 00:13:26 +0100
Subject: [PATCH 825/985] Inhibit randomization in the test

---
 .../queries/0_stateless/01019_alter_materialized_view_atomic.sh | 2 +-
 .../0_stateless/01171_mv_select_insert_isolation_long.sh        | 2 +-
 .../0_stateless/01459_manual_write_to_replicas_quorum.sh        | 2 +-
 tests/queries/0_stateless/01508_partition_pruning_long.sh       | 2 +-
 tests/queries/0_stateless/01747_system_session_log_long.sh      | 2 +-
 .../0_stateless/02782_uniq_exact_parallel_merging_bug.sh        | 2 +-
 6 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/tests/queries/0_stateless/01019_alter_materialized_view_atomic.sh b/tests/queries/0_stateless/01019_alter_materialized_view_atomic.sh
index e50b974a48e..4bd21fcee02 100755
--- a/tests/queries/0_stateless/01019_alter_materialized_view_atomic.sh
+++ b/tests/queries/0_stateless/01019_alter_materialized_view_atomic.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-fasttest
+# Tags: no-fasttest, no-debug
 
 set -e
 
diff --git a/tests/queries/0_stateless/01171_mv_select_insert_isolation_long.sh b/tests/queries/0_stateless/01171_mv_select_insert_isolation_long.sh
index 619e212c3ae..8344bb6f426 100755
--- a/tests/queries/0_stateless/01171_mv_select_insert_isolation_long.sh
+++ b/tests/queries/0_stateless/01171_mv_select_insert_isolation_long.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-parallel, no-ordinary-database
+# Tags: long, no-parallel, no-ordinary-database, no-debug
 # Test is too heavy, avoid parallel run in Flaky Check
 # shellcheck disable=SC2119
 
diff --git a/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum.sh b/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum.sh
index 379f83c6271..91a73471557 100755
--- a/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum.sh
+++ b/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: replica, no-replicated-database, no-parallel
+# Tags: replica, no-replicated-database, no-parallel, no-debug, no-random-settings
 # Tag no-replicated-database: Fails due to additional replicas or shards
 
 set -e
diff --git a/tests/queries/0_stateless/01508_partition_pruning_long.sh b/tests/queries/0_stateless/01508_partition_pruning_long.sh
index c1f2d6562ab..8e4b9547da8 100755
--- a/tests/queries/0_stateless/01508_partition_pruning_long.sh
+++ b/tests/queries/0_stateless/01508_partition_pruning_long.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-polymorphic-parts, no-random-merge-tree-settings
+# Tags: long, no-polymorphic-parts, no-random-merge-tree-settings, no-debug
 
 # Description of test result:
 # Test the correctness of the partition pruning
diff --git a/tests/queries/0_stateless/01747_system_session_log_long.sh b/tests/queries/0_stateless/01747_system_session_log_long.sh
index 3ad33c28ee1..ecddcb627b8 100755
--- a/tests/queries/0_stateless/01747_system_session_log_long.sh
+++ b/tests/queries/0_stateless/01747_system_session_log_long.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-parallel, no-fasttest
+# Tags: long, no-parallel, no-fasttest, no-debug
 
 ##################################################################################################
 # Verify that login, logout, and login failure events are properly stored in system.session_log
diff --git a/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh b/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh
index 060efe86602..6e787523540 100755
--- a/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh
+++ b/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-random-settings, no-tsan, no-asan, no-ubsan, no-msan, no-parallel
+# Tags: long, no-random-settings, no-tsan, no-asan, no-ubsan, no-msan, no-parallel, no-debug
 
 # shellcheck disable=SC2154
 

From 618c11166d5ada0b2b37a69eef534b93997faaf9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 21 Mar 2024 00:53:09 +0100
Subject: [PATCH 826/985] Add a test for #61669

---
 .../0_stateless/03015_peder1001.reference     |  1 +
 tests/queries/0_stateless/03015_peder1001.sql | 20 +++++++++++++++++++
 2 files changed, 21 insertions(+)
 create mode 100644 tests/queries/0_stateless/03015_peder1001.reference
 create mode 100644 tests/queries/0_stateless/03015_peder1001.sql

diff --git a/tests/queries/0_stateless/03015_peder1001.reference b/tests/queries/0_stateless/03015_peder1001.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/03015_peder1001.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/03015_peder1001.sql b/tests/queries/0_stateless/03015_peder1001.sql
new file mode 100644
index 00000000000..810503207f2
--- /dev/null
+++ b/tests/queries/0_stateless/03015_peder1001.sql
@@ -0,0 +1,20 @@
+DROP TABLE IF EXISTS test_data;
+
+CREATE TABLE test_data
+(
+    ShipmentDate Date
+)
+ENGINE = Memory;
+
+INSERT INTO test_data (ShipmentDate) Values ('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'), ('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-02-07'), ('2022-02-11'), ('2022-02-15'), ('2022-02-16'), ('2022-02-18'), ('2022-02-22'), ('2022-02-24'), ('2022-03-02'), ('2022-03-04'), ('2022-03-07'), ('2022-03-09'), ('2022-03-10'), ('2022-03-11'), ('2022-03-14'), ('2022-03-15'), ('2022-03-17'), ('2022-03-18'), ('2022-03-23'), ('2022-04-28'), ('2022-05-24'), ('2022-03-31'), ('2022-04-19'), ('2022-04-25'), ('2022-04-26'), ('2022-05-02'), ('2022-05-04'), ('2022-05-05'), ('2022-05-11'), ('2022-05-12'), ('2022-05-13'), ('2022-05-16'), ('2022-05-18'), ('2022-05-20'), ('2022-05-23'), ('2022-05-27'), ('2022-05-31'), ('2022-05-10'), ('2022-02-17'), ('2022-03-24'), ('2022-05-09'), ('2022-05-30'), ('2022-02-21'), ('2022-01-11'), ('2022-01-28'), ('2022-04-27'), ('2022-05-25'), ('2022-04-18'), ('2022-01-21'), ('2022-03-22'), ('2022-04-01'), ('2022-04-06'), ('2022-04-11'), ('2022-05-19'), ('2022-02-01'), ('2022-02-23'), ('2022-02-09'), ('2022-03-03'), ('2022-04-04'), ('2022-04-05'), ('2022-04-12'), ('2022-04-29'), ('2022-01-06'), ('2022-03-01'), ('2022-03-26'), ('2022-01-10'), ('2022-01-03'), ('2022-05-01'), ('2022-03-21'), ('2022-03-27'), ('2022-01-31'), ('2022-04-13'), ('2022-03-29'), ('2022-02-20'), ('2022-02-06'), ('2022-03-13'), ('2022-02-27'), ('2022-03-20'), ('2022-04-24'), ('2022-05-15'), ('2022-05-22'), ('2022-01-09'), ('2022-04-03'), ('2022-03-12'), ('2022-01-23'), ('2022-05-08'), ('2022-05-29'), ('2022-02-19'), ('2022-05-07'), ('2022-05-26'), ('2022-01-30'), ('2022-03-05'), ('2022-05-21'), ('2022-02-26'), ('2022-01-16'), ('2022-05-17'), ('2022-01-29'), ('2022-02-12'), ('2022-01-02'), ('2022-02-05'),('2022-04-22'), ('2022-02-14'), ('2022-02-28'), ('2022-02-04'), ('2022-02-08'), ('2022-03-16'), ('2022-03-25'), ('2022-02-25'), ('2022-03-08'), ('2022-05-03'), ('2022-05-06'), ('2022-02-10'), ('2022-02-13'), ('2022-03-06'), ('2022-04-07'), ('2022-04-08'), ('2022-04-20'), ('2022-04-21'), ('2022-03-28'), ('2022-03-30'), ('2022-01-04'), ('2022-01-05'), ('2022-01-07'), ('2022-01-12'), ('2022-01-13'), ('2022-01-14'), ('2022-01-17'), ('2022-01-18'), ('2022-01-19'), ('2022-01-20'), ('2022-01-24'), ('2022-01-25'), ('2022-01-26'), ('2022-01-27'), ('2022-02-02'), ('2022-02-03'), ('2022-01-08');
+
+SELECT 
+    toDayOfWeek(ShipmentDate) AS c
+FROM test_data
+WHERE c IS NOT NULL AND lowerUTF8(formatDateTime(date_add(DAY, toInt32(c) - 1, toDate('2024-01-01')), '%W')) LIKE '%m%'
+GROUP BY c
+ORDER BY c ASC
+LIMIT 62
+OFFSET 0;
+
+DROP TABLE test_data;

From 93dd212f6f9602e690ec3f378691ae57b29d1112 Mon Sep 17 00:00:00 2001
From: Nikolay Degterinsky <evillique@gmail.com>
Date: Wed, 20 Mar 2024 23:55:25 +0000
Subject: [PATCH 827/985] Fix use-of-uninitialized-value in HedgedConnections

---
 src/Client/HedgedConnections.cpp | 1 -
 src/Client/HedgedConnections.h   | 4 ++--
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/src/Client/HedgedConnections.cpp b/src/Client/HedgedConnections.cpp
index 9fa79dd6b77..fb4d9a6bdcc 100644
--- a/src/Client/HedgedConnections.cpp
+++ b/src/Client/HedgedConnections.cpp
@@ -67,7 +67,6 @@ HedgedConnections::HedgedConnections(
     }
 
     active_connection_count = connections.size();
-    offsets_with_disabled_changing_replica = 0;
     pipeline_for_new_replicas.add([throttler_](ReplicaState & replica_) { replica_.connection->setThrottler(throttler_); });
 }
 
diff --git a/src/Client/HedgedConnections.h b/src/Client/HedgedConnections.h
index 5bc274332db..7f538804e5a 100644
--- a/src/Client/HedgedConnections.h
+++ b/src/Client/HedgedConnections.h
@@ -178,12 +178,12 @@ private:
     std::queue<int> offsets_queue;
 
     /// The current number of valid connections to the replicas of this shard.
-    size_t active_connection_count;
+    size_t active_connection_count = 0;
 
     /// We count offsets in which we can't change replica anymore,
     /// it's needed to cancel choosing new replicas when we
     /// disabled replica changing in all offsets.
-    size_t offsets_with_disabled_changing_replica;
+    size_t offsets_with_disabled_changing_replica = 0;
 
     Pipeline pipeline_for_new_replicas;
 

From 4d6709579bef2bf23ba8d8cd9ee6e925dd257836 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 21 Mar 2024 02:28:14 +0100
Subject: [PATCH 828/985] Fix error

---
 src/Analyzer/MatcherNode.cpp           |  8 ++++----
 src/Analyzer/MatcherNode.h             |  2 +-
 src/Parsers/ASTColumnsTransformers.cpp | 23 +++++++++++++----------
 src/Parsers/ASTColumnsTransformers.h   |  2 +-
 4 files changed, 19 insertions(+), 16 deletions(-)

diff --git a/src/Analyzer/MatcherNode.cpp b/src/Analyzer/MatcherNode.cpp
index 48b60423688..f573b83e538 100644
--- a/src/Analyzer/MatcherNode.cpp
+++ b/src/Analyzer/MatcherNode.cpp
@@ -92,19 +92,19 @@ MatcherNode::MatcherNode(Identifier qualified_identifier_, Identifiers columns_i
 MatcherNode::MatcherNode(MatcherNodeType matcher_type_,
     Identifier qualified_identifier_,
     Identifiers columns_identifiers_,
-    String pattern_,
+    std::optional<String> pattern_,
     ColumnTransformersNodes column_transformers_)
     : IQueryTreeNode(children_size)
     , matcher_type(matcher_type_)
     , qualified_identifier(qualified_identifier_)
     , columns_identifiers(columns_identifiers_)
 {
-    if (!pattern_.empty())
+    if (pattern_)
     {
-        columns_matcher = std::make_shared<re2::RE2>(pattern_, re2::RE2::Quiet);
+        columns_matcher = std::make_shared<re2::RE2>(*pattern_, re2::RE2::Quiet);
         if (!columns_matcher->ok())
             throw DB::Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
-                "COLUMNS pattern {} cannot be compiled: {}", pattern_, columns_matcher->error());
+                "COLUMNS pattern {} cannot be compiled: {}", *pattern_, columns_matcher->error());
     }
 
     auto column_transformers_list_node = std::make_shared<ListNode>();
diff --git a/src/Analyzer/MatcherNode.h b/src/Analyzer/MatcherNode.h
index 9f6b7c6ce3d..d6f077e224b 100644
--- a/src/Analyzer/MatcherNode.h
+++ b/src/Analyzer/MatcherNode.h
@@ -147,7 +147,7 @@ private:
     explicit MatcherNode(MatcherNodeType matcher_type_,
         Identifier qualified_identifier_,
         Identifiers columns_identifiers_,
-        String pattern_,
+        std::optional<String> pattern_,
         ColumnTransformersNodes column_transformers_);
 
     MatcherNodeType matcher_type;
diff --git a/src/Parsers/ASTColumnsTransformers.cpp b/src/Parsers/ASTColumnsTransformers.cpp
index 42c4c6ad88a..2a61892f8cc 100644
--- a/src/Parsers/ASTColumnsTransformers.cpp
+++ b/src/Parsers/ASTColumnsTransformers.cpp
@@ -180,8 +180,8 @@ void ASTColumnsExceptTransformer::formatImpl(const FormatSettings & settings, Fo
         (*it)->formatImpl(settings, state, frame);
     }
 
-    if (!pattern.empty())
-        settings.ostr << quoteString(pattern);
+    if (pattern)
+        settings.ostr << quoteString(*pattern);
 
     if (children.size() > 1)
         settings.ostr << ")";
@@ -203,8 +203,8 @@ void ASTColumnsExceptTransformer::appendColumnName(WriteBuffer & ostr) const
         (*it)->appendColumnName(ostr);
     }
 
-    if (!pattern.empty())
-        writeQuotedString(pattern, ostr);
+    if (pattern)
+        writeQuotedString(*pattern, ostr);
 
     if (children.size() > 1)
         writeChar(')', ostr);
@@ -213,8 +213,11 @@ void ASTColumnsExceptTransformer::appendColumnName(WriteBuffer & ostr) const
 void ASTColumnsExceptTransformer::updateTreeHashImpl(SipHash & hash_state, bool ignore_aliases) const
 {
     hash_state.update(is_strict);
-    hash_state.update(pattern.size());
-    hash_state.update(pattern);
+    if (pattern)
+    {
+        hash_state.update(pattern->size());
+        hash_state.update(*pattern);
+    }
 
     IAST::updateTreeHashImpl(hash_state, ignore_aliases);
 }
@@ -222,7 +225,7 @@ void ASTColumnsExceptTransformer::updateTreeHashImpl(SipHash & hash_state, bool
 void ASTColumnsExceptTransformer::transform(ASTs & nodes) const
 {
     std::set<String> expected_columns;
-    if (pattern.empty())
+    if (!pattern)
     {
         for (const auto & child : children)
             expected_columns.insert(child->as<const ASTIdentifier &>().name());
@@ -278,13 +281,13 @@ void ASTColumnsExceptTransformer::setPattern(String pattern_)
 
 std::shared_ptr<re2::RE2> ASTColumnsExceptTransformer::getMatcher() const
 {
-    if (pattern.empty())
+    if (!pattern)
         return {};
 
-    auto regexp = std::make_shared<re2::RE2>(pattern, re2::RE2::Quiet);
+    auto regexp = std::make_shared<re2::RE2>(*pattern, re2::RE2::Quiet);
     if (!regexp->ok())
         throw Exception(ErrorCodes::CANNOT_COMPILE_REGEXP,
-            "COLUMNS pattern {} cannot be compiled: {}", pattern, regexp->error());
+            "COLUMNS pattern {} cannot be compiled: {}", *pattern, regexp->error());
     return regexp;
 }
 
diff --git a/src/Parsers/ASTColumnsTransformers.h b/src/Parsers/ASTColumnsTransformers.h
index 2d13cd85819..cedf955bee2 100644
--- a/src/Parsers/ASTColumnsTransformers.h
+++ b/src/Parsers/ASTColumnsTransformers.h
@@ -84,7 +84,7 @@ public:
 
 protected:
     void formatImpl(const FormatSettings & settings, FormatState &, FormatStateStacked) const override;
-    String pattern;
+    std::optional<String> pattern;
 };
 
 class ASTColumnsReplaceTransformer : public IASTColumnsTransformer

From 3698c0c2cfb0cd5cda2c10531ca6dcfc1e9899e6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 21 Mar 2024 02:46:03 +0100
Subject: [PATCH 829/985] Fix build

---
 src/Functions/FunctionsTimeWindow.cpp | 11 +++++
 src/Functions/FunctionsTimeWindow.h   | 62 +++------------------------
 2 files changed, 17 insertions(+), 56 deletions(-)

diff --git a/src/Functions/FunctionsTimeWindow.cpp b/src/Functions/FunctionsTimeWindow.cpp
index be51978499b..2b1359964e8 100644
--- a/src/Functions/FunctionsTimeWindow.cpp
+++ b/src/Functions/FunctionsTimeWindow.cpp
@@ -110,6 +110,17 @@ bool checkIntervalOrTimeZoneArgument(const ColumnWithTypeAndName & argument, con
     return true;
 }
 
+enum TimeWindowFunctionName
+{
+    TUMBLE,
+    TUMBLE_START,
+    TUMBLE_END,
+    HOP,
+    HOP_START,
+    HOP_END,
+    WINDOW_ID
+};
+
 template <TimeWindowFunctionName type>
 struct TimeWindowImpl
 {
diff --git a/src/Functions/FunctionsTimeWindow.h b/src/Functions/FunctionsTimeWindow.h
index 4ea5b3a9394..65cc7e9e87c 100644
--- a/src/Functions/FunctionsTimeWindow.h
+++ b/src/Functions/FunctionsTimeWindow.h
@@ -21,16 +21,6 @@ namespace DB
   * hopEnd(window_id)
   * hopEnd(time_attr, hop_interval, window_interval [, timezone])
   */
-enum TimeWindowFunctionName
-{
-    TUMBLE,
-    TUMBLE_START,
-    TUMBLE_END,
-    HOP,
-    HOP_START,
-    HOP_END,
-    WINDOW_ID
-};
 
 template <IntervalKind::Kind unit>
 struct ToStartOfTransform;
@@ -73,17 +63,15 @@ struct ToStartOfTransform;
     TRANSFORM_TIME(Second)
 #undef TRANSFORM_TIME
 
-/// NOLINTBEGIN(bugprone-macro-parentheses)
-
 #define TRANSFORM_SUBSECONDS(INTERVAL_KIND, DEF_SCALE) \
 template<> \
     struct ToStartOfTransform<IntervalKind::Kind::INTERVAL_KIND> \
     { \
         static Int64 execute(Int64 t, UInt64 delta, const UInt32 scale) \
         { \
-            if (scale <= DEF_SCALE) \
+            if (scale <= (DEF_SCALE)) \
             { \
-                auto val = t * DecimalUtils::scaleMultiplier<DateTime64>(DEF_SCALE - scale); \
+                auto val = t * DecimalUtils::scaleMultiplier<DateTime64>((DEF_SCALE) - scale); \
                 if (delta == 1) \
                     return val; \
                 else \
@@ -91,7 +79,7 @@ template<> \
             } \
             else \
             { \
-                return t - (t % (delta * DecimalUtils::scaleMultiplier<DateTime64>(scale - DEF_SCALE))) ; \
+                return t - (t % (delta * DecimalUtils::scaleMultiplier<DateTime64>(scale - (DEF_SCALE)))) ; \
             } \
         } \
     };
@@ -145,12 +133,12 @@ template <> \
     { \
         static inline NO_SANITIZE_UNDEFINED Int64 execute(Int64 t, UInt64 delta, const UInt32 scale) \
         { \
-            if (scale < DEF_SCALE) \
+            if (scale < (DEF_SCALE)) \
             { \
-                return t + delta * DecimalUtils::scaleMultiplier<DateTime64>(DEF_SCALE - scale); \
+                return t + delta * DecimalUtils::scaleMultiplier<DateTime64>((DEF_SCALE) - scale); \
             } \
             else \
-                return t + delta * DecimalUtils::scaleMultiplier<DateTime64>(scale - DEF_SCALE); \
+                return t + delta * DecimalUtils::scaleMultiplier<DateTime64>(scale - (DEF_SCALE)); \
         } \
     };
     ADD_SUBSECONDS(Millisecond, 3)
@@ -158,42 +146,4 @@ template <> \
     ADD_SUBSECONDS(Nanosecond, 9)
 #undef ADD_SUBSECONDS
 
-/// NOLINTEND(bugprone-macro-parentheses)
-
-template <TimeWindowFunctionName type>
-struct TimeWindowImpl
-{
-    static constexpr auto name = "UNKNOWN";
-
-    static DataTypePtr getReturnType(const ColumnsWithTypeAndName & arguments, const String & function_name);
-
-    static ColumnPtr dispatchForColumns(const ColumnsWithTypeAndName & arguments, const String & function_name);
-};
-
-template <TimeWindowFunctionName type>
-class FunctionTimeWindow : public IFunction
-{
-public:
-    static constexpr auto name = TimeWindowImpl<type>::name;
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionTimeWindow>(); }
-    String getName() const override { return name; }
-    bool isVariadic() const override { return true; }
-    size_t getNumberOfArguments() const override { return 0; }
-    bool useDefaultImplementationForConstants() const override { return true; }
-    ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2, 3}; }
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo &) const override { return true; }
-
-    DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override;
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & /*result_type*/, size_t /*input_rows_count*/) const override;
-};
-
-using FunctionTumble = FunctionTimeWindow<TUMBLE>;
-using FunctionTumbleStart = FunctionTimeWindow<TUMBLE_START>;
-using FunctionTumbleEnd = FunctionTimeWindow<TUMBLE_END>;
-using FunctionHop = FunctionTimeWindow<HOP>;
-using FunctionWindowId = FunctionTimeWindow<WINDOW_ID>;
-using FunctionHopStart = FunctionTimeWindow<HOP_START>;
-using FunctionHopEnd = FunctionTimeWindow<HOP_END>;
-
 }

From bfc7c3c89edd2454ee0d6d23052d9bade28ac2a7 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 21 Mar 2024 02:52:51 +0100
Subject: [PATCH 830/985] Remove clickhouse-diagnostics

---
 docker/packager/binary-builder/Dockerfile     |    2 +-
 docker/packager/binary-builder/build.sh       |   18 -
 packages/clickhouse-common-static.yaml        |    2 -
 programs/diagnostics/.gitignore               |   30 -
 programs/diagnostics/CONTRIBUTION.md          |   49 -
 programs/diagnostics/Makefile                 |   65 -
 programs/diagnostics/README.md                |  167 ---
 .../cmd/clickhouse-diagnostics/main.go        |    9 -
 programs/diagnostics/cmd/collect.go           |  159 ---
 programs/diagnostics/cmd/convert.go           |    1 -
 programs/diagnostics/cmd/help.go              |  124 --
 programs/diagnostics/cmd/params/params.go     |  281 ----
 .../diagnostics/cmd/params/params_test.go     |  247 ----
 programs/diagnostics/cmd/root.go              |  174 ---
 programs/diagnostics/cmd/version.go           |   24 -
 programs/diagnostics/go.mod                   |   89 --
 programs/diagnostics/go.sum                   |  992 --------------
 .../internal/collectors/clickhouse/config.go  |  113 --
 .../collectors/clickhouse/config_test.go      |  128 --
 .../internal/collectors/clickhouse/db_logs.go |  108 --
 .../collectors/clickhouse/db_logs_test.go     |  119 --
 .../internal/collectors/clickhouse/logs.go    |  140 --
 .../collectors/clickhouse/logs_test.go        |  147 --
 .../collectors/clickhouse/queries.json        |  153 ---
 .../internal/collectors/clickhouse/summary.go |  159 ---
 .../collectors/clickhouse/summary_test.go     |  111 --
 .../internal/collectors/clickhouse/system.go  |  165 ---
 .../collectors/clickhouse/system_test.go      |  366 -----
 .../collectors/clickhouse/zookeeper.go        |  153 ---
 .../collectors/clickhouse/zookeeper_test.go   |  102 --
 .../internal/collectors/registry.go           |   75 --
 .../internal/collectors/registry_test.go      |   57 -
 .../internal/collectors/system/command.go     |   90 --
 .../collectors/system/command_test.go         |  107 --
 .../internal/collectors/system/file.go        |  100 --
 .../internal/collectors/system/file_test.go   |  110 --
 .../internal/collectors/system/system.go      |  235 ----
 .../internal/collectors/system/system_test.go |   89 --
 .../internal/outputs/file/simple.go           |  344 -----
 .../internal/outputs/file/simple_test.go      |  468 -------
 .../diagnostics/internal/outputs/registry.go  |   67 -
 .../internal/outputs/registry_test.go         |   45 -
 .../internal/outputs/terminal/report.go       |  284 ----
 .../internal/platform/config/models.go        |  129 --
 .../internal/platform/config/models_test.go   |  182 ---
 .../internal/platform/config/utils.go         |   74 -
 .../internal/platform/config/utils_test.go    |  142 --
 .../internal/platform/data/bundle.go          |   27 -
 .../internal/platform/data/bundle_test.go     |   26 -
 .../internal/platform/data/database.go        |   88 --
 .../internal/platform/data/database_test.go   |   86 --
 .../internal/platform/data/field.go           |    8 -
 .../internal/platform/data/file.go            |  444 ------
 .../internal/platform/data/file_test.go       |  263 ----
 .../internal/platform/data/frame.go           |   11 -
 .../internal/platform/data/memory.go          |   35 -
 .../internal/platform/data/memory_test.go     |   61 -
 .../internal/platform/data/misc.go            |   27 -
 .../internal/platform/database/native.go      |   95 --
 .../internal/platform/database/native_test.go |  289 ----
 .../diagnostics/internal/platform/manager.go  |   49 -
 .../internal/platform/manager_test.go         |  100 --
 .../internal/platform/test/data.go            |  166 ---
 .../diagnostics/internal/platform/test/env.go |   16 -
 .../internal/platform/utils/file.go           |   95 --
 .../internal/platform/utils/file_test.go      |  134 --
 .../internal/platform/utils/process.go        |   49 -
 .../internal/platform/utils/process_test.go   |   97 --
 .../internal/platform/utils/slices.go         |   68 -
 .../internal/platform/utils/slices_test.go    |   64 -
 .../internal/platform/utils/time.go           |    7 -
 programs/diagnostics/internal/runner.go       |  115 --
 programs/diagnostics/internal/runner_test.go  |  130 --
 .../configs/include/xml/server-include.xml    |    8 -
 .../configs/include/xml/user-include.xml      |   20 -
 .../configs/include/yaml/server-include.yaml  |    1 -
 .../configs/include/yaml/user-include.yaml    |    7 -
 .../testdata/configs/xml/config.xml           | 1195 -----------------
 .../configs/xml/users.d/default-password.xml  |    8 -
 .../testdata/configs/xml/users.xml            |   57 -
 .../testdata/configs/yaml/config.yaml         |  927 -------------
 .../yaml/users.d/default-password.yaml        |    6 -
 .../testdata/configs/yaml/users.yaml          |   47 -
 .../testdata/configs/yandex_xml/config.xml    | 1167 ----------------
 .../diagnostics/testdata/docker/admin.xml     |   15 -
 .../diagnostics/testdata/docker/custom.xml    |    8 -
 .../logs/var/logs/clickhouse-server.err.log   |   10 -
 .../logs/var/logs/clickhouse-server.log       |   10 -
 .../logs/var/logs/clickhouse-server.log.gz    |    1 -
 89 files changed, 1 insertion(+), 13031 deletions(-)
 delete mode 100644 programs/diagnostics/.gitignore
 delete mode 100644 programs/diagnostics/CONTRIBUTION.md
 delete mode 100644 programs/diagnostics/Makefile
 delete mode 100644 programs/diagnostics/README.md
 delete mode 100644 programs/diagnostics/cmd/clickhouse-diagnostics/main.go
 delete mode 100644 programs/diagnostics/cmd/collect.go
 delete mode 100644 programs/diagnostics/cmd/convert.go
 delete mode 100644 programs/diagnostics/cmd/help.go
 delete mode 100644 programs/diagnostics/cmd/params/params.go
 delete mode 100644 programs/diagnostics/cmd/params/params_test.go
 delete mode 100644 programs/diagnostics/cmd/root.go
 delete mode 100644 programs/diagnostics/cmd/version.go
 delete mode 100644 programs/diagnostics/go.mod
 delete mode 100644 programs/diagnostics/go.sum
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/config.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/config_test.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/db_logs.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/db_logs_test.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/logs.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/logs_test.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/queries.json
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/summary.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/summary_test.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/system.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/system_test.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/zookeeper.go
 delete mode 100644 programs/diagnostics/internal/collectors/clickhouse/zookeeper_test.go
 delete mode 100644 programs/diagnostics/internal/collectors/registry.go
 delete mode 100644 programs/diagnostics/internal/collectors/registry_test.go
 delete mode 100644 programs/diagnostics/internal/collectors/system/command.go
 delete mode 100644 programs/diagnostics/internal/collectors/system/command_test.go
 delete mode 100644 programs/diagnostics/internal/collectors/system/file.go
 delete mode 100644 programs/diagnostics/internal/collectors/system/file_test.go
 delete mode 100644 programs/diagnostics/internal/collectors/system/system.go
 delete mode 100644 programs/diagnostics/internal/collectors/system/system_test.go
 delete mode 100644 programs/diagnostics/internal/outputs/file/simple.go
 delete mode 100644 programs/diagnostics/internal/outputs/file/simple_test.go
 delete mode 100644 programs/diagnostics/internal/outputs/registry.go
 delete mode 100644 programs/diagnostics/internal/outputs/registry_test.go
 delete mode 100644 programs/diagnostics/internal/outputs/terminal/report.go
 delete mode 100644 programs/diagnostics/internal/platform/config/models.go
 delete mode 100644 programs/diagnostics/internal/platform/config/models_test.go
 delete mode 100644 programs/diagnostics/internal/platform/config/utils.go
 delete mode 100644 programs/diagnostics/internal/platform/config/utils_test.go
 delete mode 100644 programs/diagnostics/internal/platform/data/bundle.go
 delete mode 100644 programs/diagnostics/internal/platform/data/bundle_test.go
 delete mode 100644 programs/diagnostics/internal/platform/data/database.go
 delete mode 100644 programs/diagnostics/internal/platform/data/database_test.go
 delete mode 100644 programs/diagnostics/internal/platform/data/field.go
 delete mode 100644 programs/diagnostics/internal/platform/data/file.go
 delete mode 100644 programs/diagnostics/internal/platform/data/file_test.go
 delete mode 100644 programs/diagnostics/internal/platform/data/frame.go
 delete mode 100644 programs/diagnostics/internal/platform/data/memory.go
 delete mode 100644 programs/diagnostics/internal/platform/data/memory_test.go
 delete mode 100644 programs/diagnostics/internal/platform/data/misc.go
 delete mode 100644 programs/diagnostics/internal/platform/database/native.go
 delete mode 100644 programs/diagnostics/internal/platform/database/native_test.go
 delete mode 100644 programs/diagnostics/internal/platform/manager.go
 delete mode 100644 programs/diagnostics/internal/platform/manager_test.go
 delete mode 100644 programs/diagnostics/internal/platform/test/data.go
 delete mode 100644 programs/diagnostics/internal/platform/test/env.go
 delete mode 100644 programs/diagnostics/internal/platform/utils/file.go
 delete mode 100644 programs/diagnostics/internal/platform/utils/file_test.go
 delete mode 100644 programs/diagnostics/internal/platform/utils/process.go
 delete mode 100644 programs/diagnostics/internal/platform/utils/process_test.go
 delete mode 100644 programs/diagnostics/internal/platform/utils/slices.go
 delete mode 100644 programs/diagnostics/internal/platform/utils/slices_test.go
 delete mode 100644 programs/diagnostics/internal/platform/utils/time.go
 delete mode 100644 programs/diagnostics/internal/runner.go
 delete mode 100644 programs/diagnostics/internal/runner_test.go
 delete mode 100644 programs/diagnostics/testdata/configs/include/xml/server-include.xml
 delete mode 100644 programs/diagnostics/testdata/configs/include/xml/user-include.xml
 delete mode 100644 programs/diagnostics/testdata/configs/include/yaml/server-include.yaml
 delete mode 100644 programs/diagnostics/testdata/configs/include/yaml/user-include.yaml
 delete mode 100644 programs/diagnostics/testdata/configs/xml/config.xml
 delete mode 100644 programs/diagnostics/testdata/configs/xml/users.d/default-password.xml
 delete mode 100644 programs/diagnostics/testdata/configs/xml/users.xml
 delete mode 100644 programs/diagnostics/testdata/configs/yaml/config.yaml
 delete mode 100644 programs/diagnostics/testdata/configs/yaml/users.d/default-password.yaml
 delete mode 100644 programs/diagnostics/testdata/configs/yaml/users.yaml
 delete mode 100644 programs/diagnostics/testdata/configs/yandex_xml/config.xml
 delete mode 100644 programs/diagnostics/testdata/docker/admin.xml
 delete mode 100644 programs/diagnostics/testdata/docker/custom.xml
 delete mode 100644 programs/diagnostics/testdata/logs/var/logs/clickhouse-server.err.log
 delete mode 100644 programs/diagnostics/testdata/logs/var/logs/clickhouse-server.log
 delete mode 100644 programs/diagnostics/testdata/logs/var/logs/clickhouse-server.log.gz

diff --git a/docker/packager/binary-builder/Dockerfile b/docker/packager/binary-builder/Dockerfile
index c9442accd7e..73ec4275f12 100644
--- a/docker/packager/binary-builder/Dockerfile
+++ b/docker/packager/binary-builder/Dockerfile
@@ -61,7 +61,7 @@ RUN arch=${TARGETARCH:-amd64} \
     && rm /tmp/nfpm.deb
 
 ARG GO_VERSION=1.19.10
-# We need go for clickhouse-diagnostics
+# We needed go for clickhouse-diagnostics (it is not used anymore)
 RUN arch=${TARGETARCH:-amd64} \
     && curl -Lo /tmp/go.tgz "https://go.dev/dl/go${GO_VERSION}.linux-${arch}.tar.gz" \
     && tar -xzf /tmp/go.tgz -C /usr/local/ \
diff --git a/docker/packager/binary-builder/build.sh b/docker/packager/binary-builder/build.sh
index b63643419fe..032aceb0af3 100755
--- a/docker/packager/binary-builder/build.sh
+++ b/docker/packager/binary-builder/build.sh
@@ -36,22 +36,6 @@ rm -f CMakeCache.txt
 
 if [ -n "$MAKE_DEB" ]; then
   rm -rf /build/packages/root
-  # NOTE: this is for backward compatibility with previous releases,
-  # that does not diagnostics tool (only script).
-  if [ -d /build/programs/diagnostics ]; then
-    if [ -z "$SANITIZER" ]; then
-      # We need to check if clickhouse-diagnostics is fine and build it
-      (
-        cd /build/programs/diagnostics
-        make test-no-docker
-        GOARCH="${DEB_ARCH}" CGO_ENABLED=0 make VERSION="$VERSION_STRING" build
-        mv clickhouse-diagnostics ..
-      )
-    else
-      echo -e "#!/bin/sh\necho 'Not implemented for this type of package'" > /build/programs/clickhouse-diagnostics
-      chmod +x /build/programs/clickhouse-diagnostics
-    fi
-  fi
 fi
 
 
@@ -121,8 +105,6 @@ if [ -n "$MAKE_DEB" ]; then
   # No quotes because I want it to expand to nothing if empty.
   # shellcheck disable=SC2086
   DESTDIR=/build/packages/root ninja $NINJA_FLAGS programs/install
-  cp /build/programs/clickhouse-diagnostics /build/packages/root/usr/bin
-  cp /build/programs/clickhouse-diagnostics /output
   bash -x /build/packages/build
 fi
 
diff --git a/packages/clickhouse-common-static.yaml b/packages/clickhouse-common-static.yaml
index 238126f95fd..383ad39591c 100644
--- a/packages/clickhouse-common-static.yaml
+++ b/packages/clickhouse-common-static.yaml
@@ -34,8 +34,6 @@ suggests:
 contents:
 - src: root/usr/bin/clickhouse
   dst: /usr/bin/clickhouse
-- src: root/usr/bin/clickhouse-diagnostics
-  dst: /usr/bin/clickhouse-diagnostics
 - src: root/usr/bin/clickhouse-extract-from-config
   dst: /usr/bin/clickhouse-extract-from-config
 - src: root/usr/bin/clickhouse-library-bridge
diff --git a/programs/diagnostics/.gitignore b/programs/diagnostics/.gitignore
deleted file mode 100644
index 5e0b0165f38..00000000000
--- a/programs/diagnostics/.gitignore
+++ /dev/null
@@ -1,30 +0,0 @@
-# If you prefer the allow list template instead of the deny list, see community template:
-# https://github.com/github/gitignore/blob/main/community/Golang/Go.AllowList.gitignore
-#
-# Binaries for programs and plugins
-*.exe
-*.exe~
-*.dll
-*.so
-*.dylib
-
-# Test binary, built with `go test -c`
-*.test
-
-# Output of the go coverage tool, specifically when used with LiteIDE
-*.out
-
-# Dependency directories (remove the comment below to include it)
-# vendor/
-
-# Go workspace file
-go.work
-
-.idea
-clickhouse-diagnostics
-output
-vendor
-bin
-profile.cov
-clickhouse-diagnostics.yml
-dist/
diff --git a/programs/diagnostics/CONTRIBUTION.md b/programs/diagnostics/CONTRIBUTION.md
deleted file mode 100644
index 00fb073cefe..00000000000
--- a/programs/diagnostics/CONTRIBUTION.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# Contribution
-
-We keep things simple. Execute all commands in this folder.
-
-## Requirements
-
-- docker - tested on version 20.10.12.
-- golang >= go1.17.6
-
-## Building
-
-Creates a binary `clickhouse-diagnostics` in the local folder. Build will be versioned according to a timestamp. For a versioned release see [Releasing](#releasing).
-
-```bash
-make build
-```
-
-## Linting
-
-We use [golangci-lint](https://golangci-lint.run/). We use a container to run so no need to install.
-
-```bash
-make lint-go
-```
-
-## Running Tests
-
-```bash
-make test
-```
-
-For a coverage report,
-
-```bash
-make test-coverage
-```
-
-## Adding Collectors
-
-TODO
-
-
-## Adding Outputs
-
-TODO
-
-## Frames
-
-## Parameter Types
diff --git a/programs/diagnostics/Makefile b/programs/diagnostics/Makefile
deleted file mode 100644
index 2e85002b871..00000000000
--- a/programs/diagnostics/Makefile
+++ /dev/null
@@ -1,65 +0,0 @@
-GOCMD=go
-GOTEST=$(GOCMD) test
-BINARY_NAME=clickhouse-diagnostics
-BUILD_DIR=dist
-
-TIMESTAMP := $(shell date +%Y%m%d-%H%M)
-COMMIT := $(shell git rev-parse --short HEAD)
-MODULE := github.com/ClickHouse/ClickHouse/programs/diagnostics
-VERSION := v.dev-${TIMESTAMP}
-DEVLDFLAGS = -ldflags "-X ${MODULE}/cmd.Version=${VERSION} -X ${MODULE}/cmd.Commit=${COMMIT}"
-
-# override with env variable to test other versions e.g. 21.11.10.1
-CLICKHOUSE_VERSION ?= latest
-
-GREEN  := $(shell tput -Txterm setaf 2)
-YELLOW := $(shell tput -Txterm setaf 3)
-WHITE  := $(shell tput -Txterm setaf 7)
-CYAN   := $(shell tput -Txterm setaf 6)
-RESET  := $(shell tput -Txterm sgr0)
-
-.PHONY: all test build vendor release lint-go test-coverages dep
-
-all: help
-
-release: ## Release is delegated to goreleaser
-	$(shell goreleaser release --rm-dist)
-
-## Build:
-build: ## Build a binary for local use
-	# timestamped version
-	$(GOCMD) build ${DEVLDFLAGS} -o $(BINARY_NAME) ./cmd/clickhouse-diagnostics
-
-clean: ## Remove build related file
-	rm ${BINARY_NAME}
-	rm -f checkstyle-report.xml ./coverage.xml ./profile.cov
-
-vendor: ## Copy of all packages needed to support builds and tests in the vendor directory
-	$(GOCMD) mod vendor
-
-test: ## Run the tests of the project
-	CLICKHOUSE_VERSION=$(CLICKHOUSE_VERSION) $(GOTEST) -v -race `go list ./... | grep -v ./internal/platform/test`
-
-test-no-docker: ## Don't run tests depending on dockerd
-	CLICKHOUSE_VERSION=$(CLICKHOUSE_VERSION) $(GOTEST) -v -race -tags no_docker `go list ./... | grep -v ./internal/platform/test`
-
-lint-go: ## Use golintci-lint
-	docker run --rm -v $(shell pwd):/app -w /app golangci/golangci-lint:latest-alpine golangci-lint run
-
-test-coverage: ## Run the tests of the project and export the coverage
-	CLICKHOUSE_VERSION=$(CLICKHOUSE_VERSION) $(GOTEST) -cover -covermode=count -coverprofile=profile.cov `go list ./... | grep -v ./internal/platform/test`
-	$(GOCMD) tool cover -func profile.cov
-
-dep:
-  $(shell go mod download)
-
-help: ## Show this help.
-	@echo ''
-	@echo 'Usage:'
-	@echo '  ${YELLOW}make${RESET} ${GREEN}<target>${RESET}'
-	@echo ''
-	@echo 'Targets:'
-	@awk 'BEGIN {FS = ":.*?## "} { \
-		if (/^[a-zA-Z_-]+:.*?##.*$$/) {printf "    ${YELLOW}%-20s${GREEN}%s${RESET}\n", $$1, $$2} \
-		else if (/^## .*$$/) {printf "  ${CYAN}%s${RESET}\n", substr($$1,4)} \
-		}' $(MAKEFILE_LIST)
diff --git a/programs/diagnostics/README.md b/programs/diagnostics/README.md
deleted file mode 100644
index f800bb0648e..00000000000
--- a/programs/diagnostics/README.md
+++ /dev/null
@@ -1,167 +0,0 @@
-# Clickhouse Diagnostics Tool
-
-## Purpose
-
-This tool provides a means of obtaining a diagnostic bundle from a ClickHouse instance. This bundle can be provided to your nearest ClickHouse support provider in order to assist with the diagnosis of issues.
-
-## Design Philosophy
-
-- **No local dependencies** to run. We compile to a platform-independent binary, hence Go.
-- **Minimize resource overhead**. Improvements always welcome.
-- **Extendable framework**. At its core, the tool provides collectors and outputs. Collectors are independent and are responsible for collecting a specific dataset e.g. system configuration. Outputs produce the diagnostic bundle in a specific format. It should be trivial to add both for contributors. See [Collectors](#collectors) and [Outputs](#outputs) for more details.
-- **Convertible output formats**. Outputs produce diagnostic bundles in different formats e.g. archive, simple report etc. Where possible, it should be possible to convert between these formats. For example, an administrator may provide a bundle as an archive to their support provider who in turn wishes to visualise this as a report or even in ClickHouse itself...
-- **Something is better than nothing**. Collectors execute independently. We never fail a collection because one fails - preferring to warn the user only. There are good reasons for a collector failure e.g. insufficient permissions or missing data.
-- **Execute anywhere** - Ideally, this tool is executed on a ClickHouse host. Some collectors e.g. configuration file collection or system information, rely on this. However, collectors will obtain as much information remotely from the database as possible if executed remotely from the cluster - warning where collection fails. **We do currently require ClickHouse to be running, connecting over the native port**.
-
-We recommend reading [Permissions, Warnings & Locality](#permissions-warnings--locality).
-
-## Usage
-
-### Collection
-
-The `collect` command allows the collection of a diagnostic bundle. In its simplest form, assuming ClickHouse is running locally on default ports with no password:
-
-```bash
-clickhouse-diagnostics collect
-```
-
-This will use the default collectors and the simple output. This output produces a timestamped archive bundle in `gz` format in a sub folder named after the host. This folder name can be controlled via the parameter `--id` or configured directly for the simple output parameter `output.simple.folder` (this allows a specific directory to be specified).
-
-Collectors, Outputs and ClickHouse connection credentials can be specified as shown below:
-
-```bash
-clickhouse-diagnostics collect --password random --username default --collector=system_db,system --output=simple --id my_cluster_name
-```
-
-This collects the system database and host information from the cluster running locally. The archive bundle will be produced under a folder `my_cluster_name`.
-
-For further details, use the in built help (the commands below are equivalent):
-
-```bash
-clickhouse-diagnostics collect --help
-./clickhouse-diagnostics help collect
-```
-
-### Help & Finding parameters for collectors & outputs
-
-Collectors and outputs have their own parameters not listed under the help for the command for the `collect` command. These can be identified using the `help` command. Specifically,
-
-For more information about a specific collector.
-
-```bash
-Use "clickhouse-diagnostics help --collector [collector]" 
-```
-
-For more information about a specific output.
-
-```bash
-Use "clickhouse-diagnostics help --output [output]" 
-```
-
-### Convert
-
-Coming soon to a cluster near you...
-
-## Collectors
-
-We currently support the following collectors. A `*` indicates this collector is enabled by default:
-
-- `system_db*` - Collects all tables in the system database, except those which have been excluded and up to a specified row limit.
-- `system*` - Collects summary OS and hardware statistics for the host.
-- `config*` - Collects the ClickHouse configuration from the local filesystem. A best effort is made using process information if ClickHouse is not installed locally. `include_path` are also considered. 
-- `db_logs*` - Collects the ClickHouse logs directly from the database.
-- `logs*` - Collects the ClickHouse logs directly from the database.
-- `summary*` - Collects summary statistics on the database based on a set of known useful queries. This represents the easiest collector to extend - contributions are welcome to this set which can be found [here](https://github.com/ClickHouse/ClickHouse/blob/master/programs/diagnostics/internal/collectors/clickhouse/queries.json).
-- `file` - Collects files based on glob patterns. Does not collect directories. To preview files which will be collected try, `clickhouse-diagnostics collect --collectors=file --collector.file.file_pattern=<glob path> --output report`
-- `command` - Collects the output of a user specified command. To preview output, `clickhouse-diagnostics collect --collectors=command --collector.command.command="<command>" --output report`
-- `zookeeper_db` - Collects information about zookeeper using the `system.zookeeper` table, recursively iterating the zookeeper tree/table. Note: changing the default parameter values can cause extremely high load to be placed on the database. Use with caution. By default, uses the glob `/clickhouse/{task_queue}/**` to match zookeeper paths and iterates to a max depth of 8.
-
-## Outputs
-
-We currently support the following outputs. The `simple` output is currently the default:
-
-- `simple` - Writes out the diagnostic bundle as files in a structured directory, optionally producing a compressed archive.
-- `report` - Writes out the diagnostic bundle to the terminal as a simple report. Supports an ascii table format or markdown.
-- `clickhouse` - **Under development**. This will allow a bundle to be stored in a cluster allowing visualization in common tooling e.g. Grafana.
-
-## Simple Output
-
-Since the `simple` output is the default we provide additional details here. 
-This output produces a timestamped archive by default in `gz` format under a directory created with either the hostname of the specified collection `--id`. As shown below, a specific folder can also be specified. Compression can also be disabled, leaving just the contents of the folder:
-
-```bash
-./clickhouse-diagnostics help --output simple
-
-Writes out the diagnostic bundle as files in a structured directory, optionally producing a compressed archive.
-
-Usage:
-  --output=simple [flags]
-
-Flags:
-      --output.simple.directory string   Directory in which to create dump. Defaults to the current directory. (default "./")
-      --output.simple.format string      Format of exported files (default "csv")
-      --output.simple.skip_archive       Don't compress output to an archive
-```
-
-The archive itself contains a folder for each collector. Each collector can potentially produce many discrete sets of data, known as frames. Each of these typically results in a single file within the collector's folder. For example, each query for the `summary` collector results in a correspondingly named file within the `summary` folder. 
-
-## Permissions, Warnings & Locality
-
-Some collectors either require specific permissions for complete collection or should be executed on a ClickHouse host. We aim to collate these requirements below:
-
-- `system_db` - This collect aims to collect all tables in the `system` database. Some tables may fail if certain features are not enabled. Specifically,[allow_introspection_functions](https://clickhouse.com/docs/en/operations/settings/settings/#settings-allow_introspection_functions) is required to collect the `stack_traces` table. [access_management](https://clickhouse.com/docs/en/operations/settings/settings-users/#access_management-user-setting) must be set for the ClickHouse user specified for collection, to permit access to access management tables e.g. `quota_usage`.
-- `db_logs`- The ClickHouse user must have access to the tables `query_log`,`query_thread_log` and `text_log`.
-- `logs` - The system user under which the tool is executed must have access to the logs directory. It must therefore also be executed on the target ClickHouse server directly for this collector work. In cases where the logs directory is not a default location e.g. `/var/log/clickhouse-server` we will attempt to establish the location from the ClickHouse configuration. This requires permissions to read the configuration files - which in most cases requires specific permissions to be granted to the run user if you are not comfortable executing the tool under sudo or the `clickhouse` user.
-- `summary`- This collector executes pre-recorded queries. Some of these read tables concerning access management, thus requiring the ClickHouse user to have the [access_management](https://clickhouse.com/docs/en/operations/settings/settings-users/#access_management-user-setting) permission.
-- `config` - This collector reads and copies the local configuration files. It thus requires permissions to read the configuration files - which in most cases requires specific permissions to be granted to the run user if you are not comfortable executing the tool under sudo or the `clickhouse` user.
-
-**If a collector cannot collect specific data because of either execution location or permissions, it will log a warning to the terminal.**
-
-## Logging
-
-All logs are output to `stderr`. `stdout` is used exclusively for outputs to print information.
-
-## Configuration file
-
-In addition to supporting parameters via the command line, a configuration file can be specified via the `--config`, `-f` flag. 
-
-By default, we look for a configuration file `clickhouse-diagnostics.yml` in the same directory as the binary. If not present, we revert to command line flags.
-
-**Values set via the command line values always take precedence over those in the configuration file.**
-
-All parameters can be set via the configuration file and can in most cases be converted to a yaml hierarchy, where periods indicate a nesting. For example,
-
-`--collector.system_db.row_limit=1`
-
-becomes
-
-```yaml
-collector:
-  system_db:
-    row_limit: 1
-```
-
-The following exceptions exist to avoid collisions:
-
-| Command | Parameter  | Configuration File |
-|---------|------------|--------------------|
-| collect | output     | collect.output     |
-| collect | collectors | collect.collectors |
-
-## FAQ
-
-1. Does the collector need root permissions?
-
-    No. However, to read some local files e.g. configurations, the tool should be executed as the `clickhouse` user.
-
-2. What ClickHouse database permissions does the collector need?
-
-    Read permissions on all system tables are required in most cases - although only specific collectors need this. [Access management permissions]((https://clickhouse.com/docs/en/operations/settings/settings-users/#access_management-user-setting)) will ensure full collection.
-
-3. Is any processing done on logs for anonimization purposes?
-
-    Currently no. ClickHouse should not log sensitive information to logs e.g. passwords.
-
-4. Is sensitive information removed from configuration files e.g. passwords?
-
-    Yes. We remove both passwords and hashed passwords. Please raise an issue if you require further information to be anonimized. We appreciate this is a sensitive topic.
diff --git a/programs/diagnostics/cmd/clickhouse-diagnostics/main.go b/programs/diagnostics/cmd/clickhouse-diagnostics/main.go
deleted file mode 100644
index 0a849a9f520..00000000000
--- a/programs/diagnostics/cmd/clickhouse-diagnostics/main.go
+++ /dev/null
@@ -1,9 +0,0 @@
-package main
-
-import (
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/cmd"
-)
-
-func main() {
-	cmd.Execute()
-}
diff --git a/programs/diagnostics/cmd/collect.go b/programs/diagnostics/cmd/collect.go
deleted file mode 100644
index 503d8e41fb7..00000000000
--- a/programs/diagnostics/cmd/collect.go
+++ /dev/null
@@ -1,159 +0,0 @@
-package cmd
-
-import (
-	"fmt"
-	"os"
-	"strings"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/cmd/params"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	_ "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/clickhouse"
-	_ "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/system"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs"
-	_ "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs/file"
-	_ "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs/terminal"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/rs/zerolog/log"
-	"github.com/spf13/cobra"
-	"github.com/spf13/pflag"
-	"github.com/spf13/viper"
-)
-
-var id string
-var output = params.StringOptionsVar{
-	Options: outputs.GetOutputNames(),
-	Value:   "simple",
-}
-
-// access credentials
-var host string
-var port uint16
-var username string
-var password string
-
-var collectorNames = params.StringSliceOptionsVar{
-	Options: collectors.GetCollectorNames(false),
-	Values:  collectors.GetCollectorNames(true),
-}
-
-// holds the collector params passed by the cli
-var collectorParams params.ParamMap
-
-// holds the output params passed by the cli
-var outputParams params.ParamMap
-
-const collectHelpTemplate = `Usage:{{if .Runnable}}
-  {{.UseLine}}{{end}}{{if .HasAvailableSubCommands}}
-  {{.CommandPath}} [command]{{end}}{{if gt (len .Aliases) 0}}
-
-Aliases:
-  {{.NameAndAliases}}{{end}}{{if .HasExample}}
-
-Examples:
-{{.Example}}{{end}}{{if .HasAvailableSubCommands}}
-
-Available Commands:{{range .Commands}}{{if (or .IsAvailableCommand (eq .Name "help"))}}
-  {{rpad .Name .NamePadding }} {{.Short}}{{end}}{{end}}{{end}}{{if .HasAvailableLocalFlags}}
-
-Flags:
-{{.LocalFlags.FlagUsages | trimTrailingWhitespaces}}{{end}}{{if .HasAvailableInheritedFlags}}
-
-Global Flags:
-{{.InheritedFlags.FlagUsages | trimTrailingWhitespaces}}{{end}}
-
-Additional help topics:
-	Use "{{.CommandPath}} [command] --help" for more information about a command.
-	Use "{{.Parent.Name}} help --collector [collector]" for more information about a specific collector.
-	Use "{{.Parent.Name}} help --output [output]" for more information about a specific output.
-`
-
-func init() {
-	collectCmd.Flags().StringVar(&id, "id", getHostName(), "Id of diagnostic bundle")
-
-	// access credentials
-	collectCmd.Flags().StringVar(&host, "host", "localhost", "ClickHouse host")
-	collectCmd.Flags().Uint16VarP(&port, "port", "p", 9000, "ClickHouse native port")
-	collectCmd.Flags().StringVarP(&username, "username", "u", "", "ClickHouse username")
-	collectCmd.Flags().StringVar(&password, "password", "", "ClickHouse password")
-	// collectors and outputs
-	collectCmd.Flags().VarP(&output, "output", "o", fmt.Sprintf("Output Format for the diagnostic Bundle, options: [%s]\n", strings.Join(output.Options, ",")))
-	collectCmd.Flags().VarP(&collectorNames, "collectors", "c", fmt.Sprintf("Collectors to use, options: [%s]\n", strings.Join(collectorNames.Options, ",")))
-
-	collectorConfigs, err := collectors.BuildConfigurationOptions()
-	if err != nil {
-		log.Fatal().Err(err).Msg("Unable to build collector configurations")
-	}
-	collectorParams = params.NewParamMap(collectorConfigs)
-
-	outputConfigs, err := outputs.BuildConfigurationOptions()
-	if err != nil {
-		log.Fatal().Err(err).Msg("Unable to build output configurations")
-	}
-	params.AddParamMapToCmd(collectorParams, collectCmd, "collector", true)
-
-	outputParams = params.NewParamMap(outputConfigs)
-	params.AddParamMapToCmd(outputParams, collectCmd, "output", true)
-
-	collectCmd.SetFlagErrorFunc(handleFlagErrors)
-	collectCmd.SetHelpTemplate(collectHelpTemplate)
-	rootCmd.AddCommand(collectCmd)
-}
-
-var collectCmd = &cobra.Command{
-	Use:   "collect",
-	Short: "Collect a diagnostic bundle",
-	Long:  `Collect a ClickHouse diagnostic bundle for a specified ClickHouse instance`,
-	PreRun: func(cmd *cobra.Command, args []string) {
-		bindFlagsToConfig(cmd)
-	},
-	Example: fmt.Sprintf(`%s collect --username default --collector=%s --output=simple`, rootCmd.Name(), strings.Join(collectorNames.Options[:2], ",")),
-	Run: func(cmd *cobra.Command, args []string) {
-		log.Info().Msgf("executing collect command with %v collectors and %s output", collectorNames.Values, output.Value)
-		outputConfig := params.ConvertParamsToConfig(outputParams)[output.Value]
-		runConfig := internal.NewRunConfiguration(id, host, port, username, password, output.Value, outputConfig, collectorNames.Values, params.ConvertParamsToConfig(collectorParams))
-		internal.Capture(runConfig)
-		os.Exit(0)
-	},
-}
-
-func getHostName() string {
-	name, err := os.Hostname()
-	if err != nil {
-		name = "clickhouse-diagnostics"
-	}
-	return name
-}
-
-// these flags are nested under the cmd name in the config file to prevent collisions
-var flagsToNest = []string{"output", "collectors"}
-
-// this saves us binding each command manually to viper
-func bindFlagsToConfig(cmd *cobra.Command) {
-	cmd.Flags().VisitAll(func(f *pflag.Flag) {
-		err := viper.BindEnv(f.Name, fmt.Sprintf("%s_%s", envPrefix,
-			strings.ToUpper(strings.Replace(f.Name, ".", "_", -1))))
-		if err != nil {
-			log.Error().Msgf("Unable to bind %s to config", f.Name)
-		}
-		configFlagName := f.Name
-		if utils.Contains(flagsToNest, f.Name) {
-			configFlagName = fmt.Sprintf("%s.%s", cmd.Use, configFlagName)
-		}
-		err = viper.BindPFlag(configFlagName, f)
-		if err != nil {
-			log.Error().Msgf("Unable to bind %s to config", f.Name)
-		}
-		// here we prefer the config value when the param is not set on the cmd line
-		if !f.Changed && viper.IsSet(configFlagName) {
-			val := viper.Get(configFlagName)
-			log.Debug().Msgf("Setting parameter %s from configuration file", f.Name)
-			err = cmd.Flags().Set(f.Name, fmt.Sprintf("%v", val))
-			if err != nil {
-				log.Error().Msgf("Unable to read \"%s\" value from config", f.Name)
-			} else {
-				log.Debug().Msgf("Set parameter \"%s\" from configuration", f.Name)
-			}
-		}
-	})
-}
diff --git a/programs/diagnostics/cmd/convert.go b/programs/diagnostics/cmd/convert.go
deleted file mode 100644
index 1d619dd05e2..00000000000
--- a/programs/diagnostics/cmd/convert.go
+++ /dev/null
@@ -1 +0,0 @@
-package cmd
diff --git a/programs/diagnostics/cmd/help.go b/programs/diagnostics/cmd/help.go
deleted file mode 100644
index 750576dda25..00000000000
--- a/programs/diagnostics/cmd/help.go
+++ /dev/null
@@ -1,124 +0,0 @@
-package cmd
-
-import (
-	"fmt"
-	"os"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/cmd/params"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/rs/zerolog/log"
-	"github.com/spf13/cobra"
-)
-
-var cHelp = params.StringOptionsVar{
-	Options: collectors.GetCollectorNames(false),
-	Value:   "",
-}
-var oHelp = params.StringOptionsVar{
-	Options: outputs.GetOutputNames(),
-	Value:   "",
-}
-
-func init() {
-	helpCmd.Flags().VarP(&cHelp, "collector", "c", "Specify collector to get description of available flags")
-	helpCmd.Flags().VarP(&oHelp, "output", "o", "Specify output to get description of available flags")
-	helpCmd.SetUsageTemplate(`Usage:{{if .Runnable}}
-  {{.UseLine}}{{end}}{{if .HasExample}}
-
-Examples:
-{{.Example}}{{end}}
-
-Available Commands:{{range .Parent.Commands}}{{if (or .IsAvailableCommand (eq .Name "help"))}}
-  {{rpad .Name .NamePadding }} {{.Short}}{{end}}{{end}}{{if .HasAvailableLocalFlags}}
-
-Flags:
-{{.LocalFlags.FlagUsages | trimTrailingWhitespaces}}{{end}}
-
-Alternatively use "{{.CommandPath}} [command] --help" for more information about a command.
-`)
-	helpCmd.SetFlagErrorFunc(handleFlagErrors)
-
-}
-
-var helpCmd = &cobra.Command{
-	Use:   "help [command]",
-	Short: "Help about any command, collector or output",
-	Long:  `Help provides help for any command, collector or output in the application.`,
-	Example: fmt.Sprintf(`%[1]v help collect
-%[1]v help --collector=config
-%[1]v help --output=simple`, rootCmd.Name()),
-	Run: func(c *cobra.Command, args []string) {
-		if len(args) != 0 {
-			//find the command on which help is requested
-			cmd, _, e := c.Root().Find(args)
-			if cmd == nil || e != nil {
-				c.Printf("Unknown help topic %#q\n", args)
-				cobra.CheckErr(c.Root().Usage())
-			} else {
-				cmd.InitDefaultHelpFlag()
-				cobra.CheckErr(cmd.Help())
-			}
-			return
-		}
-		if cHelp.Value != "" && oHelp.Value != "" {
-			log.Error().Msg("Specify either --collector or --output not both")
-			_ = c.Help()
-			os.Exit(1)
-		}
-		if cHelp.Value != "" {
-			collector, err := collectors.GetCollectorByName(cHelp.Value)
-			if err != nil {
-				log.Fatal().Err(err).Msgf("Unable to initialize collector %s", cHelp.Value)
-			}
-			configHelp(collector.Configuration(), "collector", cHelp.Value, collector.Description())
-		} else if oHelp.Value != "" {
-			output, err := outputs.GetOutputByName(oHelp.Value)
-			if err != nil {
-				log.Fatal().Err(err).Msgf("Unable to initialize output %s", oHelp.Value)
-			}
-			configHelp(output.Configuration(), "output", oHelp.Value, output.Description())
-		} else {
-			_ = c.Help()
-		}
-		os.Exit(0)
-	},
-}
-
-func configHelp(conf config.Configuration, componentType, name, description string) {
-
-	paramMap := params.NewParamMap(map[string]config.Configuration{
-		name: conf,
-	})
-	tempHelpCmd := &cobra.Command{
-		Use:           fmt.Sprintf("--%s=%s", componentType, name),
-		Short:         fmt.Sprintf("Help about the %s collector", name),
-		Long:          description,
-		SilenceErrors: true,
-		Run: func(c *cobra.Command, args []string) {
-			_ = c.Help()
-		},
-	}
-	params.AddParamMapToCmd(paramMap, tempHelpCmd, componentType, false)
-	// this is workaround to hide the help flag
-	tempHelpCmd.Flags().BoolP("help", "h", false, "Dummy help")
-	tempHelpCmd.Flags().Lookup("help").Hidden = true
-	tempHelpCmd.SetUsageTemplate(`
-{{.Long}}
-
-Usage:{{if .Runnable}}
-  {{.UseLine}}{{end}}{{if .HasExample}}
-
-Examples:
-{{.Example}}{{end}}
-
-Flags:{{if .HasAvailableLocalFlags}}
-{{.LocalFlags.FlagUsages | trimTrailingWhitespaces}}{{else}}
-
-	No configuration flags available
-{{end}}
-`)
-
-	_ = tempHelpCmd.Execute()
-}
diff --git a/programs/diagnostics/cmd/params/params.go b/programs/diagnostics/cmd/params/params.go
deleted file mode 100644
index c4464aab5d2..00000000000
--- a/programs/diagnostics/cmd/params/params.go
+++ /dev/null
@@ -1,281 +0,0 @@
-package params
-
-import (
-	"bytes"
-	"encoding/csv"
-	"fmt"
-	"strings"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/spf13/cobra"
-)
-
-type cliParamType uint8
-
-const (
-	String cliParamType = iota
-	StringList
-	StringOptionsList
-	Integer
-	Boolean
-)
-
-type CliParam struct {
-	Description string
-	Default     interface{}
-	//this should always be an address to a value - as required by cobra
-	Value interface{}
-	Type  cliParamType
-}
-
-type ParamMap map[string]map[string]CliParam
-
-func NewParamMap(configs map[string]config.Configuration) ParamMap {
-	paramMap := make(ParamMap)
-	for name, configuration := range configs {
-		for _, param := range configuration.Params {
-			switch p := param.(type) {
-			case config.StringParam:
-				paramMap = paramMap.createStringParam(name, p)
-			case config.StringListParam:
-				paramMap = paramMap.createStringListParam(name, p)
-			case config.StringOptions:
-				paramMap = paramMap.createStringOptionsParam(name, p)
-			case config.IntParam:
-				paramMap = paramMap.createIntegerParam(name, p)
-			case config.BoolParam:
-				paramMap = paramMap.createBoolParam(name, p)
-			}
-		}
-	}
-	return paramMap
-}
-
-func (m ParamMap) createBoolParam(rootKey string, bParam config.BoolParam) ParamMap {
-	if _, ok := m[rootKey]; !ok {
-		m[rootKey] = make(map[string]CliParam)
-	}
-	var value bool
-	param := CliParam{
-		Description: bParam.Description(),
-		Default:     bParam.Value,
-		Value:       &value,
-		Type:        Boolean,
-	}
-	m[rootKey][bParam.Name()] = param
-	return m
-}
-
-func (m ParamMap) createStringParam(rootKey string, sParam config.StringParam) ParamMap {
-	if _, ok := m[rootKey]; !ok {
-		m[rootKey] = make(map[string]CliParam)
-	}
-	var value string
-	param := CliParam{
-		Description: sParam.Description(),
-		Default:     sParam.Value,
-		Value:       &value,
-		Type:        String,
-	}
-	m[rootKey][sParam.Name()] = param
-	return m
-}
-
-func (m ParamMap) createStringListParam(rootKey string, lParam config.StringListParam) ParamMap {
-	if _, ok := m[rootKey]; !ok {
-		m[rootKey] = make(map[string]CliParam)
-	}
-	var value []string
-	param := CliParam{
-		Description: lParam.Description(),
-		Default:     lParam.Values,
-		Value:       &value,
-		Type:        StringList,
-	}
-	m[rootKey][lParam.Name()] = param
-	return m
-}
-
-func (m ParamMap) createStringOptionsParam(rootKey string, oParam config.StringOptions) ParamMap {
-	if _, ok := m[rootKey]; !ok {
-		m[rootKey] = make(map[string]CliParam)
-	}
-	value := StringOptionsVar{
-		Options: oParam.Options,
-		Value:   oParam.Value,
-	}
-	param := CliParam{
-		Description: oParam.Description(),
-		Default:     oParam.Value,
-		Value:       &value,
-		Type:        StringOptionsList,
-	}
-	m[rootKey][oParam.Name()] = param
-	return m
-}
-
-func (m ParamMap) createIntegerParam(rootKey string, iParam config.IntParam) ParamMap {
-	if _, ok := m[rootKey]; !ok {
-		m[rootKey] = make(map[string]CliParam)
-	}
-	var value int64
-	param := CliParam{
-		Description: iParam.Description(),
-		Default:     iParam.Value,
-		Value:       &value,
-		Type:        Integer,
-	}
-	m[rootKey][iParam.Name()] = param
-	return m
-}
-
-func (c CliParam) GetConfigParam(name string) config.ConfigParam {
-	// this is a config being passed to a collector - required can be false
-	param := config.NewParam(name, c.Description, false)
-	switch c.Type {
-	case String:
-		return config.StringParam{
-			Param: param,
-			// values will be pointers
-			Value: *(c.Value.(*string)),
-		}
-	case StringList:
-		return config.StringListParam{
-			Param:  param,
-			Values: *(c.Value.(*[]string)),
-		}
-	case StringOptionsList:
-		optionsVar := *(c.Value.(*StringOptionsVar))
-		return config.StringOptions{
-			Param:   param,
-			Options: optionsVar.Options,
-			Value:   optionsVar.Value,
-		}
-	case Integer:
-		return config.IntParam{
-			Param: param,
-			Value: *(c.Value.(*int64)),
-		}
-	case Boolean:
-		return config.BoolParam{
-			Param: param,
-			Value: *(c.Value.(*bool)),
-		}
-	}
-	return param
-}
-
-type StringOptionsVar struct {
-	Options []string
-	Value   string
-}
-
-func (o StringOptionsVar) String() string {
-	return o.Value
-}
-
-func (o *StringOptionsVar) Set(p string) error {
-	isIncluded := func(opts []string, val string) bool {
-		for _, opt := range opts {
-			if val == opt {
-				return true
-			}
-		}
-		return false
-	}
-	if !isIncluded(o.Options, p) {
-		return fmt.Errorf("%s is not included in options: %v", p, o.Options)
-	}
-	o.Value = p
-	return nil
-}
-
-func (o *StringOptionsVar) Type() string {
-	return "string"
-}
-
-type StringSliceOptionsVar struct {
-	Options []string
-	Values  []string
-}
-
-func (o StringSliceOptionsVar) String() string {
-	str, _ := writeAsCSV(o.Values)
-	return "[" + str + "]"
-}
-
-func (o *StringSliceOptionsVar) Set(val string) error {
-	values, err := readAsCSV(val)
-	if err != nil {
-		return err
-	}
-	vValues := utils.Distinct(values, o.Options)
-	if len(vValues) > 0 {
-		return fmt.Errorf("%v are not included in options: %v", vValues, o.Options)
-	}
-	o.Values = values
-	return nil
-}
-
-func (o *StringSliceOptionsVar) Type() string {
-	return "stringSlice"
-}
-
-func writeAsCSV(vals []string) (string, error) {
-	b := &bytes.Buffer{}
-	w := csv.NewWriter(b)
-	err := w.Write(vals)
-	if err != nil {
-		return "", err
-	}
-	w.Flush()
-	return strings.TrimSuffix(b.String(), "\n"), nil
-}
-
-func readAsCSV(val string) ([]string, error) {
-	if val == "" {
-		return []string{}, nil
-	}
-	stringReader := strings.NewReader(val)
-	csvReader := csv.NewReader(stringReader)
-	return csvReader.Read()
-}
-
-func AddParamMapToCmd(paramMap ParamMap, cmd *cobra.Command, prefix string, hide bool) {
-	for rootKey, childMap := range paramMap {
-		for childKey, value := range childMap {
-			paramName := fmt.Sprintf("%s.%s.%s", prefix, rootKey, childKey)
-			switch value.Type {
-			case String:
-				cmd.Flags().StringVar(value.Value.(*string), paramName, value.Default.(string), value.Description)
-			case StringList:
-				cmd.Flags().StringSliceVar(value.Value.(*[]string), paramName, value.Default.([]string), value.Description)
-			case StringOptionsList:
-				cmd.Flags().Var(value.Value.(*StringOptionsVar), paramName, value.Description)
-			case Integer:
-				cmd.Flags().Int64Var(value.Value.(*int64), paramName, value.Default.(int64), value.Description)
-			case Boolean:
-				cmd.Flags().BoolVar(value.Value.(*bool), paramName, value.Default.(bool), value.Description)
-			}
-			// this ensures flags from collectors and outputs are not shown as they will pollute the output
-			if hide {
-				_ = cmd.Flags().MarkHidden(paramName)
-			}
-		}
-	}
-}
-
-func ConvertParamsToConfig(paramMap ParamMap) map[string]config.Configuration {
-	configuration := make(map[string]config.Configuration)
-	for rootKey, childMap := range paramMap {
-		if _, ok := configuration[rootKey]; !ok {
-			configuration[rootKey] = config.Configuration{}
-		}
-		for childKey, value := range childMap {
-			configParam := value.GetConfigParam(childKey)
-			configuration[rootKey] = config.Configuration{Params: append(configuration[rootKey].Params, configParam)}
-		}
-	}
-	return configuration
-}
diff --git a/programs/diagnostics/cmd/params/params_test.go b/programs/diagnostics/cmd/params/params_test.go
deleted file mode 100644
index 7671506ba59..00000000000
--- a/programs/diagnostics/cmd/params/params_test.go
+++ /dev/null
@@ -1,247 +0,0 @@
-package params_test
-
-import (
-	"os"
-	"sort"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/cmd/params"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/spf13/cobra"
-	"github.com/stretchr/testify/require"
-)
-
-var conf = map[string]config.Configuration{
-	"config": {
-		Params: []config.ConfigParam{
-			config.StringParam{
-				Value:      "",
-				Param:      config.NewParam("directory", "A directory", false),
-				AllowEmpty: true,
-			},
-		},
-	},
-	"system": {
-		Params: []config.ConfigParam{
-			config.StringListParam{
-				// nil means include everything
-				Values: nil,
-				Param:  config.NewParam("include_tables", "Include tables", false),
-			},
-			config.StringListParam{
-				Values: []string{"distributed_ddl_queue", "query_thread_log", "query_log", "asynchronous_metric_log", "zookeeper"},
-				Param:  config.NewParam("exclude_tables", "Excluded tables", false),
-			},
-			config.IntParam{
-				Value: 100000,
-				Param: config.NewParam("row_limit", "Max rows", false),
-			},
-		},
-	},
-	"reader": {
-		Params: []config.ConfigParam{
-			config.StringOptions{
-				Value:   "csv",
-				Options: []string{"csv"},
-				Param:   config.NewParam("format", "Format of imported files", false),
-			},
-			config.BoolParam{
-				Value: true,
-				Param: config.NewParam("collect_archives", "Collect archives", false),
-			},
-		},
-	},
-}
-
-func TestNewParamMap(t *testing.T) {
-	// test each of the types via NewParamMap - one with each type. the keys here can represent anything e.g. a collector name
-	t.Run("test param map correctly converts types", func(t *testing.T) {
-		paramMap := params.NewParamMap(conf)
-		require.Len(t, paramMap, 3)
-		// check config
-		require.Contains(t, paramMap, "config")
-		require.Len(t, paramMap["config"], 1)
-		require.Contains(t, paramMap["config"], "directory")
-		require.IsType(t, params.CliParam{}, paramMap["config"]["directory"])
-		require.Equal(t, "A directory", paramMap["config"]["directory"].Description)
-		require.Equal(t, "", *(paramMap["config"]["directory"].Value.(*string)))
-		require.Equal(t, "", paramMap["config"]["directory"].Default)
-		require.Equal(t, params.String, paramMap["config"]["directory"].Type)
-		// check system
-		require.Contains(t, paramMap, "system")
-		require.Len(t, paramMap["system"], 3)
-		require.IsType(t, params.CliParam{}, paramMap["system"]["include_tables"])
-
-		require.Equal(t, "Include tables", paramMap["system"]["include_tables"].Description)
-		var value []string
-		require.Equal(t, &value, paramMap["system"]["include_tables"].Value)
-		require.Equal(t, value, paramMap["system"]["include_tables"].Default)
-		require.Equal(t, params.StringList, paramMap["system"]["include_tables"].Type)
-
-		require.Equal(t, "Excluded tables", paramMap["system"]["exclude_tables"].Description)
-		require.IsType(t, params.CliParam{}, paramMap["system"]["exclude_tables"])
-		require.Equal(t, &value, paramMap["system"]["exclude_tables"].Value)
-		require.Equal(t, []string{"distributed_ddl_queue", "query_thread_log", "query_log", "asynchronous_metric_log", "zookeeper"}, paramMap["system"]["exclude_tables"].Default)
-		require.Equal(t, params.StringList, paramMap["system"]["exclude_tables"].Type)
-
-		require.Equal(t, "Max rows", paramMap["system"]["row_limit"].Description)
-		require.IsType(t, params.CliParam{}, paramMap["system"]["row_limit"])
-		var iValue int64
-		require.Equal(t, &iValue, paramMap["system"]["row_limit"].Value)
-		require.Equal(t, int64(100000), paramMap["system"]["row_limit"].Default)
-		require.Equal(t, params.Integer, paramMap["system"]["row_limit"].Type)
-
-		// check reader
-		require.Contains(t, paramMap, "reader")
-		require.Len(t, paramMap["reader"], 2)
-		require.IsType(t, params.CliParam{}, paramMap["reader"]["format"])
-		require.Equal(t, "Format of imported files", paramMap["reader"]["format"].Description)
-		require.IsType(t, params.CliParam{}, paramMap["reader"]["format"])
-		oValue := params.StringOptionsVar{
-			Options: []string{"csv"},
-			Value:   "csv",
-		}
-		require.Equal(t, &oValue, paramMap["reader"]["format"].Value)
-		require.Equal(t, "csv", paramMap["reader"]["format"].Default)
-		require.Equal(t, params.StringOptionsList, paramMap["reader"]["format"].Type)
-
-		require.IsType(t, params.CliParam{}, paramMap["reader"]["collect_archives"])
-		require.Equal(t, "Collect archives", paramMap["reader"]["collect_archives"].Description)
-		require.IsType(t, params.CliParam{}, paramMap["reader"]["collect_archives"])
-		var bVar bool
-		require.Equal(t, &bVar, paramMap["reader"]["collect_archives"].Value)
-		require.Equal(t, true, paramMap["reader"]["collect_archives"].Default)
-		require.Equal(t, params.Boolean, paramMap["reader"]["collect_archives"].Type)
-
-	})
-
-}
-
-//  test GetConfigParam
-func TestConvertParamsToConfig(t *testing.T) {
-	paramMap := params.NewParamMap(conf)
-	t.Run("test we can convert a param map back to a config", func(t *testing.T) {
-		cParam := params.ConvertParamsToConfig(paramMap)
-		// these will not be equal as we have some information loss e.g. allowEmpty
-		//require.Equal(t, conf, cParam)
-		// deep equality
-		for name := range conf {
-			require.Equal(t, len(conf[name].Params), len(cParam[name].Params))
-			// sort both consistently
-			sort.Slice(conf[name].Params, func(i, j int) bool {
-				return conf[name].Params[i].Name() < conf[name].Params[j].Name()
-			})
-			sort.Slice(cParam[name].Params, func(i, j int) bool {
-				return cParam[name].Params[i].Name() < cParam[name].Params[j].Name()
-			})
-			for i, param := range conf[name].Params {
-				require.Equal(t, param.Required(), cParam[name].Params[i].Required())
-				require.Equal(t, param.Name(), cParam[name].Params[i].Name())
-				require.Equal(t, param.Description(), cParam[name].Params[i].Description())
-			}
-		}
-	})
-}
-
-// create via NewParamMap and add to command AddParamMapToCmd - check contents
-func TestAddParamMapToCmd(t *testing.T) {
-	paramMap := params.NewParamMap(conf)
-	t.Run("test we can add hidden params to a command", func(t *testing.T) {
-		testComand := &cobra.Command{
-			Use:   "test",
-			Short: "Run a test",
-			Long:  `Longer description`,
-			Run: func(cmd *cobra.Command, args []string) {
-				os.Exit(0)
-			},
-		}
-		params.AddParamMapToCmd(paramMap, testComand, "collector", true)
-		// check we get an error on one which doesn't exist
-		_, err := testComand.Flags().GetString("collector.config.random")
-		require.NotNil(t, err)
-		// check getting incorrect type
-		_, err = testComand.Flags().GetString("collector.system.include_tables")
-		require.NotNil(t, err)
-
-		// check existence of all flags
-		directory, err := testComand.Flags().GetString("collector.config.directory")
-		require.Nil(t, err)
-		require.Equal(t, "", directory)
-
-		includeTables, err := testComand.Flags().GetStringSlice("collector.system.include_tables")
-		require.Nil(t, err)
-		require.Equal(t, []string{}, includeTables)
-
-		excludeTables, err := testComand.Flags().GetStringSlice("collector.system.exclude_tables")
-		require.Nil(t, err)
-		require.Equal(t, []string{"distributed_ddl_queue", "query_thread_log", "query_log", "asynchronous_metric_log", "zookeeper"}, excludeTables)
-
-		rowLimit, err := testComand.Flags().GetInt64("collector.system.row_limit")
-		require.Nil(t, err)
-		require.Equal(t, int64(100000), rowLimit)
-
-		format, err := testComand.Flags().GetString("collector.reader.format")
-		require.Nil(t, err)
-		require.Equal(t, "csv", format)
-
-		collectArchives, err := testComand.Flags().GetBool("collector.reader.collect_archives")
-		require.Nil(t, err)
-		require.Equal(t, true, collectArchives)
-	})
-}
-
-// test StringOptionsVar
-func TestStringOptionsVar(t *testing.T) {
-
-	t.Run("test we can set", func(t *testing.T) {
-		format := params.StringOptionsVar{
-			Options: []string{"csv", "tsv", "native"},
-			Value:   "csv",
-		}
-		require.Equal(t, "csv", format.String())
-		err := format.Set("tsv")
-		require.Nil(t, err)
-		require.Equal(t, "tsv", format.String())
-	})
-
-	t.Run("test set invalid", func(t *testing.T) {
-		format := params.StringOptionsVar{
-			Options: []string{"csv", "tsv", "native"},
-			Value:   "csv",
-		}
-		require.Equal(t, "csv", format.String())
-		err := format.Set("random")
-		require.NotNil(t, err)
-		require.Equal(t, "random is not included in options: [csv tsv native]", err.Error())
-	})
-}
-
-// test StringSliceOptionsVar
-func TestStringSliceOptionsVar(t *testing.T) {
-
-	t.Run("test we can set", func(t *testing.T) {
-		formats := params.StringSliceOptionsVar{
-			Options: []string{"csv", "tsv", "native", "qsv"},
-			Values:  []string{"csv", "tsv"},
-		}
-		require.Equal(t, "[csv,tsv]", formats.String())
-		err := formats.Set("tsv,native")
-		require.Nil(t, err)
-		require.Equal(t, "[tsv,native]", formats.String())
-	})
-
-	t.Run("test set invalid", func(t *testing.T) {
-		formats := params.StringSliceOptionsVar{
-			Options: []string{"csv", "tsv", "native", "qsv"},
-			Values:  []string{"csv", "tsv"},
-		}
-		require.Equal(t, "[csv,tsv]", formats.String())
-		err := formats.Set("tsv,random")
-		require.NotNil(t, err)
-		require.Equal(t, "[random] are not included in options: [csv tsv native qsv]", err.Error())
-		err = formats.Set("msv,random")
-		require.NotNil(t, err)
-		require.Equal(t, "[msv random] are not included in options: [csv tsv native qsv]", err.Error())
-	})
-
-}
diff --git a/programs/diagnostics/cmd/root.go b/programs/diagnostics/cmd/root.go
deleted file mode 100644
index 4cf329d5438..00000000000
--- a/programs/diagnostics/cmd/root.go
+++ /dev/null
@@ -1,174 +0,0 @@
-package cmd
-
-import (
-	"fmt"
-	"net/http"
-	_ "net/http/pprof"
-	"os"
-	"strings"
-	"time"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/pkg/errors"
-	"github.com/rs/zerolog"
-	"github.com/rs/zerolog/log"
-	"github.com/spf13/cobra"
-	"github.com/spf13/viper"
-)
-
-func enableDebug() {
-	if debug {
-		zerolog.SetGlobalLevel(zerolog.DebugLevel)
-		go func() {
-			err := http.ListenAndServe("localhost:8080", nil)
-			if err != nil {
-				log.Error().Err(err).Msg("unable to start debugger")
-			} else {
-				log.Debug().Msg("debugger has been started on port 8080")
-			}
-		}()
-	}
-}
-
-var rootCmd = &cobra.Command{
-	Use:   "clickhouse-diagnostics",
-	Short: "Capture and convert ClickHouse diagnostic bundles.",
-	Long:  `Captures ClickHouse diagnostic bundles to a number of supported formats, including file and ClickHouse itself. Converts bundles between formats.`,
-	PersistentPreRunE: func(cmd *cobra.Command, args []string) error {
-		enableDebug()
-		err := initializeConfig()
-		if err != nil {
-			log.Error().Err(err)
-			os.Exit(1)
-		}
-		return nil
-	},
-	Example: `clickhouse-diagnostics collect`,
-}
-
-const (
-	colorRed = iota + 31
-	colorGreen
-	colorYellow
-	colorMagenta = 35
-
-	colorBold = 1
-)
-
-const TimeFormat = time.RFC3339
-
-var debug bool
-var configFiles []string
-
-const (
-	// The environment variable prefix of all environment variables bound to our command line flags.
-	// For example, --output is bound to CLICKHOUSE_DIAGNOSTIC_OUTPUT.
-	envPrefix = "CLICKHOUSE_DIAGNOSTIC"
-)
-
-func init() {
-	rootCmd.PersistentFlags().BoolVarP(&debug, "debug", "d", false, "Enable debug mode")
-	rootCmd.PersistentFlags().StringSliceVarP(&configFiles, "config", "f", []string{"clickhouse-diagnostics.yml", "/etc/clickhouse-diagnostics.yml"}, "Configuration file path")
-	// set a usage template to ensure flags on root are listed as global
-	rootCmd.SetUsageTemplate(`Usage:{{if .Runnable}}
-  {{.UseLine}}{{end}}{{if .HasAvailableSubCommands}}
-  {{.CommandPath}} [command]{{end}}{{if gt (len .Aliases) 0}}
-
-Aliases:
-  {{.NameAndAliases}}{{end}}{{if .HasExample}}
-
-Examples:
-{{.Example}}{{end}}{{if .HasAvailableSubCommands}}
-
-Available Commands:{{range .Commands}}{{if (or .IsAvailableCommand (eq .Name "help"))}}
-  {{rpad .Name .NamePadding }} {{.Short}}{{end}}{{end}}{{end}}{{if .HasAvailableLocalFlags}}
-
-Global Flags:
-{{.LocalFlags.FlagUsages | trimTrailingWhitespaces}}{{end}}{{if .HasAvailableInheritedFlags}}
-
-Additional help topics:{{range .Commands}}{{if .IsAdditionalHelpTopicCommand}}
-  {{rpad .CommandPath .CommandPathPadding}} {{.Short}}{{end}}{{end}}{{end}}{{if .HasAvailableSubCommands}}
-
-Use "{{.CommandPath}} [command] --help" for more information about a command.{{end}}
-`)
-	rootCmd.SetFlagErrorFunc(handleFlagErrors)
-
-}
-
-func Execute() {
-	// logs go to stderr - stdout is exclusive for outputs e.g. tables
-	output := zerolog.ConsoleWriter{Out: os.Stderr, TimeFormat: TimeFormat}
-	// override the colors
-	output.FormatLevel = func(i interface{}) string {
-		var l string
-		if ll, ok := i.(string); ok {
-			switch ll {
-			case zerolog.LevelTraceValue:
-				l = colorize("TRC", colorMagenta)
-			case zerolog.LevelDebugValue:
-				l = colorize("DBG", colorMagenta)
-			case zerolog.LevelInfoValue:
-				l = colorize("INF", colorGreen)
-			case zerolog.LevelWarnValue:
-				l = colorize(colorize("WRN", colorYellow), colorBold)
-			case zerolog.LevelErrorValue:
-				l = colorize(colorize("ERR", colorRed), colorBold)
-			case zerolog.LevelFatalValue:
-				l = colorize(colorize("FTL", colorRed), colorBold)
-			case zerolog.LevelPanicValue:
-				l = colorize(colorize("PNC", colorRed), colorBold)
-			default:
-				l = colorize("???", colorBold)
-			}
-		} else {
-			if i == nil {
-				l = colorize("???", colorBold)
-			} else {
-				l = strings.ToUpper(fmt.Sprintf("%s", i))[0:3]
-			}
-		}
-		return l
-	}
-	output.FormatTimestamp = func(i interface{}) string {
-		tt := i.(string)
-		return colorize(tt, colorGreen)
-	}
-	log.Logger = log.Output(output)
-	zerolog.SetGlobalLevel(zerolog.InfoLevel)
-	rootCmd.SetHelpCommand(helpCmd)
-	if err := rootCmd.Execute(); err != nil {
-		log.Fatal().Err(err)
-	}
-}
-
-// colorize returns the string s wrapped in ANSI code c
-func colorize(s interface{}, c int) string {
-	return fmt.Sprintf("\x1b[%dm%v\x1b[0m", c, s)
-}
-
-func handleFlagErrors(cmd *cobra.Command, err error) error {
-	fmt.Println(colorize(colorize(fmt.Sprintf("Error: %s\n", err), colorRed), colorBold))
-	_ = cmd.Help()
-	os.Exit(1)
-	return nil
-}
-
-func initializeConfig() error {
-	// we use the first config file we find
-	var configFile string
-	for _, confFile := range configFiles {
-		if ok, _ := utils.FileExists(confFile); ok {
-			configFile = confFile
-			break
-		}
-	}
-	if configFile == "" {
-		log.Warn().Msgf("config file in %s not found - config file will be ignored", configFiles)
-		return nil
-	}
-	viper.SetConfigFile(configFile)
-	if err := viper.ReadInConfig(); err != nil {
-		return errors.Wrapf(err, "Unable to read configuration file at %s", configFile)
-	}
-	return nil
-}
diff --git a/programs/diagnostics/cmd/version.go b/programs/diagnostics/cmd/version.go
deleted file mode 100644
index b1c0b44171b..00000000000
--- a/programs/diagnostics/cmd/version.go
+++ /dev/null
@@ -1,24 +0,0 @@
-package cmd
-
-import (
-	"fmt"
-	"github.com/spf13/cobra"
-)
-
-var (
-	Version = "" // set at compile time with -ldflags "-X versserv/cmd.Version=x.y.yz"
-	Commit  = ""
-)
-
-func init() {
-	rootCmd.AddCommand(versionCmd)
-}
-
-var versionCmd = &cobra.Command{
-	Use:   "version",
-	Short: "Print the version number of clickhouse-diagnostics",
-	Long:  `All software has versions. This is clickhouse-diagnostics`,
-	Run: func(cmd *cobra.Command, args []string) {
-		fmt.Printf("Clickhouse Diagnostics %s (%s)\n", Version, Commit)
-	},
-}
diff --git a/programs/diagnostics/go.mod b/programs/diagnostics/go.mod
deleted file mode 100644
index 34c6b0037ae..00000000000
--- a/programs/diagnostics/go.mod
+++ /dev/null
@@ -1,89 +0,0 @@
-module github.com/ClickHouse/ClickHouse/programs/diagnostics
-
-go 1.19
-
-require (
-	github.com/ClickHouse/clickhouse-go/v2 v2.0.12
-	github.com/DATA-DOG/go-sqlmock v1.5.0
-	github.com/Masterminds/semver v1.5.0
-	github.com/bmatcuk/doublestar/v4 v4.0.2
-	github.com/docker/go-connections v0.4.0
-	github.com/elastic/gosigar v0.14.2
-	github.com/google/shlex v0.0.0-20191202100458-e7afc7fbc510
-	github.com/jaypipes/ghw v0.8.0
-	github.com/matishsiao/goInfo v0.0.0-20210923090445-da2e3fa8d45f
-	github.com/mholt/archiver/v4 v4.0.0-alpha.4
-	github.com/olekukonko/tablewriter v0.0.5
-	github.com/pkg/errors v0.9.1
-	github.com/rs/zerolog v1.26.1
-	github.com/spf13/cobra v1.3.0
-	github.com/spf13/pflag v1.0.5
-	github.com/spf13/viper v1.10.1
-	github.com/stretchr/testify v1.8.1
-	github.com/testcontainers/testcontainers-go v0.18.0
-	github.com/yargevad/filepathx v1.0.0
-	gopkg.in/yaml.v3 v3.0.1
-)
-
-require (
-	github.com/Azure/go-ansiterm v0.0.0-20210617225240-d185dfc1b5a1 // indirect
-	github.com/Microsoft/go-winio v0.5.2 // indirect
-	github.com/StackExchange/wmi v0.0.0-20190523213315-cbe66965904d // indirect
-	github.com/andybalholm/brotli v1.0.4 // indirect
-	github.com/cenkalti/backoff/v4 v4.2.0 // indirect
-	github.com/containerd/containerd v1.6.17 // indirect
-	github.com/davecgh/go-spew v1.1.1 // indirect
-	github.com/distribution/distribution v2.8.2+incompatible // indirect
-	github.com/docker/distribution v2.8.1+incompatible // indirect
-	github.com/docker/docker v23.0.0+incompatible // indirect
-	github.com/docker/go-units v0.5.0 // indirect
-	github.com/dsnet/compress v0.0.1 // indirect
-	github.com/fsnotify/fsnotify v1.5.4 // indirect
-	github.com/ghodss/yaml v1.0.0 // indirect
-	github.com/go-ole/go-ole v1.2.4 // indirect
-	github.com/gogo/protobuf v1.3.2 // indirect
-	github.com/golang/protobuf v1.5.2 // indirect
-	github.com/golang/snappy v0.0.4 // indirect
-	github.com/google/uuid v1.3.0 // indirect
-	github.com/hashicorp/hcl v1.0.0 // indirect
-	github.com/inconshreveable/mousetrap v1.0.0 // indirect
-	github.com/jaypipes/pcidb v0.6.0 // indirect
-	github.com/klauspost/compress v1.13.6 // indirect
-	github.com/klauspost/pgzip v1.2.5 // indirect
-	github.com/kr/text v0.2.0 // indirect
-	github.com/magiconair/properties v1.8.7 // indirect
-	github.com/mattn/go-runewidth v0.0.9 // indirect
-	github.com/mitchellh/go-homedir v1.1.0 // indirect
-	github.com/mitchellh/mapstructure v1.4.3 // indirect
-	github.com/moby/patternmatcher v0.5.0 // indirect
-	github.com/moby/sys/sequential v0.5.0 // indirect
-	github.com/moby/term v0.0.0-20221128092401-c43b287e0e0f // indirect
-	github.com/morikuni/aec v1.0.0 // indirect
-	github.com/nwaples/rardecode/v2 v2.0.0-beta.2 // indirect
-	github.com/opencontainers/go-digest v1.0.0 // indirect
-	github.com/opencontainers/image-spec v1.1.0-rc2 // indirect
-	github.com/opencontainers/runc v1.1.3 // indirect
-	github.com/paulmach/orb v0.4.0 // indirect
-	github.com/pelletier/go-toml v1.9.5 // indirect
-	github.com/pierrec/lz4/v4 v4.1.14 // indirect
-	github.com/pmezard/go-difflib v1.0.0 // indirect
-	github.com/shopspring/decimal v1.3.1 // indirect
-	github.com/sirupsen/logrus v1.9.0 // indirect
-	github.com/spf13/afero v1.8.0 // indirect
-	github.com/spf13/cast v1.4.1 // indirect
-	github.com/spf13/jwalterweatherman v1.1.0 // indirect
-	github.com/subosito/gotenv v1.2.0 // indirect
-	github.com/therootcompany/xz v1.0.1 // indirect
-	github.com/ulikunitz/xz v0.5.10 // indirect
-	go.opentelemetry.io/otel v1.4.1 // indirect
-	go.opentelemetry.io/otel/trace v1.4.1 // indirect
-	golang.org/x/net v0.0.0-20220906165146-f3363e06e74c // indirect
-	golang.org/x/sys v0.5.0 // indirect
-	golang.org/x/text v0.7.0 // indirect
-	google.golang.org/genproto v0.0.0-20220617124728-180714bec0ad // indirect
-	google.golang.org/grpc v1.47.0 // indirect
-	google.golang.org/protobuf v1.28.0 // indirect
-	gopkg.in/ini.v1 v1.66.2 // indirect
-	gopkg.in/yaml.v2 v2.4.0 // indirect
-	howett.net/plist v0.0.0-20181124034731-591f970eefbb // indirect
-)
diff --git a/programs/diagnostics/go.sum b/programs/diagnostics/go.sum
deleted file mode 100644
index a95dfb4fd2b..00000000000
--- a/programs/diagnostics/go.sum
+++ /dev/null
@@ -1,992 +0,0 @@
-cloud.google.com/go v0.26.0/go.mod h1:aQUYkXzVsufM+DwF1aE+0xfcU+56JwCaLick0ClmMTw=
-cloud.google.com/go v0.34.0/go.mod h1:aQUYkXzVsufM+DwF1aE+0xfcU+56JwCaLick0ClmMTw=
-cloud.google.com/go v0.38.0/go.mod h1:990N+gfupTy94rShfmMCWGDn0LpTmnzTp2qbd1dvSRU=
-cloud.google.com/go v0.44.1/go.mod h1:iSa0KzasP4Uvy3f1mN/7PiObzGgflwredwwASm/v6AU=
-cloud.google.com/go v0.44.2/go.mod h1:60680Gw3Yr4ikxnPRS/oxxkBccT6SA1yMk63TGekxKY=
-cloud.google.com/go v0.44.3/go.mod h1:60680Gw3Yr4ikxnPRS/oxxkBccT6SA1yMk63TGekxKY=
-cloud.google.com/go v0.45.1/go.mod h1:RpBamKRgapWJb87xiFSdk4g1CME7QZg3uwTez+TSTjc=
-cloud.google.com/go v0.46.3/go.mod h1:a6bKKbmY7er1mI7TEI4lsAkts/mkhTSZK8w33B4RAg0=
-cloud.google.com/go v0.50.0/go.mod h1:r9sluTvynVuxRIOHXQEHMFffphuXHOMZMycpNR5e6To=
-cloud.google.com/go v0.52.0/go.mod h1:pXajvRH/6o3+F9jDHZWQ5PbGhn+o8w9qiu/CffaVdO4=
-cloud.google.com/go v0.53.0/go.mod h1:fp/UouUEsRkN6ryDKNW/Upv/JBKnv6WDthjR6+vze6M=
-cloud.google.com/go v0.54.0/go.mod h1:1rq2OEkV3YMf6n/9ZvGWI3GWw0VoqH/1x2nd8Is/bPc=
-cloud.google.com/go v0.56.0/go.mod h1:jr7tqZxxKOVYizybht9+26Z/gUq7tiRzu+ACVAMbKVk=
-cloud.google.com/go v0.57.0/go.mod h1:oXiQ6Rzq3RAkkY7N6t3TcE6jE+CIBBbA36lwQ1JyzZs=
-cloud.google.com/go v0.62.0/go.mod h1:jmCYTdRCQuc1PHIIJ/maLInMho30T/Y0M4hTdTShOYc=
-cloud.google.com/go v0.65.0/go.mod h1:O5N8zS7uWy9vkA9vayVHs65eM1ubvY4h553ofrNHObY=
-cloud.google.com/go v0.72.0/go.mod h1:M+5Vjvlc2wnp6tjzE102Dw08nGShTscUx2nZMufOKPI=
-cloud.google.com/go v0.74.0/go.mod h1:VV1xSbzvo+9QJOxLDaJfTjx5e+MePCpCWwvftOeQmWk=
-cloud.google.com/go v0.75.0/go.mod h1:VGuuCn7PG0dwsd5XPVm2Mm3wlh3EL55/79EKB6hlPTY=
-cloud.google.com/go v0.78.0/go.mod h1:QjdrLG0uq+YwhjoVOLsS1t7TW8fs36kLs4XO5R5ECHg=
-cloud.google.com/go v0.79.0/go.mod h1:3bzgcEeQlzbuEAYu4mrWhKqWjmpprinYgKJLgKHnbb8=
-cloud.google.com/go v0.81.0/go.mod h1:mk/AM35KwGk/Nm2YSeZbxXdrNK3KZOYHmLkOqC2V6E0=
-cloud.google.com/go v0.83.0/go.mod h1:Z7MJUsANfY0pYPdw0lbnivPx4/vhy/e2FEkSkF7vAVY=
-cloud.google.com/go v0.84.0/go.mod h1:RazrYuxIK6Kb7YrzzhPoLmCVzl7Sup4NrbKPg8KHSUM=
-cloud.google.com/go v0.87.0/go.mod h1:TpDYlFy7vuLzZMMZ+B6iRiELaY7z/gJPaqbMx6mlWcY=
-cloud.google.com/go v0.90.0/go.mod h1:kRX0mNRHe0e2rC6oNakvwQqzyDmg57xJ+SZU1eT2aDQ=
-cloud.google.com/go v0.93.3/go.mod h1:8utlLll2EF5XMAV15woO4lSbWQlk8rer9aLOfLh7+YI=
-cloud.google.com/go v0.94.1/go.mod h1:qAlAugsXlC+JWO+Bke5vCtc9ONxjQT3drlTTnAplMW4=
-cloud.google.com/go v0.97.0/go.mod h1:GF7l59pYBVlXQIBLx3a761cZ41F9bBH3JUlihCt2Udc=
-cloud.google.com/go v0.98.0/go.mod h1:ua6Ush4NALrHk5QXDWnjvZHN93OuF0HfuEPq9I1X0cM=
-cloud.google.com/go v0.99.0/go.mod h1:w0Xx2nLzqWJPuozYQX+hFfCSI8WioryfRDzkoI/Y2ZA=
-cloud.google.com/go/bigquery v1.0.1/go.mod h1:i/xbL2UlR5RvWAURpBYZTtm/cXjCha9lbfbpx4poX+o=
-cloud.google.com/go/bigquery v1.3.0/go.mod h1:PjpwJnslEMmckchkHFfq+HTD2DmtT67aNFKH1/VBDHE=
-cloud.google.com/go/bigquery v1.4.0/go.mod h1:S8dzgnTigyfTmLBfrtrhyYhwRxG72rYxvftPBK2Dvzc=
-cloud.google.com/go/bigquery v1.5.0/go.mod h1:snEHRnqQbz117VIFhE8bmtwIDY80NLUZUMb4Nv6dBIg=
-cloud.google.com/go/bigquery v1.7.0/go.mod h1://okPTzCYNXSlb24MZs83e2Do+h+VXtc4gLoIoXIAPc=
-cloud.google.com/go/bigquery v1.8.0/go.mod h1:J5hqkt3O0uAFnINi6JXValWIb1v0goeZM77hZzJN/fQ=
-cloud.google.com/go/datastore v1.0.0/go.mod h1:LXYbyblFSglQ5pkeyhO+Qmw7ukd3C+pD7TKLgZqpHYE=
-cloud.google.com/go/datastore v1.1.0/go.mod h1:umbIZjpQpHh4hmRpGhH4tLFup+FVzqBi1b3c64qFpCk=
-cloud.google.com/go/firestore v1.6.1/go.mod h1:asNXNOzBdyVQmEU+ggO8UPodTkEVFW5Qx+rwHnAz+EY=
-cloud.google.com/go/pubsub v1.0.1/go.mod h1:R0Gpsv3s54REJCy4fxDixWD93lHJMoZTyQ2kNxGRt3I=
-cloud.google.com/go/pubsub v1.1.0/go.mod h1:EwwdRX2sKPjnvnqCa270oGRyludottCI76h+R3AArQw=
-cloud.google.com/go/pubsub v1.2.0/go.mod h1:jhfEVHT8odbXTkndysNHCcx0awwzvfOlguIAii9o8iA=
-cloud.google.com/go/pubsub v1.3.1/go.mod h1:i+ucay31+CNRpDW4Lu78I4xXG+O1r/MAHgjpRVR+TSU=
-cloud.google.com/go/storage v1.0.0/go.mod h1:IhtSnM/ZTZV8YYJWCY8RULGVqBDmpoyjwiyrjsg+URw=
-cloud.google.com/go/storage v1.5.0/go.mod h1:tpKbwo567HUNpVclU5sGELwQWBDZ8gh0ZeosJ0Rtdos=
-cloud.google.com/go/storage v1.6.0/go.mod h1:N7U0C8pVQ/+NIKOBQyamJIeKQKkZ+mxpohlUTyfDhBk=
-cloud.google.com/go/storage v1.8.0/go.mod h1:Wv1Oy7z6Yz3DshWRJFhqM/UCfaWIRTdp0RXyy7KQOVs=
-cloud.google.com/go/storage v1.10.0/go.mod h1:FLPqc6j+Ki4BU591ie1oL6qBQGu2Bl/tZ9ullr3+Kg0=
-cloud.google.com/go/storage v1.14.0/go.mod h1:GrKmX003DSIwi9o29oFT7YDnHYwZoctc3fOKtUw0Xmo=
-dmitri.shuralyov.com/gpu/mtl v0.0.0-20190408044501-666a987793e9/go.mod h1:H6x//7gZCb22OMCxBHrMx7a5I7Hp++hsVxbQ4BYO7hU=
-github.com/Azure/go-ansiterm v0.0.0-20210617225240-d185dfc1b5a1 h1:UQHMgLO+TxOElx5B5HZ4hJQsoJ/PvUvKRhJHDQXO8P8=
-github.com/Azure/go-ansiterm v0.0.0-20210617225240-d185dfc1b5a1/go.mod h1:xomTg63KZ2rFqZQzSB4Vz2SUXa1BpHTVz9L5PTmPC4E=
-github.com/BurntSushi/toml v0.3.1/go.mod h1:xHWCNGjB5oqiDr8zfno3MHue2Ht5sIBksp03qcyfWMU=
-github.com/BurntSushi/xgb v0.0.0-20160522181843-27f122750802/go.mod h1:IVnqGOEym/WlBOVXweHU+Q+/VP0lqqI8lqeDx9IjBqo=
-github.com/ClickHouse/clickhouse-go v1.5.3/go.mod h1:EaI/sW7Azgz9UATzd5ZdZHRUhHgv5+JMS9NSr2smCJI=
-github.com/ClickHouse/clickhouse-go/v2 v2.0.12 h1:Nbl/NZwoM6LGJm7smNBgvtdr/rxjlIssSW3eG/Nmb9E=
-github.com/ClickHouse/clickhouse-go/v2 v2.0.12/go.mod h1:u4RoNQLLM2W6hNSPYrIESLJqaWSInZVmfM+MlaAhXcg=
-github.com/DATA-DOG/go-sqlmock v1.5.0 h1:Shsta01QNfFxHCfpW6YH2STWB0MudeXXEWMr20OEh60=
-github.com/DATA-DOG/go-sqlmock v1.5.0/go.mod h1:f/Ixk793poVmq4qj/V1dPUg2JEAKC73Q5eFN3EC/SaM=
-github.com/DataDog/datadog-go v3.2.0+incompatible/go.mod h1:LButxg5PwREeZtORoXG3tL4fMGNddJ+vMq1mwgfaqoQ=
-github.com/Masterminds/semver v1.5.0 h1:H65muMkzWKEuNDnfl9d70GUjFniHKHRbFPGBuZ3QEww=
-github.com/Masterminds/semver v1.5.0/go.mod h1:MB6lktGJrhw8PrUyiEoblNEGEQ+RzHPF078ddwwvV3Y=
-github.com/Microsoft/go-winio v0.5.2 h1:a9IhgEQBCUEk6QCdml9CiJGhAws+YwffDHEMp1VMrpA=
-github.com/Microsoft/go-winio v0.5.2/go.mod h1:WpS1mjBmmwHBEWmogvA2mj8546UReBk4v8QkMxJ6pZY=
-github.com/Microsoft/hcsshim v0.9.6 h1:VwnDOgLeoi2du6dAznfmspNqTiwczvjv4K7NxuY9jsY=
-github.com/OneOfOne/xxhash v1.2.2/go.mod h1:HSdplMjZKSmBqAxg5vPj2TmRDmfkzw+cTzAElWljhcU=
-github.com/StackExchange/wmi v0.0.0-20190523213315-cbe66965904d h1:G0m3OIz70MZUWq3EgK3CesDbo8upS2Vm9/P3FtgI+Jk=
-github.com/StackExchange/wmi v0.0.0-20190523213315-cbe66965904d/go.mod h1:3eOhrUMpNV+6aFIbp5/iudMxNCF27Vw2OZgy4xEx0Fg=
-github.com/alecthomas/template v0.0.0-20160405071501-a0175ee3bccc/go.mod h1:LOuyumcjzFXgccqObfd/Ljyb9UuFJ6TxHnclSeseNhc=
-github.com/alecthomas/template v0.0.0-20190718012654-fb15b899a751/go.mod h1:LOuyumcjzFXgccqObfd/Ljyb9UuFJ6TxHnclSeseNhc=
-github.com/alecthomas/units v0.0.0-20151022065526-2efee857e7cf/go.mod h1:ybxpYRFXyAe+OPACYpWeL0wqObRcbAqCMya13uyzqw0=
-github.com/alecthomas/units v0.0.0-20190717042225-c3de453c63f4/go.mod h1:ybxpYRFXyAe+OPACYpWeL0wqObRcbAqCMya13uyzqw0=
-github.com/andybalholm/brotli v1.0.4 h1:V7DdXeJtZscaqfNuAdSRuRFzuiKlHSC/Zh3zl9qY3JY=
-github.com/andybalholm/brotli v1.0.4/go.mod h1:fO7iG3H7G2nSZ7m0zPUDn85XEX2GTukHGRSepvi9Eig=
-github.com/antihax/optional v1.0.0/go.mod h1:uupD/76wgC+ih3iEmQUL+0Ugr19nfwCT1kdvxnR2qWY=
-github.com/armon/circbuf v0.0.0-20150827004946-bbbad097214e/go.mod h1:3U/XgcO3hCbHZ8TKRvWD2dDTCfh9M9ya+I9JpbB7O8o=
-github.com/armon/go-metrics v0.0.0-20180917152333-f0300d1749da/go.mod h1:Q73ZrmVTwzkszR9V5SSuryQ31EELlFMUz1kKyl939pY=
-github.com/armon/go-metrics v0.3.10/go.mod h1:4O98XIr/9W0sxpJ8UaYkvjk10Iff7SnFrb4QAOwNTFc=
-github.com/armon/go-radix v0.0.0-20180808171621-7fddfc383310/go.mod h1:ufUuZ+zHj4x4TnLV4JWEpy2hxWSpsRywHrMgIH9cCH8=
-github.com/armon/go-radix v1.0.0/go.mod h1:ufUuZ+zHj4x4TnLV4JWEpy2hxWSpsRywHrMgIH9cCH8=
-github.com/beorn7/perks v0.0.0-20180321164747-3a771d992973/go.mod h1:Dwedo/Wpr24TaqPxmxbtue+5NUziq4I4S80YR8gNf3Q=
-github.com/beorn7/perks v1.0.0/go.mod h1:KWe93zE9D1o94FZ5RNwFwVgaQK1VOXiVxmqh+CedLV8=
-github.com/beorn7/perks v1.0.1/go.mod h1:G2ZrVWU2WbWT9wwq4/hrbKbnv/1ERSJQ0ibhJ6rlkpw=
-github.com/bgentry/speakeasy v0.1.0/go.mod h1:+zsyZBPWlz7T6j88CTgSN5bM796AkVf0kBD4zp0CCIs=
-github.com/bkaradzic/go-lz4 v1.0.0/go.mod h1:0YdlkowM3VswSROI7qDxhRvJ3sLhlFrRRwjwegp5jy4=
-github.com/bmatcuk/doublestar/v4 v4.0.2 h1:X0krlUVAVmtr2cRoTqR8aDMrDqnB36ht8wpWTiQ3jsA=
-github.com/bmatcuk/doublestar/v4 v4.0.2/go.mod h1:xBQ8jztBU6kakFMg+8WGxn0c6z1fTSPVIjEY1Wr7jzc=
-github.com/cenkalti/backoff/v4 v4.2.0 h1:HN5dHm3WBOgndBH6E8V0q2jIYIR3s9yglV8k/+MN3u4=
-github.com/cenkalti/backoff/v4 v4.2.0/go.mod h1:Y3VNntkOUPxTVeUxJ/G5vcM//AlwfmyYozVcomhLiZE=
-github.com/census-instrumentation/opencensus-proto v0.2.1/go.mod h1:f6KPmirojxKA12rnyqOA5BBL4O983OfeGPqjHWSTneU=
-github.com/census-instrumentation/opencensus-proto v0.3.0/go.mod h1:f6KPmirojxKA12rnyqOA5BBL4O983OfeGPqjHWSTneU=
-github.com/cespare/xxhash v1.1.0/go.mod h1:XrSqR1VqqWfGrhpAt58auRo0WTKS1nRRg3ghfAqPWnc=
-github.com/cespare/xxhash/v2 v2.1.1/go.mod h1:VGX0DQ3Q6kWi7AoAeZDth3/j3BFtOZR5XLFGgcrjCOs=
-github.com/cespare/xxhash/v2 v2.1.2/go.mod h1:VGX0DQ3Q6kWi7AoAeZDth3/j3BFtOZR5XLFGgcrjCOs=
-github.com/checkpoint-restore/go-criu/v5 v5.3.0/go.mod h1:E/eQpaFtUKGOOSEBZgmKAcn+zUUwWxqcaKZlF54wK8E=
-github.com/chzyer/logex v1.1.10/go.mod h1:+Ywpsq7O8HXn0nuIou7OrIPyXbp3wmkHB+jjWRnGsAI=
-github.com/chzyer/readline v0.0.0-20180603132655-2972be24d48e/go.mod h1:nSuG5e5PlCu98SY8svDHJxuZscDgtXS6KTTbou5AhLI=
-github.com/chzyer/test v0.0.0-20180213035817-a1ea475d72b1/go.mod h1:Q3SI9o4m/ZMnBNeIyt5eFwwo7qiLfzFZmjNmxjkiQlU=
-github.com/cilium/ebpf v0.7.0/go.mod h1:/oI2+1shJiTGAMgl6/RgJr36Eo1jzrRcAWbcXO2usCA=
-github.com/circonus-labs/circonus-gometrics v2.3.1+incompatible/go.mod h1:nmEj6Dob7S7YxXgwXpfOuvO54S+tGdZdw9fuRZt25Ag=
-github.com/circonus-labs/circonusllhist v0.1.3/go.mod h1:kMXHVDlOchFAehlya5ePtbp5jckzBHf4XRpQvBOLI+I=
-github.com/client9/misspell v0.3.4/go.mod h1:qj6jICC3Q7zFZvVWo7KLAzC3yx5G7kyvSDkc90ppPyw=
-github.com/cloudflare/golz4 v0.0.0-20150217214814-ef862a3cdc58/go.mod h1:EOBUe0h4xcZ5GoxqC5SDxFQ8gwyZPKQoEzownBlhI80=
-github.com/cncf/udpa/go v0.0.0-20191209042840-269d4d468f6f/go.mod h1:M8M6+tZqaGXZJjfX53e64911xZQV5JYwmTeXPW+k8Sc=
-github.com/cncf/udpa/go v0.0.0-20200629203442-efcf912fb354/go.mod h1:WmhPx2Nbnhtbo57+VJT5O0JRkEi1Wbu0z5j0R8u5Hbk=
-github.com/cncf/udpa/go v0.0.0-20201120205902-5459f2c99403/go.mod h1:WmhPx2Nbnhtbo57+VJT5O0JRkEi1Wbu0z5j0R8u5Hbk=
-github.com/cncf/udpa/go v0.0.0-20210930031921-04548b0d99d4/go.mod h1:6pvJx4me5XPnfI9Z40ddWsdw2W/uZgQLFXToKeRcDiI=
-github.com/cncf/xds/go v0.0.0-20210312221358-fbca930ec8ed/go.mod h1:eXthEFrGJvWHgFFCl3hGmgk+/aYT6PnTQLykKQRLhEs=
-github.com/cncf/xds/go v0.0.0-20210805033703-aa0b78936158/go.mod h1:eXthEFrGJvWHgFFCl3hGmgk+/aYT6PnTQLykKQRLhEs=
-github.com/cncf/xds/go v0.0.0-20210922020428-25de7278fc84/go.mod h1:eXthEFrGJvWHgFFCl3hGmgk+/aYT6PnTQLykKQRLhEs=
-github.com/cncf/xds/go v0.0.0-20211001041855-01bcc9b48dfe/go.mod h1:eXthEFrGJvWHgFFCl3hGmgk+/aYT6PnTQLykKQRLhEs=
-github.com/cncf/xds/go v0.0.0-20211011173535-cb28da3451f1/go.mod h1:eXthEFrGJvWHgFFCl3hGmgk+/aYT6PnTQLykKQRLhEs=
-github.com/cncf/xds/go v0.0.0-20211130200136-a8f946100490/go.mod h1:eXthEFrGJvWHgFFCl3hGmgk+/aYT6PnTQLykKQRLhEs=
-github.com/containerd/console v1.0.3/go.mod h1:7LqA/THxQ86k76b8c/EMSiaJ3h1eZkMkXar0TQ1gf3U=
-github.com/containerd/containerd v1.6.17 h1:XDnJIeJW0cLf6v7/+N+6L9kGrChHeXekZp2VHu6OpiY=
-github.com/containerd/containerd v1.6.17/go.mod h1:1RdCUu95+gc2v9t3IL+zIlpClSmew7/0YS8O5eQZrOw=
-github.com/containerd/continuity v0.3.0 h1:nisirsYROK15TAMVukJOUyGJjz4BNQJBVsNvAXZJ/eg=
-github.com/coreos/go-semver v0.3.0/go.mod h1:nnelYz7RCh+5ahJtPPxZlU+153eP4D4r3EedlOD2RNk=
-github.com/coreos/go-systemd/v22 v22.3.2/go.mod h1:Y58oyj3AT4RCenI/lSvhwexgC+NSVTIJ3seZv2GcEnc=
-github.com/cpuguy83/go-md2man/v2 v2.0.0-20190314233015-f79a8a8ca69d/go.mod h1:maD7wRr/U5Z6m/iR4s+kqSMx2CaBsrgA7czyZG/E6dU=
-github.com/cpuguy83/go-md2man/v2 v2.0.1/go.mod h1:tgQtvFlXSQOSOSIRvRPT7W67SCa46tRHOmNcaadrF8o=
-github.com/creack/pty v1.1.9/go.mod h1:oKZEueFk5CKHvIhNR5MUki03XCEU+Q6VDXinZuGJ33E=
-github.com/creack/pty v1.1.17 h1:QeVUsEDNrLBW4tMgZHvxy18sKtr6VI492kBhUfhDJNI=
-github.com/cyphar/filepath-securejoin v0.2.3/go.mod h1:aPGpWjXOXUn2NCNjFvBE6aRxGGx79pTxQpKOJNYHHl4=
-github.com/davecgh/go-spew v1.1.0/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
-github.com/davecgh/go-spew v1.1.1 h1:vj9j/u1bqnvCEfJOwUhtlOARqs3+rkHYY13jYWTU97c=
-github.com/davecgh/go-spew v1.1.1/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
-github.com/distribution/distribution v2.8.2+incompatible h1:k9+4DKdOG+quPFZXT/mUsiQrGu9vYCp+dXpuPkuqhk8=
-github.com/distribution/distribution v2.8.2+incompatible/go.mod h1:EgLm2NgWtdKgzF9NpMzUKgzmR7AMmb0VQi2B+ZzDRjc=
-github.com/docker/distribution v2.8.1+incompatible h1:Q50tZOPR6T/hjNsyc9g8/syEs6bk8XXApsHjKukMl68=
-github.com/docker/distribution v2.8.1+incompatible/go.mod h1:J2gT2udsDAN96Uj4KfcMRqY0/ypR+oyYUYmja8H+y+w=
-github.com/docker/docker v23.0.0+incompatible h1:L6c28tNyqZ4/ub9AZC9d5QUuunoHHfEH4/Ue+h/E5nE=
-github.com/docker/docker v23.0.0+incompatible/go.mod h1:eEKB0N0r5NX/I1kEveEz05bcu8tLC/8azJZsviup8Sk=
-github.com/docker/go-connections v0.4.0 h1:El9xVISelRB7BuFusrZozjnkIM5YnzCViNKohAFqRJQ=
-github.com/docker/go-connections v0.4.0/go.mod h1:Gbd7IOopHjR8Iph03tsViu4nIes5XhDvyHbTtUxmeec=
-github.com/docker/go-units v0.4.0/go.mod h1:fgPhTUdO+D/Jk86RDLlptpiXQzgHJF7gydDDbaIK4Dk=
-github.com/docker/go-units v0.5.0 h1:69rxXcBk27SvSaaxTtLh/8llcHD8vYHT7WSdRZ/jvr4=
-github.com/docker/go-units v0.5.0/go.mod h1:fgPhTUdO+D/Jk86RDLlptpiXQzgHJF7gydDDbaIK4Dk=
-github.com/dsnet/compress v0.0.1 h1:PlZu0n3Tuv04TzpfPbrnI0HW/YwodEXDS+oPKahKF0Q=
-github.com/dsnet/compress v0.0.1/go.mod h1:Aw8dCMJ7RioblQeTqt88akK31OvO8Dhf5JflhBbQEHo=
-github.com/dsnet/golib v0.0.0-20171103203638-1ea166775780/go.mod h1:Lj+Z9rebOhdfkVLjJ8T6VcRQv3SXugXy999NBtR9aFY=
-github.com/elastic/gosigar v0.14.2 h1:Dg80n8cr90OZ7x+bAax/QjoW/XqTI11RmA79ZwIm9/4=
-github.com/elastic/gosigar v0.14.2/go.mod h1:iXRIGg2tLnu7LBdpqzyQfGDEidKCfWcCMS0WKyPWoMs=
-github.com/envoyproxy/go-control-plane v0.9.0/go.mod h1:YTl/9mNaCwkRvm6d1a2C3ymFceY/DCBVvsKhRF0iEA4=
-github.com/envoyproxy/go-control-plane v0.9.1-0.20191026205805-5f8ba28d4473/go.mod h1:YTl/9mNaCwkRvm6d1a2C3ymFceY/DCBVvsKhRF0iEA4=
-github.com/envoyproxy/go-control-plane v0.9.4/go.mod h1:6rpuAdCZL397s3pYoYcLgu1mIlRU8Am5FuJP05cCM98=
-github.com/envoyproxy/go-control-plane v0.9.7/go.mod h1:cwu0lG7PUMfa9snN8LXBig5ynNVH9qI8YYLbd1fK2po=
-github.com/envoyproxy/go-control-plane v0.9.9-0.20201210154907-fd9021fe5dad/go.mod h1:cXg6YxExXjJnVBQHBLXeUAgxn2UodCpnH306RInaBQk=
-github.com/envoyproxy/go-control-plane v0.9.9-0.20210217033140-668b12f5399d/go.mod h1:cXg6YxExXjJnVBQHBLXeUAgxn2UodCpnH306RInaBQk=
-github.com/envoyproxy/go-control-plane v0.9.9-0.20210512163311-63b5d3c536b0/go.mod h1:hliV/p42l8fGbc6Y9bQ70uLwIvmJyVE5k4iMKlh8wCQ=
-github.com/envoyproxy/go-control-plane v0.9.10-0.20210907150352-cf90f659a021/go.mod h1:AFq3mo9L8Lqqiid3OhADV3RfLJnjiw63cSpi+fDTRC0=
-github.com/envoyproxy/go-control-plane v0.10.1/go.mod h1:AY7fTTXNdv/aJ2O5jwpxAPOWUZ7hQAEvzN5Pf27BkQQ=
-github.com/envoyproxy/go-control-plane v0.10.2-0.20220325020618-49ff273808a1/go.mod h1:KJwIaB5Mv44NWtYuAOFCVOjcI94vtpEz2JU/D2v6IjE=
-github.com/envoyproxy/protoc-gen-validate v0.1.0/go.mod h1:iSmxcyjqTsJpI2R4NaDN7+kN2VEUnK/pcBlmesArF7c=
-github.com/envoyproxy/protoc-gen-validate v0.6.2/go.mod h1:2t7qjJNvHPx8IjnBOzl9E9/baC+qXE/TeeyBRzgJDws=
-github.com/fatih/color v1.7.0/go.mod h1:Zm6kSWBoL9eyXnKyktHP6abPY2pDugNf5KwzbycvMj4=
-github.com/fatih/color v1.9.0/go.mod h1:eQcE1qtQxscV5RaZvpXrrb8Drkc3/DdQ+uUYCNjL+zU=
-github.com/fatih/color v1.13.0/go.mod h1:kLAiJbzzSOZDVNGyDpeOxJ47H46qBXwg5ILebYFFOfk=
-github.com/frankban/quicktest v1.11.3/go.mod h1:wRf/ReqHper53s+kmmSZizM8NamnL3IM0I9ntUbOk+k=
-github.com/fsnotify/fsnotify v1.5.1/go.mod h1:T3375wBYaZdLLcVNkcVbzGHY7f1l/uK5T5Ai1i3InKU=
-github.com/fsnotify/fsnotify v1.5.4 h1:jRbGcIw6P2Meqdwuo0H1p6JVLbL5DHKAKlYndzMwVZI=
-github.com/fsnotify/fsnotify v1.5.4/go.mod h1:OVB6XrOHzAwXMpEM7uPOzcehqUV2UqJxmVXmkdnm1bU=
-github.com/ghodss/yaml v1.0.0 h1:wQHKEahhL6wmXdzwWG11gIVCkOv05bNOh+Rxn0yngAk=
-github.com/ghodss/yaml v1.0.0/go.mod h1:4dBDuWmgqj2HViK6kFavaiC9ZROes6MMH2rRYeMEF04=
-github.com/go-gl/glfw v0.0.0-20190409004039-e6da0acd62b1/go.mod h1:vR7hzQXu2zJy9AVAgeJqvqgH9Q5CA+iKCZ2gyEVpxRU=
-github.com/go-gl/glfw/v3.3/glfw v0.0.0-20191125211704-12ad95a8df72/go.mod h1:tQ2UAYgL5IevRw8kRxooKSPJfGvJ9fJQFa0TUsXzTg8=
-github.com/go-gl/glfw/v3.3/glfw v0.0.0-20200222043503-6f7a984d4dc4/go.mod h1:tQ2UAYgL5IevRw8kRxooKSPJfGvJ9fJQFa0TUsXzTg8=
-github.com/go-kit/kit v0.8.0/go.mod h1:xBxKIO96dXMWWy0MnWVtmwkA9/13aqxPnvrjFYMA2as=
-github.com/go-kit/kit v0.9.0/go.mod h1:xBxKIO96dXMWWy0MnWVtmwkA9/13aqxPnvrjFYMA2as=
-github.com/go-logfmt/logfmt v0.3.0/go.mod h1:Qt1PoO58o5twSAckw1HlFXLmHsOX5/0LbT9GBnD5lWE=
-github.com/go-logfmt/logfmt v0.4.0/go.mod h1:3RMwSq7FuexP4Kalkev3ejPJsZTpXXBr9+V4qmtdjCk=
-github.com/go-logr/logr v1.2.2/go.mod h1:jdQByPbusPIv2/zmleS9BjJVeZ6kBagPoEUsqbVz/1A=
-github.com/go-logr/stdr v1.2.2/go.mod h1:mMo/vtBO5dYbehREoey6XUKy/eSumjCCveDpRre4VKE=
-github.com/go-ole/go-ole v1.2.4 h1:nNBDSCOigTSiarFpYE9J/KtEA1IOW4CNeqT9TQDqCxI=
-github.com/go-ole/go-ole v1.2.4/go.mod h1:XCwSNxSkXRo4vlyPy93sltvi/qJq0jqQhjqQNIwKuxM=
-github.com/go-sql-driver/mysql v1.4.0/go.mod h1:zAC/RDZ24gD3HViQzih4MyKcchzm+sOG5ZlKdlhCg5w=
-github.com/go-stack/stack v1.8.0/go.mod h1:v0f6uXyyMGvRgIKkXu+yp6POWl0qKG85gN/melR3HDY=
-github.com/godbus/dbus/v5 v5.0.4/go.mod h1:xhWf0FNVPg57R7Z0UbKHbJfkEywrmjJnf7w5xrFpKfA=
-github.com/godbus/dbus/v5 v5.0.6/go.mod h1:xhWf0FNVPg57R7Z0UbKHbJfkEywrmjJnf7w5xrFpKfA=
-github.com/gogo/protobuf v1.1.1/go.mod h1:r8qH/GZQm5c6nD/R0oafs1akxWv10x8SbQlK7atdtwQ=
-github.com/gogo/protobuf v1.3.2 h1:Ov1cvc58UF3b5XjBnZv7+opcTcQFZebYjWzi34vdm4Q=
-github.com/gogo/protobuf v1.3.2/go.mod h1:P1XiOD3dCwIKUDQYPy72D8LYyHL2YPYrpS2s69NZV8Q=
-github.com/golang/glog v0.0.0-20160126235308-23def4e6c14b/go.mod h1:SBH7ygxi8pfUlaOkMMuAQtPIUF8ecWP5IEl/CR7VP2Q=
-github.com/golang/groupcache v0.0.0-20190702054246-869f871628b6/go.mod h1:cIg4eruTrX1D+g88fzRXU5OdNfaM+9IcxsU14FzY7Hc=
-github.com/golang/groupcache v0.0.0-20191227052852-215e87163ea7/go.mod h1:cIg4eruTrX1D+g88fzRXU5OdNfaM+9IcxsU14FzY7Hc=
-github.com/golang/groupcache v0.0.0-20200121045136-8c9f03a8e57e/go.mod h1:cIg4eruTrX1D+g88fzRXU5OdNfaM+9IcxsU14FzY7Hc=
-github.com/golang/groupcache v0.0.0-20210331224755-41bb18bfe9da/go.mod h1:cIg4eruTrX1D+g88fzRXU5OdNfaM+9IcxsU14FzY7Hc=
-github.com/golang/mock v1.1.1/go.mod h1:oTYuIxOrZwtPieC+H1uAHpcLFnEyAGVDL/k47Jfbm0A=
-github.com/golang/mock v1.2.0/go.mod h1:oTYuIxOrZwtPieC+H1uAHpcLFnEyAGVDL/k47Jfbm0A=
-github.com/golang/mock v1.3.1/go.mod h1:sBzyDLLjw3U8JLTeZvSv8jJB+tU5PVekmnlKIyFUx0Y=
-github.com/golang/mock v1.4.0/go.mod h1:UOMv5ysSaYNkG+OFQykRIcU/QvvxJf3p21QfJ2Bt3cw=
-github.com/golang/mock v1.4.1/go.mod h1:UOMv5ysSaYNkG+OFQykRIcU/QvvxJf3p21QfJ2Bt3cw=
-github.com/golang/mock v1.4.3/go.mod h1:UOMv5ysSaYNkG+OFQykRIcU/QvvxJf3p21QfJ2Bt3cw=
-github.com/golang/mock v1.4.4/go.mod h1:l3mdAwkq5BuhzHwde/uurv3sEJeZMXNpwsxVWU71h+4=
-github.com/golang/mock v1.5.0/go.mod h1:CWnOUgYIOo4TcNZ0wHX3YZCqsaM1I1Jvs6v3mP3KVu8=
-github.com/golang/mock v1.6.0/go.mod h1:p6yTPP+5HYm5mzsMV8JkE6ZKdX+/wYM6Hr+LicevLPs=
-github.com/golang/protobuf v1.2.0/go.mod h1:6lQm79b+lXiMfvg/cZm0SGofjICqVBUtrP5yJMmIC1U=
-github.com/golang/protobuf v1.3.1/go.mod h1:6lQm79b+lXiMfvg/cZm0SGofjICqVBUtrP5yJMmIC1U=
-github.com/golang/protobuf v1.3.2/go.mod h1:6lQm79b+lXiMfvg/cZm0SGofjICqVBUtrP5yJMmIC1U=
-github.com/golang/protobuf v1.3.3/go.mod h1:vzj43D7+SQXF/4pzW/hwtAqwc6iTitCiVSaWz5lYuqw=
-github.com/golang/protobuf v1.3.4/go.mod h1:vzj43D7+SQXF/4pzW/hwtAqwc6iTitCiVSaWz5lYuqw=
-github.com/golang/protobuf v1.3.5/go.mod h1:6O5/vntMXwX2lRkT1hjjk0nAC1IDOTvTlVgjlRvqsdk=
-github.com/golang/protobuf v1.4.0-rc.1/go.mod h1:ceaxUfeHdC40wWswd/P6IGgMaK3YpKi5j83Wpe3EHw8=
-github.com/golang/protobuf v1.4.0-rc.1.0.20200221234624-67d41d38c208/go.mod h1:xKAWHe0F5eneWXFV3EuXVDTCmh+JuBKY0li0aMyXATA=
-github.com/golang/protobuf v1.4.0-rc.2/go.mod h1:LlEzMj4AhA7rCAGe4KMBDvJI+AwstrUpVNzEA03Pprs=
-github.com/golang/protobuf v1.4.0-rc.4.0.20200313231945-b860323f09d0/go.mod h1:WU3c8KckQ9AFe+yFwt9sWVRKCVIyN9cPHBJSNnbL67w=
-github.com/golang/protobuf v1.4.0/go.mod h1:jodUvKwWbYaEsadDk5Fwe5c77LiNKVO9IDvqG2KuDX0=
-github.com/golang/protobuf v1.4.1/go.mod h1:U8fpvMrcmy5pZrNK1lt4xCsGvpyWQ/VVv6QDs8UjoX8=
-github.com/golang/protobuf v1.4.2/go.mod h1:oDoupMAO8OvCJWAcko0GGGIgR6R6ocIYbsSw735rRwI=
-github.com/golang/protobuf v1.4.3/go.mod h1:oDoupMAO8OvCJWAcko0GGGIgR6R6ocIYbsSw735rRwI=
-github.com/golang/protobuf v1.5.0/go.mod h1:FsONVRAS9T7sI+LIUmWTfcYkHO4aIWwzhcaSAoJOfIk=
-github.com/golang/protobuf v1.5.1/go.mod h1:DopwsBzvsk0Fs44TXzsVbJyPhcCPeIwnvohx4u74HPM=
-github.com/golang/protobuf v1.5.2 h1:ROPKBNFfQgOUMifHyP+KYbvpjbdoFNs+aK7DXlji0Tw=
-github.com/golang/protobuf v1.5.2/go.mod h1:XVQd3VNwM+JqD3oG2Ue2ip4fOMUkwXdXDdiuN0vRsmY=
-github.com/golang/snappy v0.0.3/go.mod h1:/XxbfmMg8lxefKM7IXC3fBNl/7bRcc72aCRzEWrmP2Q=
-github.com/golang/snappy v0.0.4 h1:yAGX7huGHXlcLOEtBnF4w7FQwA26wojNCwOYAEhLjQM=
-github.com/golang/snappy v0.0.4/go.mod h1:/XxbfmMg8lxefKM7IXC3fBNl/7bRcc72aCRzEWrmP2Q=
-github.com/google/btree v0.0.0-20180813153112-4030bb1f1f0c/go.mod h1:lNA+9X1NB3Zf8V7Ke586lFgjr2dZNuvo3lPJSGZ5JPQ=
-github.com/google/btree v1.0.0/go.mod h1:lNA+9X1NB3Zf8V7Ke586lFgjr2dZNuvo3lPJSGZ5JPQ=
-github.com/google/go-cmp v0.2.0/go.mod h1:oXzfMopK8JAjlY9xF4vHSVASa0yLyX7SntLO5aqRK0M=
-github.com/google/go-cmp v0.3.0/go.mod h1:8QqcDgzrUqlUb/G2PQTWiueGozuR1884gddMywk6iLU=
-github.com/google/go-cmp v0.3.1/go.mod h1:8QqcDgzrUqlUb/G2PQTWiueGozuR1884gddMywk6iLU=
-github.com/google/go-cmp v0.4.0/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.4.1/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.5.0/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.5.1/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.5.2/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.5.3/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.5.4/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.5.5/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.5.6/go.mod h1:v8dTdLbMG2kIc/vJvl+f65V22dbkXbowE6jgT/gNBxE=
-github.com/google/go-cmp v0.5.7/go.mod h1:n+brtR0CgQNWTVd5ZUFpTBC8YFBDLK/h/bpaJ8/DtOE=
-github.com/google/go-cmp v0.5.9 h1:O2Tfq5qg4qc4AmwVlvv0oLiVAGB7enBSJ2x2DqQFi38=
-github.com/google/gofuzz v1.0.0/go.mod h1:dBl0BpW6vV/+mYPU4Po3pmUjxk6FQPldtuIdl/M65Eg=
-github.com/google/martian v2.1.0+incompatible/go.mod h1:9I4somxYTbIHy5NJKHRl3wXiIaQGbYVAs8BPL6v8lEs=
-github.com/google/martian/v3 v3.0.0/go.mod h1:y5Zk1BBys9G+gd6Jrk0W3cC1+ELVxBWuIGO+w/tUAp0=
-github.com/google/martian/v3 v3.1.0/go.mod h1:y5Zk1BBys9G+gd6Jrk0W3cC1+ELVxBWuIGO+w/tUAp0=
-github.com/google/martian/v3 v3.2.1/go.mod h1:oBOf6HBosgwRXnUGWUB05QECsc6uvmMiJ3+6W4l/CUk=
-github.com/google/pprof v0.0.0-20181206194817-3ea8567a2e57/go.mod h1:zfwlbNMJ+OItoe0UupaVj+oy1omPYYDuagoSzA8v9mc=
-github.com/google/pprof v0.0.0-20190515194954-54271f7e092f/go.mod h1:zfwlbNMJ+OItoe0UupaVj+oy1omPYYDuagoSzA8v9mc=
-github.com/google/pprof v0.0.0-20191218002539-d4f498aebedc/go.mod h1:ZgVRPoUq/hfqzAqh7sHMqb3I9Rq5C59dIz2SbBwJ4eM=
-github.com/google/pprof v0.0.0-20200212024743-f11f1df84d12/go.mod h1:ZgVRPoUq/hfqzAqh7sHMqb3I9Rq5C59dIz2SbBwJ4eM=
-github.com/google/pprof v0.0.0-20200229191704-1ebb73c60ed3/go.mod h1:ZgVRPoUq/hfqzAqh7sHMqb3I9Rq5C59dIz2SbBwJ4eM=
-github.com/google/pprof v0.0.0-20200430221834-fc25d7d30c6d/go.mod h1:ZgVRPoUq/hfqzAqh7sHMqb3I9Rq5C59dIz2SbBwJ4eM=
-github.com/google/pprof v0.0.0-20200708004538-1a94d8640e99/go.mod h1:ZgVRPoUq/hfqzAqh7sHMqb3I9Rq5C59dIz2SbBwJ4eM=
-github.com/google/pprof v0.0.0-20201023163331-3e6fc7fc9c4c/go.mod h1:kpwsk12EmLew5upagYY7GY0pfYCcupk39gWOCRROcvE=
-github.com/google/pprof v0.0.0-20201203190320-1bf35d6f28c2/go.mod h1:kpwsk12EmLew5upagYY7GY0pfYCcupk39gWOCRROcvE=
-github.com/google/pprof v0.0.0-20201218002935-b9804c9f04c2/go.mod h1:kpwsk12EmLew5upagYY7GY0pfYCcupk39gWOCRROcvE=
-github.com/google/pprof v0.0.0-20210122040257-d980be63207e/go.mod h1:kpwsk12EmLew5upagYY7GY0pfYCcupk39gWOCRROcvE=
-github.com/google/pprof v0.0.0-20210226084205-cbba55b83ad5/go.mod h1:kpwsk12EmLew5upagYY7GY0pfYCcupk39gWOCRROcvE=
-github.com/google/pprof v0.0.0-20210601050228-01bbb1931b22/go.mod h1:kpwsk12EmLew5upagYY7GY0pfYCcupk39gWOCRROcvE=
-github.com/google/pprof v0.0.0-20210609004039-a478d1d731e9/go.mod h1:kpwsk12EmLew5upagYY7GY0pfYCcupk39gWOCRROcvE=
-github.com/google/pprof v0.0.0-20210720184732-4bb14d4b1be1/go.mod h1:kpwsk12EmLew5upagYY7GY0pfYCcupk39gWOCRROcvE=
-github.com/google/renameio v0.1.0/go.mod h1:KWCgfxg9yswjAJkECMjeO8J8rahYeXnNhOm40UhjYkI=
-github.com/google/shlex v0.0.0-20191202100458-e7afc7fbc510 h1:El6M4kTTCOh6aBiKaUGG7oYTSPP8MxqL4YI3kZKwcP4=
-github.com/google/shlex v0.0.0-20191202100458-e7afc7fbc510/go.mod h1:pupxD2MaaD3pAXIBCelhxNneeOaAeabZDe5s4K6zSpQ=
-github.com/google/uuid v1.1.2/go.mod h1:TIyPZe4MgqvfeYDBFedMoGGpEw/LqOeaOT+nhxU+yHo=
-github.com/google/uuid v1.3.0 h1:t6JiXgmwXMjEs8VusXIJk2BXHsn+wx8BZdTaoZ5fu7I=
-github.com/google/uuid v1.3.0/go.mod h1:TIyPZe4MgqvfeYDBFedMoGGpEw/LqOeaOT+nhxU+yHo=
-github.com/googleapis/gax-go/v2 v2.0.4/go.mod h1:0Wqv26UfaUD9n4G6kQubkQ+KchISgw+vpHVxEJEs9eg=
-github.com/googleapis/gax-go/v2 v2.0.5/go.mod h1:DWXyrwAJ9X0FpwwEdw+IPEYBICEFu5mhpdKc/us6bOk=
-github.com/googleapis/gax-go/v2 v2.1.0/go.mod h1:Q3nei7sK6ybPYH7twZdmQpAd1MKb7pfu6SK+H1/DsU0=
-github.com/googleapis/gax-go/v2 v2.1.1/go.mod h1:hddJymUZASv3XPyGkUpKj8pPO47Rmb0eJc8R6ouapiM=
-github.com/googleapis/google-cloud-go-testing v0.0.0-20200911160855-bcd43fbb19e8/go.mod h1:dvDLG8qkwmyD9a/MJJN3XJcT3xFxOKAvTZGvuZmac9g=
-github.com/gorilla/handlers v1.4.2/go.mod h1:Qkdc/uu4tH4g6mTK6auzZ766c4CA0Ng8+o/OAirnOIQ=
-github.com/gorilla/websocket v1.4.1/go.mod h1:YR8l580nyteQvAITg2hZ9XVh4b55+EU/adAjf1fMHhE=
-github.com/grpc-ecosystem/grpc-gateway v1.16.0/go.mod h1:BDjrQk3hbvj6Nolgz8mAMFbcEtjT1g+wF4CSlocrBnw=
-github.com/hashicorp/consul/api v1.11.0/go.mod h1:XjsvQN+RJGWI2TWy1/kqaE16HrR2J/FWgkYjdZQsX9M=
-github.com/hashicorp/consul/sdk v0.8.0/go.mod h1:GBvyrGALthsZObzUGsfgHZQDXjg4lOjagTIwIR1vPms=
-github.com/hashicorp/errwrap v1.0.0/go.mod h1:YH+1FKiLXxHSkmPseP+kNlulaMuP3n2brvKWEqk/Jc4=
-github.com/hashicorp/go-cleanhttp v0.5.0/go.mod h1:JpRdi6/HCYpAwUzNwuwqhbovhLtngrth3wmdIIUrZ80=
-github.com/hashicorp/go-cleanhttp v0.5.1/go.mod h1:JpRdi6/HCYpAwUzNwuwqhbovhLtngrth3wmdIIUrZ80=
-github.com/hashicorp/go-cleanhttp v0.5.2/go.mod h1:kO/YDlP8L1346E6Sodw+PrpBSV4/SoxCXGY6BqNFT48=
-github.com/hashicorp/go-hclog v0.12.0/go.mod h1:whpDNt7SSdeAju8AWKIWsul05p54N/39EeqMAyrmvFQ=
-github.com/hashicorp/go-hclog v1.0.0/go.mod h1:whpDNt7SSdeAju8AWKIWsul05p54N/39EeqMAyrmvFQ=
-github.com/hashicorp/go-immutable-radix v1.0.0/go.mod h1:0y9vanUI8NX6FsYoO3zeMjhV/C5i9g4Q3DwcSNZ4P60=
-github.com/hashicorp/go-immutable-radix v1.3.1/go.mod h1:0y9vanUI8NX6FsYoO3zeMjhV/C5i9g4Q3DwcSNZ4P60=
-github.com/hashicorp/go-msgpack v0.5.3/go.mod h1:ahLV/dePpqEmjfWmKiqvPkv/twdG7iPBM1vqhUKIvfM=
-github.com/hashicorp/go-multierror v1.0.0/go.mod h1:dHtQlpGsu+cZNNAkkCN/P3hoUDHhCYQXV3UM06sGGrk=
-github.com/hashicorp/go-multierror v1.1.0/go.mod h1:spPvp8C1qA32ftKqdAHm4hHTbPw+vmowP0z+KUhOZdA=
-github.com/hashicorp/go-retryablehttp v0.5.3/go.mod h1:9B5zBasrRhHXnJnui7y6sL7es7NDiJgTc6Er0maI1Xs=
-github.com/hashicorp/go-rootcerts v1.0.2/go.mod h1:pqUvnprVnM5bf7AOirdbb01K4ccR319Vf4pU3K5EGc8=
-github.com/hashicorp/go-sockaddr v1.0.0/go.mod h1:7Xibr9yA9JjQq1JpNB2Vw7kxv8xerXegt+ozgdvDeDU=
-github.com/hashicorp/go-syslog v1.0.0/go.mod h1:qPfqrKkXGihmCqbJM2mZgkZGvKG1dFdvsLplgctolz4=
-github.com/hashicorp/go-uuid v1.0.0/go.mod h1:6SBZvOh/SIDV7/2o3Jml5SYk/TvGqwFJ/bN7x4byOro=
-github.com/hashicorp/go-uuid v1.0.1/go.mod h1:6SBZvOh/SIDV7/2o3Jml5SYk/TvGqwFJ/bN7x4byOro=
-github.com/hashicorp/golang-lru v0.5.0/go.mod h1:/m3WP610KZHVQ1SGc6re/UDhFvYD7pJ4Ao+sR/qLZy8=
-github.com/hashicorp/golang-lru v0.5.1/go.mod h1:/m3WP610KZHVQ1SGc6re/UDhFvYD7pJ4Ao+sR/qLZy8=
-github.com/hashicorp/golang-lru v0.5.4/go.mod h1:iADmTwqILo4mZ8BN3D2Q6+9jd8WM5uGBxy+E8yxSoD4=
-github.com/hashicorp/hcl v1.0.0 h1:0Anlzjpi4vEasTeNFn2mLJgTSwt0+6sfsiTG8qcWGx4=
-github.com/hashicorp/hcl v1.0.0/go.mod h1:E5yfLk+7swimpb2L/Alb/PJmXilQ/rhwaUYs4T20WEQ=
-github.com/hashicorp/logutils v1.0.0/go.mod h1:QIAnNjmIWmVIIkWDTG1z5v++HQmx9WQRO+LraFDTW64=
-github.com/hashicorp/mdns v1.0.1/go.mod h1:4gW7WsVCke5TE7EPeYliwHlRUyBtfCwuFwuMg2DmyNY=
-github.com/hashicorp/mdns v1.0.4/go.mod h1:mtBihi+LeNXGtG8L9dX59gAEa12BDtBQSp4v/YAJqrc=
-github.com/hashicorp/memberlist v0.2.2/go.mod h1:MS2lj3INKhZjWNqd3N0m3J+Jxf3DAOnAH9VT3Sh9MUE=
-github.com/hashicorp/memberlist v0.3.0/go.mod h1:MS2lj3INKhZjWNqd3N0m3J+Jxf3DAOnAH9VT3Sh9MUE=
-github.com/hashicorp/serf v0.9.5/go.mod h1:UWDWwZeL5cuWDJdl0C6wrvrUwEqtQ4ZKBKKENpqIUyk=
-github.com/hashicorp/serf v0.9.6/go.mod h1:TXZNMjZQijwlDvp+r0b63xZ45H7JmCmgg4gpTwn9UV4=
-github.com/iancoleman/strcase v0.2.0/go.mod h1:iwCmte+B7n89clKwxIoIXy/HfoL7AsD47ZCWhYzw7ho=
-github.com/ianlancetaylor/demangle v0.0.0-20181102032728-5e5cf60278f6/go.mod h1:aSSvb/t6k1mPoxDqO4vJh6VOCGPwU4O0C2/Eqndh1Sc=
-github.com/ianlancetaylor/demangle v0.0.0-20200824232613-28f6c0f3b639/go.mod h1:aSSvb/t6k1mPoxDqO4vJh6VOCGPwU4O0C2/Eqndh1Sc=
-github.com/inconshreveable/mousetrap v1.0.0 h1:Z8tu5sraLXCXIcARxBp/8cbvlwVa7Z1NHg9XEKhtSvM=
-github.com/inconshreveable/mousetrap v1.0.0/go.mod h1:PxqpIevigyE2G7u3NXJIT2ANytuPF1OarO4DADm73n8=
-github.com/jaypipes/ghw v0.8.0 h1:02q1pTm9CD83vuhBsEZZhOCS128pq87uyaQeJZkp3sQ=
-github.com/jaypipes/ghw v0.8.0/go.mod h1:+gR9bjm3W/HnFi90liF+Fj9GpCe/Dsibl9Im8KmC7c4=
-github.com/jaypipes/pcidb v0.6.0 h1:VIM7GKVaW4qba30cvB67xSCgJPTzkG8Kzw/cbs5PHWU=
-github.com/jaypipes/pcidb v0.6.0/go.mod h1:L2RGk04sfRhp5wvHO0gfRAMoLY/F3PKv/nwJeVoho0o=
-github.com/jessevdk/go-flags v1.4.0/go.mod h1:4FA24M0QyGHXBuZZK/XkWh8h0e1EYbRYJSGM75WSRxI=
-github.com/jmoiron/sqlx v1.2.0/go.mod h1:1FEQNm3xlJgrMD+FBdI9+xvCksHtbpVBBw5dYhBSsks=
-github.com/json-iterator/go v1.1.6/go.mod h1:+SdeFBvtyEkXs7REEP0seUULqWtbJapLOCVDaaPEHmU=
-github.com/json-iterator/go v1.1.9/go.mod h1:KdQUCv79m/52Kvf8AW2vK1V8akMuk1QjK/uOdHXbAo4=
-github.com/json-iterator/go v1.1.11/go.mod h1:KdQUCv79m/52Kvf8AW2vK1V8akMuk1QjK/uOdHXbAo4=
-github.com/json-iterator/go v1.1.12/go.mod h1:e30LSqwooZae/UwlEbR2852Gd8hjQvJoHmT4TnhNGBo=
-github.com/jstemmer/go-junit-report v0.0.0-20190106144839-af01ea7f8024/go.mod h1:6v2b51hI/fHJwM22ozAgKL4VKDeJcHhJFhtBdhmNjmU=
-github.com/jstemmer/go-junit-report v0.9.1/go.mod h1:Brl9GWCQeLvo8nXZwPNNblvFj/XSXhF0NWZEnDohbsk=
-github.com/julienschmidt/httprouter v1.2.0/go.mod h1:SYymIcj16QtmaHHD7aYtjjsJG7VTCxuUUipMqKk8s4w=
-github.com/kisielk/errcheck v1.5.0/go.mod h1:pFxgyoBC7bSaBwPgfKdkLd5X25qrDl4LWUI2bnpBCr8=
-github.com/kisielk/gotool v1.0.0/go.mod h1:XhKaO+MFFWcvkIS/tQcRk01m1F5IRFswLeQ+oQHNcck=
-github.com/klauspost/compress v1.4.1/go.mod h1:RyIbtBH6LamlWaDj8nUwkbUhJ87Yi3uG0guNDohfE1A=
-github.com/klauspost/compress v1.13.6 h1:P76CopJELS0TiO2mebmnzgWaajssP/EszplttgQxcgc=
-github.com/klauspost/compress v1.13.6/go.mod h1:/3/Vjq9QcHkK5uEr5lBEmyoZ1iFhe47etQ6QUkpK6sk=
-github.com/klauspost/cpuid v1.2.0/go.mod h1:Pj4uuM528wm8OyEC2QMXAi2YiTZ96dNQPGgoMS4s3ek=
-github.com/klauspost/pgzip v1.2.5 h1:qnWYvvKqedOF2ulHpMG72XQol4ILEJ8k2wwRl/Km8oE=
-github.com/klauspost/pgzip v1.2.5/go.mod h1:Ch1tH69qFZu15pkjo5kYi6mth2Zzwzt50oCQKQE9RUs=
-github.com/konsorten/go-windows-terminal-sequences v1.0.1/go.mod h1:T0+1ngSBFLxvqU3pZ+m/2kptfBszLMUkC4ZK/EgS/cQ=
-github.com/kr/fs v0.1.0/go.mod h1:FFnZGqtBN9Gxj7eW1uZ42v5BccTP0vu6NEaFoC2HwRg=
-github.com/kr/logfmt v0.0.0-20140226030751-b84e30acd515/go.mod h1:+0opPa2QZZtGFBFZlji/RkVcI2GknAs/DXo4wKdlNEc=
-github.com/kr/pretty v0.1.0/go.mod h1:dAy3ld7l9f0ibDNOQOHHMYYIIbhfbHSm3C4ZsoJORNo=
-github.com/kr/pretty v0.2.0/go.mod h1:ipq/a2n7PKx3OHsz4KJII5eveXtPO4qwEXGdVfWzfnI=
-github.com/kr/pretty v0.2.1/go.mod h1:ipq/a2n7PKx3OHsz4KJII5eveXtPO4qwEXGdVfWzfnI=
-github.com/kr/pretty v0.3.0 h1:WgNl7dwNpEZ6jJ9k1snq4pZsg7DOEN8hP9Xw0Tsjwk0=
-github.com/kr/pty v1.1.1/go.mod h1:pFQYn66WHrOpPYNljwOMqo10TkYh1fy3cYio2l3bCsQ=
-github.com/kr/text v0.1.0/go.mod h1:4Jbv+DJW3UT/LiOwJeYQe1efqtUx/iVham/4vfdArNI=
-github.com/kr/text v0.2.0 h1:5Nx0Ya0ZqY2ygV366QzturHI13Jq95ApcVaJBhpS+AY=
-github.com/kr/text v0.2.0/go.mod h1:eLer722TekiGuMkidMxC/pM04lWEeraHUUmBw8l2grE=
-github.com/lib/pq v1.0.0/go.mod h1:5WUZQaWbwv1U+lTReE5YruASi9Al49XbQIvNi/34Woo=
-github.com/lyft/protoc-gen-star v0.5.3/go.mod h1:V0xaHgaf5oCCqmcxYcWiDfTiKsZsRc87/1qhoTACD8w=
-github.com/magiconair/properties v1.8.5/go.mod h1:y3VJvCyxH9uVvJTWEGAELF3aiYNyPKd5NZ3oSwXrF60=
-github.com/magiconair/properties v1.8.7 h1:IeQXZAiQcpL9mgcAe1Nu6cX9LLw6ExEHKjN0VQdvPDY=
-github.com/magiconair/properties v1.8.7/go.mod h1:Dhd985XPs7jluiymwWYZ0G4Z61jb3vdS329zhj2hYo0=
-github.com/matishsiao/goInfo v0.0.0-20210923090445-da2e3fa8d45f h1:B0OD7nYl2FPQEVrw8g2uyc1lGEzNbvrKh7fspGZcbvY=
-github.com/matishsiao/goInfo v0.0.0-20210923090445-da2e3fa8d45f/go.mod h1:aEt7p9Rvh67BYApmZwNDPpgircTO2kgdmDUoF/1QmwA=
-github.com/mattn/go-colorable v0.0.9/go.mod h1:9vuHe8Xs5qXnSaW/c/ABM9alt+Vo+STaOChaDxuIBZU=
-github.com/mattn/go-colorable v0.1.4/go.mod h1:U0ppj6V5qS13XJ6of8GYAs25YV2eR4EVcfRqFIhoBtE=
-github.com/mattn/go-colorable v0.1.6/go.mod h1:u6P/XSegPjTcexA+o6vUJrdnUu04hMope9wVRipJSqc=
-github.com/mattn/go-colorable v0.1.9/go.mod h1:u6P/XSegPjTcexA+o6vUJrdnUu04hMope9wVRipJSqc=
-github.com/mattn/go-colorable v0.1.12/go.mod h1:u5H1YNBxpqRaxsYJYSkiCWKzEfiAb1Gb520KVy5xxl4=
-github.com/mattn/go-isatty v0.0.3/go.mod h1:M+lRXTBqGeGNdLjl/ufCoiOlB5xdOkqRJdNxMWT7Zi4=
-github.com/mattn/go-isatty v0.0.8/go.mod h1:Iq45c/XA43vh69/j3iqttzPXn0bhXyGjM0Hdxcsrc5s=
-github.com/mattn/go-isatty v0.0.10/go.mod h1:qgIWMr58cqv1PHHyhnkY9lrL7etaEgOFcMEpPG5Rm84=
-github.com/mattn/go-isatty v0.0.11/go.mod h1:PhnuNfih5lzO57/f3n+odYbM4JtupLOxQOAqxQCu2WE=
-github.com/mattn/go-isatty v0.0.12/go.mod h1:cbi8OIDigv2wuxKPP5vlRcQ1OAZbq2CE4Kysco4FUpU=
-github.com/mattn/go-isatty v0.0.14/go.mod h1:7GGIvUiUoEMVVmxf/4nioHXj79iQHKdU27kJ6hsGG94=
-github.com/mattn/go-runewidth v0.0.9 h1:Lm995f3rfxdpd6TSmuVCHVb/QhupuXlYr8sCI/QdE+0=
-github.com/mattn/go-runewidth v0.0.9/go.mod h1:H031xJmbD/WCDINGzjvQ9THkh0rPKHF+m2gUSrubnMI=
-github.com/mattn/go-sqlite3 v1.9.0/go.mod h1:FPy6KqzDD04eiIsT53CuJW3U88zkxoIYsOqkbpncsNc=
-github.com/matttproud/golang_protobuf_extensions v1.0.1/go.mod h1:D8He9yQNgCq6Z5Ld7szi9bcBfOoFv/3dc6xSMkL2PC0=
-github.com/mholt/archiver/v4 v4.0.0-alpha.4 h1:QJ4UuWgavPynEX3LXxClHDRGzYcgcvTtAMp8az7spuw=
-github.com/mholt/archiver/v4 v4.0.0-alpha.4/go.mod h1:J7SYS/UTAtnO3I49RQEf+2FYZVwo7XBOh9Im43VrjNs=
-github.com/miekg/dns v1.0.14/go.mod h1:W1PPwlIAgtquWBMBEV9nkV9Cazfe8ScdGz/Lj7v3Nrg=
-github.com/miekg/dns v1.1.26/go.mod h1:bPDLeHnStXmXAq1m/Ch/hvfNHr14JKNPMBo3VZKjuso=
-github.com/miekg/dns v1.1.41/go.mod h1:p6aan82bvRIyn+zDIv9xYNUpwa73JcSh9BKwknJysuI=
-github.com/mitchellh/cli v1.1.0/go.mod h1:xcISNoH86gajksDmfB23e/pu+B+GeFRMYmoHXxx3xhI=
-github.com/mitchellh/go-homedir v1.0.0/go.mod h1:SfyaCUpYCn1Vlf4IUYiD9fPX4A5wJrkLzIz1N1q0pr0=
-github.com/mitchellh/go-homedir v1.1.0 h1:lukF9ziXFxDFPkA1vsr5zpc1XuPDn/wFntq5mG+4E0Y=
-github.com/mitchellh/go-homedir v1.1.0/go.mod h1:SfyaCUpYCn1Vlf4IUYiD9fPX4A5wJrkLzIz1N1q0pr0=
-github.com/mitchellh/go-testing-interface v1.0.0/go.mod h1:kRemZodwjscx+RGhAo8eIhFbs2+BFgRtFPeD/KE+zxI=
-github.com/mitchellh/mapstructure v0.0.0-20160808181253-ca63d7c062ee/go.mod h1:FVVH3fgwuzCH5S8UJGiWEs2h04kUh9fWfEaFds41c1Y=
-github.com/mitchellh/mapstructure v1.1.2/go.mod h1:FVVH3fgwuzCH5S8UJGiWEs2h04kUh9fWfEaFds41c1Y=
-github.com/mitchellh/mapstructure v1.4.3 h1:OVowDSCllw/YjdLkam3/sm7wEtOy59d8ndGgCcyj8cs=
-github.com/mitchellh/mapstructure v1.4.3/go.mod h1:bFUtVrKA4DC2yAKiSyO/QUcy7e+RRV2QTWOzhPopBRo=
-github.com/mkevac/debugcharts v0.0.0-20191222103121-ae1c48aa8615/go.mod h1:Ad7oeElCZqA1Ufj0U9/liOF4BtVepxRcTvr2ey7zTvM=
-github.com/moby/patternmatcher v0.5.0 h1:YCZgJOeULcxLw1Q+sVR636pmS7sPEn1Qo2iAN6M7DBo=
-github.com/moby/patternmatcher v0.5.0/go.mod h1:hDPoyOpDY7OrrMDLaYoY3hf52gNCR/YOUYxkhApJIxc=
-github.com/moby/sys/mountinfo v0.5.0/go.mod h1:3bMD3Rg+zkqx8MRYPi7Pyb0Ie97QEBmdxbhnCLlSvSU=
-github.com/moby/sys/sequential v0.5.0 h1:OPvI35Lzn9K04PBbCLW0g4LcFAJgHsvXsRyewg5lXtc=
-github.com/moby/sys/sequential v0.5.0/go.mod h1:tH2cOOs5V9MlPiXcQzRC+eEyab644PWKGRYaaV5ZZlo=
-github.com/moby/term v0.0.0-20221128092401-c43b287e0e0f h1:J/7hjLaHLD7epG0m6TBMGmp4NQ+ibBYLfeyJWdAIFLA=
-github.com/moby/term v0.0.0-20221128092401-c43b287e0e0f/go.mod h1:15ce4BGCFxt7I5NQKT+HV0yEDxmf6fSysfEDiVo3zFM=
-github.com/modern-go/concurrent v0.0.0-20180228061459-e0a39a4cb421/go.mod h1:6dJC0mAP4ikYIbvyc7fijjWJddQyLn8Ig3JB5CqoB9Q=
-github.com/modern-go/concurrent v0.0.0-20180306012644-bacd9c7ef1dd/go.mod h1:6dJC0mAP4ikYIbvyc7fijjWJddQyLn8Ig3JB5CqoB9Q=
-github.com/modern-go/reflect2 v0.0.0-20180701023420-4b7aa43c6742/go.mod h1:bx2lNnkwVCuqBIxFjflWJWanXIb3RllmbCylyMrvgv0=
-github.com/modern-go/reflect2 v1.0.1/go.mod h1:bx2lNnkwVCuqBIxFjflWJWanXIb3RllmbCylyMrvgv0=
-github.com/modern-go/reflect2 v1.0.2/go.mod h1:yWuevngMOJpCy52FWWMvUC8ws7m/LJsjYzDa0/r8luk=
-github.com/morikuni/aec v1.0.0 h1:nP9CBfwrvYnBRgY6qfDQkygYDmYwOilePFkwzv4dU8A=
-github.com/morikuni/aec v1.0.0/go.mod h1:BbKIizmSmc5MMPqRYbxO4ZU0S0+P200+tUnFx7PXmsc=
-github.com/mrunalp/fileutils v0.5.0/go.mod h1:M1WthSahJixYnrXQl/DFQuteStB1weuxD2QJNHXfbSQ=
-github.com/mwitkow/go-conntrack v0.0.0-20161129095857-cc309e4a2223/go.mod h1:qRWi+5nqEBWmkhHvq77mSJWrCKwh8bxhgT7d/eI7P4U=
-github.com/nwaples/rardecode/v2 v2.0.0-beta.2 h1:e3mzJFJs4k83GXBEiTaQ5HgSc/kOK8q0rDaRO0MPaOk=
-github.com/nwaples/rardecode/v2 v2.0.0-beta.2/go.mod h1:yntwv/HfMc/Hbvtq9I19D1n58te3h6KsqCf3GxyfBGY=
-github.com/olekukonko/tablewriter v0.0.5 h1:P2Ga83D34wi1o9J6Wh1mRuqd4mF/x/lgBS7N7AbDhec=
-github.com/olekukonko/tablewriter v0.0.5/go.mod h1:hPp6KlRPjbx+hW8ykQs1w3UBbZlj6HuIJcUGPhkA7kY=
-github.com/opencontainers/go-digest v1.0.0 h1:apOUWs51W5PlhuyGyz9FCeeBIOUDA/6nW8Oi/yOhh5U=
-github.com/opencontainers/go-digest v1.0.0/go.mod h1:0JzlMkj0TRzQZfJkVvzbP0HBR3IKzErnv2BNG4W4MAM=
-github.com/opencontainers/image-spec v1.1.0-rc2 h1:2zx/Stx4Wc5pIPDvIxHXvXtQFW/7XWJGmnM7r3wg034=
-github.com/opencontainers/image-spec v1.1.0-rc2/go.mod h1:3OVijpioIKYWTqjiG0zfF6wvoJ4fAXGbjdZuI2NgsRQ=
-github.com/opencontainers/runc v1.1.3 h1:vIXrkId+0/J2Ymu2m7VjGvbSlAId9XNRPhn2p4b+d8w=
-github.com/opencontainers/runc v1.1.3/go.mod h1:1J5XiS+vdZ3wCyZybsuxXZWGrgSr8fFJHLXuG2PsnNg=
-github.com/opencontainers/runtime-spec v1.0.3-0.20210326190908-1c3f411f0417/go.mod h1:jwyrGlmzljRJv/Fgzds9SsS/C5hL+LL3ko9hs6T5lQ0=
-github.com/opencontainers/selinux v1.10.0/go.mod h1:2i0OySw99QjzBBQByd1Gr9gSjvuho1lHsJxIJ3gGbJI=
-github.com/pascaldekloe/goe v0.0.0-20180627143212-57f6aae5913c/go.mod h1:lzWF7FIEvWOWxwDKqyGYQf6ZUaNfKdP144TG7ZOy1lc=
-github.com/pascaldekloe/goe v0.1.0/go.mod h1:lzWF7FIEvWOWxwDKqyGYQf6ZUaNfKdP144TG7ZOy1lc=
-github.com/paulmach/orb v0.4.0 h1:ilp1MQjRapLJ1+qcays1nZpe0mvkCY+b8JU/qBKRZ1A=
-github.com/paulmach/orb v0.4.0/go.mod h1:FkcWtplUAIVqAuhAOV2d3rpbnQyliDOjOcLW9dUrfdU=
-github.com/paulmach/protoscan v0.2.1-0.20210522164731-4e53c6875432/go.mod h1:2sV+uZ/oQh66m4XJVZm5iqUZ62BN88Ex1E+TTS0nLzI=
-github.com/pelletier/go-toml v1.9.4/go.mod h1:u1nR/EPcESfeI/szUZKdtJ0xRNbUoANCkoOuaOx1Y+c=
-github.com/pelletier/go-toml v1.9.5 h1:4yBQzkHv+7BHq2PQUZF3Mx0IYxG7LsP222s7Agd3ve8=
-github.com/pelletier/go-toml v1.9.5/go.mod h1:u1nR/EPcESfeI/szUZKdtJ0xRNbUoANCkoOuaOx1Y+c=
-github.com/pierrec/lz4 v2.0.5+incompatible/go.mod h1:pdkljMzZIN41W+lC3N2tnIh5sFi+IEE17M5jbnwPHcY=
-github.com/pierrec/lz4/v4 v4.1.14 h1:+fL8AQEZtz/ijeNnpduH0bROTu0O3NZAlPjQxGn8LwE=
-github.com/pierrec/lz4/v4 v4.1.14/go.mod h1:gZWDp/Ze/IJXGXf23ltt2EXimqmTUXEy0GFuRQyBid4=
-github.com/pkg/errors v0.8.0/go.mod h1:bwawxfHBFNV+L2hUp1rHADufV3IMtnDRdf1r5NINEl0=
-github.com/pkg/errors v0.8.1/go.mod h1:bwawxfHBFNV+L2hUp1rHADufV3IMtnDRdf1r5NINEl0=
-github.com/pkg/errors v0.9.1 h1:FEBLx1zS214owpjy7qsBeixbURkuhQAwrK5UwLGTwt4=
-github.com/pkg/errors v0.9.1/go.mod h1:bwawxfHBFNV+L2hUp1rHADufV3IMtnDRdf1r5NINEl0=
-github.com/pkg/sftp v1.10.1/go.mod h1:lYOWFsE0bwd1+KfKJaKeuokY15vzFx25BLbzYYoAxZI=
-github.com/pkg/sftp v1.13.1/go.mod h1:3HaPG6Dq1ILlpPZRO0HVMrsydcdLt6HRDccSgb87qRg=
-github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZbAQM=
-github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4=
-github.com/posener/complete v1.1.1/go.mod h1:em0nMJCgc9GFtwrmVmEMR/ZL6WyhyjMBndrE9hABlRI=
-github.com/posener/complete v1.2.3/go.mod h1:WZIdtGGp+qx0sLrYKtIRAruyNpv6hFCicSgv7Sy7s/s=
-github.com/prometheus/client_golang v0.9.1/go.mod h1:7SWBe2y4D6OKWSNQJUaRYU/AaXPKyh/dDVn+NZz0KFw=
-github.com/prometheus/client_golang v1.0.0/go.mod h1:db9x61etRT2tGnBNRi70OPL5FsnadC4Ky3P0J6CfImo=
-github.com/prometheus/client_golang v1.4.0/go.mod h1:e9GMxYsXl05ICDXkRhurwBS4Q3OK1iX/F2sw+iXX5zU=
-github.com/prometheus/client_model v0.0.0-20180712105110-5c3871d89910/go.mod h1:MbSGuTsp3dbXC40dX6PRTWyKYBIrTGTE9sqQNg2J8bo=
-github.com/prometheus/client_model v0.0.0-20190129233127-fd36f4220a90/go.mod h1:xMI15A0UPsDsEKsMN9yxemIoYk6Tm2C1GtYGdfGttqA=
-github.com/prometheus/client_model v0.0.0-20190812154241-14fe0d1b01d4/go.mod h1:xMI15A0UPsDsEKsMN9yxemIoYk6Tm2C1GtYGdfGttqA=
-github.com/prometheus/client_model v0.2.0/go.mod h1:xMI15A0UPsDsEKsMN9yxemIoYk6Tm2C1GtYGdfGttqA=
-github.com/prometheus/common v0.4.1/go.mod h1:TNfzLD0ON7rHzMJeJkieUDPYmFC7Snx/y86RQel1bk4=
-github.com/prometheus/common v0.9.1/go.mod h1:yhUN8i9wzaXS3w1O07YhxHEBxD+W35wd8bs7vj7HSQ4=
-github.com/prometheus/procfs v0.0.0-20181005140218-185b4288413d/go.mod h1:c3At6R/oaqEKCNdg8wHV1ftS6bRYblBhIjjI8uT2IGk=
-github.com/prometheus/procfs v0.0.2/go.mod h1:TjEm7ze935MbeOT/UhFTIMYKhuLP4wbCsTZCD3I8kEA=
-github.com/prometheus/procfs v0.0.8/go.mod h1:7Qr8sr6344vo1JqZ6HhLceV9o3AJ1Ff+GxbHq6oeK9A=
-github.com/rogpeppe/fastuuid v1.2.0/go.mod h1:jVj6XXZzXRy/MSR5jhDC/2q6DgLz+nrA6LYCDYWNEvQ=
-github.com/rogpeppe/go-internal v1.3.0/go.mod h1:M8bDsm7K2OlrFYOpmOWEs/qY81heoFRclV5y23lUDJ4=
-github.com/rogpeppe/go-internal v1.8.1 h1:geMPLpDpQOgVyCg5z5GoRwLHepNdb71NXb67XFkP+Eg=
-github.com/rs/xid v1.3.0/go.mod h1:trrq9SKmegXys3aeAKXMUTdJsYXVwGY3RLcfgqegfbg=
-github.com/rs/zerolog v1.26.1 h1:/ihwxqH+4z8UxyI70wM1z9yCvkWcfz/a3mj48k/Zngc=
-github.com/rs/zerolog v1.26.1/go.mod h1:/wSSJWX7lVrsOwlbyTRSOJvqRlc+WjWlfes+CiJ+tmc=
-github.com/russross/blackfriday/v2 v2.0.1/go.mod h1:+Rmxgy9KzJVeS9/2gXHxylqXiyQDYRxCVz55jmeOWTM=
-github.com/russross/blackfriday/v2 v2.1.0/go.mod h1:+Rmxgy9KzJVeS9/2gXHxylqXiyQDYRxCVz55jmeOWTM=
-github.com/ryanuber/columnize v0.0.0-20160712163229-9b3edd62028f/go.mod h1:sm1tb6uqfes/u+d4ooFouqFdy9/2g9QGwK3SQygK0Ts=
-github.com/sagikazarmark/crypt v0.3.0/go.mod h1:uD/D+6UF4SrIR1uGEv7bBNkNqLGqUr43MRiaGWX1Nig=
-github.com/sean-/seed v0.0.0-20170313163322-e2103e2c3529/go.mod h1:DxrIzT+xaE7yg65j358z/aeFdxmN0P9QXhEzd20vsDc=
-github.com/seccomp/libseccomp-golang v0.9.2-0.20220502022130-f33da4d89646/go.mod h1:JA8cRccbGaA1s33RQf7Y1+q9gHmZX1yB/z9WDN1C6fg=
-github.com/shirou/gopsutil v2.19.11+incompatible/go.mod h1:5b4v6he4MtMOwMlS0TUMTu2PcXUg8+E1lC7eC3UO/RA=
-github.com/shirou/w32 v0.0.0-20160930032740-bb4de0191aa4/go.mod h1:qsXQc7+bwAM3Q1u/4XEfrquwF8Lw7D7y5cD8CuHnfIc=
-github.com/shopspring/decimal v1.3.1 h1:2Usl1nmF/WZucqkFZhnfFYxxxu8LG21F6nPQBE5gKV8=
-github.com/shopspring/decimal v1.3.1/go.mod h1:DKyhrW/HYNuLGql+MJL6WCR6knT2jwCFRcu2hWCYk4o=
-github.com/shurcooL/sanitized_anchor_name v1.0.0/go.mod h1:1NzhyTcUVG4SuEtjjoZeVRXNmyL/1OwPU0+IJeTBvfc=
-github.com/sirupsen/logrus v1.2.0/go.mod h1:LxeOpSwHxABJmUn/MG1IvRgCAasNZTLOkJPxbbu5VWo=
-github.com/sirupsen/logrus v1.4.2/go.mod h1:tLMulIdttU9McNUspp0xgXVQah82FyeX6MwdIuYE2rE=
-github.com/sirupsen/logrus v1.7.0/go.mod h1:yWOB1SBYBC5VeMP7gHvWumXLIWorT60ONWic61uBYv0=
-github.com/sirupsen/logrus v1.8.1/go.mod h1:yWOB1SBYBC5VeMP7gHvWumXLIWorT60ONWic61uBYv0=
-github.com/sirupsen/logrus v1.9.0 h1:trlNQbNUG3OdDrDil03MCb1H2o9nJ1x4/5LYw7byDE0=
-github.com/sirupsen/logrus v1.9.0/go.mod h1:naHLuLoDiP4jHNo9R0sCBMtWGeIprob74mVsIT4qYEQ=
-github.com/spaolacci/murmur3 v0.0.0-20180118202830-f09979ecbc72/go.mod h1:JwIasOWyU6f++ZhiEuf87xNszmSA2myDM2Kzu9HwQUA=
-github.com/spf13/afero v1.3.3/go.mod h1:5KUK8ByomD5Ti5Artl0RtHeI5pTF7MIDuXL3yY520V4=
-github.com/spf13/afero v1.6.0/go.mod h1:Ai8FlHk4v/PARR026UzYexafAt9roJ7LcLMAmO6Z93I=
-github.com/spf13/afero v1.8.0 h1:5MmtuhAgYeU6qpa7w7bP0dv6MBYuup0vekhSpSkoq60=
-github.com/spf13/afero v1.8.0/go.mod h1:CtAatgMJh6bJEIs48Ay/FOnkljP3WeGUG0MC1RfAqwo=
-github.com/spf13/cast v1.4.1 h1:s0hze+J0196ZfEMTs80N7UlFt0BDuQ7Q+JDnHiMWKdA=
-github.com/spf13/cast v1.4.1/go.mod h1:Qx5cxh0v+4UWYiBimWS+eyWzqEqokIECu5etghLkUJE=
-github.com/spf13/cobra v0.0.3/go.mod h1:1l0Ry5zgKvJasoi3XT1TypsSe7PqH0Sj9dhYf7v3XqQ=
-github.com/spf13/cobra v1.3.0 h1:R7cSvGu+Vv+qX0gW5R/85dx2kmmJT5z5NM8ifdYjdn0=
-github.com/spf13/cobra v1.3.0/go.mod h1:BrRVncBjOJa/eUcVVm9CE+oC6as8k+VYr4NY7WCi9V4=
-github.com/spf13/jwalterweatherman v1.1.0 h1:ue6voC5bR5F8YxI5S67j9i582FU4Qvo2bmqnqMYADFk=
-github.com/spf13/jwalterweatherman v1.1.0/go.mod h1:aNWZUN0dPAAO/Ljvb5BEdw96iTZ0EXowPYD95IqWIGo=
-github.com/spf13/pflag v1.0.2/go.mod h1:DYY7MBk1bdzusC3SYhjObp+wFpr4gzcvqqNjLnInEg4=
-github.com/spf13/pflag v1.0.5 h1:iy+VFUOCP1a+8yFto/drg2CJ5u0yRoB7fZw3DKv/JXA=
-github.com/spf13/pflag v1.0.5/go.mod h1:McXfInJRrz4CZXVZOBLb0bTZqETkiAhM9Iw0y3An2Bg=
-github.com/spf13/viper v1.10.0/go.mod h1:SoyBPwAtKDzypXNDFKN5kzH7ppppbGZtls1UpIy5AsM=
-github.com/spf13/viper v1.10.1 h1:nuJZuYpG7gTj/XqiUwg8bA0cp1+M2mC3J4g5luUYBKk=
-github.com/spf13/viper v1.10.1/go.mod h1:IGlFPqhNAPKRxohIzWpI5QEy4kuI7tcl5WvR+8qy1rU=
-github.com/stretchr/objx v0.1.0/go.mod h1:HFkY916IF+rwdDfMAkV7OtwuqBVzrE8GR6GFx+wExME=
-github.com/stretchr/objx v0.1.1/go.mod h1:HFkY916IF+rwdDfMAkV7OtwuqBVzrE8GR6GFx+wExME=
-github.com/stretchr/objx v0.4.0/go.mod h1:YvHI0jy2hoMjB+UWwv71VJQ9isScKT/TqJzVSSt89Yw=
-github.com/stretchr/objx v0.5.0/go.mod h1:Yh+to48EsGEfYuaHDzXPcE3xhTkx73EhmCGUpEOglKo=
-github.com/stretchr/testify v1.2.2/go.mod h1:a8OnRcib4nhh0OaRAV+Yts87kKdq0PP7pXfy6kDkUVs=
-github.com/stretchr/testify v1.3.0/go.mod h1:M5WIy9Dh21IEIfnGCwXGc5bZfKNJtfHm1UVUgZn+9EI=
-github.com/stretchr/testify v1.4.0/go.mod h1:j7eGeouHqKxXV5pUuKE4zz7dFj8WfuZ+81PSLYec5m4=
-github.com/stretchr/testify v1.5.1/go.mod h1:5W2xD1RspED5o8YsWQXVCued0rvSQ+mT+I5cxcmMvtA=
-github.com/stretchr/testify v1.6.1/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg=
-github.com/stretchr/testify v1.7.0/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg=
-github.com/stretchr/testify v1.7.1/go.mod h1:6Fq8oRcR53rry900zMqJjRRixrwX3KX962/h/Wwjteg=
-github.com/stretchr/testify v1.8.0/go.mod h1:yNjHg4UonilssWZ8iaSj1OCr/vHnekPRkoO+kdMU+MU=
-github.com/stretchr/testify v1.8.1 h1:w7B6lhMri9wdJUVmEZPGGhZzrYTPvgJArz7wNPgYKsk=
-github.com/stretchr/testify v1.8.1/go.mod h1:w2LPCIKwWwSfY2zedu0+kehJoqGctiVI29o6fzry7u4=
-github.com/subosito/gotenv v1.2.0 h1:Slr1R9HxAlEKefgq5jn9U+DnETlIUa6HfgEzj0g5d7s=
-github.com/subosito/gotenv v1.2.0/go.mod h1:N0PQaV/YGNqwC0u51sEeR/aUtSLEXKX9iv69rRypqCw=
-github.com/syndtr/gocapability v0.0.0-20200815063812-42c35b437635/go.mod h1:hkRG7XYTFWNJGYcbNJQlaLq0fg1yr4J4t/NcTQtrfww=
-github.com/testcontainers/testcontainers-go v0.18.0 h1:8RXrcIQv5xX/uBOSmZd297gzvA7F0yuRA37/918o7Yg=
-github.com/testcontainers/testcontainers-go v0.18.0/go.mod h1:rLC7hR2SWRjJZZNrUYiTKvUXCziNxzZiYtz9icTWYNQ=
-github.com/therootcompany/xz v1.0.1 h1:CmOtsn1CbtmyYiusbfmhmkpAAETj0wBIH6kCYaX+xzw=
-github.com/therootcompany/xz v1.0.1/go.mod h1:3K3UH1yCKgBneZYhuQUvJ9HPD19UEXEI0BWbMn8qNMY=
-github.com/tv42/httpunix v0.0.0-20150427012821-b75d8614f926/go.mod h1:9ESjWnEqriFuLhtthL60Sar/7RFoluCcXsuvEwTV5KM=
-github.com/ulikunitz/xz v0.5.6/go.mod h1:2bypXElzHzzJZwzH67Y6wb67pO62Rzfn7BSiF4ABRW8=
-github.com/ulikunitz/xz v0.5.10 h1:t92gobL9l3HE202wg3rlk19F6X+JOxl9BBrCCMYEYd8=
-github.com/ulikunitz/xz v0.5.10/go.mod h1:nbz6k7qbPmH4IRqmfOplQw/tblSgqTqBwxkY0oWt/14=
-github.com/urfave/cli v1.22.1/go.mod h1:Gos4lmkARVdJ6EkW0WaNv/tZAAMe9V7XWyB60NtXRu0=
-github.com/vishvananda/netlink v1.1.0/go.mod h1:cTgwzPIzzgDAYoQrMm0EdrjRUBkTqKYppBueQtXaqoE=
-github.com/vishvananda/netns v0.0.0-20191106174202-0a2b9b5464df/go.mod h1:JP3t17pCcGlemwknint6hfoeCVQrEMVwxRLRjXpq+BU=
-github.com/yargevad/filepathx v1.0.0 h1:SYcT+N3tYGi+NvazubCNlvgIPbzAk7i7y2dwg3I5FYc=
-github.com/yargevad/filepathx v1.0.0/go.mod h1:BprfX/gpYNJHJfc35GjRRpVcwWXS89gGulUIU5tK3tA=
-github.com/yuin/goldmark v1.1.25/go.mod h1:3hX8gzYuyVAZsxl0MRgGTJEmQBFcNTphYh9decYSb74=
-github.com/yuin/goldmark v1.1.27/go.mod h1:3hX8gzYuyVAZsxl0MRgGTJEmQBFcNTphYh9decYSb74=
-github.com/yuin/goldmark v1.1.32/go.mod h1:3hX8gzYuyVAZsxl0MRgGTJEmQBFcNTphYh9decYSb74=
-github.com/yuin/goldmark v1.2.1/go.mod h1:3hX8gzYuyVAZsxl0MRgGTJEmQBFcNTphYh9decYSb74=
-github.com/yuin/goldmark v1.3.5/go.mod h1:mwnBkeHKe2W/ZEtQ+71ViKU8L12m81fl3OWwC1Zlc8k=
-github.com/yuin/goldmark v1.4.0/go.mod h1:mwnBkeHKe2W/ZEtQ+71ViKU8L12m81fl3OWwC1Zlc8k=
-go.etcd.io/etcd/api/v3 v3.5.1/go.mod h1:cbVKeC6lCfl7j/8jBhAK6aIYO9XOjdptoxU/nLQcPvs=
-go.etcd.io/etcd/client/pkg/v3 v3.5.1/go.mod h1:IJHfcCEKxYu1Os13ZdwCwIUTUVGYTSAM3YSwc9/Ac1g=
-go.etcd.io/etcd/client/v2 v2.305.1/go.mod h1:pMEacxZW7o8pg4CrFE7pquyCJJzZvkvdD2RibOCCCGs=
-go.opencensus.io v0.21.0/go.mod h1:mSImk1erAIZhrmZN+AvHh14ztQfjbGwt4TtuofqLduU=
-go.opencensus.io v0.22.0/go.mod h1:+kGneAE2xo2IficOXnaByMWTGM9T73dGwxeWcUqIpI8=
-go.opencensus.io v0.22.2/go.mod h1:yxeiOL68Rb0Xd1ddK5vPZ/oVn4vY4Ynel7k9FzqtOIw=
-go.opencensus.io v0.22.3/go.mod h1:yxeiOL68Rb0Xd1ddK5vPZ/oVn4vY4Ynel7k9FzqtOIw=
-go.opencensus.io v0.22.4/go.mod h1:yxeiOL68Rb0Xd1ddK5vPZ/oVn4vY4Ynel7k9FzqtOIw=
-go.opencensus.io v0.22.5/go.mod h1:5pWMHQbX5EPX2/62yrJeAkowc+lfs/XD7Uxpq3pI6kk=
-go.opencensus.io v0.23.0/go.mod h1:XItmlyltB5F7CS4xOC1DcqMoFqwtC6OG2xF7mCv7P7E=
-go.opentelemetry.io/otel v1.4.1 h1:QbINgGDDcoQUoMJa2mMaWno49lja9sHwp6aoa2n3a4g=
-go.opentelemetry.io/otel v1.4.1/go.mod h1:StM6F/0fSwpd8dKWDCdRr7uRvEPYdW0hBSlbdTiUde4=
-go.opentelemetry.io/otel/trace v1.4.1 h1:O+16qcdTrT7zxv2J6GejTPFinSwA++cYerC5iSiF8EQ=
-go.opentelemetry.io/otel/trace v1.4.1/go.mod h1:iYEVbroFCNut9QkwEczV9vMRPHNKSSwYZjulEtsmhFc=
-go.opentelemetry.io/proto/otlp v0.7.0/go.mod h1:PqfVotwruBrMGOCsRd/89rSnXhoiJIqeYNgFYFoEGnI=
-go.uber.org/atomic v1.7.0/go.mod h1:fEN4uk6kAWBTFdckzkM89CLk9XfWZrxpCo0nPH17wJc=
-go.uber.org/multierr v1.6.0/go.mod h1:cdWPpRnG4AhwMwsgIHip0KRBQjJy5kYEpYjJxpXp9iU=
-go.uber.org/zap v1.17.0/go.mod h1:MXVU+bhUf/A7Xi2HNOnopQOrmycQ5Ih87HtOu4q5SSo=
-golang.org/x/crypto v0.0.0-20180904163835-0709b304e793/go.mod h1:6SG95UA2DQfeDnfUPMdvaQW0Q7yPrPDi9nlGo2tz2b4=
-golang.org/x/crypto v0.0.0-20181029021203-45a5f77698d3/go.mod h1:6SG95UA2DQfeDnfUPMdvaQW0Q7yPrPDi9nlGo2tz2b4=
-golang.org/x/crypto v0.0.0-20190308221718-c2843e01d9a2/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w=
-golang.org/x/crypto v0.0.0-20190510104115-cbcb75029529/go.mod h1:yigFU9vqHzYiE8UmvKecakEJjdnWj3jj499lnFckfCI=
-golang.org/x/crypto v0.0.0-20190605123033-f99c8df09eb5/go.mod h1:yigFU9vqHzYiE8UmvKecakEJjdnWj3jj499lnFckfCI=
-golang.org/x/crypto v0.0.0-20190820162420-60c769a6c586/go.mod h1:yigFU9vqHzYiE8UmvKecakEJjdnWj3jj499lnFckfCI=
-golang.org/x/crypto v0.0.0-20190923035154-9ee001bba392/go.mod h1:/lpIB1dKB+9EgE3H3cr1v9wB50oz8l4C4h62xy7jSTY=
-golang.org/x/crypto v0.0.0-20191011191535-87dc89f01550/go.mod h1:yigFU9vqHzYiE8UmvKecakEJjdnWj3jj499lnFckfCI=
-golang.org/x/crypto v0.0.0-20200622213623-75b288015ac9/go.mod h1:LzIPMQfyMNhhGPhUkYOs5KpL4U8rLKemX1yGLhDgUto=
-golang.org/x/crypto v0.0.0-20210421170649-83a5a9bb288b/go.mod h1:T9bdIzuCu7OtxOm1hfPfRQxPLYneinmdGuTeoZ9dtd4=
-golang.org/x/crypto v0.0.0-20210817164053-32db794688a5/go.mod h1:GvvjBRRGRdwPK5ydBHafDWAxML/pGHZbMvKqRZ5+Abc=
-golang.org/x/crypto v0.0.0-20211108221036-ceb1ce70b4fa/go.mod h1:GvvjBRRGRdwPK5ydBHafDWAxML/pGHZbMvKqRZ5+Abc=
-golang.org/x/crypto v0.0.0-20211215165025-cf75a172585e/go.mod h1:P+XmwS30IXTQdn5tA2iutPOUgjI07+tq3H3K9MVA1s8=
-golang.org/x/exp v0.0.0-20190121172915-509febef88a4/go.mod h1:CJ0aWSM057203Lf6IL+f9T1iT9GByDxfZKAQTCR3kQA=
-golang.org/x/exp v0.0.0-20190306152737-a1d7652674e8/go.mod h1:CJ0aWSM057203Lf6IL+f9T1iT9GByDxfZKAQTCR3kQA=
-golang.org/x/exp v0.0.0-20190510132918-efd6b22b2522/go.mod h1:ZjyILWgesfNpC6sMxTJOJm9Kp84zZh5NQWvqDGG3Qr8=
-golang.org/x/exp v0.0.0-20190829153037-c13cbed26979/go.mod h1:86+5VVa7VpoJ4kLfm080zCjGlMRFzhUhsZKEZO7MGek=
-golang.org/x/exp v0.0.0-20191030013958-a1ab85dbe136/go.mod h1:JXzH8nQsPlswgeRAPE3MuO9GYsAcnJvJ4vnMwN/5qkY=
-golang.org/x/exp v0.0.0-20191129062945-2f5052295587/go.mod h1:2RIsYlXP63K8oxa1u096TMicItID8zy7Y6sNkU49FU4=
-golang.org/x/exp v0.0.0-20191227195350-da58074b4299/go.mod h1:2RIsYlXP63K8oxa1u096TMicItID8zy7Y6sNkU49FU4=
-golang.org/x/exp v0.0.0-20200119233911-0405dc783f0a/go.mod h1:2RIsYlXP63K8oxa1u096TMicItID8zy7Y6sNkU49FU4=
-golang.org/x/exp v0.0.0-20200207192155-f17229e696bd/go.mod h1:J/WKrq2StrnmMY6+EHIKF9dgMWnmCNThgcyBT1FY9mM=
-golang.org/x/exp v0.0.0-20200224162631-6cc2880d07d6/go.mod h1:3jZMyOhIsHpP37uCMkUooju7aAi5cS1Q23tOzKc+0MU=
-golang.org/x/image v0.0.0-20190227222117-0694c2d4d067/go.mod h1:kZ7UVZpmo3dzQBMxlp+ypCbDeSB+sBbTgSJuh5dn5js=
-golang.org/x/image v0.0.0-20190802002840-cff245a6509b/go.mod h1:FeLwcggjj3mMvU+oOTbSwawSJRM1uh48EjtB4UJZlP0=
-golang.org/x/lint v0.0.0-20181026193005-c67002cb31c3/go.mod h1:UVdnD1Gm6xHRNCYTkRU2/jEulfH38KcIWyp/GAMgvoE=
-golang.org/x/lint v0.0.0-20190227174305-5b3e6a55c961/go.mod h1:wehouNa3lNwaWXcvxsM5YxQ5yQlVC4a0KAMCusXpPoU=
-golang.org/x/lint v0.0.0-20190301231843-5614ed5bae6f/go.mod h1:UVdnD1Gm6xHRNCYTkRU2/jEulfH38KcIWyp/GAMgvoE=
-golang.org/x/lint v0.0.0-20190313153728-d0100b6bd8b3/go.mod h1:6SW0HCj/g11FgYtHlgUYUwCkIfeOF89ocIRzGO/8vkc=
-golang.org/x/lint v0.0.0-20190409202823-959b441ac422/go.mod h1:6SW0HCj/g11FgYtHlgUYUwCkIfeOF89ocIRzGO/8vkc=
-golang.org/x/lint v0.0.0-20190909230951-414d861bb4ac/go.mod h1:6SW0HCj/g11FgYtHlgUYUwCkIfeOF89ocIRzGO/8vkc=
-golang.org/x/lint v0.0.0-20190930215403-16217165b5de/go.mod h1:6SW0HCj/g11FgYtHlgUYUwCkIfeOF89ocIRzGO/8vkc=
-golang.org/x/lint v0.0.0-20191125180803-fdd1cda4f05f/go.mod h1:5qLYkcX4OjUUV8bRuDixDT3tpyyb+LUpUlRWLxfhWrs=
-golang.org/x/lint v0.0.0-20200130185559-910be7a94367/go.mod h1:3xt1FjdF8hUf6vQPIChWIBhFzV8gjjsPE/fR3IyQdNY=
-golang.org/x/lint v0.0.0-20200302205851-738671d3881b/go.mod h1:3xt1FjdF8hUf6vQPIChWIBhFzV8gjjsPE/fR3IyQdNY=
-golang.org/x/lint v0.0.0-20201208152925-83fdc39ff7b5/go.mod h1:3xt1FjdF8hUf6vQPIChWIBhFzV8gjjsPE/fR3IyQdNY=
-golang.org/x/lint v0.0.0-20210508222113-6edffad5e616/go.mod h1:3xt1FjdF8hUf6vQPIChWIBhFzV8gjjsPE/fR3IyQdNY=
-golang.org/x/mobile v0.0.0-20190312151609-d3739f865fa6/go.mod h1:z+o9i4GpDbdi3rU15maQ/Ox0txvL9dWGYEHz965HBQE=
-golang.org/x/mobile v0.0.0-20190719004257-d2bd2a29d028/go.mod h1:E/iHnbuqvinMTCcRqshq8CkpyQDoeVncDDYHnLhea+o=
-golang.org/x/mod v0.0.0-20190513183733-4bf6d317e70e/go.mod h1:mXi4GBBbnImb6dmsKGUJ2LatrhH/nqhxcFungHvyanc=
-golang.org/x/mod v0.1.0/go.mod h1:0QHyrYULN0/3qlju5TqG8bIK38QM8yzMo5ekMj3DlcY=
-golang.org/x/mod v0.1.1-0.20191105210325-c90efee705ee/go.mod h1:QqPTAvyqsEbceGzBzNggFXnrqF1CaUcvgkdR5Ot7KZg=
-golang.org/x/mod v0.1.1-0.20191107180719-034126e5016b/go.mod h1:QqPTAvyqsEbceGzBzNggFXnrqF1CaUcvgkdR5Ot7KZg=
-golang.org/x/mod v0.2.0/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
-golang.org/x/mod v0.3.0/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
-golang.org/x/mod v0.4.0/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
-golang.org/x/mod v0.4.1/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
-golang.org/x/mod v0.4.2/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
-golang.org/x/mod v0.5.0/go.mod h1:5OXOZSfqPIIbmVBIIKWRFfZjPR0E5r58TLhUjH0a2Ro=
-golang.org/x/net v0.0.0-20180724234803-3673e40ba225/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
-golang.org/x/net v0.0.0-20180826012351-8a410e7b638d/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
-golang.org/x/net v0.0.0-20181023162649-9b4f9f5ad519/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
-golang.org/x/net v0.0.0-20181114220301-adae6a3d119a/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
-golang.org/x/net v0.0.0-20190108225652-1e06a53dbb7e/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
-golang.org/x/net v0.0.0-20190213061140-3a22650c66bd/go.mod h1:mL1N/T3taQHkDXs73rZJwtUhF3w3ftmwwsq0BUmARs4=
-golang.org/x/net v0.0.0-20190311183353-d8887717615a/go.mod h1:t9HGtf8HONx5eT2rtn7q6eTqICYqUVnKs3thJo3Qplg=
-golang.org/x/net v0.0.0-20190404232315-eb5bcb51f2a3/go.mod h1:t9HGtf8HONx5eT2rtn7q6eTqICYqUVnKs3thJo3Qplg=
-golang.org/x/net v0.0.0-20190501004415-9ce7a6920f09/go.mod h1:t9HGtf8HONx5eT2rtn7q6eTqICYqUVnKs3thJo3Qplg=
-golang.org/x/net v0.0.0-20190503192946-f4e77d36d62c/go.mod h1:t9HGtf8HONx5eT2rtn7q6eTqICYqUVnKs3thJo3Qplg=
-golang.org/x/net v0.0.0-20190603091049-60506f45cf65/go.mod h1:HSz+uSET+XFnRR8LxR5pz3Of3rY3CfYBVs4xY44aLks=
-golang.org/x/net v0.0.0-20190613194153-d28f0bde5980/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20190620200207-3b0461eec859/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20190628185345-da137c7871d7/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20190724013045-ca1201d0de80/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20190923162816-aa69164e4478/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20191209160850-c0dbc17a3553/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20200114155413-6afb5195e5aa/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20200202094626-16171245cfb2/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20200222125558-5a598a2470a0/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20200226121028-0de0cce0169b/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20200301022130-244492dfa37a/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20200324143707-d3edc9973b7e/go.mod h1:qpuaurCH72eLCgpAm/N6yyVIVM9cpaDIP3A8BGJEC5A=
-golang.org/x/net v0.0.0-20200501053045-e0ff5e5a1de5/go.mod h1:qpuaurCH72eLCgpAm/N6yyVIVM9cpaDIP3A8BGJEC5A=
-golang.org/x/net v0.0.0-20200506145744-7e3656a0809f/go.mod h1:qpuaurCH72eLCgpAm/N6yyVIVM9cpaDIP3A8BGJEC5A=
-golang.org/x/net v0.0.0-20200513185701-a91f0712d120/go.mod h1:qpuaurCH72eLCgpAm/N6yyVIVM9cpaDIP3A8BGJEC5A=
-golang.org/x/net v0.0.0-20200520182314-0ba52f642ac2/go.mod h1:qpuaurCH72eLCgpAm/N6yyVIVM9cpaDIP3A8BGJEC5A=
-golang.org/x/net v0.0.0-20200625001655-4c5254603344/go.mod h1:/O7V0waA8r7cgGh81Ro3o1hOxt32SMVPicZroKQ2sZA=
-golang.org/x/net v0.0.0-20200707034311-ab3426394381/go.mod h1:/O7V0waA8r7cgGh81Ro3o1hOxt32SMVPicZroKQ2sZA=
-golang.org/x/net v0.0.0-20200822124328-c89045814202/go.mod h1:/O7V0waA8r7cgGh81Ro3o1hOxt32SMVPicZroKQ2sZA=
-golang.org/x/net v0.0.0-20201021035429-f5854403a974/go.mod h1:sp8m0HH+o8qH0wwXwYZr8TS3Oi6o0r6Gce1SSxlDquU=
-golang.org/x/net v0.0.0-20201031054903-ff519b6c9102/go.mod h1:sp8m0HH+o8qH0wwXwYZr8TS3Oi6o0r6Gce1SSxlDquU=
-golang.org/x/net v0.0.0-20201110031124-69a78807bb2b/go.mod h1:sp8m0HH+o8qH0wwXwYZr8TS3Oi6o0r6Gce1SSxlDquU=
-golang.org/x/net v0.0.0-20201209123823-ac852fbbde11/go.mod h1:m0MpNAwzfU5UDzcl9v0D8zg8gWTRqZa9RBIspLL5mdg=
-golang.org/x/net v0.0.0-20201224014010-6772e930b67b/go.mod h1:m0MpNAwzfU5UDzcl9v0D8zg8gWTRqZa9RBIspLL5mdg=
-golang.org/x/net v0.0.0-20210119194325-5f4716e94777/go.mod h1:m0MpNAwzfU5UDzcl9v0D8zg8gWTRqZa9RBIspLL5mdg=
-golang.org/x/net v0.0.0-20210226172049-e18ecbb05110/go.mod h1:m0MpNAwzfU5UDzcl9v0D8zg8gWTRqZa9RBIspLL5mdg=
-golang.org/x/net v0.0.0-20210316092652-d523dce5a7f4/go.mod h1:RBQZq4jEuRlivfhVLdyRGr576XBO4/greRjx4P4O3yc=
-golang.org/x/net v0.0.0-20210405180319-a5a99cb37ef4/go.mod h1:p54w0d4576C0XHj96bSt6lcn1PtDYWL6XObtHCRCNQM=
-golang.org/x/net v0.0.0-20210410081132-afb366fc7cd1/go.mod h1:9tjilg8BloeKEkVJvy7fQ90B1CfIiPueXVOjqfkSzI8=
-golang.org/x/net v0.0.0-20210503060351-7fd8e65b6420/go.mod h1:9nx3DQGgdP8bBQD5qxJ1jj9UTztislL4KSBs9R2vV5Y=
-golang.org/x/net v0.0.0-20210805182204-aaa1db679c0d/go.mod h1:9nx3DQGgdP8bBQD5qxJ1jj9UTztislL4KSBs9R2vV5Y=
-golang.org/x/net v0.0.0-20210813160813-60bc85c4be6d/go.mod h1:9nx3DQGgdP8bBQD5qxJ1jj9UTztislL4KSBs9R2vV5Y=
-golang.org/x/net v0.0.0-20220906165146-f3363e06e74c h1:yKufUcDwucU5urd+50/Opbt4AYpqthk7wHpHok8f1lo=
-golang.org/x/net v0.0.0-20220906165146-f3363e06e74c/go.mod h1:YDH+HFinaLZZlnHAfSS6ZXJJ9M9t4Dl22yv3iI2vPwk=
-golang.org/x/oauth2 v0.0.0-20180821212333-d2e6202438be/go.mod h1:N/0e6XlmueqKjAGxoOufVs8QHGRruUQn6yWY3a++T0U=
-golang.org/x/oauth2 v0.0.0-20190226205417-e64efc72b421/go.mod h1:gOpvHmFTYa4IltrdGE7lF6nIHvwfUNPOp7c8zoXwtLw=
-golang.org/x/oauth2 v0.0.0-20190604053449-0f29369cfe45/go.mod h1:gOpvHmFTYa4IltrdGE7lF6nIHvwfUNPOp7c8zoXwtLw=
-golang.org/x/oauth2 v0.0.0-20191202225959-858c2ad4c8b6/go.mod h1:gOpvHmFTYa4IltrdGE7lF6nIHvwfUNPOp7c8zoXwtLw=
-golang.org/x/oauth2 v0.0.0-20200107190931-bf48bf16ab8d/go.mod h1:gOpvHmFTYa4IltrdGE7lF6nIHvwfUNPOp7c8zoXwtLw=
-golang.org/x/oauth2 v0.0.0-20200902213428-5d25da1a8d43/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20201109201403-9fd604954f58/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20201208152858-08078c50e5b5/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20210218202405-ba52d332ba99/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20210220000619-9bb904979d93/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20210313182246-cd4f82c27b84/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20210514164344-f6687ab2804c/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20210628180205-a41e5a781914/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20210805134026-6f1e6394065a/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20210819190943-2bc19b11175f/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20211005180243-6b3c2da341f1/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/oauth2 v0.0.0-20211104180415-d3ed0bb246c8/go.mod h1:KelEdhl1UZF7XfJ4dDtk6s++YSgaE7mD/BuKKDLBl4A=
-golang.org/x/sync v0.0.0-20180314180146-1d60e4601c6f/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20181108010431-42b317875d0f/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20181221193216-37e7f081c4d4/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20190227155943-e225da77a7e6/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20190423024810-112230192c58/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20190911185100-cd5d95a43a6e/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20200317015054-43a5402ce75a/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20200625203802-6e8e738ad208/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20201020160332-67f06af15bc9/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20201207232520-09787c993a3a/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20210220032951-036812b2e83c/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sys v0.0.0-20180810173357-98c5dad5d1a0/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
-golang.org/x/sys v0.0.0-20180823144017-11551d06cbcc/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
-golang.org/x/sys v0.0.0-20180830151530-49385e6e1522/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
-golang.org/x/sys v0.0.0-20180905080454-ebe1bf3edb33/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
-golang.org/x/sys v0.0.0-20181026203630-95b1ffbd15a5/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
-golang.org/x/sys v0.0.0-20181116152217-5ac8a444bdc5/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
-golang.org/x/sys v0.0.0-20190215142949-d0b11bdaac8a/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
-golang.org/x/sys v0.0.0-20190222072716-a9d3bda3a223/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
-golang.org/x/sys v0.0.0-20190312061237-fead79001313/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190412213103-97732733099d/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190422165155-953cdadca894/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190502145724-3ef323f4f1fd/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190507160741-ecd444e8653b/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190606165138-5da285871e9c/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190606203320-7fc4e5ec1444/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190624142023-c5567b49c5d0/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190726091711-fc99dfbffb4e/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190922100055-0a153f010e69/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20190924154521-2837fb4f24fe/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20191001151750-bb3f8db39f24/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20191008105621-543471e840be/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20191026070338-33540a1f6037/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20191115151921-52ab43148777/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20191204072324-ce4227a45e2e/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20191220220014-0732a990476f/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20191228213918-04cbcbbfeed8/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200113162924-86b910548bc1/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200116001909-b77594299b42/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200122134326-e047566fdf82/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200124204421-9fbb57f87de9/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200202164722-d101bd2416d5/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200212091648-12a6c2dcc1e4/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200223170610-d5e6a3e2c0ae/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200302150141-5c8b2ff67527/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200323222414-85ca7c5b95cd/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200331124033-c3d80250170d/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200501052902-10377860bb8e/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200511232937-7e40ca221e25/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200515095857-1151b9dac4a9/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200523222454-059865788121/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200803210538-64077c9b5642/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200905004654-be1d3432aa8f/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20200930185726-fdedc70b468f/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20201119102817-f84b799fce68/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20201201145000-ef89a241ccb3/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210104204734-6f8348627aad/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210119212857-b64e53b001e4/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210124154548-22da62e12c0c/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210220050731-9a76102bfb43/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210225134936-a50acf3fe073/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210303074136-134d130e1a04/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210305230114-8fe3ee5dd75b/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210315160823-c6e025ad8005/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210320140829-1e4c9ba3b0c4/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210330210617-4fbd30eecc44/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210403161142-5e06dd20ab57/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210423082822-04245dca01da/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210423185535-09eb48e85fd7/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210510120138-977fb7262007/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210514084401-e8d321eab015/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210603125802-9665404d3644/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210615035016-665e8c7367d1/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210616094352-59db8d763f22/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210630005230-0f9fa26af87c/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210806184541-e5e7981a1069/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210809222454-d867a43fc93e/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210816183151-1e6c022a8912/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210823070655-63515b42dcdf/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210906170528-6f6e22806c34/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210908233432-aa78b53d3365/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20210927094055-39ccf1dd6fa6/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20211007075335-d3039528d8ac/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20211025201205-69cdffdb9359/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20211110154304-99a53858aa08/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20211116061358-0a5406a5449c/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20211124211545-fe61309f8881/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20211205182925-97ca703d548d/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20220412211240-33da011f77ad/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20220715151400-c0bba94af5f8/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.5.0 h1:MUK/U/4lj1t1oPg0HfuXDN/Z1wv31ZJ/YcPiGccS4DU=
-golang.org/x/sys v0.5.0/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/term v0.0.0-20201126162022-7de9c90e9dd1/go.mod h1:bj7SfCRtBDWHUb9snDiAeCFNEtKQo2Wmx5Cou7ajbmo=
-golang.org/x/text v0.0.0-20170915032832-14c0d48ead0c/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ=
-golang.org/x/text v0.3.0/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ=
-golang.org/x/text v0.3.1-0.20180807135948-17ff2d5776d2/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ=
-golang.org/x/text v0.3.2/go.mod h1:bEr9sfX3Q8Zfm5fL9x+3itogRgK3+ptLWKqgva+5dAk=
-golang.org/x/text v0.3.3/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
-golang.org/x/text v0.3.4/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
-golang.org/x/text v0.3.5/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
-golang.org/x/text v0.3.6/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
-golang.org/x/text v0.3.7/go.mod h1:u+2+/6zg+i71rQMx5EYifcz6MCKuco9NR6JIITiCfzQ=
-golang.org/x/text v0.7.0 h1:4BRB4x83lYWy72KwLD/qYDuTu7q9PjSagHvijDw7cLo=
-golang.org/x/text v0.7.0/go.mod h1:mrYo+phRRbMaCq/xk9113O4dZlRixOauAjOtrjsXDZ8=
-golang.org/x/time v0.0.0-20181108054448-85acf8d2951c/go.mod h1:tRJNPiyCQ0inRvYxbN9jk5I+vvW/OXSQhTDSoE431IQ=
-golang.org/x/time v0.0.0-20190308202827-9d24e82272b4/go.mod h1:tRJNPiyCQ0inRvYxbN9jk5I+vvW/OXSQhTDSoE431IQ=
-golang.org/x/time v0.0.0-20191024005414-555d28b269f0/go.mod h1:tRJNPiyCQ0inRvYxbN9jk5I+vvW/OXSQhTDSoE431IQ=
-golang.org/x/time v0.0.0-20220210224613-90d013bbcef8 h1:vVKdlvoWBphwdxWKrFZEuM0kGgGLxUOYcY4U/2Vjg44=
-golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ=
-golang.org/x/tools v0.0.0-20190114222345-bf090417da8b/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ=
-golang.org/x/tools v0.0.0-20190226205152-f727befe758c/go.mod h1:9Yl7xja0Znq3iFh3HoIrodX9oNMXvdceNzlUR8zjMvY=
-golang.org/x/tools v0.0.0-20190311212946-11955173bddd/go.mod h1:LCzVGOaR6xXOjkQ3onu1FJEFr0SW1gC7cKk1uF8kGRs=
-golang.org/x/tools v0.0.0-20190312151545-0bb0c0a6e846/go.mod h1:LCzVGOaR6xXOjkQ3onu1FJEFr0SW1gC7cKk1uF8kGRs=
-golang.org/x/tools v0.0.0-20190312170243-e65039ee4138/go.mod h1:LCzVGOaR6xXOjkQ3onu1FJEFr0SW1gC7cKk1uF8kGRs=
-golang.org/x/tools v0.0.0-20190425150028-36563e24a262/go.mod h1:RgjU9mgBXZiqYHBnxXauZ1Gv1EHHAz9KjViQ78xBX0Q=
-golang.org/x/tools v0.0.0-20190506145303-2d16b83fe98c/go.mod h1:RgjU9mgBXZiqYHBnxXauZ1Gv1EHHAz9KjViQ78xBX0Q=
-golang.org/x/tools v0.0.0-20190524140312-2c0ae7006135/go.mod h1:RgjU9mgBXZiqYHBnxXauZ1Gv1EHHAz9KjViQ78xBX0Q=
-golang.org/x/tools v0.0.0-20190606124116-d0a3d012864b/go.mod h1:/rFqwRUd4F7ZHNgwSSTFct+R/Kf4OFW1sUzUTQQTgfc=
-golang.org/x/tools v0.0.0-20190621195816-6e04913cbbac/go.mod h1:/rFqwRUd4F7ZHNgwSSTFct+R/Kf4OFW1sUzUTQQTgfc=
-golang.org/x/tools v0.0.0-20190628153133-6cdbf07be9d0/go.mod h1:/rFqwRUd4F7ZHNgwSSTFct+R/Kf4OFW1sUzUTQQTgfc=
-golang.org/x/tools v0.0.0-20190816200558-6889da9d5479/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.0.0-20190907020128-2ca718005c18/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.0.0-20190911174233-4f2ddba30aff/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.0.0-20191012152004-8de300cfc20a/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.0.0-20191113191852-77e3bb0ad9e7/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.0.0-20191115202509-3a792d9c32b2/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.0.0-20191119224855-298f0cb1881e/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.0.0-20191125144606-a911d9008d1f/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.0.0-20191130070609-6e064ea0cf2d/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.0.0-20191216173652-a0e659d51361/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20191227053925-7b8e75db28f4/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20200117161641-43d50277825c/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20200122220014-bf1340f18c4a/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20200130002326-2f3ba24bd6e7/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20200204074204-1cc6d1ef6c74/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20200207183749-b753a1ba74fa/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20200212150539-ea181f53ac56/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20200224181240-023911ca70b2/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20200227222343-706bc42d1f0d/go.mod h1:TB2adYChydJhpapKDTa4BR/hXlZSLoq2Wpct/0txZ28=
-golang.org/x/tools v0.0.0-20200304193943-95d2e580d8eb/go.mod h1:o4KQGtdN14AW+yjsvvwRTJJuXz8XRtIHtEnmAXLyFUw=
-golang.org/x/tools v0.0.0-20200312045724-11d5b4c81c7d/go.mod h1:o4KQGtdN14AW+yjsvvwRTJJuXz8XRtIHtEnmAXLyFUw=
-golang.org/x/tools v0.0.0-20200331025713-a30bf2db82d4/go.mod h1:Sl4aGygMT6LrqrWclx+PTx3U+LnKx/seiNR+3G19Ar8=
-golang.org/x/tools v0.0.0-20200501065659-ab2804fb9c9d/go.mod h1:EkVYQZoAsY45+roYkvgYkIh4xh/qjgUK9TdY2XT94GE=
-golang.org/x/tools v0.0.0-20200512131952-2bc93b1c0c88/go.mod h1:EkVYQZoAsY45+roYkvgYkIh4xh/qjgUK9TdY2XT94GE=
-golang.org/x/tools v0.0.0-20200515010526-7d3b6ebf133d/go.mod h1:EkVYQZoAsY45+roYkvgYkIh4xh/qjgUK9TdY2XT94GE=
-golang.org/x/tools v0.0.0-20200618134242-20370b0cb4b2/go.mod h1:EkVYQZoAsY45+roYkvgYkIh4xh/qjgUK9TdY2XT94GE=
-golang.org/x/tools v0.0.0-20200619180055-7c47624df98f/go.mod h1:EkVYQZoAsY45+roYkvgYkIh4xh/qjgUK9TdY2XT94GE=
-golang.org/x/tools v0.0.0-20200729194436-6467de6f59a7/go.mod h1:njjCfa9FT2d7l9Bc6FUM5FLjQPp3cFF28FI3qnDFljA=
-golang.org/x/tools v0.0.0-20200804011535-6c149bb5ef0d/go.mod h1:njjCfa9FT2d7l9Bc6FUM5FLjQPp3cFF28FI3qnDFljA=
-golang.org/x/tools v0.0.0-20200825202427-b303f430e36d/go.mod h1:njjCfa9FT2d7l9Bc6FUM5FLjQPp3cFF28FI3qnDFljA=
-golang.org/x/tools v0.0.0-20200904185747-39188db58858/go.mod h1:Cj7w3i3Rnn0Xh82ur9kSqwfTHTeVxaDqrfMjpcNT6bE=
-golang.org/x/tools v0.0.0-20201110124207-079ba7bd75cd/go.mod h1:emZCQorbCU4vsT4fOWvOPXz4eW1wZW4PmDk9uLelYpA=
-golang.org/x/tools v0.0.0-20201201161351-ac6f37ff4c2a/go.mod h1:emZCQorbCU4vsT4fOWvOPXz4eW1wZW4PmDk9uLelYpA=
-golang.org/x/tools v0.0.0-20201208233053-a543418bbed2/go.mod h1:emZCQorbCU4vsT4fOWvOPXz4eW1wZW4PmDk9uLelYpA=
-golang.org/x/tools v0.0.0-20210105154028-b0ab187a4818/go.mod h1:emZCQorbCU4vsT4fOWvOPXz4eW1wZW4PmDk9uLelYpA=
-golang.org/x/tools v0.0.0-20210106214847-113979e3529a/go.mod h1:emZCQorbCU4vsT4fOWvOPXz4eW1wZW4PmDk9uLelYpA=
-golang.org/x/tools v0.0.0-20210108195828-e2f9c7f1fc8e/go.mod h1:emZCQorbCU4vsT4fOWvOPXz4eW1wZW4PmDk9uLelYpA=
-golang.org/x/tools v0.1.0/go.mod h1:xkSsbof2nBLbhDlRMhhhyNLN/zl3eTqcnHD5viDpcZ0=
-golang.org/x/tools v0.1.1/go.mod h1:o0xws9oXOQQZyjljx8fwUC0k7L1pTE6eaCbjGeHmOkk=
-golang.org/x/tools v0.1.2/go.mod h1:o0xws9oXOQQZyjljx8fwUC0k7L1pTE6eaCbjGeHmOkk=
-golang.org/x/tools v0.1.3/go.mod h1:o0xws9oXOQQZyjljx8fwUC0k7L1pTE6eaCbjGeHmOkk=
-golang.org/x/tools v0.1.4/go.mod h1:o0xws9oXOQQZyjljx8fwUC0k7L1pTE6eaCbjGeHmOkk=
-golang.org/x/tools v0.1.5/go.mod h1:o0xws9oXOQQZyjljx8fwUC0k7L1pTE6eaCbjGeHmOkk=
-golang.org/x/tools v0.1.7/go.mod h1:LGqMHiF4EqQNHR1JncWGqT5BVaXmza+X+BDGol+dOxo=
-golang.org/x/xerrors v0.0.0-20190717185122-a985d3407aa7/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
-golang.org/x/xerrors v0.0.0-20191011141410-1b5146add898/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
-golang.org/x/xerrors v0.0.0-20191204190536-9bdfabe68543/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
-golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
-google.golang.org/api v0.4.0/go.mod h1:8k5glujaEP+g9n7WNsDg8QP6cUVNI86fCNMcbazEtwE=
-google.golang.org/api v0.7.0/go.mod h1:WtwebWUNSVBH/HAw79HIFXZNqEvBhG+Ra+ax0hx3E3M=
-google.golang.org/api v0.8.0/go.mod h1:o4eAsZoiT+ibD93RtjEohWalFOjRDx6CVaqeizhEnKg=
-google.golang.org/api v0.9.0/go.mod h1:o4eAsZoiT+ibD93RtjEohWalFOjRDx6CVaqeizhEnKg=
-google.golang.org/api v0.13.0/go.mod h1:iLdEw5Ide6rF15KTC1Kkl0iskquN2gFfn9o9XIsbkAI=
-google.golang.org/api v0.14.0/go.mod h1:iLdEw5Ide6rF15KTC1Kkl0iskquN2gFfn9o9XIsbkAI=
-google.golang.org/api v0.15.0/go.mod h1:iLdEw5Ide6rF15KTC1Kkl0iskquN2gFfn9o9XIsbkAI=
-google.golang.org/api v0.17.0/go.mod h1:BwFmGc8tA3vsd7r/7kR8DY7iEEGSU04BFxCo5jP/sfE=
-google.golang.org/api v0.18.0/go.mod h1:BwFmGc8tA3vsd7r/7kR8DY7iEEGSU04BFxCo5jP/sfE=
-google.golang.org/api v0.19.0/go.mod h1:BwFmGc8tA3vsd7r/7kR8DY7iEEGSU04BFxCo5jP/sfE=
-google.golang.org/api v0.20.0/go.mod h1:BwFmGc8tA3vsd7r/7kR8DY7iEEGSU04BFxCo5jP/sfE=
-google.golang.org/api v0.22.0/go.mod h1:BwFmGc8tA3vsd7r/7kR8DY7iEEGSU04BFxCo5jP/sfE=
-google.golang.org/api v0.24.0/go.mod h1:lIXQywCXRcnZPGlsd8NbLnOjtAoL6em04bJ9+z0MncE=
-google.golang.org/api v0.28.0/go.mod h1:lIXQywCXRcnZPGlsd8NbLnOjtAoL6em04bJ9+z0MncE=
-google.golang.org/api v0.29.0/go.mod h1:Lcubydp8VUV7KeIHD9z2Bys/sm/vGKnG1UHuDBSrHWM=
-google.golang.org/api v0.30.0/go.mod h1:QGmEvQ87FHZNiUVJkT14jQNYJ4ZJjdRF23ZXz5138Fc=
-google.golang.org/api v0.35.0/go.mod h1:/XrVsuzM0rZmrsbjJutiuftIzeuTQcEeaYcSk/mQ1dg=
-google.golang.org/api v0.36.0/go.mod h1:+z5ficQTmoYpPn8LCUNVpK5I7hwkpjbcgqA7I34qYtE=
-google.golang.org/api v0.40.0/go.mod h1:fYKFpnQN0DsDSKRVRcQSDQNtqWPfM9i+zNPxepjRCQ8=
-google.golang.org/api v0.41.0/go.mod h1:RkxM5lITDfTzmyKFPt+wGrCJbVfniCr2ool8kTBzRTU=
-google.golang.org/api v0.43.0/go.mod h1:nQsDGjRXMo4lvh5hP0TKqF244gqhGcr/YSIykhUk/94=
-google.golang.org/api v0.47.0/go.mod h1:Wbvgpq1HddcWVtzsVLyfLp8lDg6AA241LmgIL59tHXo=
-google.golang.org/api v0.48.0/go.mod h1:71Pr1vy+TAZRPkPs/xlCf5SsU8WjuAWv1Pfjbtukyy4=
-google.golang.org/api v0.50.0/go.mod h1:4bNT5pAuq5ji4SRZm+5QIkjny9JAyVD/3gaSihNefaw=
-google.golang.org/api v0.51.0/go.mod h1:t4HdrdoNgyN5cbEfm7Lum0lcLDLiise1F8qDKX00sOU=
-google.golang.org/api v0.54.0/go.mod h1:7C4bFFOvVDGXjfDTAsgGwDgAxRDeQ4X8NvUedIt6z3k=
-google.golang.org/api v0.55.0/go.mod h1:38yMfeP1kfjsl8isn0tliTjIb1rJXcQi4UXlbqivdVE=
-google.golang.org/api v0.56.0/go.mod h1:38yMfeP1kfjsl8isn0tliTjIb1rJXcQi4UXlbqivdVE=
-google.golang.org/api v0.57.0/go.mod h1:dVPlbZyBo2/OjBpmvNdpn2GRm6rPy75jyU7bmhdrMgI=
-google.golang.org/api v0.59.0/go.mod h1:sT2boj7M9YJxZzgeZqXogmhfmRWDtPzT31xkieUbuZU=
-google.golang.org/api v0.61.0/go.mod h1:xQRti5UdCmoCEqFxcz93fTl338AVqDgyaDRuOZ3hg9I=
-google.golang.org/api v0.62.0/go.mod h1:dKmwPCydfsad4qCH08MSdgWjfHOyfpd4VtDGgRFdavw=
-google.golang.org/appengine v1.1.0/go.mod h1:EbEs0AVv82hx2wNQdGPgUI5lhzA/G0D9YwlJXL52JkM=
-google.golang.org/appengine v1.4.0/go.mod h1:xpcJRLb0r/rnEns0DIKYYv+WjYCduHsrkT7/EB5XEv4=
-google.golang.org/appengine v1.5.0/go.mod h1:xpcJRLb0r/rnEns0DIKYYv+WjYCduHsrkT7/EB5XEv4=
-google.golang.org/appengine v1.6.1/go.mod h1:i06prIuMbXzDqacNJfV5OdTW448YApPu5ww/cMBSeb0=
-google.golang.org/appengine v1.6.5/go.mod h1:8WjMMxjGQR8xUklV/ARdw2HLXBOI7O7uCIDZVag1xfc=
-google.golang.org/appengine v1.6.6/go.mod h1:8WjMMxjGQR8xUklV/ARdw2HLXBOI7O7uCIDZVag1xfc=
-google.golang.org/appengine v1.6.7/go.mod h1:8WjMMxjGQR8xUklV/ARdw2HLXBOI7O7uCIDZVag1xfc=
-google.golang.org/genproto v0.0.0-20180817151627-c66870c02cf8/go.mod h1:JiN7NxoALGmiZfu7CAH4rXhgtRTLTxftemlI0sWmxmc=
-google.golang.org/genproto v0.0.0-20190307195333-5fe7a883aa19/go.mod h1:VzzqZJRnGkLBvHegQrXjBqPurQTc5/KpmUdxsrq26oE=
-google.golang.org/genproto v0.0.0-20190418145605-e7d98fc518a7/go.mod h1:VzzqZJRnGkLBvHegQrXjBqPurQTc5/KpmUdxsrq26oE=
-google.golang.org/genproto v0.0.0-20190425155659-357c62f0e4bb/go.mod h1:VzzqZJRnGkLBvHegQrXjBqPurQTc5/KpmUdxsrq26oE=
-google.golang.org/genproto v0.0.0-20190502173448-54afdca5d873/go.mod h1:VzzqZJRnGkLBvHegQrXjBqPurQTc5/KpmUdxsrq26oE=
-google.golang.org/genproto v0.0.0-20190801165951-fa694d86fc64/go.mod h1:DMBHOl98Agz4BDEuKkezgsaosCRResVns1a3J2ZsMNc=
-google.golang.org/genproto v0.0.0-20190819201941-24fa4b261c55/go.mod h1:DMBHOl98Agz4BDEuKkezgsaosCRResVns1a3J2ZsMNc=
-google.golang.org/genproto v0.0.0-20190911173649-1774047e7e51/go.mod h1:IbNlFCBrqXvoKpeg0TB2l7cyZUmoaFKYIwrEpbDKLA8=
-google.golang.org/genproto v0.0.0-20191108220845-16a3f7862a1a/go.mod h1:n3cpQtvxv34hfy77yVDNjmbRyujviMdxYliBSkLhpCc=
-google.golang.org/genproto v0.0.0-20191115194625-c23dd37a84c9/go.mod h1:n3cpQtvxv34hfy77yVDNjmbRyujviMdxYliBSkLhpCc=
-google.golang.org/genproto v0.0.0-20191216164720-4f79533eabd1/go.mod h1:n3cpQtvxv34hfy77yVDNjmbRyujviMdxYliBSkLhpCc=
-google.golang.org/genproto v0.0.0-20191230161307-f3c370f40bfb/go.mod h1:n3cpQtvxv34hfy77yVDNjmbRyujviMdxYliBSkLhpCc=
-google.golang.org/genproto v0.0.0-20200115191322-ca5a22157cba/go.mod h1:n3cpQtvxv34hfy77yVDNjmbRyujviMdxYliBSkLhpCc=
-google.golang.org/genproto v0.0.0-20200122232147-0452cf42e150/go.mod h1:n3cpQtvxv34hfy77yVDNjmbRyujviMdxYliBSkLhpCc=
-google.golang.org/genproto v0.0.0-20200204135345-fa8e72b47b90/go.mod h1:GmwEX6Z4W5gMy59cAlVYjN9JhxgbQH6Gn+gFDQe2lzA=
-google.golang.org/genproto v0.0.0-20200212174721-66ed5ce911ce/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
-google.golang.org/genproto v0.0.0-20200224152610-e50cd9704f63/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
-google.golang.org/genproto v0.0.0-20200228133532-8c2c7df3a383/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
-google.golang.org/genproto v0.0.0-20200305110556-506484158171/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
-google.golang.org/genproto v0.0.0-20200312145019-da6875a35672/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
-google.golang.org/genproto v0.0.0-20200331122359-1ee6d9798940/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
-google.golang.org/genproto v0.0.0-20200430143042-b979b6f78d84/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
-google.golang.org/genproto v0.0.0-20200511104702-f5ebc3bea380/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
-google.golang.org/genproto v0.0.0-20200513103714-09dca8ec2884/go.mod h1:55QSHmfGQM9UVYDPBsyGGes0y52j32PQ3BqQfXhyH3c=
-google.golang.org/genproto v0.0.0-20200515170657-fc4c6c6a6587/go.mod h1:YsZOwe1myG/8QRHRsmBRE1LrgQY60beZKjly0O1fX9U=
-google.golang.org/genproto v0.0.0-20200526211855-cb27e3aa2013/go.mod h1:NbSheEEYHJ7i3ixzK3sjbqSGDJWnxyFXZblF3eUsNvo=
-google.golang.org/genproto v0.0.0-20200618031413-b414f8b61790/go.mod h1:jDfRM7FcilCzHH/e9qn6dsT145K34l5v+OpcnNgKAAA=
-google.golang.org/genproto v0.0.0-20200729003335-053ba62fc06f/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20200804131852-c06518451d9c/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20200825200019-8632dd797987/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20200904004341-0bd0a958aa1d/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20201109203340-2640f1f9cdfb/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20201201144952-b05cb90ed32e/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20201210142538-e3217bee35cc/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20201214200347-8c77b98c765d/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20210108203827-ffc7fda8c3d7/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20210222152913-aa3ee6e6a81c/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20210226172003-ab064af71705/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20210303154014-9728d6b83eeb/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20210310155132-4ce2db91004e/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20210319143718-93e7006c17a6/go.mod h1:FWY/as6DDZQgahTzZj3fqbO1CbirC29ZNUFHwi0/+no=
-google.golang.org/genproto v0.0.0-20210402141018-6c239bbf2bb1/go.mod h1:9lPAdzaEmUacj36I+k7YKbEc5CXzPIeORRgDAUOu28A=
-google.golang.org/genproto v0.0.0-20210513213006-bf773b8c8384/go.mod h1:P3QM42oQyzQSnHPnZ/vqoCdDmzH28fzWByN9asMeM8A=
-google.golang.org/genproto v0.0.0-20210602131652-f16073e35f0c/go.mod h1:UODoCrxHCcBojKKwX1terBiRUaqAsFqJiF615XL43r0=
-google.golang.org/genproto v0.0.0-20210604141403-392c879c8b08/go.mod h1:UODoCrxHCcBojKKwX1terBiRUaqAsFqJiF615XL43r0=
-google.golang.org/genproto v0.0.0-20210608205507-b6d2f5bf0d7d/go.mod h1:UODoCrxHCcBojKKwX1terBiRUaqAsFqJiF615XL43r0=
-google.golang.org/genproto v0.0.0-20210624195500-8bfb893ecb84/go.mod h1:SzzZ/N+nwJDaO1kznhnlzqS8ocJICar6hYhVyhi++24=
-google.golang.org/genproto v0.0.0-20210713002101-d411969a0d9a/go.mod h1:AxrInvYm1dci+enl5hChSFPOmmUF1+uAa/UsgNRWd7k=
-google.golang.org/genproto v0.0.0-20210716133855-ce7ef5c701ea/go.mod h1:AxrInvYm1dci+enl5hChSFPOmmUF1+uAa/UsgNRWd7k=
-google.golang.org/genproto v0.0.0-20210728212813-7823e685a01f/go.mod h1:ob2IJxKrgPT52GcgX759i1sleT07tiKowYBGbczaW48=
-google.golang.org/genproto v0.0.0-20210805201207-89edb61ffb67/go.mod h1:ob2IJxKrgPT52GcgX759i1sleT07tiKowYBGbczaW48=
-google.golang.org/genproto v0.0.0-20210813162853-db860fec028c/go.mod h1:cFeNkxwySK631ADgubI+/XFU/xp8FD5KIVV4rj8UC5w=
-google.golang.org/genproto v0.0.0-20210821163610-241b8fcbd6c8/go.mod h1:eFjDcFEctNawg4eG61bRv87N7iHBWyVhJu7u1kqDUXY=
-google.golang.org/genproto v0.0.0-20210828152312-66f60bf46e71/go.mod h1:eFjDcFEctNawg4eG61bRv87N7iHBWyVhJu7u1kqDUXY=
-google.golang.org/genproto v0.0.0-20210831024726-fe130286e0e2/go.mod h1:eFjDcFEctNawg4eG61bRv87N7iHBWyVhJu7u1kqDUXY=
-google.golang.org/genproto v0.0.0-20210903162649-d08c68adba83/go.mod h1:eFjDcFEctNawg4eG61bRv87N7iHBWyVhJu7u1kqDUXY=
-google.golang.org/genproto v0.0.0-20210909211513-a8c4777a87af/go.mod h1:eFjDcFEctNawg4eG61bRv87N7iHBWyVhJu7u1kqDUXY=
-google.golang.org/genproto v0.0.0-20210924002016-3dee208752a0/go.mod h1:5CzLGKJ67TSI2B9POpiiyGha0AjJvZIUgRMt1dSmuhc=
-google.golang.org/genproto v0.0.0-20211008145708-270636b82663/go.mod h1:5CzLGKJ67TSI2B9POpiiyGha0AjJvZIUgRMt1dSmuhc=
-google.golang.org/genproto v0.0.0-20211028162531-8db9c33dc351/go.mod h1:5CzLGKJ67TSI2B9POpiiyGha0AjJvZIUgRMt1dSmuhc=
-google.golang.org/genproto v0.0.0-20211118181313-81c1377c94b1/go.mod h1:5CzLGKJ67TSI2B9POpiiyGha0AjJvZIUgRMt1dSmuhc=
-google.golang.org/genproto v0.0.0-20211129164237-f09f9a12af12/go.mod h1:5CzLGKJ67TSI2B9POpiiyGha0AjJvZIUgRMt1dSmuhc=
-google.golang.org/genproto v0.0.0-20211203200212-54befc351ae9/go.mod h1:5CzLGKJ67TSI2B9POpiiyGha0AjJvZIUgRMt1dSmuhc=
-google.golang.org/genproto v0.0.0-20211206160659-862468c7d6e0/go.mod h1:5CzLGKJ67TSI2B9POpiiyGha0AjJvZIUgRMt1dSmuhc=
-google.golang.org/genproto v0.0.0-20211208223120-3a66f561d7aa/go.mod h1:5CzLGKJ67TSI2B9POpiiyGha0AjJvZIUgRMt1dSmuhc=
-google.golang.org/genproto v0.0.0-20220617124728-180714bec0ad h1:kqrS+lhvaMHCxul6sKQvKJ8nAAhlVItmZV822hYFH/U=
-google.golang.org/genproto v0.0.0-20220617124728-180714bec0ad/go.mod h1:KEWEmljWE5zPzLBa/oHl6DaEt9LmfH6WtH1OHIvleBA=
-google.golang.org/grpc v1.19.0/go.mod h1:mqu4LbDTu4XGKhr4mRzUsmM4RtVoemTSY81AxZiDr8c=
-google.golang.org/grpc v1.20.1/go.mod h1:10oTOabMzJvdu6/UiuZezV6QK5dSlG84ov/aaiqXj38=
-google.golang.org/grpc v1.21.1/go.mod h1:oYelfM1adQP15Ek0mdvEgi9Df8B9CZIaU1084ijfRaM=
-google.golang.org/grpc v1.23.0/go.mod h1:Y5yQAOtifL1yxbo5wqy6BxZv8vAUGQwXBOALyacEbxg=
-google.golang.org/grpc v1.25.1/go.mod h1:c3i+UQWmh7LiEpx4sFZnkU36qjEYZ0imhYfXVyQciAY=
-google.golang.org/grpc v1.26.0/go.mod h1:qbnxyOmOxrQa7FizSgH+ReBfzJrCY1pSN7KXBS8abTk=
-google.golang.org/grpc v1.27.0/go.mod h1:qbnxyOmOxrQa7FizSgH+ReBfzJrCY1pSN7KXBS8abTk=
-google.golang.org/grpc v1.27.1/go.mod h1:qbnxyOmOxrQa7FizSgH+ReBfzJrCY1pSN7KXBS8abTk=
-google.golang.org/grpc v1.28.0/go.mod h1:rpkK4SK4GF4Ach/+MFLZUBavHOvF2JJB5uozKKal+60=
-google.golang.org/grpc v1.29.1/go.mod h1:itym6AZVZYACWQqET3MqgPpjcuV5QH3BxFS3IjizoKk=
-google.golang.org/grpc v1.30.0/go.mod h1:N36X2cJ7JwdamYAgDz+s+rVMFjt3numwzf/HckM8pak=
-google.golang.org/grpc v1.31.0/go.mod h1:N36X2cJ7JwdamYAgDz+s+rVMFjt3numwzf/HckM8pak=
-google.golang.org/grpc v1.31.1/go.mod h1:N36X2cJ7JwdamYAgDz+s+rVMFjt3numwzf/HckM8pak=
-google.golang.org/grpc v1.33.1/go.mod h1:fr5YgcSWrqhRRxogOsw7RzIpsmvOZ6IcH4kBYTpR3n0=
-google.golang.org/grpc v1.33.2/go.mod h1:JMHMWHQWaTccqQQlmk3MJZS+GWXOdAesneDmEnv2fbc=
-google.golang.org/grpc v1.34.0/go.mod h1:WotjhfgOW/POjDeRt8vscBtXq+2VjORFy659qA51WJ8=
-google.golang.org/grpc v1.35.0/go.mod h1:qjiiYl8FncCW8feJPdyg3v6XW24KsRHe+dy9BAGRRjU=
-google.golang.org/grpc v1.36.0/go.mod h1:qjiiYl8FncCW8feJPdyg3v6XW24KsRHe+dy9BAGRRjU=
-google.golang.org/grpc v1.36.1/go.mod h1:qjiiYl8FncCW8feJPdyg3v6XW24KsRHe+dy9BAGRRjU=
-google.golang.org/grpc v1.37.0/go.mod h1:NREThFqKR1f3iQ6oBuvc5LadQuXVGo9rkm5ZGrQdJfM=
-google.golang.org/grpc v1.37.1/go.mod h1:NREThFqKR1f3iQ6oBuvc5LadQuXVGo9rkm5ZGrQdJfM=
-google.golang.org/grpc v1.38.0/go.mod h1:NREThFqKR1f3iQ6oBuvc5LadQuXVGo9rkm5ZGrQdJfM=
-google.golang.org/grpc v1.39.0/go.mod h1:PImNr+rS9TWYb2O4/emRugxiyHZ5JyHW5F+RPnDzfrE=
-google.golang.org/grpc v1.39.1/go.mod h1:PImNr+rS9TWYb2O4/emRugxiyHZ5JyHW5F+RPnDzfrE=
-google.golang.org/grpc v1.40.0/go.mod h1:ogyxbiOoUXAkP+4+xa6PZSE9DZgIHtSpzjDTB9KAK34=
-google.golang.org/grpc v1.40.1/go.mod h1:ogyxbiOoUXAkP+4+xa6PZSE9DZgIHtSpzjDTB9KAK34=
-google.golang.org/grpc v1.42.0/go.mod h1:k+4IHHFw41K8+bbowsex27ge2rCb65oeWqe4jJ590SU=
-google.golang.org/grpc v1.47.0 h1:9n77onPX5F3qfFCqjy9dhn8PbNQsIKeVU04J9G7umt8=
-google.golang.org/grpc v1.47.0/go.mod h1:vN9eftEi1UMyUsIF80+uQXhHjbXYbm0uXoFCACuMGWk=
-google.golang.org/grpc/cmd/protoc-gen-go-grpc v1.1.0/go.mod h1:6Kw0yEErY5E/yWrBtf03jp27GLLJujG4z/JK95pnjjw=
-google.golang.org/protobuf v0.0.0-20200109180630-ec00e32a8dfd/go.mod h1:DFci5gLYBciE7Vtevhsrf46CRTquxDuWsQurQQe4oz8=
-google.golang.org/protobuf v0.0.0-20200221191635-4d8936d0db64/go.mod h1:kwYJMbMJ01Woi6D6+Kah6886xMZcty6N08ah7+eCXa0=
-google.golang.org/protobuf v0.0.0-20200228230310-ab0ca4ff8a60/go.mod h1:cfTl7dwQJ+fmap5saPgwCLgHXTUD7jkjRqWcaiX5VyM=
-google.golang.org/protobuf v1.20.1-0.20200309200217-e05f789c0967/go.mod h1:A+miEFZTKqfCUM6K7xSMQL9OKL/b6hQv+e19PK+JZNE=
-google.golang.org/protobuf v1.21.0/go.mod h1:47Nbq4nVaFHyn7ilMalzfO3qCViNmqZ2kzikPIcrTAo=
-google.golang.org/protobuf v1.22.0/go.mod h1:EGpADcykh3NcUnDUJcl1+ZksZNG86OlYog2l/sGQquU=
-google.golang.org/protobuf v1.23.0/go.mod h1:EGpADcykh3NcUnDUJcl1+ZksZNG86OlYog2l/sGQquU=
-google.golang.org/protobuf v1.23.1-0.20200526195155-81db48ad09cc/go.mod h1:EGpADcykh3NcUnDUJcl1+ZksZNG86OlYog2l/sGQquU=
-google.golang.org/protobuf v1.24.0/go.mod h1:r/3tXBNzIEhYS9I1OUVjXDlt8tc493IdKGjtUeSXeh4=
-google.golang.org/protobuf v1.25.0/go.mod h1:9JNX74DMeImyA3h4bdi1ymwjUzf21/xIlbajtzgsN7c=
-google.golang.org/protobuf v1.26.0-rc.1/go.mod h1:jlhhOSvTdKEhbULTjvd4ARK9grFBp09yW+WbY/TyQbw=
-google.golang.org/protobuf v1.26.0/go.mod h1:9q0QmTI4eRPtz6boOQmLYwt+qCgq0jsYwAQnmE0givc=
-google.golang.org/protobuf v1.27.1/go.mod h1:9q0QmTI4eRPtz6boOQmLYwt+qCgq0jsYwAQnmE0givc=
-google.golang.org/protobuf v1.28.0 h1:w43yiav+6bVFTBQFZX0r7ipe9JQ1QsbMgHwbBziscLw=
-google.golang.org/protobuf v1.28.0/go.mod h1:HV8QOd/L58Z+nl8r43ehVNZIU/HEI6OcFqwMG9pJV4I=
-gopkg.in/alecthomas/kingpin.v2 v2.2.6/go.mod h1:FMv+mEhP44yOT+4EoQTLFTRgOQ1FBLkstjWtayDeSgw=
-gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0=
-gopkg.in/check.v1 v1.0.0-20180628173108-788fd7840127/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0=
-gopkg.in/check.v1 v1.0.0-20190902080502-41f04d3bba15/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0=
-gopkg.in/check.v1 v1.0.0-20201130134442-10cb98267c6c h1:Hei/4ADfdWqJk1ZMxUNpqntNwaWcugrBjAiHlqqRiVk=
-gopkg.in/errgo.v2 v2.1.0/go.mod h1:hNsd1EY+bozCKY1Ytp96fpM3vjJbqLJn88ws8XvfDNI=
-gopkg.in/ini.v1 v1.66.2 h1:XfR1dOYubytKy4Shzc2LHrrGhU0lDCfDGG1yLPmpgsI=
-gopkg.in/ini.v1 v1.66.2/go.mod h1:pNLf8WUiyNEtQjuu5G5vTm06TEv9tsIgeAvK8hOrP4k=
-gopkg.in/yaml.v2 v2.2.1/go.mod h1:hI93XBmqTisBFMUTm0b8Fm+jr3Dg1NNxqwp+5A1VGuI=
-gopkg.in/yaml.v2 v2.2.2/go.mod h1:hI93XBmqTisBFMUTm0b8Fm+jr3Dg1NNxqwp+5A1VGuI=
-gopkg.in/yaml.v2 v2.2.3/go.mod h1:hI93XBmqTisBFMUTm0b8Fm+jr3Dg1NNxqwp+5A1VGuI=
-gopkg.in/yaml.v2 v2.2.4/go.mod h1:hI93XBmqTisBFMUTm0b8Fm+jr3Dg1NNxqwp+5A1VGuI=
-gopkg.in/yaml.v2 v2.2.5/go.mod h1:hI93XBmqTisBFMUTm0b8Fm+jr3Dg1NNxqwp+5A1VGuI=
-gopkg.in/yaml.v2 v2.2.8/go.mod h1:hI93XBmqTisBFMUTm0b8Fm+jr3Dg1NNxqwp+5A1VGuI=
-gopkg.in/yaml.v2 v2.4.0 h1:D8xgwECY7CYvx+Y2n4sBz93Jn9JRvxdiyyo8CTfuKaY=
-gopkg.in/yaml.v2 v2.4.0/go.mod h1:RDklbk79AGWmwhnvt/jBztapEOGDOx6ZbXqjP6csGnQ=
-gopkg.in/yaml.v3 v3.0.0-20200313102051-9f266ea9e77c/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
-gopkg.in/yaml.v3 v3.0.0-20210107192922-496545a6307b/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
-gopkg.in/yaml.v3 v3.0.1 h1:fxVm/GzAzEWqLHuvctI91KS9hhNmmWOoWu0XTYJS7CA=
-gopkg.in/yaml.v3 v3.0.1/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
-gotest.tools/v3 v3.0.3 h1:4AuOwCGf4lLR9u3YOe2awrHygurzhO/HeQ6laiA6Sx0=
-honnef.co/go/tools v0.0.0-20190102054323-c2f93a96b099/go.mod h1:rf3lG4BRIbNafJWhAfAdb/ePZxsR/4RtNHQocxwk9r4=
-honnef.co/go/tools v0.0.0-20190106161140-3f1c8253044a/go.mod h1:rf3lG4BRIbNafJWhAfAdb/ePZxsR/4RtNHQocxwk9r4=
-honnef.co/go/tools v0.0.0-20190418001031-e561f6794a2a/go.mod h1:rf3lG4BRIbNafJWhAfAdb/ePZxsR/4RtNHQocxwk9r4=
-honnef.co/go/tools v0.0.0-20190523083050-ea95bdfd59fc/go.mod h1:rf3lG4BRIbNafJWhAfAdb/ePZxsR/4RtNHQocxwk9r4=
-honnef.co/go/tools v0.0.1-2019.2.3/go.mod h1:a3bituU0lyd329TUQxRnasdCoJDkEUEAqEt0JzvZhAg=
-honnef.co/go/tools v0.0.1-2020.1.3/go.mod h1:X/FiERA/W4tHapMX5mGpAtMSVEeEUOyHaw9vFzvIQ3k=
-honnef.co/go/tools v0.0.1-2020.1.4/go.mod h1:X/FiERA/W4tHapMX5mGpAtMSVEeEUOyHaw9vFzvIQ3k=
-howett.net/plist v0.0.0-20181124034731-591f970eefbb h1:jhnBjNi9UFpfpl8YZhA9CrOqpnJdvzuiHsl/dnxl11M=
-howett.net/plist v0.0.0-20181124034731-591f970eefbb/go.mod h1:vMygbs4qMhSZSc4lCUl2OEE+rDiIIJAIdR4m7MiMcm0=
-rsc.io/binaryregexp v0.2.0/go.mod h1:qTv7/COck+e2FymRvadv62gMdZztPaShugOCi3I+8D8=
-rsc.io/quote/v3 v3.1.0/go.mod h1:yEA65RcK8LyAZtP9Kv3t0HmxON59tX3rD+tICJqUlj0=
-rsc.io/sampler v1.3.0/go.mod h1:T1hPZKmBbMNahiBKFy5HrXp6adAjACjK9JXDnKaTXpA=
diff --git a/programs/diagnostics/internal/collectors/clickhouse/config.go b/programs/diagnostics/internal/collectors/clickhouse/config.go
deleted file mode 100644
index 92368bce6f3..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/config.go
+++ /dev/null
@@ -1,113 +0,0 @@
-package clickhouse
-
-import (
-	"fmt"
-	"path/filepath"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/pkg/errors"
-)
-
-type ConfigCollector struct {
-	resourceManager *platform.ResourceManager
-}
-
-func NewConfigCollector(m *platform.ResourceManager) *ConfigCollector {
-	return &ConfigCollector{
-		resourceManager: m,
-	}
-}
-
-const DefaultConfigLocation = "/etc/clickhouse-server/"
-const ProcessedConfigurationLocation = "/var/lib/clickhouse/preprocessed_configs"
-
-func (c ConfigCollector) Collect(conf config.Configuration) (*data.DiagnosticBundle, error) {
-	conf, err := conf.ValidateConfig(c.Configuration())
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	directory, err := config.ReadStringValue(conf, "directory")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-
-	if directory != "" {
-		// user has specified a directory - we therefore skip all other efforts to locate the config
-		frame, errs := data.NewConfigFileFrame(directory)
-		return &data.DiagnosticBundle{
-			Frames: map[string]data.Frame{
-				"user_specified": frame,
-			},
-			Errors: data.FrameErrors{Errors: errs},
-		}, nil
-	}
-	configCandidates, err := FindConfigurationFiles()
-	if err != nil {
-		return &data.DiagnosticBundle{}, errors.Wrapf(err, "Unable to find configuration files")
-	}
-	frames := make(map[string]data.Frame)
-	var frameErrors []error
-	for frameName, confDir := range configCandidates {
-		frame, errs := data.NewConfigFileFrame(confDir)
-		frameErrors = append(frameErrors, errs...)
-		frames[frameName] = frame
-	}
-	return &data.DiagnosticBundle{
-		Frames: frames,
-		Errors: data.FrameErrors{Errors: frameErrors},
-	}, err
-}
-
-func FindConfigurationFiles() (map[string]string, error) {
-	configCandidates := map[string]string{
-		"default":      DefaultConfigLocation,
-		"preprocessed": ProcessedConfigurationLocation,
-	}
-	// we don't know specifically where the config is but try to find via processes
-	processConfigs, err := utils.FindConfigsFromClickHouseProcesses()
-	if err != nil {
-		return nil, err
-	}
-	for i, path := range processConfigs {
-		confDir := filepath.Dir(path)
-		if len(processConfigs) == 1 {
-			configCandidates["process"] = confDir
-			break
-		}
-		configCandidates[fmt.Sprintf("process_%d", i)] = confDir
-	}
-	return configCandidates, nil
-}
-
-func (c ConfigCollector) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.StringParam{
-				Value:      "",
-				Param:      config.NewParam("directory", "Specify the location of the configuration files for ClickHouse Server e.g. /etc/clickhouse-server/", false),
-				AllowEmpty: true,
-			},
-		},
-	}
-}
-
-func (c ConfigCollector) Description() string {
-	return "Collects the ClickHouse configuration from the local filesystem."
-}
-
-func (c ConfigCollector) IsDefault() bool {
-	return true
-}
-
-// here we register the collector for use
-func init() {
-	collectors.Register("config", func() (collectors.Collector, error) {
-		return &ConfigCollector{
-			resourceManager: platform.GetResourceManager(),
-		}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/config_test.go b/programs/diagnostics/internal/collectors/clickhouse/config_test.go
deleted file mode 100644
index 355cbb65620..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/config_test.go
+++ /dev/null
@@ -1,128 +0,0 @@
-package clickhouse_test
-
-import (
-	"encoding/xml"
-	"fmt"
-	"io"
-	"os"
-	"path"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/clickhouse"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/stretchr/testify/require"
-)
-
-func TestConfigConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned for config collector", func(t *testing.T) {
-		configCollector := clickhouse.NewConfigCollector(&platform.ResourceManager{})
-		conf := configCollector.Configuration()
-		require.Len(t, conf.Params, 1)
-		// check first param
-		require.IsType(t, config.StringParam{}, conf.Params[0])
-		directory, ok := conf.Params[0].(config.StringParam)
-		require.True(t, ok)
-		require.False(t, directory.Required())
-		require.Equal(t, directory.Name(), "directory")
-		require.Equal(t, "", directory.Value)
-	})
-}
-
-func TestConfigCollect(t *testing.T) {
-	configCollector := clickhouse.NewConfigCollector(&platform.ResourceManager{})
-
-	t.Run("test default file collector configuration", func(t *testing.T) {
-		diagSet, err := configCollector.Collect(config.Configuration{})
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		// we won't be able to collect the default configs preprocessed and default - even if clickhouse is installed
-		// these directories should not be readable under any permissions these tests are unrealistically executed!
-		// note: we may also pick up configs from a local clickhouse process - we thus allow a len >=2 but don't check this
-		// as its non-deterministic
-		require.GreaterOrEqual(t, len(diagSet.Frames), 2)
-		// check default key
-		require.Contains(t, diagSet.Frames, "default")
-		require.Equal(t, diagSet.Frames["default"].Name(), "/etc/clickhouse-server/")
-		require.Equal(t, diagSet.Frames["default"].Columns(), []string{"config"})
-		// collection will have failed
-		checkFrame(t, diagSet.Frames["default"], nil)
-		// check preprocessed key
-		require.Contains(t, diagSet.Frames, "preprocessed")
-		require.Equal(t, diagSet.Frames["preprocessed"].Name(), "/var/lib/clickhouse/preprocessed_configs")
-		require.Equal(t, diagSet.Frames["preprocessed"].Columns(), []string{"config"})
-		// min of 2 - might be more if a local installation of clickhouse is running
-		require.GreaterOrEqual(t, len(diagSet.Errors.Errors), 2)
-	})
-
-	t.Run("test configuration when specified", func(t *testing.T) {
-		// create some test files
-		tempDir := t.TempDir()
-		confDir := path.Join(tempDir, "conf")
-		// create an includes file
-		includesDir := path.Join(tempDir, "includes")
-		err := os.MkdirAll(includesDir, os.ModePerm)
-		require.Nil(t, err)
-		includesPath := path.Join(includesDir, "random.xml")
-		includesFile, err := os.Create(includesPath)
-		require.Nil(t, err)
-		xmlWriter := io.Writer(includesFile)
-		enc := xml.NewEncoder(xmlWriter)
-		enc.Indent("  ", "    ")
-		xmlConfig := data.XmlConfig{
-			XMLName: xml.Name{},
-			Clickhouse: data.XmlLoggerConfig{
-				XMLName:  xml.Name{},
-				ErrorLog: "/var/log/clickhouse-server/clickhouse-server.err.log",
-				Log:      "/var/log/clickhouse-server/clickhouse-server.log",
-			},
-			IncludeFrom: "",
-		}
-		err = enc.Encode(xmlConfig)
-		require.Nil(t, err)
-		// create 5 temporary config files - length is 6 for the included file
-		rows := make([][]interface{}, 6)
-		for i := 0; i < 5; i++ {
-			if i == 4 {
-				// set the includes for the last doc
-				xmlConfig.IncludeFrom = includesPath
-			}
-			// we want to check hierarchies are walked so create a simple folder for each file
-			fileDir := path.Join(confDir, fmt.Sprintf("%d", i))
-			err := os.MkdirAll(fileDir, os.ModePerm)
-			require.Nil(t, err)
-			filepath := path.Join(fileDir, fmt.Sprintf("random-%d.xml", i))
-			row := make([]interface{}, 1)
-			row[0] = data.XmlConfigFile{Path: filepath}
-			rows[i] = row
-			xmlFile, err := os.Create(filepath)
-			require.Nil(t, err)
-			// write a little xml so its valid
-			xmlConfig := xmlConfig
-			xmlWriter := io.Writer(xmlFile)
-			enc := xml.NewEncoder(xmlWriter)
-			enc.Indent("  ", "    ")
-			err = enc.Encode(xmlConfig)
-			require.Nil(t, err)
-		}
-		diagSet, err := configCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value: confDir,
-					Param: config.NewParam("directory", "File locations", false),
-				},
-			},
-		})
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Frames, 1)
-		require.Contains(t, diagSet.Frames, "user_specified")
-		require.Equal(t, diagSet.Frames["user_specified"].Name(), confDir)
-		require.Equal(t, diagSet.Frames["user_specified"].Columns(), []string{"config"})
-		iConf := make([]interface{}, 1)
-		iConf[0] = data.XmlConfigFile{Path: includesPath, Included: true}
-		rows[5] = iConf
-		checkFrame(t, diagSet.Frames["user_specified"], rows)
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/db_logs.go b/programs/diagnostics/internal/collectors/clickhouse/db_logs.go
deleted file mode 100644
index 3253f504c1b..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/db_logs.go
+++ /dev/null
@@ -1,108 +0,0 @@
-package clickhouse
-
-import (
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/pkg/errors"
-)
-
-type DBLogTable struct {
-	orderBy        data.OrderBy
-	excludeColumns []string
-}
-
-var DbLogTables = map[string]DBLogTable{
-	"query_log": {
-		orderBy: data.OrderBy{
-			Column: "event_time_microseconds",
-			Order:  data.Asc,
-		},
-		excludeColumns: []string{},
-	},
-	"query_thread_log": {
-		orderBy: data.OrderBy{
-			Column: "event_time_microseconds",
-			Order:  data.Asc,
-		},
-		excludeColumns: []string{},
-	},
-	"text_log": {
-		orderBy: data.OrderBy{
-			Column: "event_time_microseconds",
-			Order:  data.Asc,
-		},
-		excludeColumns: []string{},
-	},
-}
-
-// This collector collects db logs
-
-type DBLogsCollector struct {
-	resourceManager *platform.ResourceManager
-}
-
-func NewDBLogsCollector(m *platform.ResourceManager) *DBLogsCollector {
-	return &DBLogsCollector{
-		resourceManager: m,
-	}
-}
-
-func (dc *DBLogsCollector) Collect(conf config.Configuration) (*data.DiagnosticBundle, error) {
-	conf, err := conf.ValidateConfig(dc.Configuration())
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	rowLimit, err := config.ReadIntValue(conf, "row_limit")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-
-	frames := make(map[string]data.Frame)
-	var frameErrors []error
-	for logTable, tableConfig := range DbLogTables {
-		frame, err := dc.resourceManager.DbClient.ReadTable("system", logTable, tableConfig.excludeColumns, tableConfig.orderBy, rowLimit)
-		if err != nil {
-			frameErrors = append(frameErrors, errors.Wrapf(err, "Unable to collect %s", logTable))
-		} else {
-			frames[logTable] = frame
-		}
-	}
-
-	fErrors := data.FrameErrors{
-		Errors: frameErrors,
-	}
-	return &data.DiagnosticBundle{
-		Frames: frames,
-		Errors: fErrors,
-	}, nil
-}
-
-func (dc *DBLogsCollector) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.IntParam{
-				Value: 100000,
-				Param: config.NewParam("row_limit", "Maximum number of log rows to collect. Negative values mean unlimited", false),
-			},
-		},
-	}
-}
-
-func (dc *DBLogsCollector) IsDefault() bool {
-	return true
-}
-
-func (dc DBLogsCollector) Description() string {
-	return "Collects the ClickHouse logs directly from the database."
-}
-
-// here we register the collector for use
-func init() {
-	collectors.Register("db_logs", func() (collectors.Collector, error) {
-		return &DBLogsCollector{
-			resourceManager: platform.GetResourceManager(),
-		}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/db_logs_test.go b/programs/diagnostics/internal/collectors/clickhouse/db_logs_test.go
deleted file mode 100644
index 3fc585f3352..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/db_logs_test.go
+++ /dev/null
@@ -1,119 +0,0 @@
-package clickhouse_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/clickhouse"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/stretchr/testify/require"
-)
-
-func TestDbLogsConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned for summary collector", func(t *testing.T) {
-		client := test.NewFakeClickhouseClient(make(map[string][]string))
-		dbLogsCollector := clickhouse.NewDBLogsCollector(&platform.ResourceManager{
-			DbClient: client,
-		})
-		conf := dbLogsCollector.Configuration()
-		require.Len(t, conf.Params, 1)
-		require.IsType(t, config.IntParam{}, conf.Params[0])
-		rowLimit, ok := conf.Params[0].(config.IntParam)
-		require.True(t, ok)
-		require.False(t, rowLimit.Required())
-		require.Equal(t, rowLimit.Name(), "row_limit")
-		require.Equal(t, int64(100000), rowLimit.Value)
-	})
-}
-
-func TestDbLogsCollect(t *testing.T) {
-	client := test.NewFakeClickhouseClient(make(map[string][]string))
-	dbLogsCollector := clickhouse.NewDBLogsCollector(&platform.ResourceManager{
-		DbClient: client,
-	})
-	queryLogColumns := []string{"type", "event_date", "event_time", "event_time_microseconds",
-		"query_start_time", "query_start_time_microseconds", "query_duration_ms", "read_rows", "read_bytes", "written_rows", "written_bytes",
-		"result_rows", "result_bytes", "memory_usage", "current_database", "query", "formatted_query", "normalized_query_hash",
-		"query_kind", "databases", "tables", "columns", "projections", "views", "exception_code", "exception", "stack_trace",
-		"is_initial_query", "user", "query_id", "address", "port", "initial_user", "initial_query_id", "initial_address", "initial_port",
-		"initial_query_start_time", "initial_query_start_time_microseconds", "interface", "os_user", "client_hostname", "client_name",
-		"client_revision", "client_version_major", "client_version_minor", "client_version_patch", "http_method", "http_user_agent",
-		"http_referer", "forwarded_for", "quota_key", "revision", "log_comment", "thread_ids", "ProfileEvents", "Settings",
-		"used_aggregate_functions", "used_aggregate_function_combinators", "used_database_engines", "used_data_type_families",
-		"used_dictionaries", "used_formats", "used_functions", "used_storages", "used_table_functions"}
-	queryLogFrame := test.NewFakeDataFrame("queryLog", queryLogColumns,
-		[][]interface{}{
-			{"QueryStart", "2021-12-13", "2021-12-13 12:53:20", "2021-12-13 12:53:20.590579", "2021-12-13 12:53:20", "2021-12-13 12:53:20.590579", "0", "0", "0", "0", "0", "0", "0", "0", "default", "SELECT DISTINCT arrayJoin(extractAll(name, '[\\w_]{2,}')) AS res FROM (SELECT name FROM system.functions UNION ALL SELECT name FROM system.table_engines UNION ALL SELECT name FROM system.formats UNION ALL SELECT name FROM system.table_functions UNION ALL SELECT name FROM system.data_type_families UNION ALL SELECT name FROM system.merge_tree_settings UNION ALL SELECT name FROM system.settings UNION ALL SELECT cluster FROM system.clusters UNION ALL SELECT macro FROM system.macros UNION ALL SELECT policy_name FROM system.storage_policies UNION ALL SELECT concat(func.name, comb.name) FROM system.functions AS func CROSS JOIN system.aggregate_function_combinators AS comb WHERE is_aggregate UNION ALL SELECT name FROM system.databases LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.tables LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.dictionaries LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.columns LIMIT 10000) WHERE notEmpty(res)", "", "6666026786019643712", "Select", "['system']", "['system.aggregate_function_combinators','system.clusters','system.columns','system.data_type_families','system.databases','system.dictionaries','system.formats','system.functions','system.macros','system.merge_tree_settings','system.settings','system.storage_policies','system.table_engines','system.table_functions','system.tables']", "['system.aggregate_function_combinators.name','system.clusters.cluster','system.columns.name','system.data_type_families.name','system.databases.name','system.dictionaries.name','system.formats.name','system.functions.is_aggregate','system.functions.name','system.macros.macro','system.merge_tree_settings.name','system.settings.name','system.storage_policies.policy_name','system.table_engines.name','system.table_functions.name','system.tables.name']", "[]", "[]", "0", "", "", "1", "default", "3b5feb6d-3086-4718-adb2-17464988ff12", "::ffff:127.0.0.1", "50920", "default", "3b5feb6d-3086-4718-adb2-17464988ff12", "::ffff:127.0.0.1", "50920", "2021-12-13 12:53:30", "2021-12-13 12:53:30.590579", "1", "", "", "ClickHouse client", "54450", "21", "11", "0", "0", "", "", "", "", "54456", "", "[]", "{}", "{'load_balancing':'random','max_memory_usage':'10000000000'}", "[]", "[]", "[]", "[]", "[]", "[]", "[]", "[]", "[]"},
-			{"QueryFinish", "2021-12-13", "2021-12-13 12:53:30", "2021-12-13 12:53:30.607292", "2021-12-13 12:53:30", "2021-12-13 12:53:30.590579", "15", "4512", "255694", "0", "0", "4358", "173248", "4415230", "default", "SELECT DISTINCT arrayJoin(extractAll(name, '[\\w_]{2,}')) AS res FROM (SELECT name FROM system.functions UNION ALL SELECT name FROM system.table_engines UNION ALL SELECT name FROM system.formats UNION ALL SELECT name FROM system.table_functions UNION ALL SELECT name FROM system.data_type_families UNION ALL SELECT name FROM system.merge_tree_settings UNION ALL SELECT name FROM system.settings UNION ALL SELECT cluster FROM system.clusters UNION ALL SELECT macro FROM system.macros UNION ALL SELECT policy_name FROM system.storage_policies UNION ALL SELECT concat(func.name, comb.name) FROM system.functions AS func CROSS JOIN system.aggregate_function_combinators AS comb WHERE is_aggregate UNION ALL SELECT name FROM system.databases LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.tables LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.dictionaries LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.columns LIMIT 10000) WHERE notEmpty(res)", "", "6666026786019643712", "Select", "['system']", "['system.aggregate_function_combinators','system.clusters','system.columns','system.data_type_families','system.databases','system.dictionaries','system.formats','system.functions','system.macros','system.merge_tree_settings','system.settings','system.storage_policies','system.table_engines','system.table_functions','system.tables']", "['system.aggregate_function_combinators.name','system.clusters.cluster','system.columns.name','system.data_type_families.name','system.databases.name','system.dictionaries.name','system.formats.name','system.functions.is_aggregate','system.functions.name','system.macros.macro','system.merge_tree_settings.name','system.settings.name','system.storage_policies.policy_name','system.table_engines.name','system.table_functions.name','system.tables.name']", "[]", "[]", "0", "", "", "1", "default", "3b5feb6d-3086-4718-adb2-17464988ff12", "::ffff:127.0.0.1", "50920", "default", "3b5feb6d-3086-4718-adb2-17464988ff12", "::ffff:127.0.0.1", "50920", "2021-12-13 12:53:30", "2021-12-13 12:53:30.590579", "1", "", "", "ClickHouse client", "54450", "21", "11", "0", "0", "", "", "", "", "54456", "", "[95298,95315,95587,95316,95312,95589,95318,95586,95588,95585]", "{'Query':1,'SelectQuery':1,'ArenaAllocChunks':41,'ArenaAllocBytes':401408,'FunctionExecute':62,'NetworkSendElapsedMicroseconds':463,'NetworkSendBytes':88452,'SelectedRows':4512,'SelectedBytes':255694,'RegexpCreated':6,'ContextLock':411,'RWLockAcquiredReadLocks':190,'RealTimeMicroseconds':49221,'UserTimeMicroseconds':19811,'SystemTimeMicroseconds':2817,'SoftPageFaults':1128,'OSCPUWaitMicroseconds':127,'OSCPUVirtualTimeMicroseconds':22624,'OSWriteBytes':12288,'OSWriteChars':13312}", "{'load_balancing':'random','max_memory_usage':'10000000000'}", "[]", "[]", "[]", "[]", "[]", "[]", "['concat','notEmpty','extractAll']", "[]", "[]"},
-			{"QueryStart", "2021-12-13", "2021-12-13 13:02:53", "2021-12-13 13:02:53.419528", "2021-12-13 13:02:53", "2021-12-13 13:02:53.419528", "0", "0", "0", "0", "0", "0", "0", "0", "default", "SELECT DISTINCT arrayJoin(extractAll(name, '[\\w_]{2,}')) AS res FROM (SELECT name FROM system.functions UNION ALL SELECT name FROM system.table_engines UNION ALL SELECT name FROM system.formats UNION ALL SELECT name FROM system.table_functions UNION ALL SELECT name FROM system.data_type_families UNION ALL SELECT name FROM system.merge_tree_settings UNION ALL SELECT name FROM system.settings UNION ALL SELECT cluster FROM system.clusters UNION ALL SELECT macro FROM system.macros UNION ALL SELECT policy_name FROM system.storage_policies UNION ALL SELECT concat(func.name, comb.name) FROM system.functions AS func CROSS JOIN system.aggregate_function_combinators AS comb WHERE is_aggregate UNION ALL SELECT name FROM system.databases LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.tables LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.dictionaries LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.columns LIMIT 10000) WHERE notEmpty(res)", "", "6666026786019643712", "Select", "['system']", "['system.aggregate_function_combinators','system.clusters','system.columns','system.data_type_families','system.databases','system.dictionaries','system.formats','system.functions','system.macros','system.merge_tree_settings','system.settings','system.storage_policies','system.table_engines','system.table_functions','system.tables']", "['system.aggregate_function_combinators.name','system.clusters.cluster','system.columns.name','system.data_type_families.name','system.databases.name','system.dictionaries.name','system.formats.name','system.functions.is_aggregate','system.functions.name','system.macros.macro','system.merge_tree_settings.name','system.settings.name','system.storage_policies.policy_name','system.table_engines.name','system.table_functions.name','system.tables.name']", "[]", "[]", "0", "", "", "1", "default", "351b58e4-6128-47d4-a7b8-03d78c1f84c6", "::ffff:127.0.0.1", "50968", "default", "351b58e4-6128-47d4-a7b8-03d78c1f84c6", "::ffff:127.0.0.1", "50968", "2021-12-13 13:02:53", "2021-12-13 13:02:53.419528", "1", "", "", "ClickHouse client", "54450", "21", "11", "0", "0", "", "", "", "", "54456", "", "[]", "{}", "{'load_balancing':'random','max_memory_usage':'10000000000'}", "[]", "[]", "[]", "[]", "[]", "[]", "[]", "[]", "[]"},
-			{"QueryFinish", "2021-12-13", "2021-12-13 13:02:56", "2021-12-13 13:02:56.437115", "2021-12-13 13:02:56", "2021-12-13 13:02:56.419528", "16", "4629", "258376", "0", "0", "4377", "174272", "4404694", "default", "SELECT DISTINCT arrayJoin(extractAll(name, '[\\w_]{2,}')) AS res FROM (SELECT name FROM system.functions UNION ALL SELECT name FROM system.table_engines UNION ALL SELECT name FROM system.formats UNION ALL SELECT name FROM system.table_functions UNION ALL SELECT name FROM system.data_type_families UNION ALL SELECT name FROM system.merge_tree_settings UNION ALL SELECT name FROM system.settings UNION ALL SELECT cluster FROM system.clusters UNION ALL SELECT macro FROM system.macros UNION ALL SELECT policy_name FROM system.storage_policies UNION ALL SELECT concat(func.name, comb.name) FROM system.functions AS func CROSS JOIN system.aggregate_function_combinators AS comb WHERE is_aggregate UNION ALL SELECT name FROM system.databases LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.tables LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.dictionaries LIMIT 10000 UNION ALL SELECT DISTINCT name FROM system.columns LIMIT 10000) WHERE notEmpty(res)", "", "6666026786019643712", "Select", "['system']", "['system.aggregate_function_combinators','system.clusters','system.columns','system.data_type_families','system.databases','system.dictionaries','system.formats','system.functions','system.macros','system.merge_tree_settings','system.settings','system.storage_policies','system.table_engines','system.table_functions','system.tables']", "['system.aggregate_function_combinators.name','system.clusters.cluster','system.columns.name','system.data_type_families.name','system.databases.name','system.dictionaries.name','system.formats.name','system.functions.is_aggregate','system.functions.name','system.macros.macro','system.merge_tree_settings.name','system.settings.name','system.storage_policies.policy_name','system.table_engines.name','system.table_functions.name','system.tables.name']", "[]", "[]", "0", "", "", "1", "default", "351b58e4-6128-47d4-a7b8-03d78c1f84c6", "::ffff:127.0.0.1", "50968", "default", "351b58e4-6128-47d4-a7b8-03d78c1f84c6", "::ffff:127.0.0.1", "50968", "2021-12-13 13:02:53", "2021-12-13 13:02:53.419528", "1", "", "", "ClickHouse client", "54450", "21", "11", "0", "0", "", "", "", "", "54456", "", "[95298,95318,95315,95316,95312,95588,95589,95586,95585,95587]", "{'Query':1,'SelectQuery':1,'ArenaAllocChunks':41,'ArenaAllocBytes':401408,'FunctionExecute':62,'NetworkSendElapsedMicroseconds':740,'NetworkSendBytes':88794,'SelectedRows':4629,'SelectedBytes':258376,'ContextLock':411,'RWLockAcquiredReadLocks':194,'RealTimeMicroseconds':52469,'UserTimeMicroseconds':17179,'SystemTimeMicroseconds':4218,'SoftPageFaults':569,'OSCPUWaitMicroseconds':303,'OSCPUVirtualTimeMicroseconds':25087,'OSWriteBytes':12288,'OSWriteChars':12288}", "{'load_balancing':'random','max_memory_usage':'10000000000'}", "[]", "[]", "[]", "[]", "[]", "[]", "['concat','notEmpty','extractAll']", "[]", "[]"},
-		})
-
-	client.QueryResponses["SELECT * FROM system.query_log ORDER BY event_time_microseconds ASC LIMIT 100000"] = &queryLogFrame
-
-	textLogColumns := []string{"event_date", "event_time", "event_time_microseconds", "microseconds", "thread_name", "thread_id", "level", "query_id", "logger_name", "message", "revision", "source_file", "source_line"}
-	textLogFrame := test.NewFakeDataFrame("textLog", textLogColumns,
-		[][]interface{}{
-			{"2022-02-03", "2022-02-03 16:17:47", "2022-02-03 16:37:17.056950", "56950", "clickhouse-serv", "68947", "Information", "", "DNSCacheUpdater", "Update period 15 seconds", "54458", "../src/Interpreters/DNSCacheUpdater.cpp; void DB::DNSCacheUpdater::start()", "46"},
-			{"2022-02-03", "2022-02-03 16:27:47", "2022-02-03 16:37:27.057022", "57022", "clickhouse-serv", "68947", "Information", "", "Application", "Available RAM: 62.24 GiB; physical cores: 8; logical cores: 16.", "54458", "../programs/server/Server.cpp; virtual int DB::Server::main(const std::vector<std::string> &)", "1380"},
-			{"2022-02-03", "2022-02-03 16:37:47", "2022-02-03 16:37:37.057484", "57484", "clickhouse-serv", "68947", "Information", "", "Application", "Listening for http://[::1]:8123", "54458", "../programs/server/Server.cpp; virtual int DB::Server::main(const std::vector<std::string> &)", "1444"},
-			{"2022-02-03", "2022-02-03 16:47:47", "2022-02-03 16:37:47.057527", "57527", "clickhouse-serv", "68947", "Information", "", "Application", "Listening for native protocol (tcp): [::1]:9000", "54458", "../programs/server/Server.cpp; virtual int DB::Server::main(const std::vector<std::string> &)", "1444"},
-		})
-
-	client.QueryResponses["SELECT * FROM system.text_log ORDER BY event_time_microseconds ASC LIMIT 100000"] = &textLogFrame
-
-	// skip query_thread_log frame - often it doesn't exist anyway unless enabled
-	t.Run("test default db logs collection", func(t *testing.T) {
-		bundle, errs := dbLogsCollector.Collect(config.Configuration{})
-		require.Empty(t, errs)
-		require.NotNil(t, bundle)
-		require.Len(t, bundle.Frames, 2)
-		require.Contains(t, bundle.Frames, "text_log")
-		require.Contains(t, bundle.Frames, "query_log")
-		require.Len(t, bundle.Errors.Errors, 1)
-		// check query_log frame
-		require.Contains(t, bundle.Frames, "query_log")
-		require.Equal(t, queryLogColumns, bundle.Frames["query_log"].Columns())
-		checkFrame(t, bundle.Frames["query_log"], queryLogFrame.Rows)
-		//check text_log frame
-		require.Contains(t, bundle.Frames, "text_log")
-		require.Equal(t, textLogColumns, bundle.Frames["text_log"].Columns())
-		checkFrame(t, bundle.Frames["text_log"], textLogFrame.Rows)
-		client.Reset()
-	})
-
-	t.Run("test db logs collection with limit", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.IntParam{
-					Value: 1,
-					Param: config.NewParam("row_limit", "Maximum number of log rows to collect. Negative values mean unlimited", false),
-				},
-			},
-		}
-		bundle, err := dbLogsCollector.Collect(conf)
-		require.Empty(t, err)
-		require.NotNil(t, bundle)
-		require.Len(t, bundle.Frames, 0)
-		require.Len(t, bundle.Errors.Errors, 3)
-		// populate client
-		client.QueryResponses["SELECT * FROM system.query_log ORDER BY event_time_microseconds ASC LIMIT 1"] = &queryLogFrame
-		client.QueryResponses["SELECT * FROM system.text_log ORDER BY event_time_microseconds ASC LIMIT 1"] = &textLogFrame
-		bundle, err = dbLogsCollector.Collect(conf)
-		require.Empty(t, err)
-		require.Len(t, bundle.Frames, 2)
-		require.Len(t, bundle.Errors.Errors, 1)
-		require.Contains(t, bundle.Frames, "text_log")
-		require.Contains(t, bundle.Frames, "query_log")
-		// check query_log frame
-		require.Contains(t, bundle.Frames, "query_log")
-		require.Equal(t, queryLogColumns, bundle.Frames["query_log"].Columns())
-		checkFrame(t, bundle.Frames["query_log"], queryLogFrame.Rows[:1])
-		//check text_log frame
-		require.Contains(t, bundle.Frames, "text_log")
-		require.Equal(t, textLogColumns, bundle.Frames["text_log"].Columns())
-		checkFrame(t, bundle.Frames["text_log"], textLogFrame.Rows[:1])
-		client.Reset()
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/logs.go b/programs/diagnostics/internal/collectors/clickhouse/logs.go
deleted file mode 100644
index 8436a392c47..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/logs.go
+++ /dev/null
@@ -1,140 +0,0 @@
-package clickhouse
-
-import (
-	"fmt"
-	"path/filepath"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-)
-
-// This collector collects logs
-
-type LogsCollector struct {
-	resourceManager *platform.ResourceManager
-}
-
-func NewLogsCollector(m *platform.ResourceManager) *LogsCollector {
-	return &LogsCollector{
-		resourceManager: m,
-	}
-}
-
-var DefaultLogsLocation = filepath.Clean("/var/log/clickhouse-server/")
-
-func (lc *LogsCollector) Collect(conf config.Configuration) (*data.DiagnosticBundle, error) {
-	conf, err := conf.ValidateConfig(lc.Configuration())
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	directory, err := config.ReadStringValue(conf, "directory")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	collectArchives, err := config.ReadBoolValue(conf, "collect_archives")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	logPatterns := []string{"*.log"}
-	if collectArchives {
-		logPatterns = append(logPatterns, "*.gz")
-	}
-
-	if directory != "" {
-		// user has specified a directory - we therefore skip all other efforts to locate the logs
-		frame, errs := data.NewFileDirectoryFrame(directory, logPatterns)
-		return &data.DiagnosticBundle{
-			Frames: map[string]data.Frame{
-				"user_specified": frame,
-			},
-			Errors: data.FrameErrors{Errors: errs},
-		}, nil
-	}
-	// add the default
-	frames := make(map[string]data.Frame)
-	dirFrame, frameErrors := data.NewFileDirectoryFrame(DefaultLogsLocation, logPatterns)
-	frames["default"] = dirFrame
-	logFolders, errs := FindLogFileCandidates()
-	frameErrors = append(frameErrors, errs...)
-	i := 0
-	for folder, paths := range logFolders {
-		// we will collect the default location anyway above so skip these
-		if folder != DefaultLogsLocation {
-			if collectArchives {
-				paths = append(paths, "*.gz")
-			}
-			dirFrame, errs := data.NewFileDirectoryFrame(folder, paths)
-			frames[fmt.Sprintf("logs-%d", i)] = dirFrame
-			frameErrors = append(frameErrors, errs...)
-		}
-	}
-	return &data.DiagnosticBundle{
-		Frames: frames,
-		Errors: data.FrameErrors{Errors: frameErrors},
-	}, err
-}
-
-func (lc *LogsCollector) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.StringParam{
-				Value:      "",
-				Param:      config.NewParam("directory", "Specify the location of the log files for ClickHouse Server e.g. /var/log/clickhouse-server/", false),
-				AllowEmpty: true,
-			},
-			config.BoolParam{
-				Param: config.NewParam("collect_archives", "Collect compressed log archive files", false),
-			},
-		},
-	}
-}
-
-func FindLogFileCandidates() (logFolders map[string][]string, configErrors []error) {
-	// we need the config to determine the location of the logs
-	configCandidates := make(map[string]data.ConfigFileFrame)
-	configFiles, err := FindConfigurationFiles()
-	logFolders = make(map[string][]string)
-	if err != nil {
-		configErrors = append(configErrors, err)
-		return logFolders, configErrors
-	}
-	for _, folder := range configFiles {
-		configFrame, errs := data.NewConfigFileFrame(folder)
-		configErrors = append(configErrors, errs...)
-		configCandidates[filepath.Clean(folder)] = configFrame
-	}
-
-	for _, config := range configCandidates {
-		paths, errs := config.FindLogPaths()
-		for _, path := range paths {
-			folder := filepath.Dir(path)
-			filename := filepath.Base(path)
-			if _, ok := logFolders[folder]; !ok {
-				logFolders[folder] = []string{}
-			}
-			logFolders[folder] = utils.Unique(append(logFolders[folder], filename))
-		}
-		configErrors = append(configErrors, errs...)
-	}
-	return logFolders, configErrors
-}
-
-func (lc *LogsCollector) IsDefault() bool {
-	return true
-}
-
-func (lc LogsCollector) Description() string {
-	return "Collects the ClickHouse logs directly from the database."
-}
-
-// here we register the collector for use
-func init() {
-	collectors.Register("logs", func() (collectors.Collector, error) {
-		return &LogsCollector{
-			resourceManager: platform.GetResourceManager(),
-		}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/logs_test.go b/programs/diagnostics/internal/collectors/clickhouse/logs_test.go
deleted file mode 100644
index 5f0be734445..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/logs_test.go
+++ /dev/null
@@ -1,147 +0,0 @@
-package clickhouse_test
-
-import (
-	"fmt"
-	"os"
-	"path"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/clickhouse"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/stretchr/testify/require"
-)
-
-func TestLogsConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned for logs collector", func(t *testing.T) {
-		client := test.NewFakeClickhouseClient(make(map[string][]string))
-		logsCollector := clickhouse.NewLogsCollector(&platform.ResourceManager{
-			DbClient: client,
-		})
-		conf := logsCollector.Configuration()
-		require.Len(t, conf.Params, 2)
-		// check directory
-		require.IsType(t, config.StringParam{}, conf.Params[0])
-		directory, ok := conf.Params[0].(config.StringParam)
-		require.True(t, ok)
-		require.False(t, directory.Required())
-		require.Equal(t, directory.Name(), "directory")
-		require.Empty(t, directory.Value)
-		// check collect_archives
-		require.IsType(t, config.BoolParam{}, conf.Params[1])
-		collectArchives, ok := conf.Params[1].(config.BoolParam)
-		require.True(t, ok)
-		require.False(t, collectArchives.Required())
-		require.Equal(t, collectArchives.Name(), "collect_archives")
-		require.False(t, collectArchives.Value)
-	})
-}
-
-func TestLogsCollect(t *testing.T) {
-
-	logsCollector := clickhouse.NewLogsCollector(&platform.ResourceManager{})
-
-	t.Run("test default logs collection", func(t *testing.T) {
-		// we can't rely on a local installation of clickhouse being present for tests - if it is present (and running)
-		// results maybe variable e.g. we may find a config. For now, we allow flexibility and test only default.
-		// TODO: we may want to test this within a container
-		bundle, err := logsCollector.Collect(config.Configuration{})
-		require.Nil(t, err)
-		require.NotNil(t, bundle)
-		// we will have some errors if clickhouse is installed or not. If former, permission issues - if latter missing folders.
-		require.Greater(t, len(bundle.Errors.Errors), 0)
-		require.Len(t, bundle.Frames, 1)
-		require.Contains(t, bundle.Frames, "default")
-		_, ok := bundle.Frames["default"].(data.DirectoryFileFrame)
-		require.True(t, ok)
-		// no guarantees clickhouse is installed so this bundle could have no frames
-	})
-
-	t.Run("test logs collection when directory is specified", func(t *testing.T) {
-		cwd, err := os.Getwd()
-		require.Nil(t, err)
-		logsPath := path.Join(cwd, "../../../testdata", "logs", "var", "logs")
-		bundle, err := logsCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value:      logsPath,
-					Param:      config.NewParam("directory", "Specify the location of the log files for ClickHouse Server e.g. /var/log/clickhouse-server/", false),
-					AllowEmpty: true,
-				},
-			},
-		})
-		require.Nil(t, err)
-		checkDirectoryBundle(t, bundle, logsPath, []string{"clickhouse-server.log", "clickhouse-server.err.log"})
-
-	})
-
-	t.Run("test logs collection of archives", func(t *testing.T) {
-		cwd, err := os.Getwd()
-		require.Nil(t, err)
-		logsPath := path.Join(cwd, "../../../testdata", "logs", "var", "logs")
-		bundle, err := logsCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value:      logsPath,
-					Param:      config.NewParam("directory", "Specify the location of the log files for ClickHouse Server e.g. /var/log/clickhouse-server/", false),
-					AllowEmpty: true,
-				},
-				config.BoolParam{
-					Value: true,
-					Param: config.NewParam("collect_archives", "Collect compressed log archive files", false),
-				},
-			},
-		})
-		require.Nil(t, err)
-		checkDirectoryBundle(t, bundle, logsPath, []string{"clickhouse-server.log", "clickhouse-server.err.log", "clickhouse-server.log.gz"})
-	})
-
-	t.Run("test when directory does not exist", func(t *testing.T) {
-		tmpDir := t.TempDir()
-		logsPath := path.Join(tmpDir, "random")
-		bundle, err := logsCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value:      logsPath,
-					Param:      config.NewParam("directory", "Specify the location of the log files for ClickHouse Server e.g. /var/log/clickhouse-server/", false),
-					AllowEmpty: true,
-				},
-			},
-		})
-		// not a fatal error currently
-		require.Nil(t, err)
-		require.Len(t, bundle.Errors.Errors, 1)
-		require.Equal(t, fmt.Sprintf("directory %s does not exist", logsPath), bundle.Errors.Errors[0].Error())
-	})
-}
-
-func checkDirectoryBundle(t *testing.T, bundle *data.DiagnosticBundle, logsPath string, expectedFiles []string) {
-	require.NotNil(t, bundle)
-	require.Nil(t, bundle.Errors.Errors)
-	require.Len(t, bundle.Frames, 1)
-	require.Contains(t, bundle.Frames, "user_specified")
-	dirFrame, ok := bundle.Frames["user_specified"].(data.DirectoryFileFrame)
-	require.True(t, ok)
-	require.Equal(t, logsPath, dirFrame.Directory)
-	require.Equal(t, []string{"files"}, dirFrame.Columns())
-	i := 0
-	fullPaths := make([]string, len(expectedFiles))
-	for i, filePath := range expectedFiles {
-		fullPaths[i] = path.Join(logsPath, filePath)
-	}
-	for {
-		values, ok, err := dirFrame.Next()
-		require.Nil(t, err)
-		if !ok {
-			break
-		}
-		require.Len(t, values, 1)
-		file, ok := values[0].(data.SimpleFile)
-		require.True(t, ok)
-		require.Contains(t, fullPaths, file.FilePath())
-		i += 1
-	}
-	require.Equal(t, len(fullPaths), i)
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/queries.json b/programs/diagnostics/internal/collectors/clickhouse/queries.json
deleted file mode 100644
index f5cf4362c9e..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/queries.json
+++ /dev/null
@@ -1,153 +0,0 @@
-{
-  "queries": {
-    "version": [
-      {
-        "statement": "SELECT version()"
-      }
-    ],
-    "databases": [
-      {
-        "statement": "SELECT name, engine, tables, partitions, parts, formatReadableSize(bytes_on_disk) \"disk_size\" FROM system.databases db LEFT JOIN ( SELECT database, uniq(table) \"tables\", uniq(table, partition) \"partitions\", count() AS parts, sum(bytes_on_disk) \"bytes_on_disk\" FROM system.parts WHERE active GROUP BY database ) AS db_stats ON db.name = db_stats.database ORDER BY bytes_on_disk DESC LIMIT {{.Limit}}"
-      }
-    ],
-    "access": [
-      {
-        "statement": "SHOW ACCESS"
-      }
-    ],
-    "quotas": [
-      {
-        "statement": "SHOW QUOTA"
-      }
-    ],
-    "db_engines": [
-      {
-        "statement": "SELECT engine, count() \"count\" FROM system.databases GROUP BY engine"
-      }
-    ],
-    "table_engines": [
-      {
-        "statement": "SELECT engine, count() \"count\" FROM system.tables WHERE database != 'system' GROUP BY engine"
-      }
-    ],
-    "dictionaries": [
-      {
-        "statement": "SELECT source, type, status, count() \"count\" FROM system.dictionaries GROUP BY source, type, status ORDER BY status DESC, source"
-      }
-    ],
-    "replicated_tables_by_delay": [
-      {
-        "statement": "SELECT database, table, is_leader, is_readonly, absolute_delay, queue_size, inserts_in_queue, merges_in_queue FROM system.replicas ORDER BY absolute_delay DESC LIMIT {{.Limit}}"
-      }
-    ],
-    "replication_queue_by_oldest": [
-      {
-        "statement": "SELECT database, table, replica_name, position, node_name, type, source_replica, parts_to_merge, new_part_name, create_time, required_quorum, is_detach, is_currently_executing, num_tries, last_attempt_time, last_exception, concat( 'time: ', toString(last_postpone_time), ', number: ', toString(num_postponed), ', reason: ', postpone_reason ) postpone FROM system.replication_queue ORDER BY create_time ASC LIMIT {{.Limit}}"
-      }
-    ],
-    "replicated_fetches": [
-      {
-        "statement": "SELECT database, table, round(elapsed, 1) \"elapsed\", round(100 * progress, 1) \"progress\", partition_id, result_part_name, result_part_path, total_size_bytes_compressed, bytes_read_compressed, source_replica_path, source_replica_hostname, source_replica_port, interserver_scheme, to_detached, thread_id FROM system.replicated_fetches"
-      }
-    ],
-    "tables_by_max_partition_count": [
-      {
-        "statement": "SELECT database, table, count() \"partitions\", sum(part_count) \"parts\", max(part_count) \"max_parts_per_partition\" FROM ( SELECT database, table, partition, count() \"part_count\" FROM system.parts WHERE active GROUP BY database, table, partition ) partitions GROUP BY database, table ORDER BY max_parts_per_partition DESC LIMIT {{.Limit}}"
-      }
-    ],
-    "stack_traces": [
-      {
-        "statement": "SELECT '\\n' || arrayStringConcat( arrayMap( x, y -> concat(x, ': ', y), arrayMap(x -> addressToLine(x), trace), arrayMap(x -> demangle(addressToSymbol(x)), trace) ), '\\n' ) AS trace FROM system.stack_trace"
-      }
-    ],
-    "crash_log": [
-      {
-        "statement": "SELECT event_time, signal, thread_id, query_id, '\\n' || arrayStringConcat(trace_full, '\\n') AS trace, version FROM system.crash_log ORDER BY event_time DESC"
-      }
-    ],
-    "merges": [
-      {
-        "statement": "SELECT database, table, round(elapsed, 1) \"elapsed\", round(100 * progress, 1) \"progress\", is_mutation, partition_id, result_part_path, source_part_paths, num_parts, formatReadableSize(total_size_bytes_compressed) \"total_size_compressed\", formatReadableSize(bytes_read_uncompressed) \"read_uncompressed\", formatReadableSize(bytes_written_uncompressed) \"written_uncompressed\", columns_written, formatReadableSize(memory_usage) \"memory_usage\", thread_id FROM system.merges",
-        "constraint": ">=20.3"
-      },
-      {
-        "statement": "SELECT database, table, round(elapsed, 1) \"elapsed\", round(100 * progress, 1) \"progress\", is_mutation, partition_id, num_parts, formatReadableSize(total_size_bytes_compressed) \"total_size_compressed\", formatReadableSize(bytes_read_uncompressed) \"read_uncompressed\", formatReadableSize(bytes_written_uncompressed) \"written_uncompressed\", columns_written, formatReadableSize(memory_usage) \"memory_usage\" FROM system.merges"
-      }
-    ],
-    "mutations": [
-      {
-        "statement": "SELECT database, table, mutation_id, command, create_time, parts_to_do_names, parts_to_do, is_done, latest_failed_part, latest_fail_time, latest_fail_reason FROM system.mutations WHERE NOT is_done ORDER BY create_time DESC",
-        "constraint": ">=20.3"
-      },
-      {
-        "statement": "SELECT database, table, mutation_id, command, create_time, parts_to_do, is_done, latest_failed_part, latest_fail_time, latest_fail_reason FROM system.mutations WHERE NOT is_done ORDER BY create_time DESC"
-      }
-    ],
-    "recent_data_parts": [
-      {
-        "statement": "SELECT database, table, engine, partition_id, name, part_type, active, level, disk_name, path, marks, rows, bytes_on_disk, data_compressed_bytes, data_uncompressed_bytes, marks_bytes, modification_time, remove_time, refcount, is_frozen, min_date, max_date, min_time, max_time, min_block_number, max_block_number FROM system.parts WHERE modification_time > now() - INTERVAL 3 MINUTE ORDER BY modification_time DESC",
-        "constraint": ">=20.3"
-      },
-      {
-        "statement": "SELECT database, table, engine, partition_id, name, active, level, path, marks, rows, bytes_on_disk, data_compressed_bytes, data_uncompressed_bytes, marks_bytes, modification_time, remove_time, refcount, is_frozen, min_date, max_date, min_time, max_time, min_block_number, max_block_number FROM system.parts WHERE modification_time > now() - INTERVAL 3 MINUTE ORDER BY modification_time DESC"
-      }
-    ],
-    "detached_parts": [
-      {
-        "statement": "SELECT database, table, partition_id, name, disk, reason, min_block_number, max_block_number, level FROM system.detached_parts"
-      }
-    ],
-    "processes": [
-      {
-        "statement": "SELECT elapsed, query_id, normalizeQuery(query) AS normalized_query, is_cancelled, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, formatReadableSize(memory_usage) AS \"memory usage\", user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, thread_ids, ProfileEvents, Settings FROM system.processes ORDER BY elapsed DESC",
-        "constraint": ">=21.8"
-      },
-      {
-        "statement": "SELECT elapsed, query_id, normalizeQuery(query) AS normalized_query, is_cancelled, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, formatReadableSize(memory_usage) AS \"memory usage\", user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, thread_ids, ProfileEvents.Names, ProfileEvents.Values, Settings.Names, Settings.Values FROM system.processes ORDER BY elapsed DESC",
-        "constraint": ">=21.3"
-      },
-      {
-        "statement": "SELECT elapsed, query_id, normalizeQuery(query) AS normalized_query, is_cancelled, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, formatReadableSize(memory_usage) AS \"memory usage\", user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, ProfileEvents.Names, ProfileEvents.Values, Settings.Names, Settings.Values FROM system.processes ORDER BY elapsed DESC"
-      }
-    ],
-    "top_queries_by_duration": [
-      {
-        "statement": "SELECT type, query_start_time, query_duration_ms, query_id, query_kind, is_initial_query, normalizeQuery(query) AS normalized_query, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, concat( toString(result_rows), ' rows / ', formatReadableSize(result_bytes) ) AS result, formatReadableSize(memory_usage) AS \"memory usage\", exception, '\\n' || stack_trace AS stack_trace, user, initial_user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, client_hostname, databases, tables, columns, used_aggregate_functions, used_aggregate_function_combinators, used_database_engines, used_data_type_families, used_dictionaries, used_formats, used_functions, used_storages, used_table_functions, thread_ids, ProfileEvents, Settings FROM system.query_log WHERE type != 'QueryStart' AND event_date >= today() - 1 AND event_time >= now() - INTERVAL 1 DAY ORDER BY query_duration_ms DESC LIMIT {{.Limit}}",
-        "constraint": ">=21.8"
-      },
-      {
-        "statement": "SELECT type, query_start_time, query_duration_ms, query_id, query_kind, is_initial_query, normalizeQuery(query) AS normalized_query, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, concat( toString(result_rows), ' rows / ', formatReadableSize(result_bytes) ) AS result, formatReadableSize(memory_usage) AS \"memory usage\", exception, '\\n' || stack_trace AS stack_trace, user, initial_user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, client_hostname, databases, tables, columns, used_aggregate_functions, used_aggregate_function_combinators, used_database_engines, used_data_type_families, used_dictionaries, used_formats, used_functions, used_storages, used_table_functions, thread_ids, ProfileEvents.Names, ProfileEvents.Values, Settings.Names, Settings.Values FROM system.query_log WHERE type != 'QueryStart' AND event_date >= today() - 1 AND event_time >= now() - INTERVAL 1 DAY ORDER BY query_duration_ms DESC LIMIT {{.Limit}}",
-        "constraint": ">=21.3"
-      },
-      {
-        "statement": "SELECT type, query_start_time, query_duration_ms, query_id, query_kind, is_initial_query, normalizeQuery(query) AS normalized_query, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, concat( toString(result_rows), ' rows / ', formatReadableSize(result_bytes) ) AS result, formatReadableSize(memory_usage) AS \"memory usage\", exception, '\\n' || stack_trace AS stack_trace, user, initial_user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, client_hostname, ProfileEvents.Names, ProfileEvents.Values, Settings.Names, Settings.Values FROM system.query_log WHERE type != 'QueryStart' AND event_date >= today() - 1 AND event_time >= now() - INTERVAL 1 DAY ORDER BY query_duration_ms DESC LIMIT {{.Limit}}"
-      }
-    ],
-    "top_queries_by_memory": [
-      {
-        "statement": "SELECT type, query_start_time, query_duration_ms, query_id, query_kind, is_initial_query, normalizeQuery(query) AS normalized_query, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, concat( toString(result_rows), ' rows / ', formatReadableSize(result_bytes) ) AS result, formatReadableSize(memory_usage) AS \"memory usage\", exception, '\\n' || stack_trace AS stack_trace, user, initial_user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, client_hostname, databases, tables, columns, used_aggregate_functions, used_aggregate_function_combinators, used_database_engines, used_data_type_families, used_dictionaries, used_formats, used_functions, used_storages, used_table_functions, thread_ids, ProfileEvents, Settings FROM system.query_log WHERE type != 'QueryStart' AND event_date >= today() - 1 AND event_time >= now() - INTERVAL 1 DAY ORDER BY memory_usage DESC LIMIT {{.Limit}}",
-        "constraint": ">=21.8"
-      },
-      {
-        "statement": "SELECT type, query_start_time, query_duration_ms, query_id, query_kind, is_initial_query, normalizeQuery(query) AS normalized_query, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, concat( toString(result_rows), ' rows / ', formatReadableSize(result_bytes) ) AS result, formatReadableSize(memory_usage) AS \"memory usage\", exception, '\\n' || stack_trace AS stack_trace, user, initial_user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, client_hostname, databases, tables, columns, used_aggregate_functions, used_aggregate_function_combinators, used_database_engines, used_data_type_families, used_dictionaries, used_formats, used_functions, used_storages, used_table_functions, thread_ids, ProfileEvents.Names, ProfileEvents.Values, Settings.Names, Settings.Values FROM system.query_log WHERE type != 'QueryStart' AND event_date >= today() - 1 AND event_time >= now() - INTERVAL 1 DAY ORDER BY memory_usage DESC LIMIT {{.Limit}}",
-        "constraint": ">=21.3"
-      },
-      {
-        "statement": "SELECT type, query_start_time, query_duration_ms, query_id, query_kind, is_initial_query, normalizeQuery(query) AS normalized_query, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, concat( toString(result_rows), ' rows / ', formatReadableSize(result_bytes) ) AS result, formatReadableSize(memory_usage) AS \"memory usage\", exception, '\\n' || stack_trace AS stack_trace, user, initial_user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, client_hostname, ProfileEvents.Names, ProfileEvents.Values, Settings.Names, Settings.Values FROM system.query_log WHERE type != 'QueryStart' AND event_date >= today() - 1 AND event_time >= now() - INTERVAL 1 DAY ORDER BY memory_usage DESC LIMIT {{.Limit}}"
-      }
-    ],
-    "failed_queries": [
-      {
-        "statement": "SELECT type, query_start_time, query_duration_ms, query_id, query_kind, is_initial_query, normalizeQuery(query) AS normalized_query, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, concat( toString(result_rows), ' rows / ', formatReadableSize(result_bytes) ) AS result, formatReadableSize(memory_usage) AS \"memory usage\", exception, '\\n' || stack_trace AS stack_trace, user, initial_user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, client_hostname, databases, tables, columns, used_aggregate_functions, used_aggregate_function_combinators, used_database_engines, used_data_type_families, used_dictionaries, used_formats, used_functions, used_storages, used_table_functions, thread_ids, ProfileEvents, Settings FROM system.query_log WHERE type != 'QueryStart' AND event_date >= today() - 1 AND event_time >= now() - INTERVAL 1 DAY AND exception != '' ORDER BY query_start_time DESC LIMIT {{.Limit}}",
-        "constraint": ">=21.8"
-      },
-      {
-        "statement": "SELECT type, query_start_time, query_duration_ms, query_id, query_kind, is_initial_query, normalizeQuery(query) AS normalized_query, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, concat( toString(result_rows), ' rows / ', formatReadableSize(result_bytes) ) AS result, formatReadableSize(memory_usage) AS \"memory usage\", exception, '\\n' || stack_trace AS stack_trace, user, initial_user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, client_hostname, databases, tables, columns, used_aggregate_functions, used_aggregate_function_combinators, used_database_engines, used_data_type_families, used_dictionaries, used_formats, used_functions, used_storages, used_table_functions, thread_ids, ProfileEvents.Names, ProfileEvents.Values, Settings.Names, Settings.Values FROM system.query_log WHERE type != 'QueryStart' AND event_date >= today() - 1 AND event_time >= now() - INTERVAL 1 DAY AND exception != '' ORDER BY query_start_time DESC LIMIT {{.Limit}}",
-        "constraint": ">=21.3"
-      },
-      {
-        "statement": "SELECT type, query_start_time, query_duration_ms, query_id, query_kind, is_initial_query, normalizeQuery(query) AS normalized_query, concat( toString(read_rows), ' rows / ', formatReadableSize(read_bytes) ) AS read, concat( toString(written_rows), ' rows / ', formatReadableSize(written_bytes) ) AS written, concat( toString(result_rows), ' rows / ', formatReadableSize(result_bytes) ) AS result, formatReadableSize(memory_usage) AS \"memory usage\", exception, '\\n' || stack_trace AS stack_trace, user, initial_user, multiIf( empty(client_name), http_user_agent, concat( client_name, ' ', toString(client_version_major), '.', toString(client_version_minor), '.', toString(client_version_patch) ) ) AS client, client_hostname, ProfileEvents.Names, ProfileEvents.Values, Settings.Names, Settings.Values FROM system.query_log WHERE type != 'QueryStart' AND event_date >= today() - 1 AND event_time >= now() - INTERVAL 1 DAY AND exception != '' ORDER BY query_start_time DESC LIMIT {{.Limit}}"
-      }
-    ]
-  }
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/summary.go b/programs/diagnostics/internal/collectors/clickhouse/summary.go
deleted file mode 100644
index 0b6dd3aff20..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/summary.go
+++ /dev/null
@@ -1,159 +0,0 @@
-package clickhouse
-
-import (
-	"bytes"
-	_ "embed"
-	"encoding/json"
-	"strings"
-	"text/template"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/Masterminds/semver"
-	"github.com/pkg/errors"
-)
-
-// This collector collects the system db from database
-
-type SummaryCollector struct {
-	resourceManager *platform.ResourceManager
-}
-
-type querySet struct {
-	Queries map[string][]query `json:"queries"`
-}
-
-type query struct {
-	Statement  string `json:"statement"`
-	Constraint string `json:"constraint"`
-}
-
-type ParameterTemplate struct {
-	Limit int64
-}
-
-//go:embed queries.json
-var queryFile []byte
-
-func NewSummaryCollector(m *platform.ResourceManager) *SummaryCollector {
-	return &SummaryCollector{
-		resourceManager: m,
-	}
-}
-
-func (sc *SummaryCollector) Collect(conf config.Configuration) (*data.DiagnosticBundle, error) {
-	conf, err := conf.ValidateConfig(sc.Configuration())
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	var queries querySet
-	err = json.Unmarshal(queryFile, &queries)
-	if err != nil {
-		return &data.DiagnosticBundle{}, errors.Wrap(err, "Unable to read queries from disk")
-	}
-	limit, err := config.ReadIntValue(conf, "row_limit")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-
-	paramTemplate := ParameterTemplate{
-		Limit: limit,
-	}
-	frames := make(map[string]data.Frame)
-
-	serverVersion, err := getServerSemVersion(sc)
-	if err != nil {
-		return &data.DiagnosticBundle{}, errors.Wrapf(err, "Unable to read server version")
-	}
-
-	var frameErrors []error
-	for queryId, sqlQueries := range queries.Queries {
-		//  we find the first matching query that satisfies the current version. Empty version means ANY version is
-		// supported
-		for _, sqlQuery := range sqlQueries {
-			var queryConstraint *semver.Constraints
-			if sqlQuery.Constraint != "" {
-				queryConstraint, err = semver.NewConstraint(sqlQuery.Constraint)
-				if err != nil {
-					//we try another one
-					frameErrors = append(frameErrors, errors.Wrapf(err, "Unable to parse version %s for query %s", sqlQuery.Constraint, queryId))
-					continue
-				}
-			}
-			if sqlQuery.Constraint == "" || queryConstraint.Check(serverVersion) {
-				tmpl, err := template.New(queryId).Parse(sqlQuery.Statement)
-				if err != nil {
-					frameErrors = append(frameErrors, errors.Wrapf(err, "Unable to parse query %s", queryId))
-					//we try another one
-					continue
-				}
-				buf := new(bytes.Buffer)
-				err = tmpl.Execute(buf, paramTemplate)
-				if err != nil {
-					frameErrors = append(frameErrors, errors.Wrapf(err, "Unable to process query %s template", queryId))
-					//we try another one
-					continue
-				}
-				frame, err := sc.resourceManager.DbClient.ExecuteStatement(queryId, buf.String())
-				if err != nil {
-					frameErrors = append(frameErrors, errors.Wrapf(err, "Unable to execute query %s", queryId))
-					//we try another one
-				} else {
-					frames[queryId] = frame
-					// only 1 query executed
-					break
-				}
-			}
-		}
-
-	}
-
-	fErrors := data.FrameErrors{
-		Errors: frameErrors,
-	}
-	return &data.DiagnosticBundle{
-		Frames: frames,
-		Errors: fErrors,
-	}, nil
-}
-
-func getServerSemVersion(sc *SummaryCollector) (*semver.Version, error) {
-	serverVersion, err := sc.resourceManager.DbClient.Version()
-	if err != nil {
-		return &semver.Version{}, err
-	}
-	//drop the build number - it is not a semantic version
-	versionComponents := strings.Split(serverVersion, ".")
-	serverVersion = strings.Join(versionComponents[:len(versionComponents)-1], ".")
-	return semver.NewVersion(serverVersion)
-}
-
-func (sc *SummaryCollector) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.IntParam{
-				Value: 20,
-				Param: config.NewParam("row_limit", "Limit rows on supported queries.", false),
-			},
-		},
-	}
-}
-
-func (sc *SummaryCollector) IsDefault() bool {
-	return true
-}
-
-func (sc *SummaryCollector) Description() string {
-	return "Collects summary statistics on the database based on a set of known useful queries."
-}
-
-// here we register the collector for use
-func init() {
-	collectors.Register("summary", func() (collectors.Collector, error) {
-		return &SummaryCollector{
-			resourceManager: platform.GetResourceManager(),
-		}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/summary_test.go b/programs/diagnostics/internal/collectors/clickhouse/summary_test.go
deleted file mode 100644
index 92945d987ed..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/summary_test.go
+++ /dev/null
@@ -1,111 +0,0 @@
-package clickhouse_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/clickhouse"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/stretchr/testify/require"
-)
-
-func TestSummaryConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned for summary collector", func(t *testing.T) {
-		client := test.NewFakeClickhouseClient(make(map[string][]string))
-		summaryCollector := clickhouse.NewSummaryCollector(&platform.ResourceManager{
-			DbClient: client,
-		})
-		conf := summaryCollector.Configuration()
-		require.Len(t, conf.Params, 1)
-		require.IsType(t, config.IntParam{}, conf.Params[0])
-		limit, ok := conf.Params[0].(config.IntParam)
-		require.True(t, ok)
-		require.False(t, limit.Required())
-		require.Equal(t, limit.Name(), "row_limit")
-		require.Equal(t, int64(20), limit.Value)
-	})
-}
-
-func TestSummaryCollection(t *testing.T) {
-
-	client := test.NewFakeClickhouseClient(make(map[string][]string))
-	versionFrame := test.NewFakeDataFrame("version", []string{"version()"},
-		[][]interface{}{
-			{"22.1.3.7"},
-		},
-	)
-	client.QueryResponses["SELECT version()"] = &versionFrame
-	databasesFrame := test.NewFakeDataFrame("databases", []string{"name", "engine", "tables", "partitions", "parts", "disk_size"},
-		[][]interface{}{
-			{"tutorial", "Atomic", 2, 2, 2, "1.70 GiB"},
-			{"default", "Atomic", 5, 5, 6, "1.08 GiB"},
-			{"system", "Atomic", 11, 24, 70, "1.05 GiB"},
-			{"INFORMATION_SCHEMA", "Memory", 0, 0, 0, "0.00 B"},
-			{"covid19db", "Atomic", 0, 0, 0, "0.00 B"},
-			{"information_schema", "Memory", 0, 0, 0, "0.00 B"}})
-
-	client.QueryResponses["SELECT name, engine, tables, partitions, parts, formatReadableSize(bytes_on_disk) \"disk_size\" "+
-		"FROM system.databases db LEFT JOIN ( SELECT database, uniq(table) \"tables\", uniq(table, partition) \"partitions\", "+
-		"count() AS parts, sum(bytes_on_disk) \"bytes_on_disk\" FROM system.parts WHERE active GROUP BY database ) AS db_stats "+
-		"ON db.name = db_stats.database ORDER BY bytes_on_disk DESC LIMIT 20"] = &databasesFrame
-
-	summaryCollector := clickhouse.NewSummaryCollector(&platform.ResourceManager{
-		DbClient: client,
-	})
-
-	t.Run("test default summary collection", func(t *testing.T) {
-		bundle, errs := summaryCollector.Collect(config.Configuration{})
-		require.Empty(t, errs)
-		require.Len(t, bundle.Errors.Errors, 30)
-		require.NotNil(t, bundle)
-		require.Len(t, bundle.Frames, 2)
-		// check version frame
-		require.Contains(t, bundle.Frames, "version")
-		require.Equal(t, []string{"version()"}, bundle.Frames["version"].Columns())
-		checkFrame(t, bundle.Frames["version"], versionFrame.Rows)
-		//check databases frame
-		require.Contains(t, bundle.Frames, "databases")
-		require.Equal(t, []string{"name", "engine", "tables", "partitions", "parts", "disk_size"}, bundle.Frames["databases"].Columns())
-		checkFrame(t, bundle.Frames["databases"], databasesFrame.Rows)
-		client.Reset()
-	})
-
-	t.Run("test summary collection with limit", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.IntParam{
-					Value: 1,
-					Param: config.NewParam("row_limit", "Limit rows on supported queries.", false),
-				},
-			},
-		}
-		bundle, errs := summaryCollector.Collect(conf)
-
-		require.Empty(t, errs)
-		require.Len(t, bundle.Errors.Errors, 31)
-		require.NotNil(t, bundle)
-		// databases will be absent due to limit
-		require.Len(t, bundle.Frames, 1)
-		// check version frame
-		require.Contains(t, bundle.Frames, "version")
-		require.Equal(t, []string{"version()"}, bundle.Frames["version"].Columns())
-		checkFrame(t, bundle.Frames["version"], versionFrame.Rows)
-
-		client.QueryResponses["SELECT name, engine, tables, partitions, parts, formatReadableSize(bytes_on_disk) \"disk_size\" "+
-			"FROM system.databases db LEFT JOIN ( SELECT database, uniq(table) \"tables\", uniq(table, partition) \"partitions\", "+
-			"count() AS parts, sum(bytes_on_disk) \"bytes_on_disk\" FROM system.parts WHERE active GROUP BY database ) AS db_stats "+
-			"ON db.name = db_stats.database ORDER BY bytes_on_disk DESC LIMIT 1"] = &databasesFrame
-		bundle, errs = summaryCollector.Collect(conf)
-		require.Empty(t, errs)
-		require.Len(t, bundle.Errors.Errors, 30)
-		require.NotNil(t, bundle)
-		require.Len(t, bundle.Frames, 2)
-		require.Contains(t, bundle.Frames, "version")
-		//check databases frame
-		require.Contains(t, bundle.Frames, "databases")
-		require.Equal(t, []string{"name", "engine", "tables", "partitions", "parts", "disk_size"}, bundle.Frames["databases"].Columns())
-		// this will parse as our mock client does not read statement (specifically the limit clause) when called with execute
-		checkFrame(t, bundle.Frames["databases"], databasesFrame.Rows)
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/system.go b/programs/diagnostics/internal/collectors/clickhouse/system.go
deleted file mode 100644
index d47cfd924f3..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/system.go
+++ /dev/null
@@ -1,165 +0,0 @@
-package clickhouse
-
-import (
-	"fmt"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/pkg/errors"
-)
-
-// This collector collects the system db from database
-
-type SystemDatabaseCollector struct {
-	resourceManager *platform.ResourceManager
-}
-
-const SystemDatabase = "system"
-
-// ExcludeColumns columns if we need - this will be refined over time [table_name][columnA, columnB]
-var ExcludeColumns = map[string][]string{}
-
-// BannedTables - Hardcoded list. These are always excluded even if the user doesn't specify in exclude_tables.
-//Attempts to export will work but we will warn
-var BannedTables = []string{"numbers", "zeros"}
-
-// OrderBy contains a map of tables to an order by clause - by default we don't order table dumps
-var OrderBy = map[string]data.OrderBy{
-	"errors": {
-		Column: "last_error_message",
-		Order:  data.Desc,
-	},
-	"replication_queue": {
-		Column: "create_time",
-		Order:  data.Asc,
-	},
-}
-
-func NewSystemDatabaseCollector(m *platform.ResourceManager) *SystemDatabaseCollector {
-	return &SystemDatabaseCollector{
-		resourceManager: m,
-	}
-}
-
-func (sc *SystemDatabaseCollector) Collect(conf config.Configuration) (*data.DiagnosticBundle, error) {
-	conf, err := conf.ValidateConfig(sc.Configuration())
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	includeTables, err := config.ReadStringListValues(conf, "include_tables")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	excludeTables, err := config.ReadStringListValues(conf, "exclude_tables")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	rowLimit, err := config.ReadIntValue(conf, "row_limit")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	excludeTables = checkBannedTables(includeTables, excludeTables)
-	ds, err := sc.readSystemAllTables(includeTables, excludeTables, rowLimit)
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	return ds, nil
-}
-
-// all banned tables are added to excluded if not present and not specified in included. Returns new exclude_tables list.
-func checkBannedTables(includeTables []string, excludeTables []string) []string {
-	for _, bannedTable := range BannedTables {
-		//if its specified we don't add to our exclude list - explicitly included tables take precedence
-		if !utils.Contains(includeTables, bannedTable) && !utils.Contains(excludeTables, bannedTable) {
-			excludeTables = append(excludeTables, bannedTable)
-		}
-	}
-	return excludeTables
-}
-
-func (sc *SystemDatabaseCollector) readSystemAllTables(include []string, exclude []string, limit int64) (*data.DiagnosticBundle, error) {
-	tableNames, err := sc.resourceManager.DbClient.ReadTableNamesForDatabase(SystemDatabase)
-	if err != nil {
-		return nil, err
-	}
-	var frameErrors []error
-	if include != nil {
-		// nil means include everything
-		tableNames = utils.Intersection(tableNames, include)
-		if len(tableNames) != len(include) {
-			// we warn that some included tables aren't present in db
-			frameErrors = append(frameErrors, fmt.Errorf("some tables specified in the include_tables are not in the system database and will not be exported: %v",
-				utils.Distinct(include, tableNames)))
-		}
-	}
-
-	// exclude tables unless specified in includes
-	excludedTables := utils.Distinct(exclude, include)
-	tableNames = utils.Distinct(tableNames, excludedTables)
-	frames := make(map[string]data.Frame)
-
-	for _, tableName := range tableNames {
-		var excludeColumns []string
-		if _, ok := ExcludeColumns[tableName]; ok {
-			excludeColumns = ExcludeColumns[tableName]
-		}
-		orderBy := data.OrderBy{}
-		if _, ok := OrderBy[tableName]; ok {
-			orderBy = OrderBy[tableName]
-		}
-		frame, err := sc.resourceManager.DbClient.ReadTable(SystemDatabase, tableName, excludeColumns, orderBy, limit)
-		if err != nil {
-			frameErrors = append(frameErrors, errors.Wrapf(err, "Unable to collect %s", tableName))
-		} else {
-			frames[tableName] = frame
-		}
-	}
-
-	fErrors := data.FrameErrors{
-		Errors: frameErrors,
-	}
-	return &data.DiagnosticBundle{
-		Frames: frames,
-		Errors: fErrors,
-	}, nil
-}
-
-func (sc *SystemDatabaseCollector) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.StringListParam{
-				// nil means include everything
-				Values: nil,
-				Param:  config.NewParam("include_tables", "Specify list of tables to collect. Takes precedence over exclude_tables. If not specified (default) all tables except exclude_tables.", false),
-			},
-			config.StringListParam{
-				Values: []string{"licenses", "distributed_ddl_queue", "query_thread_log", "query_log", "asynchronous_metric_log", "zookeeper", "aggregate_function_combinators", "collations", "contributors", "data_type_families", "formats", "graphite_retentions", "numbers", "numbers_mt", "one", "parts_columns", "projection_parts", "projection_parts_columns", "table_engines", "time_zones", "zeros", "zeros_mt"},
-				Param:  config.NewParam("exclude_tables", "Specify list of tables to not collect.", false),
-			},
-			config.IntParam{
-				Value: 100000,
-				Param: config.NewParam("row_limit", "Maximum number of rows to collect from any table. Negative values mean unlimited.", false),
-			},
-		},
-	}
-}
-
-func (sc *SystemDatabaseCollector) IsDefault() bool {
-	return true
-}
-
-func (sc *SystemDatabaseCollector) Description() string {
-	return "Collects all tables in the system database, except those which have been excluded."
-}
-
-// here we register the collector for use
-func init() {
-	collectors.Register("system_db", func() (collectors.Collector, error) {
-		return &SystemDatabaseCollector{
-			resourceManager: platform.GetResourceManager(),
-		}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/system_test.go b/programs/diagnostics/internal/collectors/clickhouse/system_test.go
deleted file mode 100644
index d1b9a6e7859..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/system_test.go
+++ /dev/null
@@ -1,366 +0,0 @@
-package clickhouse_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/clickhouse"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/stretchr/testify/require"
-)
-
-func TestSystemConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned for system db collector", func(t *testing.T) {
-		client := test.NewFakeClickhouseClient(make(map[string][]string))
-		systemDbCollector := clickhouse.NewSystemDatabaseCollector(&platform.ResourceManager{
-			DbClient: client,
-		})
-		conf := systemDbCollector.Configuration()
-		require.Len(t, conf.Params, 3)
-		// check first param
-		require.IsType(t, config.StringListParam{}, conf.Params[0])
-		includeTables, ok := conf.Params[0].(config.StringListParam)
-		require.True(t, ok)
-		require.False(t, includeTables.Required())
-		require.Equal(t, includeTables.Name(), "include_tables")
-		require.Nil(t, includeTables.Values)
-		// check second param
-		require.IsType(t, config.StringListParam{}, conf.Params[1])
-		excludeTables, ok := conf.Params[1].(config.StringListParam)
-		require.True(t, ok)
-		require.False(t, excludeTables.Required())
-		require.Equal(t, "exclude_tables", excludeTables.Name())
-		require.Equal(t, []string{"licenses", "distributed_ddl_queue", "query_thread_log", "query_log", "asynchronous_metric_log", "zookeeper", "aggregate_function_combinators", "collations", "contributors", "data_type_families", "formats", "graphite_retentions", "numbers", "numbers_mt", "one", "parts_columns", "projection_parts", "projection_parts_columns", "table_engines", "time_zones", "zeros", "zeros_mt"}, excludeTables.Values)
-		// check third param
-		require.IsType(t, config.IntParam{}, conf.Params[2])
-		rowLimit, ok := conf.Params[2].(config.IntParam)
-		require.True(t, ok)
-		require.False(t, rowLimit.Required())
-		require.Equal(t, "row_limit", rowLimit.Name())
-		require.Equal(t, int64(100000), rowLimit.Value)
-	})
-}
-
-func TestSystemDbCollect(t *testing.T) {
-
-	diskFrame := test.NewFakeDataFrame("disks", []string{"name", "path", "free_space", "total_space", "keep_free_space", "type"},
-		[][]interface{}{
-			{"default", "/var/lib/clickhouse", 1729659346944, 1938213220352, "", "local"},
-		},
-	)
-	clusterFrame := test.NewFakeDataFrame("clusters", []string{"cluster", "shard_num", "shard_weight", "replica_num", "host_name", "host_address", "port", "is_local", "user", "default_database", "errors_count", "slowdowns_count", "estimated_recovery_time"},
-		[][]interface{}{
-			{"events", 1, 1, 1, "dalem-local-clickhouse-blue-1", "192.168.144.2", 9000, 1, "default", "", 0, 0, 0},
-			{"events", 2, 1, 1, "dalem-local-clickhouse-blue-2", "192.168.144.4", 9000, 1, "default", "", 0, 0, 0},
-			{"events", 3, 1, 1, "dalem-local-clickhouse-blue-3", "192.168.144.3", 9000, 1, "default", "", 0, 0, 0},
-		},
-	)
-	userFrame := test.NewFakeDataFrame("users", []string{"name", "id", "storage", "auth_type", "auth_params", "host_ip", "host_names", "host_names_regexp", "host_names_like"},
-		[][]interface{}{
-			{"default", "94309d50-4f52-5250-31bd-74fecac179db,users.xml,plaintext_password", "sha256_password", []string{"::0"}, []string{}, []string{}, []string{}},
-		},
-	)
-
-	dbTables := map[string][]string{
-		clickhouse.SystemDatabase: {"disks", "clusters", "users"},
-	}
-	client := test.NewFakeClickhouseClient(dbTables)
-
-	client.QueryResponses["SELECT * FROM system.disks LIMIT 100000"] = &diskFrame
-	client.QueryResponses["SELECT * FROM system.clusters LIMIT 100000"] = &clusterFrame
-	client.QueryResponses["SELECT * FROM system.users LIMIT 100000"] = &userFrame
-	systemDbCollector := clickhouse.NewSystemDatabaseCollector(&platform.ResourceManager{
-		DbClient: client,
-	})
-
-	t.Run("test default system db collection", func(t *testing.T) {
-		diagSet, err := systemDbCollector.Collect(config.Configuration{})
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 3)
-		// disks frame
-		require.Equal(t, "disks", diagSet.Frames["disks"].Name())
-		require.Equal(t, diskFrame.ColumnNames, diagSet.Frames["disks"].Columns())
-		checkFrame(t, diagSet.Frames["disks"], diskFrame.Rows)
-		// clusters frame
-		require.Equal(t, "clusters", diagSet.Frames["clusters"].Name())
-		require.Equal(t, clusterFrame.ColumnNames, diagSet.Frames["clusters"].Columns())
-		checkFrame(t, diagSet.Frames["clusters"], clusterFrame.Rows)
-		// users frame
-		require.Equal(t, "users", diagSet.Frames["users"].Name())
-		require.Equal(t, userFrame.ColumnNames, diagSet.Frames["users"].Columns())
-		checkFrame(t, diagSet.Frames["users"], userFrame.Rows)
-		client.Reset()
-	})
-
-	t.Run("test when we pass an includes", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringListParam{
-					// nil means include everything
-					Values: []string{"disks"},
-					Param:  config.NewParam("include_tables", "Exclusion", false),
-				},
-			},
-		}
-		diagSet, err := systemDbCollector.Collect(conf)
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 1)
-		// disks frame
-		require.Equal(t, "disks", diagSet.Frames["disks"].Name())
-		require.Equal(t, diskFrame.ColumnNames, diagSet.Frames["disks"].Columns())
-		checkFrame(t, diagSet.Frames["disks"], diskFrame.Rows)
-		client.Reset()
-	})
-
-	// test excludes
-	t.Run("test when we pass an excludes", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringListParam{
-					Values: []string{"disks"},
-					Param:  config.NewParam("exclude_tables", "Exclusion", false),
-				},
-			},
-		}
-		diagSet, err := systemDbCollector.Collect(conf)
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 2)
-		// clusters frame
-		require.Equal(t, "clusters", diagSet.Frames["clusters"].Name())
-		require.Equal(t, clusterFrame.ColumnNames, diagSet.Frames["clusters"].Columns())
-		checkFrame(t, diagSet.Frames["clusters"], clusterFrame.Rows)
-		// users frame
-		require.Equal(t, "users", diagSet.Frames["users"].Name())
-		require.Equal(t, userFrame.ColumnNames, diagSet.Frames["users"].Columns())
-		checkFrame(t, diagSet.Frames["users"], userFrame.Rows)
-		client.Reset()
-	})
-
-	// test includes which isn't in the list
-	t.Run("test when we pass an invalid includes", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringListParam{
-					// nil means include everything
-					Values: []string{"disks", "invalid"},
-					Param:  config.NewParam("include_tables", "Exclusion", false),
-				},
-			},
-		}
-		diagSet, err := systemDbCollector.Collect(conf)
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 1)
-		require.Equal(t, diagSet.Errors.Error(), "some tables specified in the include_tables are not in the "+
-			"system database and will not be exported: [invalid]")
-		require.Len(t, diagSet.Frames, 1)
-		// disks frame
-		require.Equal(t, "disks", diagSet.Frames["disks"].Name())
-		require.Equal(t, diskFrame.ColumnNames, diagSet.Frames["disks"].Columns())
-		checkFrame(t, diagSet.Frames["disks"], diskFrame.Rows)
-		client.Reset()
-	})
-
-	t.Run("test when we use a table with excluded fields", func(t *testing.T) {
-		excludeDefault := clickhouse.ExcludeColumns
-		client.QueryResponses["SELECT * EXCEPT(keep_free_space,type) FROM system.disks LIMIT 100000"] = &diskFrame
-		clickhouse.ExcludeColumns = map[string][]string{
-			"disks": {"keep_free_space", "type"},
-		}
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringListParam{
-					// nil means include everything
-					Values: []string{"disks"},
-					Param:  config.NewParam("include_tables", "Exclusion", false),
-				},
-			},
-		}
-		diagSet, err := systemDbCollector.Collect(conf)
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 1)
-		// disks frame
-		require.Equal(t, "disks", diagSet.Frames["disks"].Name())
-		require.Equal(t, []string{"name", "path", "free_space", "total_space"}, diagSet.Frames["disks"].Columns())
-		eDiskFrame := test.NewFakeDataFrame("disks", []string{"name", "path", "free_space", "total_space"},
-			[][]interface{}{
-				{"default", "/var/lib/clickhouse", 1729659346944, 1938213220352},
-			},
-		)
-		checkFrame(t, diagSet.Frames["disks"], eDiskFrame.Rows)
-		clickhouse.ExcludeColumns = excludeDefault
-		client.Reset()
-	})
-
-	t.Run("test with a low row limit", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.IntParam{
-					Value: 1,
-					Param: config.NewParam("row_limit", "Maximum number of rows to collect from any table. Negative values mean unlimited.", false),
-				},
-			},
-		}
-		client.QueryResponses["SELECT * FROM system.disks LIMIT 1"] = &diskFrame
-		client.QueryResponses["SELECT * FROM system.clusters LIMIT 1"] = &clusterFrame
-		client.QueryResponses["SELECT * FROM system.users LIMIT 1"] = &userFrame
-		diagSet, err := systemDbCollector.Collect(conf)
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 3)
-		// clusters frame
-		require.Equal(t, "clusters", diagSet.Frames["clusters"].Name())
-		require.Equal(t, clusterFrame.ColumnNames, diagSet.Frames["clusters"].Columns())
-		lClusterFrame := test.NewFakeDataFrame("clusters", []string{"cluster", "shard_num", "shard_weight", "replica_num", "host_name", "host_address", "port", "is_local", "user", "default_database", "errors_count", "slowdowns_count", "estimated_recovery_time"},
-			[][]interface{}{
-				{"events", 1, 1, 1, "dalem-local-clickhouse-blue-1", "192.168.144.2", 9000, 1, "default", "", 0, 0, 0},
-			})
-		checkFrame(t, diagSet.Frames["clusters"], lClusterFrame.Rows)
-		client.Reset()
-	})
-
-	t.Run("test with a negative low row limit", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.IntParam{
-					Value: -23,
-					Param: config.NewParam("row_limit", "Maximum number of rows to collect from any table. Negative values mean unlimited.", false),
-				},
-			},
-		}
-		client.QueryResponses["SELECT * FROM system.clusters"] = &clusterFrame
-		client.QueryResponses["SELECT * FROM system.disks"] = &diskFrame
-		client.QueryResponses["SELECT * FROM system.users"] = &userFrame
-		diagSet, err := systemDbCollector.Collect(conf)
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 3)
-		// disks frame
-		require.Equal(t, "disks", diagSet.Frames["disks"].Name())
-		require.Equal(t, diskFrame.ColumnNames, diagSet.Frames["disks"].Columns())
-		checkFrame(t, diagSet.Frames["disks"], diskFrame.Rows)
-		// clusters frame
-		require.Equal(t, "clusters", diagSet.Frames["clusters"].Name())
-		require.Equal(t, clusterFrame.ColumnNames, diagSet.Frames["clusters"].Columns())
-		checkFrame(t, diagSet.Frames["clusters"], clusterFrame.Rows)
-		// users frame
-		require.Equal(t, "users", diagSet.Frames["users"].Name())
-		require.Equal(t, userFrame.ColumnNames, diagSet.Frames["users"].Columns())
-		checkFrame(t, diagSet.Frames["users"], userFrame.Rows)
-		client.Reset()
-	})
-
-	t.Run("test that includes overrides excludes", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringListParam{
-					// nil means include everything
-					Values: []string{"disks"},
-					Param:  config.NewParam("exclude_tables", "Excluded", false),
-				},
-				config.StringListParam{
-					// nil means include everything
-					Values: []string{"disks", "clusters", "users"},
-					Param:  config.NewParam("include_tables", "Included", false),
-				},
-			},
-		}
-		diagSet, err := systemDbCollector.Collect(conf)
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 3)
-		client.Reset()
-	})
-
-	t.Run("test banned", func(t *testing.T) {
-		bannedDefault := clickhouse.BannedTables
-		clickhouse.BannedTables = []string{"disks"}
-		diagSet, err := systemDbCollector.Collect(config.Configuration{})
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 2)
-		require.Contains(t, diagSet.Frames, "users")
-		require.Contains(t, diagSet.Frames, "clusters")
-		clickhouse.BannedTables = bannedDefault
-		client.Reset()
-	})
-
-	t.Run("test banned unless included", func(t *testing.T) {
-		bannedDefault := clickhouse.BannedTables
-		clickhouse.BannedTables = []string{"disks"}
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringListParam{
-					// nil means include everything
-					Values: []string{"disks", "clusters", "users"},
-					Param:  config.NewParam("include_tables", "Included", false),
-				},
-			},
-		}
-		diagSet, err := systemDbCollector.Collect(conf)
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 3)
-		require.Contains(t, diagSet.Frames, "disks")
-		require.Contains(t, diagSet.Frames, "users")
-		require.Contains(t, diagSet.Frames, "clusters")
-		clickhouse.BannedTables = bannedDefault
-		client.Reset()
-	})
-
-	t.Run("tables are ordered if configured", func(t *testing.T) {
-		defaultOrderBy := clickhouse.OrderBy
-		clickhouse.OrderBy = map[string]data.OrderBy{
-			"clusters": {
-				Column: "shard_num",
-				Order:  data.Desc,
-			},
-		}
-		client.QueryResponses["SELECT * FROM system.clusters ORDER BY shard_num DESC LIMIT 100000"] = &clusterFrame
-		diagSet, err := systemDbCollector.Collect(config.Configuration{})
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 3)
-		clickhouse.OrderBy = defaultOrderBy
-		oClusterFrame := test.NewFakeDataFrame("clusters", []string{"cluster", "shard_num", "shard_weight", "replica_num", "host_name", "host_address", "port", "is_local", "user", "default_database", "errors_count", "slowdowns_count", "estimated_recovery_time"},
-			[][]interface{}{
-				{"events", 3, 1, 1, "dalem-local-clickhouse-blue-3", "192.168.144.3", 9000, 1, "default", "", 0, 0, 0},
-				{"events", 2, 1, 1, "dalem-local-clickhouse-blue-2", "192.168.144.4", 9000, 1, "default", "", 0, 0, 0},
-				{"events", 1, 1, 1, "dalem-local-clickhouse-blue-1", "192.168.144.2", 9000, 1, "default", "", 0, 0, 0},
-			},
-		)
-		checkFrame(t, diagSet.Frames["clusters"], oClusterFrame.Rows)
-		client.Reset()
-	})
-
-}
-
-func checkFrame(t *testing.T, frame data.Frame, rows [][]interface{}) {
-	i := 0
-	for {
-		values, ok, err := frame.Next()
-		require.Nil(t, err)
-		if !ok {
-			break
-		}
-		require.ElementsMatch(t, rows[i], values)
-		i += 1
-	}
-	require.Equal(t, i, len(rows))
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/zookeeper.go b/programs/diagnostics/internal/collectors/clickhouse/zookeeper.go
deleted file mode 100644
index 78aefeaa0c1..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/zookeeper.go
+++ /dev/null
@@ -1,153 +0,0 @@
-package clickhouse
-
-import (
-	"fmt"
-	"strings"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/bmatcuk/doublestar/v4"
-	"github.com/pkg/errors"
-	"github.com/rs/zerolog/log"
-)
-
-// This collector collects the system zookeeper db
-
-type ZookeeperCollector struct {
-	resourceManager *platform.ResourceManager
-}
-
-func NewZookeeperCollector(m *platform.ResourceManager) *ZookeeperCollector {
-	return &ZookeeperCollector{
-		resourceManager: m,
-	}
-}
-
-func (zkc *ZookeeperCollector) Collect(conf config.Configuration) (*data.DiagnosticBundle, error) {
-	conf, err := conf.ValidateConfig(zkc.Configuration())
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-
-	pathPattern, err := config.ReadStringValue(conf, "path_pattern")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	defaultPattern, _ := zkc.Configuration().GetConfigParam("path_pattern")
-	if defaultPattern.(config.StringParam).Value != pathPattern {
-		log.Warn().Msgf("Using non default zookeeper glob pattern [%s] - this can potentially cause high query load", pathPattern)
-	}
-	maxDepth, err := config.ReadIntValue(conf, "max_depth")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	rowLimit, err := config.ReadIntValue(conf, "row_limit")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	// we use doublestar for globs as it provides us with ** but also allows us to identify prefix or base paths
-	if !doublestar.ValidatePattern(pathPattern) {
-		return &data.DiagnosticBundle{}, errors.Wrapf(err, "%s is not a valid pattern", pathPattern)
-	}
-	base, _ := doublestar.SplitPattern(pathPattern)
-	frames := make(map[string]data.Frame)
-	hFrame, frameErrors := zkc.collectSubFrames(base, pathPattern, rowLimit, 0, maxDepth)
-	fErrors := data.FrameErrors{
-		Errors: frameErrors,
-	}
-	frames["zookeeper_db"] = hFrame
-	return &data.DiagnosticBundle{
-		Frames: frames,
-		Errors: fErrors,
-	}, nil
-}
-
-// recursively iterates over the zookeeper sub tables to a max depth, applying the filter and max rows per table
-func (zkc *ZookeeperCollector) collectSubFrames(path, pathPattern string, rowLimit, currentDepth, maxDepth int64) (data.HierarchicalFrame, []error) {
-	var frameErrors []error
-	var subFrames []data.HierarchicalFrame
-
-	currentDepth += 1
-	if currentDepth == maxDepth {
-		return data.HierarchicalFrame{}, frameErrors
-	}
-	match, err := doublestar.PathMatch(pathPattern, path)
-	if err != nil {
-		frameErrors = append(frameErrors, errors.Wrapf(err, "Path match failed for pattern %s with path %s", pathPattern, path))
-		return data.HierarchicalFrame{}, frameErrors
-	}
-	// we allow a single level to be examined or we never get going
-	if !match && currentDepth > 1 {
-		return data.HierarchicalFrame{}, frameErrors
-	}
-	frame, err := zkc.resourceManager.DbClient.ExecuteStatement(path, fmt.Sprintf("SELECT name FROM system.zookeeper WHERE path='%s' LIMIT %d", path, rowLimit))
-	if err != nil {
-		frameErrors = append(frameErrors, errors.Wrapf(err, "Unable to read zookeeper table path for sub paths %s", path))
-		return data.HierarchicalFrame{}, frameErrors
-	}
-
-	// this isn't ideal, we add re-execute the query to our collection as this will be consumed by the output lazily
-	outputFrame, err := zkc.resourceManager.DbClient.ExecuteStatement(path, fmt.Sprintf("SELECT * FROM system.zookeeper WHERE path='%s' LIMIT %d", path, rowLimit))
-	if err != nil {
-		frameErrors = append(frameErrors, errors.Wrapf(err, "Unable to read zookeeper table path %s", path))
-		return data.HierarchicalFrame{}, frameErrors
-	}
-	frameComponents := strings.Split(path, "/")
-	frameId := frameComponents[len(frameComponents)-1]
-
-	for {
-		values, ok, err := frame.Next()
-		if err != nil {
-			frameErrors = append(frameErrors, errors.Wrapf(err, "unable to read frame %s", frame.Name()))
-			return data.NewHierarchicalFrame(frameId, outputFrame, subFrames), frameErrors
-		}
-		if !ok {
-			return data.NewHierarchicalFrame(frameId, outputFrame, subFrames), frameErrors
-		}
-		subName := fmt.Sprintf("%v", values[0])
-		subPath := fmt.Sprintf("%s/%s", path, subName)
-		subFrame, errs := zkc.collectSubFrames(subPath, pathPattern, rowLimit, currentDepth, maxDepth)
-		if subFrame.Name() != "" {
-			subFrames = append(subFrames, subFrame)
-		}
-		frameErrors = append(frameErrors, errs...)
-	}
-}
-
-func (zkc *ZookeeperCollector) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.StringParam{
-				Value: "/clickhouse/{task_queue}/**",
-				Param: config.NewParam("path_pattern", "Glob pattern for zookeeper path matching. Change with caution.", false),
-			},
-			config.IntParam{
-				Value: 8,
-				Param: config.NewParam("max_depth", "Max depth for zookeeper navigation.", false),
-			},
-			config.IntParam{
-				Value: 10,
-				Param: config.NewParam("row_limit", "Maximum number of rows/sub nodes to collect/expand from any zookeeper leaf. Negative values mean unlimited.", false),
-			},
-		},
-	}
-}
-
-func (zkc *ZookeeperCollector) IsDefault() bool {
-	return false
-}
-
-func (zkc *ZookeeperCollector) Description() string {
-	return "Collects Zookeeper information available within ClickHouse."
-}
-
-// here we register the collector for use
-func init() {
-	collectors.Register("zookeeper_db", func() (collectors.Collector, error) {
-		return &ZookeeperCollector{
-			resourceManager: platform.GetResourceManager(),
-		}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/clickhouse/zookeeper_test.go b/programs/diagnostics/internal/collectors/clickhouse/zookeeper_test.go
deleted file mode 100644
index 3e56f6200f0..00000000000
--- a/programs/diagnostics/internal/collectors/clickhouse/zookeeper_test.go
+++ /dev/null
@@ -1,102 +0,0 @@
-package clickhouse_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/clickhouse"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/stretchr/testify/require"
-)
-
-func TestZookeeperConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned for system zookeeper collector", func(t *testing.T) {
-		client := test.NewFakeClickhouseClient(make(map[string][]string))
-		zkCollector := clickhouse.NewZookeeperCollector(&platform.ResourceManager{
-			DbClient: client,
-		})
-		conf := zkCollector.Configuration()
-		require.Len(t, conf.Params, 3)
-		// check first param
-		require.IsType(t, config.StringParam{}, conf.Params[0])
-		pathPattern, ok := conf.Params[0].(config.StringParam)
-		require.True(t, ok)
-		require.False(t, pathPattern.Required())
-		require.Equal(t, pathPattern.Name(), "path_pattern")
-		require.Equal(t, "/clickhouse/{task_queue}/**", pathPattern.Value)
-		// check second param
-		require.IsType(t, config.IntParam{}, conf.Params[1])
-		maxDepth, ok := conf.Params[1].(config.IntParam)
-		require.True(t, ok)
-		require.False(t, maxDepth.Required())
-		require.Equal(t, "max_depth", maxDepth.Name())
-		require.Equal(t, int64(8), maxDepth.Value)
-		// check third param
-		require.IsType(t, config.IntParam{}, conf.Params[2])
-		rowLimit, ok := conf.Params[2].(config.IntParam)
-		require.True(t, ok)
-		require.False(t, rowLimit.Required())
-		require.Equal(t, "row_limit", rowLimit.Name())
-		require.Equal(t, int64(10), rowLimit.Value)
-	})
-}
-
-func TestZookeeperCollect(t *testing.T) {
-	level1 := test.NewFakeDataFrame("level_1", []string{"name", "value", "czxid", "mzxid", "ctime", "mtime", "version", "cversion", "aversion", "ephemeralOwner", "dataLength", "numChildren", "pzxid", "path"},
-		[][]interface{}{
-			{"name", "value", "czxid", "mzxid", "ctime", "mtime", "version", "cversion", "aversion", "ephemeralOwner", "dataLength", "numChildren", "pzxid", "path"},
-			{"task_queue", "", "4", "4", "2022-02-22 13:30:15", "2022-02-22 13:30:15", "0", "1", "0", "0", "0", "1", "5", "/clickhouse"},
-			{"copytasks", "", "525608", "525608", "2022-03-09 13:47:39", "2022-03-09 13:47:39", "0", "7", "0", "0", "0", "7", "526100", "/clickhouse"},
-		},
-	)
-	level2 := test.NewFakeDataFrame("level_2", []string{"name", "value", "czxid", "mzxid", "ctime", "mtime", "version", "cversion", "aversion", "ephemeralOwner", "dataLength", "numChildren", "pzxid", "path"},
-		[][]interface{}{
-			{"ddl", "", "5", "5", "2022-02-22 13:30:15", "2022-02-22 13:30:15", "0", "0", "0", "0", "0", "0", "5", "/clickhouse/task_queue"},
-		},
-	)
-	level3 := test.NewFakeDataFrame("level_2", []string{"name", "value", "czxid", "mzxid", "ctime", "mtime", "version", "cversion", "aversion", "ephemeralOwner", "dataLength", "numChildren", "pzxid", "path"},
-		[][]interface{}{},
-	)
-	dbTables := map[string][]string{
-		clickhouse.SystemDatabase: {"zookeeper"},
-	}
-	client := test.NewFakeClickhouseClient(dbTables)
-
-	client.QueryResponses["SELECT name FROM system.zookeeper WHERE path='/clickhouse' LIMIT 10"] = &level1
-	// can't reuse the frame as the first frame will be iterated as part of the recursive zookeeper search performed by the collector
-	cLevel1 := test.NewFakeDataFrame("level_1", level1.Columns(), level1.Rows)
-	client.QueryResponses["SELECT * FROM system.zookeeper WHERE path='/clickhouse' LIMIT 10"] = &cLevel1
-	client.QueryResponses["SELECT name FROM system.zookeeper WHERE path='/clickhouse/task_queue' LIMIT 10"] = &level2
-	cLevel2 := test.NewFakeDataFrame("level_2", level2.Columns(), level2.Rows)
-	client.QueryResponses["SELECT * FROM system.zookeeper WHERE path='/clickhouse/task_queue' LIMIT 10"] = &cLevel2
-	client.QueryResponses["SELECT name FROM system.zookeeper WHERE path='/clickhouse/task_queue/ddl' LIMIT 10"] = &level3
-	cLevel3 := test.NewFakeDataFrame("level_3", level3.Columns(), level3.Rows)
-	client.QueryResponses["SELECT * FROM system.zookeeper WHERE path='/clickhouse/task_queue/ddl' LIMIT 10"] = &cLevel3
-
-	zKCollector := clickhouse.NewZookeeperCollector(&platform.ResourceManager{
-		DbClient: client,
-	})
-
-	t.Run("test default zookeeper collection", func(t *testing.T) {
-		diagSet, err := zKCollector.Collect(config.Configuration{})
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 1)
-		require.Contains(t, diagSet.Frames, "zookeeper_db")
-		require.Equal(t, "clickhouse", diagSet.Frames["zookeeper_db"].Name())
-		require.IsType(t, data.HierarchicalFrame{}, diagSet.Frames["zookeeper_db"])
-		checkFrame(t, diagSet.Frames["zookeeper_db"], level1.Rows)
-		require.Equal(t, level1.Columns(), diagSet.Frames["zookeeper_db"].Columns())
-		hierarchicalFrame := diagSet.Frames["zookeeper_db"].(data.HierarchicalFrame)
-		require.Len(t, hierarchicalFrame.SubFrames, 1)
-		checkFrame(t, hierarchicalFrame.SubFrames[0], cLevel2.Rows)
-		require.Equal(t, cLevel2.Columns(), hierarchicalFrame.SubFrames[0].Columns())
-		hierarchicalFrame = hierarchicalFrame.SubFrames[0]
-		require.Len(t, hierarchicalFrame.SubFrames, 1)
-		checkFrame(t, hierarchicalFrame.SubFrames[0], cLevel3.Rows)
-		require.Equal(t, cLevel3.Columns(), hierarchicalFrame.SubFrames[0].Columns())
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/registry.go b/programs/diagnostics/internal/collectors/registry.go
deleted file mode 100644
index 5611f947466..00000000000
--- a/programs/diagnostics/internal/collectors/registry.go
+++ /dev/null
@@ -1,75 +0,0 @@
-package collectors
-
-import (
-	"fmt"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/pkg/errors"
-	"github.com/rs/zerolog/log"
-)
-
-type Collector interface {
-	Collect(config config.Configuration) (*data.DiagnosticBundle, error)
-	Configuration() config.Configuration
-	IsDefault() bool
-	Description() string
-}
-
-// Register can be called from init() on a collector in this package
-// It will automatically be added to the Collectors map to be called externally
-func Register(name string, collector CollectorFactory) {
-	if name == "diag_trace" {
-		// we use this to record errors and warnings
-		log.Fatal().Msgf("diag_trace is a reserved collector name")
-	}
-	// names must be unique
-	if _, ok := Collectors[name]; ok {
-		log.Fatal().Msgf("More than 1 collector is trying to register under the name %s. Names must be unique.", name)
-	}
-	Collectors[name] = collector
-}
-
-// CollectorFactory lets us use a closure to get instances of the collector struct
-type CollectorFactory func() (Collector, error)
-
-var Collectors = map[string]CollectorFactory{}
-
-func GetCollectorNames(defaultOnly bool) []string {
-	// can't pre-allocate as not all maybe default
-	var collectors []string
-	for collectorName := range Collectors {
-		collector, err := GetCollectorByName(collectorName)
-		if err != nil {
-			log.Fatal().Err(err)
-		}
-		if !defaultOnly || (defaultOnly && collector.IsDefault()) {
-			collectors = append(collectors, collectorName)
-		}
-	}
-	return collectors
-}
-
-func GetCollectorByName(name string) (Collector, error) {
-	if collectorFactory, ok := Collectors[name]; ok {
-		//do something here
-		collector, err := collectorFactory()
-		if err != nil {
-			return nil, errors.Wrapf(err, "collector %s could not be initialized", name)
-		}
-		return collector, nil
-	}
-	return nil, fmt.Errorf("%s is not a valid collector name", name)
-}
-
-func BuildConfigurationOptions() (map[string]config.Configuration, error) {
-	configurations := make(map[string]config.Configuration)
-	for name, collectorFactory := range Collectors {
-		collector, err := collectorFactory()
-		if err != nil {
-			return nil, errors.Wrapf(err, "collector %s could not be initialized", name)
-		}
-		configurations[name] = collector.Configuration()
-	}
-	return configurations, nil
-}
diff --git a/programs/diagnostics/internal/collectors/registry_test.go b/programs/diagnostics/internal/collectors/registry_test.go
deleted file mode 100644
index eccc5f2265d..00000000000
--- a/programs/diagnostics/internal/collectors/registry_test.go
+++ /dev/null
@@ -1,57 +0,0 @@
-package collectors_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/clickhouse"
-	_ "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/system"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/stretchr/testify/require"
-)
-
-func TestGetCollectorNames(t *testing.T) {
-	t.Run("can get all collector names", func(t *testing.T) {
-		collectorNames := collectors.GetCollectorNames(false)
-		require.ElementsMatch(t, []string{"system_db", "config", "summary", "system", "logs", "db_logs", "file", "command", "zookeeper_db"}, collectorNames)
-	})
-
-	t.Run("can get default collector names", func(t *testing.T) {
-		collectorNames := collectors.GetCollectorNames(true)
-		require.ElementsMatch(t, []string{"system_db", "config", "summary", "system", "logs", "db_logs"}, collectorNames)
-	})
-}
-
-func TestGetCollectorByName(t *testing.T) {
-
-	t.Run("can get collector by name", func(t *testing.T) {
-		collector, err := collectors.GetCollectorByName("system_db")
-		require.Nil(t, err)
-		require.Equal(t, clickhouse.NewSystemDatabaseCollector(platform.GetResourceManager()), collector)
-	})
-
-	t.Run("fails on non existing collector", func(t *testing.T) {
-		collector, err := collectors.GetCollectorByName("random")
-		require.NotNil(t, err)
-		require.Equal(t, "random is not a valid collector name", err.Error())
-		require.Nil(t, collector)
-	})
-}
-
-func TestBuildConfigurationOptions(t *testing.T) {
-
-	t.Run("can get all collector configurations", func(t *testing.T) {
-		configs, err := collectors.BuildConfigurationOptions()
-		require.Nil(t, err)
-		require.Len(t, configs, 9)
-		require.Contains(t, configs, "system_db")
-		require.Contains(t, configs, "config")
-		require.Contains(t, configs, "summary")
-		require.Contains(t, configs, "system")
-		require.Contains(t, configs, "logs")
-		require.Contains(t, configs, "db_logs")
-		require.Contains(t, configs, "file")
-		require.Contains(t, configs, "command")
-		require.Contains(t, configs, "zookeeper_db")
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/system/command.go b/programs/diagnostics/internal/collectors/system/command.go
deleted file mode 100644
index ba4dd1e996c..00000000000
--- a/programs/diagnostics/internal/collectors/system/command.go
+++ /dev/null
@@ -1,90 +0,0 @@
-package system
-
-import (
-	"bytes"
-	"os/exec"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/google/shlex"
-	"github.com/pkg/errors"
-)
-
-// This collector runs a user specified command and collects it to a file
-
-type CommandCollector struct {
-	resourceManager *platform.ResourceManager
-}
-
-func NewCommandCollector(m *platform.ResourceManager) *CommandCollector {
-	return &CommandCollector{
-		resourceManager: m,
-	}
-}
-
-func (c *CommandCollector) Collect(conf config.Configuration) (*data.DiagnosticBundle, error) {
-	conf, err := conf.ValidateConfig(c.Configuration())
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	command, err := config.ReadStringValue(conf, "command")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	var frameErrors []error
-	// shlex to split the commands and args
-	cmdArgs, err := shlex.Split(command)
-	if err != nil || len(cmdArgs) == 0 {
-		return &data.DiagnosticBundle{}, errors.Wrap(err, "Unable to parse command")
-	}
-	cmd := exec.Command(cmdArgs[0], cmdArgs[1:]...)
-	var stdout, stderr bytes.Buffer
-	cmd.Stdout = &stdout
-	cmd.Stderr = &stderr
-	err = cmd.Run()
-	var sError string
-	if err != nil {
-		frameErrors = append(frameErrors, errors.Wrap(err, "Unable to execute command"))
-		sError = err.Error()
-	}
-	memoryFrame := data.NewMemoryFrame("output", []string{"command", "stdout", "stderr", "error"}, [][]interface{}{
-		{command, stdout.String(), stderr.String(), sError},
-	})
-	return &data.DiagnosticBundle{
-		Errors: data.FrameErrors{Errors: frameErrors},
-		Frames: map[string]data.Frame{
-			"output": memoryFrame,
-		},
-	}, nil
-}
-
-func (c *CommandCollector) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.StringParam{
-				Value:      "",
-				Param:      config.NewParam("command", "Command to execute", true),
-				AllowEmpty: false,
-			},
-		},
-	}
-}
-
-func (c *CommandCollector) IsDefault() bool {
-	return false
-}
-
-func (c *CommandCollector) Description() string {
-	return "Allows collection of the output from a user specified command"
-}
-
-// here we register the collector for use
-func init() {
-	collectors.Register("command", func() (collectors.Collector, error) {
-		return &CommandCollector{
-			resourceManager: platform.GetResourceManager(),
-		}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/system/command_test.go b/programs/diagnostics/internal/collectors/system/command_test.go
deleted file mode 100644
index 7de00cdabf4..00000000000
--- a/programs/diagnostics/internal/collectors/system/command_test.go
+++ /dev/null
@@ -1,107 +0,0 @@
-package system_test
-
-import (
-	"fmt"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/system"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/stretchr/testify/require"
-)
-
-func TestCommandConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned for file collector", func(t *testing.T) {
-		commandCollector := system.NewCommandCollector(&platform.ResourceManager{})
-		conf := commandCollector.Configuration()
-		require.Len(t, conf.Params, 1)
-		require.IsType(t, config.StringParam{}, conf.Params[0])
-		command, ok := conf.Params[0].(config.StringParam)
-		require.True(t, ok)
-		require.True(t, command.Required())
-		require.Equal(t, command.Name(), "command")
-		require.Equal(t, "", command.Value)
-	})
-}
-
-func TestCommandCollect(t *testing.T) {
-	t.Run("test simple command with args", func(t *testing.T) {
-		commandCollector := system.NewCommandCollector(&platform.ResourceManager{})
-		bundle, err := commandCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value:      "ls -l ../../../testdata",
-					Param:      config.NewParam("command", "Command to execute", true),
-					AllowEmpty: false,
-				},
-			},
-		})
-		require.Nil(t, err)
-		require.Nil(t, bundle.Errors.Errors)
-		require.Len(t, bundle.Frames, 1)
-		require.Contains(t, bundle.Frames, "output")
-		require.Equal(t, bundle.Frames["output"].Columns(), []string{"command", "stdout", "stderr", "error"})
-		memFrame := bundle.Frames["output"].(data.MemoryFrame)
-		values, ok, err := memFrame.Next()
-		require.True(t, ok)
-		require.Nil(t, err)
-		fmt.Println(values)
-		require.Len(t, values, 4)
-		require.Equal(t, "ls -l ../../../testdata", values[0])
-		require.Contains(t, values[1], "configs")
-		require.Contains(t, values[1], "docker")
-		require.Contains(t, values[1], "log")
-		require.Equal(t, "", values[2])
-		require.Equal(t, "", values[3])
-		values, ok, err = memFrame.Next()
-		require.False(t, ok)
-		require.Nil(t, err)
-		require.Nil(t, values)
-	})
-
-	t.Run("test empty command", func(t *testing.T) {
-		commandCollector := system.NewCommandCollector(&platform.ResourceManager{})
-		bundle, err := commandCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value:      "",
-					Param:      config.NewParam("command", "Command to execute", true),
-					AllowEmpty: false,
-				},
-			},
-		})
-		require.Equal(t, "parameter command is invalid - command cannot be empty", err.Error())
-		require.Equal(t, &data.DiagnosticBundle{}, bundle)
-	})
-
-	t.Run("test invalid command", func(t *testing.T) {
-		commandCollector := system.NewCommandCollector(&platform.ResourceManager{})
-		bundle, err := commandCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value:      "ls --invalid ../../../testdata",
-					Param:      config.NewParam("command", "Command to execute", true),
-					AllowEmpty: false,
-				},
-			},
-		})
-		// commands may error with output - we still capture on stderr
-		require.Nil(t, err)
-		require.Len(t, bundle.Errors.Errors, 1)
-		require.Equal(t, "Unable to execute command: exit status 2", bundle.Errors.Errors[0].Error())
-		require.Len(t, bundle.Frames, 1)
-		require.Contains(t, bundle.Frames, "output")
-		require.Equal(t, bundle.Frames["output"].Columns(), []string{"command", "stdout", "stderr", "error"})
-		memFrame := bundle.Frames["output"].(data.MemoryFrame)
-		values, ok, err := memFrame.Next()
-		require.True(t, ok)
-		require.Nil(t, err)
-		require.Len(t, values, 4)
-		require.Equal(t, "ls --invalid ../../../testdata", values[0])
-		require.Equal(t, "", values[1])
-		// exact values here may vary on platform
-		require.NotEmpty(t, values[2])
-		require.NotEmpty(t, values[3])
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/system/file.go b/programs/diagnostics/internal/collectors/system/file.go
deleted file mode 100644
index cda91636c52..00000000000
--- a/programs/diagnostics/internal/collectors/system/file.go
+++ /dev/null
@@ -1,100 +0,0 @@
-package system
-
-import (
-	"os"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/pkg/errors"
-	"github.com/rs/zerolog/log"
-	"github.com/yargevad/filepathx"
-)
-
-// This collector collects arbitrary user files
-
-type FileCollector struct {
-	resourceManager *platform.ResourceManager
-}
-
-func NewFileCollector(m *platform.ResourceManager) *FileCollector {
-	return &FileCollector{
-		resourceManager: m,
-	}
-}
-
-func (f *FileCollector) Collect(conf config.Configuration) (*data.DiagnosticBundle, error) {
-	conf, err := conf.ValidateConfig(f.Configuration())
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	filePattern, err := config.ReadStringValue(conf, "file_pattern")
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-
-	var frameErrors []error
-	// this util package supports recursive file matching e.g. /**/*
-	matches, err := filepathx.Glob(filePattern)
-	if err != nil {
-		return &data.DiagnosticBundle{}, errors.Wrapf(err, "Invalid file_pattern \"%s\"", filePattern)
-	}
-
-	if len(matches) == 0 {
-		frameErrors = append(frameErrors, errors.New("0 files match glob pattern"))
-		return &data.DiagnosticBundle{
-			Errors: data.FrameErrors{Errors: frameErrors},
-		}, nil
-	}
-
-	var filePaths []string
-	for _, match := range matches {
-		fi, err := os.Stat(match)
-		if err != nil {
-			frameErrors = append(frameErrors, errors.Wrapf(err, "Unable to read file %s", match))
-		}
-		if !fi.IsDir() {
-			log.Debug().Msgf("Collecting file %s", match)
-			filePaths = append(filePaths, match)
-		}
-	}
-
-	frame := data.NewFileFrame("collection", filePaths)
-
-	return &data.DiagnosticBundle{
-		Errors: data.FrameErrors{Errors: frameErrors},
-		Frames: map[string]data.Frame{
-			"collection": frame,
-		},
-	}, nil
-}
-
-func (f *FileCollector) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.StringParam{
-				Value:      "",
-				Param:      config.NewParam("file_pattern", "Glob based pattern to specify files for collection", true),
-				AllowEmpty: false,
-			},
-		},
-	}
-}
-
-func (f *FileCollector) IsDefault() bool {
-	return false
-}
-
-func (f *FileCollector) Description() string {
-	return "Allows collection of user specified files"
-}
-
-// here we register the collector for use
-func init() {
-	collectors.Register("file", func() (collectors.Collector, error) {
-		return &FileCollector{
-			resourceManager: platform.GetResourceManager(),
-		}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/system/file_test.go b/programs/diagnostics/internal/collectors/system/file_test.go
deleted file mode 100644
index 5b1d5b3a92f..00000000000
--- a/programs/diagnostics/internal/collectors/system/file_test.go
+++ /dev/null
@@ -1,110 +0,0 @@
-package system_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/system"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/stretchr/testify/require"
-)
-
-func TestFileConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned for file collector", func(t *testing.T) {
-		fileCollector := system.NewFileCollector(&platform.ResourceManager{})
-		conf := fileCollector.Configuration()
-		require.Len(t, conf.Params, 1)
-		require.IsType(t, config.StringParam{}, conf.Params[0])
-		filePattern, ok := conf.Params[0].(config.StringParam)
-		require.True(t, ok)
-		require.True(t, filePattern.Required())
-		require.Equal(t, filePattern.Name(), "file_pattern")
-		require.Equal(t, "", filePattern.Value)
-	})
-}
-
-func TestFileCollect(t *testing.T) {
-
-	t.Run("test filter patterns work", func(t *testing.T) {
-		fileCollector := system.NewFileCollector(&platform.ResourceManager{})
-		bundle, err := fileCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value:      "../../../testdata/**/*.xml",
-					Param:      config.NewParam("file_pattern", "Glob based pattern to specify files for collection", true),
-					AllowEmpty: false,
-				},
-			},
-		})
-		require.Nil(t, err)
-		require.Nil(t, bundle.Errors.Errors)
-		checkFileBundle(t, bundle,
-			[]string{"../../../testdata/configs/include/xml/server-include.xml",
-				"../../../testdata/configs/include/xml/user-include.xml",
-				"../../../testdata/configs/xml/config.xml",
-				"../../../testdata/configs/xml/users.xml",
-				"../../../testdata/configs/xml/users.d/default-password.xml",
-				"../../../testdata/configs/yandex_xml/config.xml",
-				"../../../testdata/docker/admin.xml",
-				"../../../testdata/docker/custom.xml"})
-	})
-
-	t.Run("invalid file patterns are detected", func(t *testing.T) {
-		fileCollector := system.NewFileCollector(&platform.ResourceManager{})
-		bundle, err := fileCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value:      "",
-					Param:      config.NewParam("file_pattern", "Glob based pattern to specify files for collection", true),
-					AllowEmpty: false,
-				},
-			},
-		})
-		require.NotNil(t, err)
-		require.Equal(t, "parameter file_pattern is invalid - file_pattern cannot be empty", err.Error())
-		require.Equal(t, &data.DiagnosticBundle{}, bundle)
-	})
-
-	t.Run("check empty matches are reported", func(t *testing.T) {
-		fileCollector := system.NewFileCollector(&platform.ResourceManager{})
-		bundle, err := fileCollector.Collect(config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value:      "../../../testdata/**/*.random",
-					Param:      config.NewParam("file_pattern", "Glob based pattern to specify files for collection", true),
-					AllowEmpty: false,
-				},
-			},
-		})
-		require.Nil(t, err)
-		require.Nil(t, bundle.Frames)
-		require.Len(t, bundle.Errors.Errors, 1)
-		require.Equal(t, "0 files match glob pattern", bundle.Errors.Errors[0].Error())
-	})
-
-}
-
-func checkFileBundle(t *testing.T, bundle *data.DiagnosticBundle, expectedFiles []string) {
-	require.NotNil(t, bundle)
-	require.Nil(t, bundle.Errors.Errors)
-	require.Len(t, bundle.Frames, 1)
-	require.Contains(t, bundle.Frames, "collection")
-	dirFrame, ok := bundle.Frames["collection"].(data.FileFrame)
-	require.True(t, ok)
-	require.Equal(t, []string{"files"}, dirFrame.Columns())
-	i := 0
-	for {
-		values, ok, err := dirFrame.Next()
-		require.Nil(t, err)
-		if !ok {
-			break
-		}
-		require.Len(t, values, 1)
-		file, ok := values[0].(data.SimpleFile)
-		require.True(t, ok)
-		require.Contains(t, expectedFiles, file.FilePath())
-		i += 1
-	}
-	require.Equal(t, len(expectedFiles), i)
-}
diff --git a/programs/diagnostics/internal/collectors/system/system.go b/programs/diagnostics/internal/collectors/system/system.go
deleted file mode 100644
index 69d16f36b8b..00000000000
--- a/programs/diagnostics/internal/collectors/system/system.go
+++ /dev/null
@@ -1,235 +0,0 @@
-package system
-
-import (
-	"strings"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/elastic/gosigar"
-	"github.com/jaypipes/ghw"
-	"github.com/matishsiao/goInfo"
-	"github.com/pkg/errors"
-)
-
-// This collector collects the system overview
-
-type SystemCollector struct {
-	resourceManager *platform.ResourceManager
-}
-
-func NewSystemCollector(m *platform.ResourceManager) *SystemCollector {
-	return &SystemCollector{
-		resourceManager: m,
-	}
-}
-
-func (sc *SystemCollector) Collect(conf config.Configuration) (*data.DiagnosticBundle, error) {
-	_, err := conf.ValidateConfig(sc.Configuration())
-	if err != nil {
-		return &data.DiagnosticBundle{}, err
-	}
-	frames := make(map[string]data.Frame)
-	var frameErrors []error
-
-	frameErrors = addStatsToFrame(frames, frameErrors, "disks", getDisk)
-	frameErrors = addStatsToFrame(frames, frameErrors, "disk_usage", getDiskUsage)
-
-	frameErrors = addStatsToFrame(frames, frameErrors, "memory", getMemory)
-	frameErrors = addStatsToFrame(frames, frameErrors, "memory_usage", getMemoryUsage)
-
-	frameErrors = addStatsToFrame(frames, frameErrors, "cpu", getCPU)
-	//frameErrors = addStatsToFrame(frames, frameErrors, "cpu_usage", getCPUUsage)
-
-	frameErrors = addStatsToFrame(frames, frameErrors, "processes", getProcessList)
-
-	frameErrors = addStatsToFrame(frames, frameErrors, "os", getHostDetails)
-
-	return &data.DiagnosticBundle{
-		Frames: frames,
-		Errors: data.FrameErrors{
-			Errors: frameErrors,
-		},
-	}, err
-}
-
-func addStatsToFrame(frames map[string]data.Frame, errors []error, name string, statFunc func() (data.MemoryFrame, error)) []error {
-	frame, err := statFunc()
-	if err != nil {
-		errors = append(errors, err)
-	}
-	frames[name] = frame
-	return errors
-}
-
-func (sc *SystemCollector) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{},
-	}
-}
-
-func (sc *SystemCollector) IsDefault() bool {
-	return true
-}
-
-func getDisk() (data.MemoryFrame, error) {
-	block, err := ghw.Block()
-	if err != nil {
-		return data.MemoryFrame{}, errors.Wrapf(err, "unable to list block storage")
-	}
-	var rows [][]interface{}
-	columns := []string{"name", "size", "physicalBlockSize", "driveType", "controller", "vendor", "model", "partitionName", "partitionSize", "mountPoint", "readOnly"}
-	for _, disk := range block.Disks {
-		for _, part := range disk.Partitions {
-			rows = append(rows, []interface{}{disk.Name, disk.SizeBytes, disk.PhysicalBlockSizeBytes, disk.DriveType, disk.StorageController, disk.Vendor, disk.Model, part.Name, part.SizeBytes, part.MountPoint, part.IsReadOnly})
-		}
-	}
-	return data.NewMemoryFrame("disk_usage", columns, rows), nil
-}
-
-func getDiskUsage() (data.MemoryFrame, error) {
-	fsList := gosigar.FileSystemList{}
-	err := fsList.Get()
-	if err != nil {
-		return data.MemoryFrame{}, errors.Wrapf(err, "unable to list filesystems for usage")
-	}
-	rows := make([][]interface{}, len(fsList.List))
-	columns := []string{"filesystem", "size", "used", "avail", "use%", "mounted on"}
-	for i, fs := range fsList.List {
-		dirName := fs.DirName
-		usage := gosigar.FileSystemUsage{}
-		err = usage.Get(dirName)
-		if err == nil {
-			rows[i] = []interface{}{fs.DevName, usage.Total, usage.Used, usage.Avail, usage.UsePercent(), dirName}
-		} else {
-			// we try to output something
-			rows[i] = []interface{}{fs.DevName, 0, 0, 0, 0, dirName}
-		}
-	}
-	return data.NewMemoryFrame("disk_usage", columns, rows), nil
-}
-
-func getMemory() (data.MemoryFrame, error) {
-	memory, err := ghw.Memory()
-	if err != nil {
-		return data.MemoryFrame{}, errors.Wrapf(err, "unable to read memory")
-	}
-	columns := []string{"totalPhysical", "totalUsable", "supportedPageSizes"}
-	rows := make([][]interface{}, 1)
-	rows[0] = []interface{}{memory.TotalPhysicalBytes, memory.TotalUsableBytes, memory.SupportedPageSizes}
-	return data.NewMemoryFrame("memory", columns, rows), nil
-}
-
-func getMemoryUsage() (data.MemoryFrame, error) {
-	mem := gosigar.Mem{}
-	swap := gosigar.Swap{}
-
-	err := mem.Get()
-	if err != nil {
-		return data.MemoryFrame{}, errors.Wrapf(err, "unable to read memory usage")
-	}
-
-	err = swap.Get()
-	if err != nil {
-		return data.MemoryFrame{}, errors.Wrapf(err, "unable to read swap")
-	}
-
-	columns := []string{"type", "total", "used", "free"}
-	rows := make([][]interface{}, 3)
-
-	rows[0] = []interface{}{"mem", mem.Total, mem.Used, mem.Free}
-	rows[1] = []interface{}{"buffers/cache", 0, mem.ActualUsed, mem.ActualFree}
-	rows[2] = []interface{}{"swap", swap.Total, swap.Used, swap.Free}
-	return data.NewMemoryFrame("memory_usage", columns, rows), nil
-
-}
-
-func getCPU() (data.MemoryFrame, error) {
-	cpu, err := ghw.CPU()
-	if err != nil {
-		return data.MemoryFrame{}, errors.Wrapf(err, "unable to list cpus")
-	}
-	columns := []string{"processor", "vendor", "model", "core", "numThreads", "logical", "capabilities"}
-	var rows [][]interface{}
-	for _, proc := range cpu.Processors {
-		for _, core := range proc.Cores {
-			rows = append(rows, []interface{}{proc.ID, proc.Vendor, proc.Model, core.ID, core.NumThreads, core.LogicalProcessors, strings.Join(proc.Capabilities, " ")})
-		}
-	}
-	return data.NewMemoryFrame("cpu", columns, rows), nil
-}
-
-// this gets cpu usage vs a listing of arch etc - see getCPU(). This needs successive values as its ticks - not currently used
-// see https://github.com/elastic/beats/blob/master/metricbeat/internal/metrics/cpu/metrics.go#L131 for inspiration
-//nolint
-func getCPUUsage() (data.MemoryFrame, error) {
-	cpuList := gosigar.CpuList{}
-	err := cpuList.Get()
-	if err != nil {
-		return data.MemoryFrame{}, errors.Wrapf(err, "unable to list cpus for usage")
-	}
-	columns := []string{"sys", "nice", "stolen", "irq", "idle", "softIrq", "user", "wait", "total"}
-	rows := make([][]interface{}, len(cpuList.List), len(cpuList.List))
-	for i, cpu := range cpuList.List {
-		rows[i] = []interface{}{cpu.Sys, cpu.Nice, cpu.Stolen, cpu.Irq, cpu.Idle, cpu.SoftIrq, cpu.User, cpu.Wait, cpu.Total()}
-	}
-	return data.NewMemoryFrame("cpu_usage", columns, rows), nil
-}
-
-func getProcessList() (data.MemoryFrame, error) {
-	pidList := gosigar.ProcList{}
-	err := pidList.Get()
-	if err != nil {
-		return data.MemoryFrame{}, errors.Wrapf(err, "unable to list processes")
-	}
-	columns := []string{"pid", "ppid", "stime", "time", "rss", "size", "faults", "minorFaults", "majorFaults", "user", "state", "priority", "nice", "command"}
-	rows := make([][]interface{}, len(pidList.List))
-	for i, pid := range pidList.List {
-		state := gosigar.ProcState{}
-		mem := gosigar.ProcMem{}
-		time := gosigar.ProcTime{}
-		args := gosigar.ProcArgs{}
-		if err := state.Get(pid); err != nil {
-			continue
-		}
-		if err := mem.Get(pid); err != nil {
-			continue
-		}
-		if err := time.Get(pid); err != nil {
-			continue
-		}
-		if err := args.Get(pid); err != nil {
-			continue
-		}
-		rows[i] = []interface{}{pid, state.Ppid, time.FormatStartTime(), time.FormatTotal(), mem.Resident, mem.Size,
-			mem.PageFaults, mem.MinorFaults, mem.MajorFaults, state.Username, state.State, state.Priority, state.Nice,
-			strings.Join(args.List, " ")}
-	}
-	return data.NewMemoryFrame("process_list", columns, rows), nil
-}
-
-func getHostDetails() (data.MemoryFrame, error) {
-	gi, err := goInfo.GetInfo()
-	if err != nil {
-		return data.MemoryFrame{}, errors.Wrapf(err, "unable to get host summary")
-	}
-	columns := []string{"hostname", "os", "goOs", "cpus", "core", "kernel", "platform"}
-	rows := [][]interface{}{
-		{gi.Hostname, gi.OS, gi.GoOS, gi.CPUs, gi.Core, gi.Kernel, gi.Platform},
-	}
-	return data.NewMemoryFrame("os", columns, rows), nil
-}
-
-func (sc *SystemCollector) Description() string {
-	return "Collects summary OS and hardware statistics for the host"
-}
-
-// here we register the collector for use
-func init() {
-	collectors.Register("system", func() (collectors.Collector, error) {
-		return &SystemCollector{
-			resourceManager: platform.GetResourceManager(),
-		}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/collectors/system/system_test.go b/programs/diagnostics/internal/collectors/system/system_test.go
deleted file mode 100644
index fb1e16bd1ed..00000000000
--- a/programs/diagnostics/internal/collectors/system/system_test.go
+++ /dev/null
@@ -1,89 +0,0 @@
-package system_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/system"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/stretchr/testify/require"
-)
-
-func TestSystemConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned for system collector", func(t *testing.T) {
-		systemCollector := system.NewSystemCollector(&platform.ResourceManager{})
-		conf := systemCollector.Configuration()
-		require.Len(t, conf.Params, 0)
-		require.Equal(t, []config.ConfigParam{}, conf.Params)
-	})
-}
-
-func TestSystemCollect(t *testing.T) {
-	t.Run("test default system collection", func(t *testing.T) {
-		systemCollector := system.NewSystemCollector(&platform.ResourceManager{})
-		diagSet, err := systemCollector.Collect(config.Configuration{})
-		require.Nil(t, err)
-		require.NotNil(t, diagSet)
-		require.Len(t, diagSet.Errors.Errors, 0)
-		require.Len(t, diagSet.Frames, 7)
-		require.Contains(t, diagSet.Frames, "disks")
-		require.Contains(t, diagSet.Frames, "disk_usage")
-		require.Contains(t, diagSet.Frames, "memory")
-		require.Contains(t, diagSet.Frames, "memory_usage")
-		require.Contains(t, diagSet.Frames, "cpu")
-		require.Contains(t, diagSet.Frames, "processes")
-		require.Contains(t, diagSet.Frames, "os")
-		// responses here will vary depending on platform - mocking seems excessive so we test we have some data
-		// disks
-		require.Equal(t, []string{"name", "size", "physicalBlockSize", "driveType", "controller", "vendor", "model", "partitionName", "partitionSize", "mountPoint", "readOnly"}, diagSet.Frames["disks"].Columns())
-		diskFrames, err := countFrameRows(diagSet, "disks")
-		require.Greater(t, diskFrames, 0)
-		require.Nil(t, err)
-		// disk usage
-		require.Equal(t, []string{"filesystem", "size", "used", "avail", "use%", "mounted on"}, diagSet.Frames["disk_usage"].Columns())
-		diskUsageFrames, err := countFrameRows(diagSet, "disk_usage")
-		require.Greater(t, diskUsageFrames, 0)
-		require.Nil(t, err)
-		// memory
-		require.Equal(t, []string{"totalPhysical", "totalUsable", "supportedPageSizes"}, diagSet.Frames["memory"].Columns())
-		memoryFrames, err := countFrameRows(diagSet, "memory")
-		require.Greater(t, memoryFrames, 0)
-		require.Nil(t, err)
-		// memory_usage
-		require.Equal(t, []string{"type", "total", "used", "free"}, diagSet.Frames["memory_usage"].Columns())
-		memoryUsageFrames, err := countFrameRows(diagSet, "memory_usage")
-		require.Greater(t, memoryUsageFrames, 0)
-		require.Nil(t, err)
-		// cpu
-		require.Equal(t, []string{"processor", "vendor", "model", "core", "numThreads", "logical", "capabilities"}, diagSet.Frames["cpu"].Columns())
-		cpuFrames, err := countFrameRows(diagSet, "cpu")
-		require.Greater(t, cpuFrames, 0)
-		require.Nil(t, err)
-		// processes
-		require.Equal(t, []string{"pid", "ppid", "stime", "time", "rss", "size", "faults", "minorFaults", "majorFaults", "user", "state", "priority", "nice", "command"}, diagSet.Frames["processes"].Columns())
-		processesFrames, err := countFrameRows(diagSet, "processes")
-		require.Greater(t, processesFrames, 0)
-		require.Nil(t, err)
-		// os
-		require.Equal(t, []string{"hostname", "os", "goOs", "cpus", "core", "kernel", "platform"}, diagSet.Frames["os"].Columns())
-		osFrames, err := countFrameRows(diagSet, "os")
-		require.Greater(t, osFrames, 0)
-		require.Nil(t, err)
-	})
-}
-
-func countFrameRows(diagSet *data.DiagnosticBundle, frameName string) (int, error) {
-	frame := diagSet.Frames[frameName]
-	i := 0
-	for {
-		_, ok, err := frame.Next()
-		if !ok {
-			return i, err
-		}
-		if err != nil {
-			return i, err
-		}
-		i++
-	}
-}
diff --git a/programs/diagnostics/internal/outputs/file/simple.go b/programs/diagnostics/internal/outputs/file/simple.go
deleted file mode 100644
index 63847b3addd..00000000000
--- a/programs/diagnostics/internal/outputs/file/simple.go
+++ /dev/null
@@ -1,344 +0,0 @@
-package file
-
-import (
-	"context"
-	"encoding/csv"
-	"fmt"
-	"os"
-	"path"
-	"path/filepath"
-	"strconv"
-	"strings"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/mholt/archiver/v4"
-	"github.com/pkg/errors"
-	"github.com/rs/zerolog/log"
-)
-
-const OutputName = "simple"
-
-type SubFolderGenerator func() string
-
-type SimpleOutput struct {
-	// mainly used for testing to make sub folder deterministic - which it won't be by default as it uses a timestamp
-	FolderGenerator SubFolderGenerator
-}
-
-func (o SimpleOutput) Write(id string, bundles map[string]*data.DiagnosticBundle, conf config.Configuration) (data.FrameErrors, error) {
-	conf, err := conf.ValidateConfig(o.Configuration())
-	if err != nil {
-		return data.FrameErrors{}, err
-	}
-	directory, err := config.ReadStringValue(conf, "directory")
-	if err != nil {
-		return data.FrameErrors{}, err
-	}
-	directory, err = getWorkingDirectory(directory)
-	if err != nil {
-		return data.FrameErrors{}, err
-	}
-	subFolder := strconv.FormatInt(utils.MakeTimestamp(), 10)
-	if o.FolderGenerator != nil {
-		subFolder = o.FolderGenerator()
-	}
-	skipArchive, err := config.ReadBoolValue(conf, "skip_archive")
-	if err != nil {
-		return data.FrameErrors{}, err
-	}
-
-	outputDir := filepath.Join(directory, id, subFolder)
-	log.Info().Msgf("creating bundle in %s", outputDir)
-	if err := os.MkdirAll(outputDir, os.ModePerm); err != nil {
-		return data.FrameErrors{}, err
-	}
-	frameErrors := data.FrameErrors{}
-	var filePaths []string
-	for name := range bundles {
-		bundlePaths, frameError := writeDiagnosticBundle(name, bundles[name], outputDir)
-		filePaths = append(filePaths, bundlePaths...)
-		frameErrors.Errors = append(frameErrors.Errors, frameError.Errors...)
-	}
-	log.Info().Msg("bundle created")
-	if !skipArchive {
-		archiveFilename := filepath.Join(directory, id, fmt.Sprintf("%s.tar.gz", subFolder))
-		log.Info().Msgf("compressing bundle to %s", archiveFilename)
-		// produce a map containing the input paths to the archive paths - we preserve the output directory and hierarchy
-		archiveMap := createArchiveMap(filePaths, directory)
-		if err := createArchive(archiveFilename, archiveMap); err != nil {
-			return frameErrors, err
-		}
-		// we delete the original directory leaving just the archive behind
-		if err := os.RemoveAll(outputDir); err != nil {
-			return frameErrors, err
-		}
-		log.Info().Msgf("archive ready at: %s ", archiveFilename)
-	}
-	return frameErrors, nil
-}
-
-func writeDiagnosticBundle(name string, diag *data.DiagnosticBundle, baseDir string) ([]string, data.FrameErrors) {
-	diagDir := filepath.Join(baseDir, name)
-	if err := os.MkdirAll(diagDir, os.ModePerm); err != nil {
-		return nil, data.FrameErrors{Errors: []error{
-			errors.Wrapf(err, "unable to create directory for %s", name),
-		}}
-	}
-	frameErrors := data.FrameErrors{}
-	var filePaths []string
-	for frameId, frame := range diag.Frames {
-		fFilePath, errs := writeFrame(frameId, frame, diagDir)
-		filePaths = append(filePaths, fFilePath...)
-		if len(errs) > 0 {
-			// it would be nice if we could wrap this list of errors into something formal but this logs well
-			frameErrors.Errors = append(frameErrors.Errors, fmt.Errorf("unable to write frame %s for %s", frameId, name))
-			frameErrors.Errors = append(frameErrors.Errors, errs...)
-		}
-	}
-	return filePaths, frameErrors
-}
-
-func writeFrame(frameId string, frame data.Frame, baseDir string) ([]string, []error) {
-	switch f := frame.(type) {
-	case data.DatabaseFrame:
-		return writeDatabaseFrame(frameId, f, baseDir)
-	case data.ConfigFileFrame:
-		return writeConfigFrame(frameId, f, baseDir)
-	case data.DirectoryFileFrame:
-		return processDirectoryFileFrame(frameId, f, baseDir)
-	case data.FileFrame:
-		return processFileFrame(frameId, f, baseDir)
-	case data.HierarchicalFrame:
-		return writeHierarchicalFrame(frameId, f, baseDir)
-	default:
-		// for now our data frame writer supports all frames
-		return writeDatabaseFrame(frameId, frame, baseDir)
-	}
-}
-
-func writeHierarchicalFrame(frameId string, frame data.HierarchicalFrame, baseDir string) ([]string, []error) {
-	filePaths, errs := writeFrame(frameId, frame.DataFrame, baseDir)
-	for _, subFrame := range frame.SubFrames {
-		subDir := filepath.Join(baseDir, subFrame.Name())
-		if err := os.MkdirAll(subDir, os.ModePerm); err != nil {
-			errs = append(errs, err)
-			continue
-		}
-		subPaths, subErrs := writeFrame(subFrame.Name(), subFrame, subDir)
-		filePaths = append(filePaths, subPaths...)
-		errs = append(errs, subErrs...)
-	}
-	return filePaths, errs
-}
-
-func writeDatabaseFrame(frameId string, frame data.Frame, baseDir string) ([]string, []error) {
-	frameFilePath := filepath.Join(baseDir, fmt.Sprintf("%s.csv", frameId))
-	var errs []error
-	f, err := os.Create(frameFilePath)
-	if err != nil {
-		errs = append(errs, errors.Wrapf(err, "unable to create directory for frame %s", frameId))
-		return []string{}, errs
-	}
-	defer f.Close()
-	w := csv.NewWriter(f)
-	defer w.Flush()
-	if err := w.Write(frame.Columns()); err != nil {
-		errs = append(errs, errors.Wrapf(err, "unable to write columns for frame %s", frameId))
-		return []string{}, errs
-	}
-	// we don't collect an error for every line here like configs and logs - could mean a lot of unnecessary noise
-	for {
-		values, ok, err := frame.Next()
-		if err != nil {
-			errs = append(errs, errors.Wrapf(err, "unable to read frame %s", frameId))
-			return []string{}, errs
-		}
-		if !ok {
-			return []string{frameFilePath}, errs
-		}
-		sValues := make([]string, len(values))
-		for i, value := range values {
-			sValues[i] = fmt.Sprintf("%v", value)
-		}
-		if err := w.Write(sValues); err != nil {
-			errs = append(errs, errors.Wrapf(err, "unable to write row for frame %s", frameId))
-			return []string{}, errs
-		}
-	}
-}
-
-func writeConfigFrame(frameId string, frame data.ConfigFileFrame, baseDir string) ([]string, []error) {
-	var errs []error
-	frameDirectory := filepath.Join(baseDir, frameId)
-	if err := os.MkdirAll(frameDirectory, os.ModePerm); err != nil {
-		errs = append(errs, errors.Wrapf(err, "unable to create directory for frame %s", frameId))
-		return []string{}, errs
-	}
-	// this holds our files included
-	includesDirectory := filepath.Join(frameDirectory, "includes")
-	if err := os.MkdirAll(includesDirectory, os.ModePerm); err != nil {
-		errs = append(errs, errors.Wrapf(err, "unable to create includes directory for frame %s", frameId))
-		return []string{}, errs
-	}
-	for {
-		values, ok, err := frame.Next()
-		if err != nil {
-			errs = append(errs, err)
-			return []string{frameDirectory}, errs
-		}
-		if !ok {
-			return []string{frameDirectory}, errs
-		}
-		configFile := values[0].(data.ConfigFile)
-		if !configFile.IsIncluded() {
-			relPath := strings.TrimPrefix(configFile.FilePath(), frame.Directory)
-			destPath := path.Join(frameDirectory, relPath)
-			if err = configFile.Copy(destPath, true); err != nil {
-				errs = append(errs, errors.Wrapf(err, "Unable to copy file %s", configFile.FilePath()))
-			}
-		} else {
-			// include files could be anywhere - potentially multiple with the same name. We thus, recreate the directory
-			// hierarchy under includes to avoid collisions
-			destPath := path.Join(includesDirectory, configFile.FilePath())
-			if err = configFile.Copy(destPath, true); err != nil {
-				errs = append(errs, errors.Wrapf(err, "Unable to copy file %s", configFile.FilePath()))
-			}
-		}
-
-	}
-}
-
-func processDirectoryFileFrame(frameId string, frame data.DirectoryFileFrame, baseDir string) ([]string, []error) {
-	var errs []error
-	// each set of files goes under its own directory to preserve grouping
-	frameDirectory := filepath.Join(baseDir, frameId)
-	if err := os.MkdirAll(frameDirectory, os.ModePerm); err != nil {
-		errs = append(errs, errors.Wrapf(err, "unable to create directory for frame %s", frameId))
-		return []string{}, errs
-	}
-	for {
-		values, ok, err := frame.Next()
-		if err != nil {
-			errs = append(errs, err)
-			return []string{frameDirectory}, errs
-		}
-		if !ok {
-			return []string{frameDirectory}, errs
-		}
-		file := values[0].(data.SimpleFile)
-		relPath := strings.TrimPrefix(file.FilePath(), frame.Directory)
-		destPath := path.Join(frameDirectory, relPath)
-
-		if err = file.Copy(destPath, true); err != nil {
-			errs = append(errs, errors.Wrapf(err, "unable to copy file %s for frame %s", file, frameId))
-		}
-	}
-}
-
-func processFileFrame(frameId string, frame data.FileFrame, baseDir string) ([]string, []error) {
-	var errs []error
-	frameDirectory := filepath.Join(baseDir, frameId)
-	if err := os.MkdirAll(frameDirectory, os.ModePerm); err != nil {
-		errs = append(errs, errors.Wrapf(err, "unable to create directory for frame %s", frameId))
-		return []string{}, errs
-	}
-	for {
-		values, ok, err := frame.Next()
-		if err != nil {
-			errs = append(errs, err)
-		}
-		if !ok {
-			return []string{frameDirectory}, errs
-		}
-		file := values[0].(data.SimpleFile)
-		// we need an absolute path to preserve the directory hierarchy
-		dir, err := filepath.Abs(filepath.Dir(file.FilePath()))
-		if err != nil {
-			errs = append(errs, errors.Wrapf(err, "unable to determine dir for %s", file.FilePath()))
-		}
-		outputDir := filepath.Join(frameDirectory, dir)
-		if _, err := os.Stat(outputDir); os.IsNotExist(err) {
-			if err := os.MkdirAll(outputDir, os.ModePerm); err != nil {
-				errs = append(errs, errors.Wrapf(err, "unable to create directory for %s", file.FilePath()))
-			} else {
-				outputPath := filepath.Join(outputDir, filepath.Base(file.FilePath()))
-				err = file.Copy(outputPath, false)
-				if err != nil {
-					errs = append(errs, errors.Wrapf(err, "unable to copy file %s", file.FilePath()))
-				}
-			}
-		}
-	}
-}
-
-func getWorkingDirectory(path string) (string, error) {
-	if !filepath.IsAbs(path) {
-		workingPath, err := os.Getwd()
-		if err != nil {
-			return "", err
-		}
-		return filepath.Join(workingPath, path), nil
-	}
-	return path, nil
-}
-
-func createArchiveMap(filePaths []string, prefix string) map[string]string {
-	archiveMap := make(map[string]string)
-	for _, path := range filePaths {
-		archiveMap[path] = strings.TrimPrefix(path, prefix)
-	}
-	return archiveMap
-}
-
-func createArchive(outputFile string, filePaths map[string]string) error {
-	files, err := archiver.FilesFromDisk(nil, filePaths)
-	if err != nil {
-		return err
-	}
-	out, err := os.Create(outputFile)
-	if err != nil {
-		return err
-	}
-	defer out.Close()
-	format := archiver.CompressedArchive{
-		Compression: archiver.Gz{},
-		Archival:    archiver.Tar{},
-	}
-	err = format.Archive(context.Background(), out, files)
-	return err
-}
-
-func (o SimpleOutput) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.StringParam{
-				Value: "./",
-				Param: config.NewParam("directory", "Directory in which to create dump. Defaults to the current directory.", false),
-			},
-			config.StringOptions{
-				Value: "csv",
-				// TODO: add tsv and others here later
-				Options: []string{"csv"},
-				Param:   config.NewParam("format", "Format of exported files", false),
-			},
-			config.BoolParam{
-				Value: false,
-				Param: config.NewParam("skip_archive", "Don't compress output to an archive", false),
-			},
-		},
-	}
-}
-
-func (o SimpleOutput) Description() string {
-	return "Writes out the diagnostic bundle as files in a structured directory, optionally producing a compressed archive."
-}
-
-// here we register the output for use
-func init() {
-	outputs.Register(OutputName, func() (outputs.Output, error) {
-		return SimpleOutput{}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/outputs/file/simple_test.go b/programs/diagnostics/internal/outputs/file/simple_test.go
deleted file mode 100644
index 471a1c70cc1..00000000000
--- a/programs/diagnostics/internal/outputs/file/simple_test.go
+++ /dev/null
@@ -1,468 +0,0 @@
-package file_test
-
-import (
-	"bufio"
-	"encoding/xml"
-	"fmt"
-	"io"
-	"os"
-	"path"
-	"strings"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs/file"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/stretchr/testify/require"
-)
-
-var clusterFrame = test.NewFakeDataFrame("clusters", []string{"cluster", "shard_num", "shard_weight", "replica_num", "host_name", "host_address", "port", "is_local", "user", "default_database", "errors_count", "slowdowns_count", "estimated_recovery_time"},
-	[][]interface{}{
-		{"events", 1, 1, 1, "dalem-local-clickhouse-blue-1", "192.168.144.2", 9000, 1, "default", "", 0, 0, 0},
-		{"events", 2, 1, 1, "dalem-local-clickhouse-blue-2", "192.168.144.4", 9001, 1, "default", "", 0, 0, 0},
-		{"events", 3, 1, 1, "dalem-local-clickhouse-blue-3", "192.168.144.3", 9002, 1, "default", "", 0, 0, 0},
-	},
-)
-
-var diskFrame = test.NewFakeDataFrame("disks", []string{"name", "path", "free_space", "total_space", "keep_free_space", "type"},
-	[][]interface{}{
-		{"default", "/var/lib/clickhouse", 1729659346944, 1938213220352, "", "local"},
-	},
-)
-
-var userFrame = test.NewFakeDataFrame("users", []string{"name", "id", "storage", "auth_type", "auth_params", "host_ip", "host_names", "host_names_regexp", "host_names_like"},
-	[][]interface{}{
-		{"default", "94309d50-4f52-5250-31bd-74fecac179db,users.xml,plaintext_password", "sha256_password", []string{"::0"}, []string{}, []string{}, []string{}},
-	},
-)
-
-func TestConfiguration(t *testing.T) {
-	t.Run("correct configuration is returned", func(t *testing.T) {
-		output := file.SimpleOutput{}
-		conf := output.Configuration()
-		require.Len(t, conf.Params, 3)
-		// check first directory param
-		require.IsType(t, config.StringParam{}, conf.Params[0])
-		directory, ok := conf.Params[0].(config.StringParam)
-		require.True(t, ok)
-		require.False(t, directory.Required())
-		require.Equal(t, "directory", directory.Name())
-		require.Equal(t, "./", directory.Value)
-		// check second format param
-		require.IsType(t, config.StringOptions{}, conf.Params[1])
-		format, ok := conf.Params[1].(config.StringOptions)
-		require.True(t, ok)
-		require.False(t, format.Required())
-		require.Equal(t, "format", format.Name())
-		require.Equal(t, "csv", format.Value)
-		require.Equal(t, []string{"csv"}, format.Options)
-		// check third format compress
-		require.IsType(t, config.BoolParam{}, conf.Params[2])
-		skipArchive, ok := conf.Params[2].(config.BoolParam)
-		require.True(t, ok)
-		require.False(t, format.Required())
-		require.False(t, skipArchive.Value)
-	})
-}
-
-func TestWrite(t *testing.T) {
-	bundles := map[string]*data.DiagnosticBundle{
-		"systemA": {
-			Frames: map[string]data.Frame{
-				"disk":    diskFrame,
-				"cluster": clusterFrame,
-			},
-		},
-		"systemB": {
-			Frames: map[string]data.Frame{
-				"user": userFrame,
-			},
-		},
-	}
-	t.Run("test we can write simple diagnostic sets", func(t *testing.T) {
-		tempDir := t.TempDir()
-		configuration := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Param: config.NewParam("directory", "A directory", true),
-					Value: tempDir,
-				},
-				// turn compression off as the folder will be deleted by default
-				config.BoolParam{
-					Value: true,
-					Param: config.NewParam("skip_archive", "Skip archive", false),
-				},
-			},
-		}
-		output := file.SimpleOutput{FolderGenerator: staticFolderName}
-		frameErrors, err := output.Write("test", bundles, configuration)
-		require.Nil(t, err)
-		require.Equal(t, data.FrameErrors{}, frameErrors)
-		clusterFile := path.Join(tempDir, "test", "test", "systemA", "cluster.csv")
-		diskFile := path.Join(tempDir, "test", "test", "systemA", "disk.csv")
-		userFile := path.Join(tempDir, "test", "test", "systemB", "user.csv")
-		require.FileExists(t, clusterFile)
-		require.FileExists(t, diskFile)
-		require.FileExists(t, userFile)
-		diskLines, err := readFileLines(diskFile)
-		require.Nil(t, err)
-		require.Len(t, diskLines, 2)
-		usersLines, err := readFileLines(userFile)
-		require.Nil(t, err)
-		require.Len(t, usersLines, 2)
-		clusterLines, err := readFileLines(clusterFile)
-		require.Nil(t, err)
-		require.Len(t, clusterLines, 4)
-		require.Equal(t, strings.Join(clusterFrame.ColumnNames, ","), clusterLines[0])
-		require.Equal(t, "events,1,1,1,dalem-local-clickhouse-blue-1,192.168.144.2,9000,1,default,,0,0,0", clusterLines[1])
-		require.Equal(t, "events,2,1,1,dalem-local-clickhouse-blue-2,192.168.144.4,9001,1,default,,0,0,0", clusterLines[2])
-		require.Equal(t, "events,3,1,1,dalem-local-clickhouse-blue-3,192.168.144.3,9002,1,default,,0,0,0", clusterLines[3])
-		resetFrames()
-	})
-
-	t.Run("test invalid parameter", func(t *testing.T) {
-		tempDir := t.TempDir()
-		configuration := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Param: config.NewParam("directory", "A directory", true),
-					Value: tempDir,
-				},
-				config.StringOptions{
-					Value:   "random",
-					Options: []string{"csv"},
-					// TODO: add tsv and others here later
-					Param: config.NewParam("format", "Format of exported files", false),
-				},
-				config.BoolParam{
-					Value: true,
-					Param: config.NewParam("skip_archive", "Skip compressed archive", false),
-				},
-			},
-		}
-		output := file.SimpleOutput{FolderGenerator: staticFolderName}
-		frameErrors, err := output.Write("test", bundles, configuration)
-		require.Equal(t, data.FrameErrors{}, frameErrors)
-		require.NotNil(t, err)
-		require.Equal(t, "parameter format is invalid - random is not a valid value for format - [csv]", err.Error())
-		resetFrames()
-	})
-
-	t.Run("test compression", func(t *testing.T) {
-		tempDir := t.TempDir()
-		configuration := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Param: config.NewParam("directory", "A directory", true),
-					Value: tempDir,
-				},
-			},
-		}
-		output := file.SimpleOutput{FolderGenerator: staticFolderName}
-		frameErrors, err := output.Write("test", bundles, configuration)
-		require.Nil(t, err)
-		require.Equal(t, data.FrameErrors{}, frameErrors)
-		archiveFileName := path.Join(tempDir, "test", "test.tar.gz")
-		fi, err := os.Stat(archiveFileName)
-		require.Nil(t, err)
-		require.FileExists(t, archiveFileName)
-		// compression will vary so lets test range
-		require.Greater(t, int64(600), fi.Size())
-		require.Less(t, int64(200), fi.Size())
-		outputFolder := path.Join(tempDir, "test", "test")
-		// check the folder doesn't exist and is cleaned up
-		require.NoFileExists(t, outputFolder)
-		resetFrames()
-	})
-
-	t.Run("test support for directory frames", func(t *testing.T) {
-		// create 5 temporary files
-		tempDir := t.TempDir()
-		files := createRandomFiles(tempDir, 5)
-		dirFrame, errs := data.NewFileDirectoryFrame(tempDir, []string{"*.log"})
-		require.Empty(t, errs)
-		fileBundles := map[string]*data.DiagnosticBundle{
-			"systemA": {
-				Frames: map[string]data.Frame{
-					"disk":    diskFrame,
-					"cluster": clusterFrame,
-				},
-			},
-			"config": {
-				Frames: map[string]data.Frame{
-					"logs": dirFrame,
-				},
-			},
-		}
-		destDir := t.TempDir()
-		configuration := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Param: config.NewParam("directory", "A directory", true),
-					Value: destDir,
-				},
-				// turn compression off as the folder will be deleted by default
-				config.BoolParam{
-					Value: true,
-					Param: config.NewParam("skip_archive", "Skip archive", false),
-				},
-			},
-		}
-		output := file.SimpleOutput{FolderGenerator: staticFolderName}
-		frameErrors, err := output.Write("test", fileBundles, configuration)
-		require.Nil(t, err)
-		require.NotNil(t, frameErrors)
-
-		// test the usual frames still work
-		clusterFile := path.Join(destDir, "test", "test", "systemA", "cluster.csv")
-		diskFile := path.Join(destDir, "test", "test", "systemA", "disk.csv")
-		require.FileExists(t, clusterFile)
-		require.FileExists(t, diskFile)
-		diskLines, err := readFileLines(diskFile)
-		require.Nil(t, err)
-		require.Len(t, diskLines, 2)
-		clusterLines, err := readFileLines(clusterFile)
-		require.Nil(t, err)
-		require.Len(t, clusterLines, 4)
-		require.Equal(t, strings.Join(clusterFrame.ColumnNames, ","), clusterLines[0])
-		require.Equal(t, "events,1,1,1,dalem-local-clickhouse-blue-1,192.168.144.2,9000,1,default,,0,0,0", clusterLines[1])
-		require.Equal(t, "events,2,1,1,dalem-local-clickhouse-blue-2,192.168.144.4,9001,1,default,,0,0,0", clusterLines[2])
-		require.Equal(t, "events,3,1,1,dalem-local-clickhouse-blue-3,192.168.144.3,9002,1,default,,0,0,0", clusterLines[3])
-		//test our directory frame
-		for _, filepath := range files {
-			// check they were copied
-			subPath := strings.TrimPrefix(filepath, tempDir)
-			// path here will be <destDir>/<id>/test>/config/logs/<sub path>
-			newPath := path.Join(destDir, "test", "test", "config", "logs", subPath)
-			require.FileExists(t, newPath)
-		}
-		resetFrames()
-	})
-
-	t.Run("test support for config frames", func(t *testing.T) {
-		xmlConfig := data.XmlConfig{
-			XMLName: xml.Name{},
-			Clickhouse: data.XmlLoggerConfig{
-				XMLName:  xml.Name{},
-				ErrorLog: "/var/log/clickhouse-server/clickhouse-server.err.log",
-				Log:      "/var/log/clickhouse-server/clickhouse-server.log",
-			},
-			IncludeFrom: "",
-		}
-		tempDir := t.TempDir()
-		confDir := path.Join(tempDir, "conf")
-		// create an includes file
-		includesDir := path.Join(tempDir, "includes")
-		err := os.MkdirAll(includesDir, os.ModePerm)
-		require.Nil(t, err)
-		includesPath := path.Join(includesDir, "random.xml")
-		includesFile, err := os.Create(includesPath)
-		require.Nil(t, err)
-		xmlWriter := io.Writer(includesFile)
-		enc := xml.NewEncoder(xmlWriter)
-		enc.Indent("  ", "    ")
-		err = enc.Encode(xmlConfig)
-		require.Nil(t, err)
-		// create 5 temporary config files
-		files := make([]string, 5)
-		// set the includes
-		xmlConfig.IncludeFrom = includesPath
-		for i := 0; i < 5; i++ {
-			// we want to check hierarchies are preserved so create a simple folder for each file
-			fileDir := path.Join(confDir, fmt.Sprintf("%d", i))
-			err := os.MkdirAll(fileDir, os.ModePerm)
-			require.Nil(t, err)
-			filepath := path.Join(fileDir, fmt.Sprintf("random-%d.xml", i))
-			files[i] = filepath
-			xmlFile, err := os.Create(filepath)
-			require.Nil(t, err)
-			// write a little xml so its valid
-			xmlWriter := io.Writer(xmlFile)
-			enc := xml.NewEncoder(xmlWriter)
-			enc.Indent("  ", "    ")
-			err = enc.Encode(xmlConfig)
-			require.Nil(t, err)
-		}
-		configFrame, errs := data.NewConfigFileFrame(confDir)
-		require.Empty(t, errs)
-		fileBundles := map[string]*data.DiagnosticBundle{
-			"systemA": {
-				Frames: map[string]data.Frame{
-					"disk":    diskFrame,
-					"cluster": clusterFrame,
-				},
-			},
-			"config": {
-				Frames: map[string]data.Frame{
-					"user_specified": configFrame,
-				},
-			},
-		}
-		destDir := t.TempDir()
-		configuration := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Param: config.NewParam("directory", "A directory", true),
-					Value: destDir,
-				},
-				// turn compression off as the folder will be deleted by default
-				config.BoolParam{
-					Value: true,
-					Param: config.NewParam("skip_archive", "Skip archive", false),
-				},
-			},
-		}
-		output := file.SimpleOutput{FolderGenerator: staticFolderName}
-		frameErrors, err := output.Write("test", fileBundles, configuration)
-		require.Nil(t, err)
-		require.NotNil(t, frameErrors)
-		require.Empty(t, frameErrors.Errors)
-		//test our config frame
-		for _, filepath := range files {
-			// check they were copied
-			subPath := strings.TrimPrefix(filepath, confDir)
-			// path here will be <destDir>/<id>/test>/config/user_specified/file
-			newPath := path.Join(destDir, "test", "test", "config", "user_specified", subPath)
-			require.FileExists(t, newPath)
-		}
-		// check our includes file exits
-		// path here will be <destDir>/<id>/test>/config/user_specified/file/includes
-		require.FileExists(t, path.Join(destDir, "test", "test", "config", "user_specified", "includes", includesPath))
-		resetFrames()
-	})
-
-	t.Run("test support for file frames", func(t *testing.T) {
-		// create 5 temporary files
-		tempDir := t.TempDir()
-		files := createRandomFiles(tempDir, 5)
-		fileFrame := data.NewFileFrame("collection", files)
-		fileBundles := map[string]*data.DiagnosticBundle{
-			"systemA": {
-				Frames: map[string]data.Frame{
-					"disk":    diskFrame,
-					"cluster": clusterFrame,
-				},
-			},
-			"file": {
-				Frames: map[string]data.Frame{
-					"collection": fileFrame,
-				},
-			},
-		}
-		destDir := t.TempDir()
-		configuration := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Param: config.NewParam("directory", "A directory", true),
-					Value: destDir,
-				},
-				// turn compression off as the folder will be deleted by default
-				config.BoolParam{
-					Value: true,
-					Param: config.NewParam("skip_archive", "Skip archive", false),
-				},
-			},
-		}
-		output := file.SimpleOutput{FolderGenerator: staticFolderName}
-		frameErrors, err := output.Write("test", fileBundles, configuration)
-		require.Nil(t, err)
-		require.NotNil(t, frameErrors)
-		//test our directory frame
-		for _, filepath := range files {
-			// path here will be <destDir>/<id>/test>/file/collection/<sub path>
-			newPath := path.Join(destDir, "test", "test", "file", "collection", filepath)
-			require.FileExists(t, newPath)
-		}
-		resetFrames()
-	})
-
-	t.Run("test support for hierarchical frames", func(t *testing.T) {
-		bottomFrame := data.NewHierarchicalFrame("bottomLevel", userFrame, []data.HierarchicalFrame{})
-		middleFrame := data.NewHierarchicalFrame("middleLevel", diskFrame, []data.HierarchicalFrame{bottomFrame})
-		topFrame := data.NewHierarchicalFrame("topLevel", clusterFrame, []data.HierarchicalFrame{middleFrame})
-		tempDir := t.TempDir()
-		configuration := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Param: config.NewParam("directory", "A directory", true),
-					Value: tempDir,
-				},
-				// turn compression off as the folder will be deleted by default
-				config.BoolParam{
-					Value: true,
-					Param: config.NewParam("skip_archive", "Skip archive", false),
-				},
-			},
-		}
-		output := file.SimpleOutput{FolderGenerator: staticFolderName}
-		hierarchicalBundle := map[string]*data.DiagnosticBundle{
-			"systemA": {
-				Frames: map[string]data.Frame{
-					"topLevel": topFrame,
-				},
-			},
-		}
-		frameErrors, err := output.Write("test", hierarchicalBundle, configuration)
-		require.Nil(t, err)
-		require.Equal(t, data.FrameErrors{}, frameErrors)
-		topFile := path.Join(tempDir, "test", "test", "systemA", "topLevel.csv")
-		middleFile := path.Join(tempDir, "test", "test", "systemA", "middleLevel", "middleLevel.csv")
-		bottomFile := path.Join(tempDir, "test", "test", "systemA", "middleLevel", "bottomLevel", "bottomLevel.csv")
-		require.FileExists(t, topFile)
-		require.FileExists(t, middleFile)
-		require.FileExists(t, bottomFile)
-		topLines, err := readFileLines(topFile)
-		require.Nil(t, err)
-		require.Len(t, topLines, 4)
-		middleLines, err := readFileLines(middleFile)
-		require.Nil(t, err)
-		require.Len(t, middleLines, 2)
-		bottomLines, err := readFileLines(bottomFile)
-		require.Nil(t, err)
-		require.Len(t, bottomLines, 2)
-		require.Equal(t, strings.Join(clusterFrame.ColumnNames, ","), topLines[0])
-		require.Equal(t, "events,1,1,1,dalem-local-clickhouse-blue-1,192.168.144.2,9000,1,default,,0,0,0", topLines[1])
-		require.Equal(t, "events,2,1,1,dalem-local-clickhouse-blue-2,192.168.144.4,9001,1,default,,0,0,0", topLines[2])
-		require.Equal(t, "events,3,1,1,dalem-local-clickhouse-blue-3,192.168.144.3,9002,1,default,,0,0,0", topLines[3])
-		resetFrames()
-	})
-}
-
-func createRandomFiles(tempDir string, num int) []string {
-	files := make([]string, num)
-	for i := 0; i < 5; i++ {
-		// we want to check hierarchies are preserved so create a simple folder for each file
-		fileDir := path.Join(tempDir, fmt.Sprintf("%d", i))
-		os.MkdirAll(fileDir, os.ModePerm) //nolint:errcheck
-		filepath := path.Join(fileDir, fmt.Sprintf("random-%d.log", i))
-		files[i] = filepath
-		os.Create(filepath) //nolint:errcheck
-	}
-	return files
-}
-
-func resetFrames() {
-	clusterFrame.Reset()
-	userFrame.Reset()
-	diskFrame.Reset()
-}
-
-func readFileLines(filename string) ([]string, error) {
-	file, err := os.Open(filename)
-	if err != nil {
-		return nil, err
-	}
-	defer file.Close()
-
-	var lines []string
-	scanner := bufio.NewScanner(file)
-	for scanner.Scan() {
-		lines = append(lines, scanner.Text())
-	}
-	return lines, scanner.Err()
-}
-
-func staticFolderName() string {
-	return "test"
-}
diff --git a/programs/diagnostics/internal/outputs/registry.go b/programs/diagnostics/internal/outputs/registry.go
deleted file mode 100644
index 0187cd9105d..00000000000
--- a/programs/diagnostics/internal/outputs/registry.go
+++ /dev/null
@@ -1,67 +0,0 @@
-package outputs
-
-import (
-	"fmt"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/pkg/errors"
-	"github.com/rs/zerolog/log"
-)
-
-type Output interface {
-	Write(id string, bundles map[string]*data.DiagnosticBundle, config config.Configuration) (data.FrameErrors, error)
-	Configuration() config.Configuration
-	Description() string
-	// TODO: we will need to implement this for the convert function
-	//Read(config config.Configuration) (data.DiagnosticBundle, error)
-}
-
-// Register can be called from init() on an output in this package
-// It will automatically be added to the Outputs map to be called externally
-func Register(name string, output OutputFactory) {
-	// names must be unique
-	if _, ok := Outputs[name]; ok {
-		log.Error().Msgf("More than 1 output is trying to register under the name %s. Names must be unique.", name)
-	}
-	Outputs[name] = output
-}
-
-// OutputFactory lets us use a closure to get instances of the output struct
-type OutputFactory func() (Output, error)
-
-var Outputs = map[string]OutputFactory{}
-
-func GetOutputNames() []string {
-	outputs := make([]string, len(Outputs))
-	i := 0
-	for k := range Outputs {
-		outputs[i] = k
-		i++
-	}
-	return outputs
-}
-
-func GetOutputByName(name string) (Output, error) {
-	if outputFactory, ok := Outputs[name]; ok {
-		//do something here
-		output, err := outputFactory()
-		if err != nil {
-			return nil, errors.Wrapf(err, "output %s could not be initialized", name)
-		}
-		return output, nil
-	}
-	return nil, fmt.Errorf("%s is not a valid output name", name)
-}
-
-func BuildConfigurationOptions() (map[string]config.Configuration, error) {
-	configurations := make(map[string]config.Configuration)
-	for name, collectorFactory := range Outputs {
-		output, err := collectorFactory()
-		if err != nil {
-			return nil, errors.Wrapf(err, "output %s could not be initialized", name)
-		}
-		configurations[name] = output.Configuration()
-	}
-	return configurations, nil
-}
diff --git a/programs/diagnostics/internal/outputs/registry_test.go b/programs/diagnostics/internal/outputs/registry_test.go
deleted file mode 100644
index ba8408e5a59..00000000000
--- a/programs/diagnostics/internal/outputs/registry_test.go
+++ /dev/null
@@ -1,45 +0,0 @@
-package outputs_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs/file"
-	_ "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs/terminal"
-	"github.com/stretchr/testify/require"
-)
-
-func TestGetOutputNames(t *testing.T) {
-	t.Run("can get all output names", func(t *testing.T) {
-		outputNames := outputs.GetOutputNames()
-		require.ElementsMatch(t, []string{"simple", "report"}, outputNames)
-	})
-
-}
-
-func TestGetOutputByName(t *testing.T) {
-
-	t.Run("can get output by name", func(t *testing.T) {
-		output, err := outputs.GetOutputByName("simple")
-		require.Nil(t, err)
-		require.Equal(t, file.SimpleOutput{}, output)
-	})
-
-	t.Run("fails on non existing output", func(t *testing.T) {
-		output, err := outputs.GetOutputByName("random")
-		require.NotNil(t, err)
-		require.Equal(t, "random is not a valid output name", err.Error())
-		require.Nil(t, output)
-	})
-}
-
-func TestBuildConfigurationOptions(t *testing.T) {
-
-	t.Run("can get all output configurations", func(t *testing.T) {
-		outputs, err := outputs.BuildConfigurationOptions()
-		require.Nil(t, err)
-		require.Len(t, outputs, 2)
-		require.Contains(t, outputs, "simple")
-		require.Contains(t, outputs, "report")
-	})
-}
diff --git a/programs/diagnostics/internal/outputs/terminal/report.go b/programs/diagnostics/internal/outputs/terminal/report.go
deleted file mode 100644
index 8337f542457..00000000000
--- a/programs/diagnostics/internal/outputs/terminal/report.go
+++ /dev/null
@@ -1,284 +0,0 @@
-package terminal
-
-import (
-	"bufio"
-	"fmt"
-	"os"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/olekukonko/tablewriter"
-	"github.com/pkg/errors"
-)
-
-const OutputName = "report"
-
-type ReportOutput struct {
-}
-
-func (r ReportOutput) Write(id string, bundles map[string]*data.DiagnosticBundle, conf config.Configuration) (data.FrameErrors, error) {
-	conf, err := conf.ValidateConfig(r.Configuration())
-	if err != nil {
-		return data.FrameErrors{}, err
-	}
-	format, err := config.ReadStringOptionsValue(conf, "format")
-	if err != nil {
-		return data.FrameErrors{}, err
-	}
-	nonInteractive, err := config.ReadBoolValue(conf, "continue")
-	if err != nil {
-		return data.FrameErrors{}, err
-	}
-	maxRows, err := config.ReadIntValue(conf, "row_limit")
-	if err != nil {
-		return data.FrameErrors{}, err
-	}
-	maxColumns, err := config.ReadIntValue(conf, "column_limit")
-	if err != nil {
-		return data.FrameErrors{}, err
-	}
-	frameErrors := data.FrameErrors{}
-	for name := range bundles {
-		frameError := printDiagnosticBundle(name, bundles[name], format, !nonInteractive, int(maxRows), int(maxColumns))
-		frameErrors.Errors = append(frameErrors.Errors, frameError.Errors...)
-	}
-	return data.FrameErrors{}, nil
-}
-
-func printDiagnosticBundle(name string, diag *data.DiagnosticBundle, format string, interactive bool, maxRows, maxColumns int) data.FrameErrors {
-	frameErrors := data.FrameErrors{}
-	for frameId, frame := range diag.Frames {
-		printFrameHeader(fmt.Sprintf("%s.%s", name, frameId))
-		err := printFrame(frame, format, maxRows, maxColumns)
-		if err != nil {
-			frameErrors.Errors = append(frameErrors.Errors, err)
-		}
-		if interactive {
-			err := waitForEnter()
-			if err != nil {
-				frameErrors.Errors = append(frameErrors.Errors, err)
-			}
-		}
-	}
-	return frameErrors
-}
-
-func waitForEnter() error {
-	fmt.Println("Press the Enter Key to view the next frame report")
-	for {
-		consoleReader := bufio.NewReaderSize(os.Stdin, 1)
-		input, err := consoleReader.ReadByte()
-		if err != nil {
-			return errors.New("Unable to read user input")
-		}
-		if input == 3 {
-			//ctl +c
-			fmt.Println("Exiting...")
-			os.Exit(0)
-		}
-		if input == 10 {
-			return nil
-		}
-	}
-}
-
-func printFrame(frame data.Frame, format string, maxRows, maxColumns int) error {
-	switch f := frame.(type) {
-	case data.DatabaseFrame:
-		return printDatabaseFrame(f, format, maxRows, maxColumns)
-	case data.ConfigFileFrame:
-		return printConfigFrame(f, format)
-	case data.DirectoryFileFrame:
-		return printDirectoryFileFrame(f, format, maxRows)
-	case data.HierarchicalFrame:
-		return printHierarchicalFrame(f, format, maxRows, maxColumns)
-	default:
-		// for now our data frame writer supports all frames
-		return printDatabaseFrame(f, format, maxRows, maxColumns)
-	}
-}
-
-func createTable(format string) *tablewriter.Table {
-	table := tablewriter.NewWriter(os.Stdout)
-	if format == "markdown" {
-		table.SetBorders(tablewriter.Border{Left: true, Top: false, Right: true, Bottom: false})
-		table.SetCenterSeparator("|")
-	}
-	return table
-}
-
-func printFrameHeader(title string) {
-	titleTable := tablewriter.NewWriter(os.Stdout)
-	titleTable.SetHeader([]string{title})
-	titleTable.SetAutoWrapText(false)
-	titleTable.SetAutoFormatHeaders(true)
-	titleTable.SetHeaderAlignment(tablewriter.ALIGN_CENTER)
-	titleTable.SetRowSeparator("\n")
-	titleTable.SetHeaderLine(false)
-	titleTable.SetBorder(false)
-	titleTable.SetTablePadding("\t") // pad with tabs
-	titleTable.SetNoWhiteSpace(true)
-	titleTable.Render()
-}
-
-func printHierarchicalFrame(frame data.HierarchicalFrame, format string, maxRows, maxColumns int) error {
-	err := printDatabaseFrame(frame, format, maxRows, maxColumns)
-	if err != nil {
-		return err
-	}
-	for _, subFrame := range frame.SubFrames {
-		err = printHierarchicalFrame(subFrame, format, maxRows, maxColumns)
-		if err != nil {
-			return err
-		}
-	}
-	return nil
-}
-
-func printDatabaseFrame(frame data.Frame, format string, maxRows, maxColumns int) error {
-	table := createTable(format)
-	table.SetAutoWrapText(false)
-	columns := len(frame.Columns())
-	if maxColumns > 0 && maxColumns < columns {
-		columns = maxColumns
-	}
-	table.SetHeader(frame.Columns()[:columns])
-	r := 0
-	trunColumns := 0
-	for {
-		values, ok, err := frame.Next()
-		if !ok || r == maxRows {
-			table.Render()
-			if trunColumns > 0 {
-				warning(fmt.Sprintf("Truncated %d columns, more available...", trunColumns))
-			}
-			if r == maxRows {
-				warning("Truncated rows, more available...")
-			}
-			return err
-		}
-		if err != nil {
-			return err
-		}
-		columns := len(values)
-		// -1 means unlimited
-		if maxColumns > 0 && maxColumns < columns {
-			trunColumns = columns - maxColumns
-			columns = maxColumns
-		}
-		row := make([]string, columns)
-		for i, value := range values {
-			if i == columns {
-				break
-			}
-			row[i] = fmt.Sprintf("%v", value)
-		}
-		table.Append(row)
-		r++
-	}
-}
-
-// currently we dump the whole config - useless in parts
-func printConfigFrame(frame data.Frame, format string) error {
-	for {
-		values, ok, err := frame.Next()
-		if !ok {
-			return err
-		}
-		if err != nil {
-			return err
-		}
-		configFile := values[0].(data.File)
-		dat, err := os.ReadFile(configFile.FilePath())
-		if err != nil {
-			return err
-		}
-		// create a table per row - as each will be a file
-		table := createTable(format)
-		table.SetAutoWrapText(false)
-		table.SetAutoFormatHeaders(false)
-		table.ClearRows()
-		table.SetHeader([]string{configFile.FilePath()})
-		table.Append([]string{string(dat)})
-		table.Render()
-	}
-}
-
-func printDirectoryFileFrame(frame data.Frame, format string, maxRows int) error {
-	for {
-		values, ok, err := frame.Next()
-		if !ok {
-
-			return err
-		}
-		if err != nil {
-			return err
-		}
-		path := values[0].(data.SimpleFile)
-		file, err := os.Open(path.FilePath())
-		if err != nil {
-			// failure on one file causes rest to be ignored in frame...we could improve this
-			return errors.Wrapf(err, "Unable to read file %s", path.FilePath())
-		}
-		scanner := bufio.NewScanner(file)
-		i := 0
-		// create a table per row - as each will be a file
-		table := createTable(format)
-		table.SetAutoWrapText(false)
-		table.SetAutoFormatHeaders(false)
-		table.ClearRows()
-		table.SetHeader([]string{path.FilePath()})
-		for scanner.Scan() {
-			if i == maxRows {
-				fmt.Println()
-				table.Render()
-				warning("Truncated lines, more available...")
-				fmt.Print("\n")
-				break
-			}
-			table.Append([]string{scanner.Text()})
-			i++
-		}
-	}
-}
-
-// prints a warning
-func warning(s string) {
-	fmt.Printf("\x1b[%dm%v\x1b[0m%s\n", 33, "WARNING: ", s)
-}
-
-func (r ReportOutput) Configuration() config.Configuration {
-	return config.Configuration{
-		Params: []config.ConfigParam{
-			config.StringOptions{
-				Value:   "default",
-				Options: []string{"default", "markdown"},
-				Param:   config.NewParam("format", "Format of tables. Default is terminal friendly.", false),
-			},
-			config.BoolParam{
-				Value: false,
-				Param: config.NewParam("continue", "Print report with no interaction", false),
-			},
-			config.IntParam{
-				Value: 10,
-				Param: config.NewParam("row_limit", "Max Rows to print per frame.", false),
-			},
-			config.IntParam{
-				Value: 8,
-				Param: config.NewParam("column_limit", "Max Columns to print per frame. Negative is unlimited.", false),
-			},
-		},
-	}
-}
-
-func (r ReportOutput) Description() string {
-	return "Writes out the diagnostic bundle to the terminal as a simple report."
-}
-
-// here we register the output for use
-func init() {
-	outputs.Register(OutputName, func() (outputs.Output, error) {
-		return ReportOutput{}, nil
-	})
-}
diff --git a/programs/diagnostics/internal/platform/config/models.go b/programs/diagnostics/internal/platform/config/models.go
deleted file mode 100644
index 6c76b8f149b..00000000000
--- a/programs/diagnostics/internal/platform/config/models.go
+++ /dev/null
@@ -1,129 +0,0 @@
-package config
-
-import (
-	"fmt"
-	"strings"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-)
-
-type ConfigParam interface {
-	Name() string
-	Required() bool
-	Description() string
-	validate(defaultConfig ConfigParam) error
-}
-
-type Configuration struct {
-	Params []ConfigParam
-}
-
-type Param struct {
-	name        string
-	description string
-	required    bool
-}
-
-func NewParam(name string, description string, required bool) Param {
-	return Param{
-		name:        name,
-		description: description,
-		required:    required,
-	}
-}
-
-func (bp Param) Name() string {
-	return bp.name
-}
-
-func (bp Param) Required() bool {
-	return bp.required
-}
-
-func (bp Param) Description() string {
-	return bp.description
-}
-
-func (bp Param) validate(defaultConfig ConfigParam) error {
-	return nil
-}
-
-func (c Configuration) GetConfigParam(paramName string) (ConfigParam, error) {
-	for _, param := range c.Params {
-		if param.Name() == paramName {
-			return param, nil
-		}
-	}
-	return nil, fmt.Errorf("%s does not exist", paramName)
-}
-
-// ValidateConfig finds the intersection of a config c and a default config. Requires all possible params to be in default.
-func (c Configuration) ValidateConfig(defaultConfig Configuration) (Configuration, error) {
-	var finalParams []ConfigParam
-	for _, defaultParam := range defaultConfig.Params {
-		setParam, err := c.GetConfigParam(defaultParam.Name())
-		if err == nil {
-			// check the set value is valid
-			if err := setParam.validate(defaultParam); err != nil {
-				return Configuration{}, fmt.Errorf("parameter %s is invalid - %s", defaultParam.Name(), err.Error())
-			}
-			finalParams = append(finalParams, setParam)
-		} else if defaultParam.Required() {
-			return Configuration{}, fmt.Errorf("missing required parameter %s - %s", defaultParam.Name(), err.Error())
-		} else {
-			finalParams = append(finalParams, defaultParam)
-		}
-	}
-	return Configuration{
-		Params: finalParams,
-	}, nil
-}
-
-type StringParam struct {
-	Param
-	Value      string
-	AllowEmpty bool
-}
-
-func (sp StringParam) validate(defaultConfig ConfigParam) error {
-	dsp := defaultConfig.(StringParam)
-	if !dsp.AllowEmpty && strings.TrimSpace(sp.Value) == "" {
-		return fmt.Errorf("%s cannot be empty", sp.Name())
-	}
-	// if the parameter is not required it doesn't matter
-	return nil
-}
-
-type StringListParam struct {
-	Param
-	Values []string
-}
-
-type StringOptions struct {
-	Param
-	Options    []string
-	Value      string
-	AllowEmpty bool
-}
-
-func (so StringOptions) validate(defaultConfig ConfigParam) error {
-	dso := defaultConfig.(StringOptions)
-	if !dso.AllowEmpty && strings.TrimSpace(so.Value) == "" {
-		return fmt.Errorf("%s cannot be empty", so.Name())
-	}
-	if !utils.Contains(dso.Options, so.Value) {
-		return fmt.Errorf("%s is not a valid value for %s - %v", so.Value, so.Name(), so.Options)
-	}
-	// if the parameter is not required it doesn't matter
-	return nil
-}
-
-type IntParam struct {
-	Param
-	Value int64
-}
-
-type BoolParam struct {
-	Param
-	Value bool
-}
diff --git a/programs/diagnostics/internal/platform/config/models_test.go b/programs/diagnostics/internal/platform/config/models_test.go
deleted file mode 100644
index 916d20ec28b..00000000000
--- a/programs/diagnostics/internal/platform/config/models_test.go
+++ /dev/null
@@ -1,182 +0,0 @@
-package config_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/stretchr/testify/require"
-)
-
-var conf = config.Configuration{
-	Params: []config.ConfigParam{
-		config.StringListParam{
-			Values: []string{"some", "values"},
-			Param:  config.NewParam("paramA", "", false),
-		},
-		config.StringParam{
-			Value: "random",
-			Param: config.NewParam("paramB", "", true),
-		},
-		config.StringParam{
-			Value:      "",
-			AllowEmpty: true,
-			Param:      config.NewParam("paramC", "", false),
-		},
-		config.StringOptions{
-			Value:      "random",
-			Options:    []string{"random", "very_random", "very_very_random"},
-			Param:      config.NewParam("paramD", "", false),
-			AllowEmpty: true,
-		},
-	},
-}
-
-func TestGetConfigParam(t *testing.T) {
-
-	t.Run("can find get config param by name", func(t *testing.T) {
-		paramA, err := conf.GetConfigParam("paramA")
-		require.Nil(t, err)
-		require.NotNil(t, paramA)
-		require.IsType(t, config.StringListParam{}, paramA)
-		stringListParam, ok := paramA.(config.StringListParam)
-		require.True(t, ok)
-		require.False(t, stringListParam.Required())
-		require.Equal(t, stringListParam.Name(), "paramA")
-		require.ElementsMatch(t, stringListParam.Values, []string{"some", "values"})
-	})
-
-	t.Run("throws error on missing element", func(t *testing.T) {
-		paramZ, err := conf.GetConfigParam("paramZ")
-		require.Nil(t, paramZ)
-		require.NotNil(t, err)
-		require.Equal(t, err.Error(), "paramZ does not exist")
-	})
-}
-
-func TestValidateConfig(t *testing.T) {
-
-	t.Run("validate adds the default and allows override", func(t *testing.T) {
-		customConf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value: "custom",
-					Param: config.NewParam("paramB", "", true),
-				},
-			},
-		}
-		newConf, err := customConf.ValidateConfig(conf)
-		require.Nil(t, err)
-		require.NotNil(t, newConf)
-		require.Len(t, newConf.Params, 4)
-		// check first param
-		require.IsType(t, config.StringListParam{}, newConf.Params[0])
-		stringListParam, ok := newConf.Params[0].(config.StringListParam)
-		require.True(t, ok)
-		require.False(t, stringListParam.Required())
-		require.Equal(t, stringListParam.Name(), "paramA")
-		require.ElementsMatch(t, stringListParam.Values, []string{"some", "values"})
-		// check second param
-		require.IsType(t, config.StringParam{}, newConf.Params[1])
-		stringParam, ok := newConf.Params[1].(config.StringParam)
-		require.True(t, ok)
-		require.True(t, stringParam.Required())
-		require.Equal(t, "paramB", stringParam.Name())
-		require.Equal(t, "custom", stringParam.Value)
-	})
-
-	t.Run("validate errors if missing param", func(t *testing.T) {
-		//missing required paramB
-		customConf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringListParam{
-					Values: []string{"some", "values"},
-					Param:  config.NewParam("paramA", "", false),
-				},
-			},
-		}
-		newConf, err := customConf.ValidateConfig(conf)
-		require.Nil(t, newConf.Params)
-		require.NotNil(t, err)
-		require.Equal(t, "missing required parameter paramB - paramB does not exist", err.Error())
-	})
-
-	t.Run("validate errors if invalid string value", func(t *testing.T) {
-		//missing required paramB
-		customConf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value: "",
-					Param: config.NewParam("paramB", "", true),
-				},
-			},
-		}
-		newConf, err := customConf.ValidateConfig(conf)
-		require.Nil(t, newConf.Params)
-		require.NotNil(t, err)
-		require.Equal(t, "parameter paramB is invalid - paramB cannot be empty", err.Error())
-	})
-
-	t.Run("allow empty string value if specified", func(t *testing.T) {
-		//missing required paramB
-		customConf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value: "",
-					Param: config.NewParam("paramC", "", true),
-				},
-				config.StringParam{
-					Value: "custom",
-					Param: config.NewParam("paramB", "", true),
-				},
-			},
-		}
-		newConf, err := customConf.ValidateConfig(conf)
-		require.NotNil(t, newConf.Params)
-		require.Nil(t, err)
-	})
-
-	t.Run("validate errors if invalid string options value", func(t *testing.T) {
-		//missing required paramB
-		customConf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value: "not_random",
-					Param: config.NewParam("paramB", "", true),
-				},
-				config.StringOptions{
-					Value: "custom",
-					// this isn't ideal we need to ensure options are set for this to validate correctly
-					Options: []string{"random", "very_random", "very_very_random"},
-					Param:   config.NewParam("paramD", "", true),
-				},
-			},
-		}
-		newConf, err := customConf.ValidateConfig(conf)
-		require.Nil(t, newConf.Params)
-		require.NotNil(t, err)
-		require.Equal(t, "parameter paramD is invalid - custom is not a valid value for paramD - [random very_random very_very_random]", err.Error())
-	})
-
-	t.Run("allow empty string value for StringOptions if specified", func(t *testing.T) {
-		//missing required paramB
-		customConf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringParam{
-					Value: "custom",
-					Param: config.NewParam("paramB", "", true),
-				},
-				config.StringOptions{
-					Param: config.Param{},
-					// this isn't ideal we need to ensure options are set for this to validate correctly
-					Options: []string{"random", "very_random", "very_very_random"},
-					Value:   "",
-				},
-			},
-		}
-		newConf, err := customConf.ValidateConfig(conf)
-		require.NotNil(t, newConf.Params)
-		require.Nil(t, err)
-	})
-
-	//TODO: Do we need to test if parameters of the same name but wrong type are passed??
-}
diff --git a/programs/diagnostics/internal/platform/config/utils.go b/programs/diagnostics/internal/platform/config/utils.go
deleted file mode 100644
index 5f84c38d4f4..00000000000
--- a/programs/diagnostics/internal/platform/config/utils.go
+++ /dev/null
@@ -1,74 +0,0 @@
-package config
-
-import (
-	"fmt"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-)
-
-func ReadStringListValues(conf Configuration, paramName string) ([]string, error) {
-	param, err := conf.GetConfigParam(paramName)
-	if err != nil {
-		return nil, err
-	}
-	value, ok := param.(StringListParam)
-	if !ok {
-		value, ok = param.(StringListParam)
-		if !ok {
-			return nil, fmt.Errorf("%s must be a list of strings", paramName)
-		}
-	}
-
-	return value.Values, nil
-}
-
-func ReadStringValue(conf Configuration, paramName string) (string, error) {
-	param, err := conf.GetConfigParam(paramName)
-	if err != nil {
-		return "", err
-	}
-	value, ok := param.(StringParam)
-	if !ok {
-		return "", fmt.Errorf("%s must be a list of strings", paramName)
-	}
-	return value.Value, nil
-}
-
-func ReadIntValue(conf Configuration, paramName string) (int64, error) {
-	param, err := conf.GetConfigParam(paramName)
-	if err != nil {
-		return 0, err
-	}
-	value, ok := param.(IntParam)
-	if !ok {
-		return 9, fmt.Errorf("%s must be an unsigned integer", paramName)
-	}
-	return value.Value, nil
-}
-
-func ReadBoolValue(conf Configuration, paramName string) (bool, error) {
-	param, err := conf.GetConfigParam(paramName)
-	if err != nil {
-		return false, err
-	}
-	value, ok := param.(BoolParam)
-	if !ok {
-		return false, fmt.Errorf("%s must be a boolean", paramName)
-	}
-	return value.Value, nil
-}
-
-func ReadStringOptionsValue(conf Configuration, paramName string) (string, error) {
-	param, err := conf.GetConfigParam(paramName)
-	if err != nil {
-		return "", err
-	}
-	value, ok := param.(StringOptions)
-	if !ok {
-		return "", fmt.Errorf("%s must be a string options", paramName)
-	}
-	if !utils.Contains(value.Options, value.Value) {
-		return "", fmt.Errorf("%s is not a valid option in %v for the the parameter %s", value.Value, value.Options, paramName)
-	}
-	return value.Value, nil
-}
diff --git a/programs/diagnostics/internal/platform/config/utils_test.go b/programs/diagnostics/internal/platform/config/utils_test.go
deleted file mode 100644
index 9e03e5e69d2..00000000000
--- a/programs/diagnostics/internal/platform/config/utils_test.go
+++ /dev/null
@@ -1,142 +0,0 @@
-package config_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/stretchr/testify/require"
-)
-
-func TestReadStringListValues(t *testing.T) {
-
-	t.Run("can find a string list param", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringListParam{
-					// nil means include everything
-					Values: nil,
-					Param:  config.NewParam("include_tables", "Specify list of tables to collect", false),
-				},
-				config.StringListParam{
-					Values: []string{"licenses", "settings"},
-					Param:  config.NewParam("exclude_tables", "Specify list of tables not to collect", false),
-				},
-			},
-		}
-		excludeTables, err := config.ReadStringListValues(conf, "exclude_tables")
-		require.Nil(t, err)
-		require.Equal(t, []string{"licenses", "settings"}, excludeTables)
-	})
-
-}
-
-func TestReadStringValue(t *testing.T) {
-
-	t.Run("can find a string param", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringListParam{
-					// nil means include everything
-					Values: nil,
-					Param:  config.NewParam("include_tables", "Specify list of tables to collect", false),
-				},
-				config.StringParam{
-					Value: "/tmp/dump",
-					Param: config.NewParam("directory", "Specify a directory", false),
-				},
-			},
-		}
-		directory, err := config.ReadStringValue(conf, "directory")
-		require.Nil(t, err)
-		require.Equal(t, "/tmp/dump", directory)
-	})
-
-}
-
-func TestReadIntValue(t *testing.T) {
-	t.Run("can find an integer param", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.IntParam{
-					// nil means include everything
-					Value: 10000,
-					Param: config.NewParam("row_limit", "Max Rows to collect", false),
-				},
-				config.StringListParam{
-					// nil means include everything
-					Values: nil,
-					Param:  config.NewParam("include_tables", "Specify list of tables to collect", false),
-				},
-				config.StringParam{
-					Value: "/tmp/dump",
-					Param: config.NewParam("directory", "Specify a directory", false),
-				},
-			},
-		}
-		rowLimit, err := config.ReadIntValue(conf, "row_limit")
-		require.Nil(t, err)
-		require.Equal(t, int64(10000), rowLimit)
-	})
-
-}
-
-func TestReadBoolValue(t *testing.T) {
-	t.Run("can find a boolean param", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.BoolParam{
-					// nil means include everything
-					Value: true,
-					Param: config.NewParam("compress", "Compress data", false),
-				},
-				config.StringListParam{
-					// nil means include everything
-					Values: nil,
-					Param:  config.NewParam("include_tables", "Specify list of tables to collect", false),
-				},
-				config.StringParam{
-					Value: "/tmp/dump",
-					Param: config.NewParam("directory", "Specify a directory", false),
-				},
-			},
-		}
-
-		compress, err := config.ReadBoolValue(conf, "compress")
-		require.Nil(t, err)
-		require.True(t, compress)
-	})
-}
-
-func TestReadStringOptionsValue(t *testing.T) {
-	t.Run("can find a string value in a list of options", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringOptions{
-					Param:      config.NewParam("format", "List of formats", false),
-					Options:    []string{"csv", "tsv", "binary", "json", "ndjson"},
-					Value:      "csv",
-					AllowEmpty: false,
-				},
-			},
-		}
-		format, err := config.ReadStringOptionsValue(conf, "format")
-		require.Nil(t, err)
-		require.Equal(t, "csv", format)
-	})
-
-	t.Run("errors on invalid value", func(t *testing.T) {
-		conf := config.Configuration{
-			Params: []config.ConfigParam{
-				config.StringOptions{
-					Param:      config.NewParam("format", "List of formats", false),
-					Options:    []string{"csv", "tsv", "binary", "json", "ndjson"},
-					Value:      "random",
-					AllowEmpty: false,
-				},
-			},
-		}
-		format, err := config.ReadStringOptionsValue(conf, "format")
-		require.Equal(t, "random is not a valid option in [csv tsv binary json ndjson] for the the parameter format", err.Error())
-		require.Equal(t, "", format)
-	})
-}
diff --git a/programs/diagnostics/internal/platform/data/bundle.go b/programs/diagnostics/internal/platform/data/bundle.go
deleted file mode 100644
index e4eeede659e..00000000000
--- a/programs/diagnostics/internal/platform/data/bundle.go
+++ /dev/null
@@ -1,27 +0,0 @@
-package data
-
-import (
-	"strings"
-)
-
-// DiagnosticBundle contains the results from a Collector
-// each frame can represent a table or collection of data files. By allowing multiple frames a single DiagnosticBundle
-// can potentially contain many related tables
-type DiagnosticBundle struct {
-	Frames map[string]Frame
-	// Errors is a property to be set if the Collector has an error. This can be used to indicate a partial collection
-	// and failed frames
-	Errors FrameErrors
-}
-
-type FrameErrors struct {
-	Errors []error
-}
-
-func (fe *FrameErrors) Error() string {
-	errors := make([]string, len(fe.Errors))
-	for i := range errors {
-		errors[i] = fe.Errors[i].Error()
-	}
-	return strings.Join(errors, "\n")
-}
diff --git a/programs/diagnostics/internal/platform/data/bundle_test.go b/programs/diagnostics/internal/platform/data/bundle_test.go
deleted file mode 100644
index ff9cfc2cf56..00000000000
--- a/programs/diagnostics/internal/platform/data/bundle_test.go
+++ /dev/null
@@ -1,26 +0,0 @@
-package data_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/pkg/errors"
-	"github.com/stretchr/testify/require"
-)
-
-func TestBundleError(t *testing.T) {
-
-	t.Run("can get a bundle error", func(t *testing.T) {
-		errs := make([]error, 3)
-		errs[0] = errors.New("Error 1")
-		errs[1] = errors.New("Error 2")
-		errs[2] = errors.New("Error 3")
-		fErrors := data.FrameErrors{
-			Errors: errs,
-		}
-		require.Equal(t, `Error 1
-Error 2
-Error 3`, fErrors.Error())
-
-	})
-}
diff --git a/programs/diagnostics/internal/platform/data/database.go b/programs/diagnostics/internal/platform/data/database.go
deleted file mode 100644
index d49317d8719..00000000000
--- a/programs/diagnostics/internal/platform/data/database.go
+++ /dev/null
@@ -1,88 +0,0 @@
-package data
-
-import (
-	"database/sql"
-	"fmt"
-	"reflect"
-	"strings"
-)
-
-type DatabaseFrame struct {
-	name        string
-	ColumnNames []string
-	rows        *sql.Rows
-	columnTypes []*sql.ColumnType
-	vars        []interface{}
-}
-
-func NewDatabaseFrame(name string, rows *sql.Rows) (DatabaseFrame, error) {
-	databaseFrame := DatabaseFrame{}
-	columnTypes, err := rows.ColumnTypes()
-	if err != nil {
-		return DatabaseFrame{}, err
-	}
-	databaseFrame.columnTypes = columnTypes
-	databaseFrame.name = name
-	vars := make([]interface{}, len(columnTypes))
-	columnNames := make([]string, len(columnTypes))
-	for i := range columnTypes {
-		value := reflect.Zero(columnTypes[i].ScanType()).Interface()
-		vars[i] = &value
-		columnNames[i] = columnTypes[i].Name()
-	}
-	databaseFrame.ColumnNames = columnNames
-	databaseFrame.vars = vars
-	databaseFrame.rows = rows
-	return databaseFrame, nil
-}
-
-func (f DatabaseFrame) Next() ([]interface{}, bool, error) {
-	values := make([]interface{}, len(f.columnTypes))
-	for f.rows.Next() {
-		if err := f.rows.Scan(f.vars...); err != nil {
-			return nil, false, err
-		}
-		for i := range f.columnTypes {
-			ptr := reflect.ValueOf(f.vars[i])
-			values[i] = ptr.Elem().Interface()
-		}
-		return values, true, nil //nolint
-	}
-	// TODO: raise issue as this seems to always raise an error
-	//err := f.rows.Err()
-	f.rows.Close()
-	return nil, false, nil
-}
-
-func (f DatabaseFrame) Columns() []string {
-	return f.ColumnNames
-}
-
-func (f DatabaseFrame) Name() string {
-	return f.name
-}
-
-type Order int
-
-const (
-	Asc  Order = 1
-	Desc Order = 2
-)
-
-type OrderBy struct {
-	Column string
-	Order  Order
-}
-
-func (o OrderBy) String() string {
-	if strings.TrimSpace(o.Column) == "" {
-		return ""
-	}
-	switch o.Order {
-	case Asc:
-		return fmt.Sprintf(" ORDER BY %s ASC", o.Column)
-	case Desc:
-		return fmt.Sprintf(" ORDER BY %s DESC", o.Column)
-	}
-	return ""
-}
diff --git a/programs/diagnostics/internal/platform/data/database_test.go b/programs/diagnostics/internal/platform/data/database_test.go
deleted file mode 100644
index 57d89e78efc..00000000000
--- a/programs/diagnostics/internal/platform/data/database_test.go
+++ /dev/null
@@ -1,86 +0,0 @@
-package data_test
-
-import (
-	"database/sql"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/DATA-DOG/go-sqlmock"
-	"github.com/stretchr/testify/require"
-)
-
-func TestString(t *testing.T) {
-	t.Run("can order by asc", func(t *testing.T) {
-		orderBy := data.OrderBy{
-			Column: "created_at",
-			Order:  data.Asc,
-		}
-		require.Equal(t, " ORDER BY created_at ASC", orderBy.String())
-	})
-
-	t.Run("can order by desc", func(t *testing.T) {
-		orderBy := data.OrderBy{
-			Column: "created_at",
-			Order:  data.Desc,
-		}
-		require.Equal(t, " ORDER BY created_at DESC", orderBy.String())
-	})
-
-}
-
-func TestNextDatabaseFrame(t *testing.T) {
-
-	t.Run("can iterate sql rows", func(t *testing.T) {
-		rowValues := [][]interface{}{
-			{int64(1), "post_1", "hello"},
-			{int64(2), "post_2", "world"},
-			{int64(3), "post_3", "goodbye"},
-			{int64(4), "post_4", "world"},
-		}
-		mockRows := sqlmock.NewRows([]string{"id", "title", "body"})
-		for i := range rowValues {
-			mockRows.AddRow(rowValues[i][0], rowValues[i][1], rowValues[i][2])
-		}
-		rows := mockRowsToSqlRows(mockRows)
-		dbFrame, err := data.NewDatabaseFrame("test", rows)
-		require.ElementsMatch(t, dbFrame.Columns(), []string{"id", "title", "body"})
-		require.Nil(t, err)
-		i := 0
-		for {
-			values, ok, err := dbFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-			require.Len(t, values, 3)
-			require.ElementsMatch(t, values, rowValues[i])
-			i++
-		}
-		require.Equal(t, 4, i)
-	})
-
-	t.Run("can iterate empty sql rows", func(t *testing.T) {
-		mockRows := sqlmock.NewRows([]string{"id", "title", "body"})
-		rows := mockRowsToSqlRows(mockRows)
-		dbFrame, err := data.NewDatabaseFrame("test", rows)
-		require.ElementsMatch(t, dbFrame.Columns(), []string{"id", "title", "body"})
-		require.Nil(t, err)
-		i := 0
-		for {
-			_, ok, err := dbFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-			i++
-		}
-		require.Equal(t, 0, i)
-	})
-}
-
-func mockRowsToSqlRows(mockRows *sqlmock.Rows) *sql.Rows {
-	db, mock, _ := sqlmock.New()
-	mock.ExpectQuery("select").WillReturnRows(mockRows)
-	rows, _ := db.Query("select")
-	return rows
-}
diff --git a/programs/diagnostics/internal/platform/data/field.go b/programs/diagnostics/internal/platform/data/field.go
deleted file mode 100644
index 5e80fc1f467..00000000000
--- a/programs/diagnostics/internal/platform/data/field.go
+++ /dev/null
@@ -1,8 +0,0 @@
-package data
-
-type Field struct {
-	// Name of the field
-	Name string
-	// A list of fields that must implement FieldType interface
-	Values []interface{}
-}
diff --git a/programs/diagnostics/internal/platform/data/file.go b/programs/diagnostics/internal/platform/data/file.go
deleted file mode 100644
index 9760b4b6906..00000000000
--- a/programs/diagnostics/internal/platform/data/file.go
+++ /dev/null
@@ -1,444 +0,0 @@
-package data
-
-import (
-	"bufio"
-	"encoding/xml"
-	"io/ioutil"
-	"os"
-	"path"
-	"path/filepath"
-	"regexp"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/pkg/errors"
-	"gopkg.in/yaml.v3"
-)
-
-type File interface {
-	Copy(destPath string, removeSensitive bool) error
-	FilePath() string
-}
-
-type SimpleFile struct {
-	Path string
-}
-
-// Copy supports removeSensitive for other file types but for a simple file this doesn't do anything
-func (s SimpleFile) Copy(destPath string, removeSensitive bool) error {
-	// simple copy easiest
-	if err := utils.CopyFile(s.FilePath(), destPath); err != nil {
-		return errors.Wrapf(err, "unable to copy file %s", s.FilePath())
-	}
-	return nil
-}
-
-func (s SimpleFile) FilePath() string {
-	return s.Path
-}
-
-func NewFileFrame(name string, filePaths []string) FileFrame {
-	i := 0
-	files := make([]File, len(filePaths))
-	for i, path := range filePaths {
-		files[i] = SimpleFile{
-			Path: path,
-		}
-	}
-	return FileFrame{
-		name:  name,
-		i:     &i,
-		files: files,
-	}
-}
-
-type FileFrame struct {
-	name  string
-	i     *int
-	files []File
-}
-
-func (f FileFrame) Next() ([]interface{}, bool, error) {
-	if len(f.files) == *(f.i) {
-		return nil, false, nil
-	}
-	file := f.files[*f.i]
-	*f.i++
-	value := make([]interface{}, 1)
-	value[0] = file
-	return value, true, nil
-}
-
-func (f FileFrame) Columns() []string {
-	return []string{"files"}
-}
-
-func (f FileFrame) Name() string {
-	return f.name
-}
-
-// DirectoryFileFrame represents a set of files under a directory
-type DirectoryFileFrame struct {
-	FileFrame
-	Directory string
-}
-
-func NewFileDirectoryFrame(directory string, exts []string) (DirectoryFileFrame, []error) {
-	filePaths, errs := utils.ListFilesInDirectory(directory, exts)
-	files := make([]File, len(filePaths))
-	for i, path := range filePaths {
-		files[i] = SimpleFile{
-			Path: path,
-		}
-	}
-	i := 0
-	return DirectoryFileFrame{
-		Directory: directory,
-		FileFrame: FileFrame{
-			files: files,
-			i:     &i,
-		},
-	}, errs
-}
-
-func (f DirectoryFileFrame) Next() ([]interface{}, bool, error) {
-	if len(f.files) == *(f.i) {
-		return nil, false, nil
-	}
-	file := f.files[*f.i]
-	*f.i++
-	value := make([]interface{}, 1)
-	value[0] = file
-	return value, true, nil
-}
-
-func (f DirectoryFileFrame) Columns() []string {
-	return []string{"files"}
-}
-
-func (f DirectoryFileFrame) Name() string {
-	return f.Directory
-}
-
-type ConfigFile interface {
-	File
-	FindLogPaths() ([]string, error)
-	FindIncludedConfig() (ConfigFile, error)
-	IsIncluded() bool
-}
-
-type ConfigFileFrame struct {
-	i         *int
-	Directory string
-	files     []ConfigFile
-}
-
-func (f ConfigFileFrame) Next() ([]interface{}, bool, error) {
-	if len(f.files) == *(f.i) {
-		return nil, false, nil
-	}
-	file := f.files[*f.i]
-	*f.i++
-	value := make([]interface{}, 1)
-	value[0] = file
-	return value, true, nil
-}
-
-func (f ConfigFileFrame) Name() string {
-	return f.Directory
-}
-
-func NewConfigFileFrame(directory string) (ConfigFileFrame, []error) {
-	files, errs := utils.ListFilesInDirectory(directory, []string{"*.xml", "*.yaml", "*.yml"})
-	// we can't predict the length because of include files
-	var configs []ConfigFile
-
-	for _, path := range files {
-		var configFile ConfigFile
-		switch ext := filepath.Ext(path); ext {
-		case ".xml":
-			configFile = XmlConfigFile{
-				Path:     path,
-				Included: false,
-			}
-		case ".yml":
-			configFile = YamlConfigFile{
-				Path:     path,
-				Included: false,
-			}
-		case ".yaml":
-			configFile = YamlConfigFile{
-				Path: path,
-			}
-		}
-		if configFile != nil {
-			configs = append(configs, configFile)
-			// add any included configs
-			iConf, err := configFile.FindIncludedConfig()
-			if err != nil {
-				errs = append(errs, err)
-			} else {
-				if iConf.FilePath() != "" {
-					configs = append(configs, iConf)
-				}
-			}
-		}
-	}
-	i := 0
-
-	return ConfigFileFrame{
-		i:         &i,
-		Directory: directory,
-		files:     configs,
-	}, errs
-}
-
-func (f ConfigFileFrame) Columns() []string {
-	return []string{"config"}
-}
-
-func (f ConfigFileFrame) FindLogPaths() (logPaths []string, errors []error) {
-	for _, configFile := range f.files {
-		paths, err := configFile.FindLogPaths()
-		if err != nil {
-			errors = append(errors, err)
-		} else {
-			logPaths = append(logPaths, paths...)
-		}
-	}
-	return logPaths, errors
-}
-
-type XmlConfigFile struct {
-	Path     string
-	Included bool
-}
-
-// these patterns will be used to remove sensitive content - matches of the pattern will be replaced with the key
-var xmlSensitivePatterns = map[string]*regexp.Regexp{
-	"<password>Replaced</password>":                       regexp.MustCompile(`<password>(.*)</password>`),
-	"<password_sha256_hex>Replaced</password_sha256_hex>": regexp.MustCompile(`<password_sha256_hex>(.*)</password_sha256_hex>`),
-	"<secret_access_key>Replaced</secret_access_key>":     regexp.MustCompile(`<secret_access_key>(.*)</secret_access_key>`),
-	"<access_key_id>Replaced</access_key_id>":             regexp.MustCompile(`<access_key_id>(.*)</access_key_id>`),
-	"<secret>Replaced</secret>":                           regexp.MustCompile(`<secret>(.*)</secret>`),
-}
-
-func (x XmlConfigFile) Copy(destPath string, removeSensitive bool) error {
-	if !removeSensitive {
-		// simple copy easiest
-		if err := utils.CopyFile(x.FilePath(), destPath); err != nil {
-			return errors.Wrapf(err, "unable to copy file %s", x.FilePath())
-		}
-		return nil
-	}
-	return sensitiveFileCopy(x.FilePath(), destPath, xmlSensitivePatterns)
-}
-
-func (x XmlConfigFile) FilePath() string {
-	return x.Path
-}
-
-func (x XmlConfigFile) IsIncluded() bool {
-	return x.Included
-}
-
-type XmlLoggerConfig struct {
-	XMLName  xml.Name `xml:"logger"`
-	ErrorLog string   `xml:"errorlog"`
-	Log      string   `xml:"log"`
-}
-
-type YandexXMLConfig struct {
-	XMLName     xml.Name        `xml:"yandex"`
-	Clickhouse  XmlLoggerConfig `xml:"logger"`
-	IncludeFrom string          `xml:"include_from"`
-}
-
-type XmlConfig struct {
-	XMLName     xml.Name        `xml:"clickhouse"`
-	Clickhouse  XmlLoggerConfig `xml:"logger"`
-	IncludeFrom string          `xml:"include_from"`
-}
-
-func (x XmlConfigFile) UnmarshallConfig() (XmlConfig, error) {
-	inputFile, err := ioutil.ReadFile(x.Path)
-
-	if err != nil {
-		return XmlConfig{}, err
-	}
-	var cConfig XmlConfig
-	err = xml.Unmarshal(inputFile, &cConfig)
-	if err == nil {
-		return XmlConfig{
-			Clickhouse:  cConfig.Clickhouse,
-			IncludeFrom: cConfig.IncludeFrom,
-		}, nil
-	}
-	// attempt to marshall as yandex file
-	var yConfig YandexXMLConfig
-	err = xml.Unmarshal(inputFile, &yConfig)
-	if err != nil {
-		return XmlConfig{}, err
-	}
-	return XmlConfig{
-		Clickhouse:  yConfig.Clickhouse,
-		IncludeFrom: yConfig.IncludeFrom,
-	}, nil
-}
-
-func (x XmlConfigFile) FindLogPaths() ([]string, error) {
-	var paths []string
-	config, err := x.UnmarshallConfig()
-	if err != nil {
-		return nil, err
-	}
-	if config.Clickhouse.Log != "" {
-		paths = append(paths, config.Clickhouse.Log)
-	}
-	if config.Clickhouse.ErrorLog != "" {
-		paths = append(paths, config.Clickhouse.ErrorLog)
-	}
-
-	return paths, nil
-}
-
-func (x XmlConfigFile) FindIncludedConfig() (ConfigFile, error) {
-	if x.Included {
-		//can't recurse
-		return XmlConfigFile{}, nil
-	}
-	config, err := x.UnmarshallConfig()
-	if err != nil {
-		return XmlConfigFile{}, err
-	}
-	// we need to convert this
-	if config.IncludeFrom != "" {
-		if filepath.IsAbs(config.IncludeFrom) {
-			return XmlConfigFile{Path: config.IncludeFrom, Included: true}, nil
-		}
-		confDir := filepath.Dir(x.FilePath())
-		return XmlConfigFile{Path: path.Join(confDir, config.IncludeFrom), Included: true}, nil
-	}
-	return XmlConfigFile{}, nil
-}
-
-type YamlConfigFile struct {
-	Path     string
-	Included bool
-}
-
-var ymlSensitivePatterns = map[string]*regexp.Regexp{
-	"password: 'Replaced'":            regexp.MustCompile(`password:\s*.*$`),
-	"password_sha256_hex: 'Replaced'": regexp.MustCompile(`password_sha256_hex:\s*.*$`),
-	"access_key_id: 'Replaced'":       regexp.MustCompile(`access_key_id:\s*.*$`),
-	"secret_access_key: 'Replaced'":   regexp.MustCompile(`secret_access_key:\s*.*$`),
-	"secret: 'Replaced'":              regexp.MustCompile(`secret:\s*.*$`),
-}
-
-func (y YamlConfigFile) Copy(destPath string, removeSensitive bool) error {
-	if !removeSensitive {
-		// simple copy easiest
-		if err := utils.CopyFile(y.FilePath(), destPath); err != nil {
-			return errors.Wrapf(err, "unable to copy file %s", y.FilePath())
-		}
-		return nil
-	}
-	return sensitiveFileCopy(y.FilePath(), destPath, ymlSensitivePatterns)
-}
-
-func (y YamlConfigFile) FilePath() string {
-	return y.Path
-}
-
-func (y YamlConfigFile) IsIncluded() bool {
-	return y.Included
-}
-
-type YamlLoggerConfig struct {
-	Log      string
-	ErrorLog string
-}
-
-type YamlConfig struct {
-	Logger       YamlLoggerConfig
-	Include_From string
-}
-
-func (y YamlConfigFile) FindLogPaths() ([]string, error) {
-	var paths []string
-	inputFile, err := ioutil.ReadFile(y.Path)
-	if err != nil {
-		return nil, err
-	}
-	var config YamlConfig
-	err = yaml.Unmarshal(inputFile, &config)
-	if err != nil {
-		return nil, err
-	}
-	if config.Logger.Log != "" {
-		paths = append(paths, config.Logger.Log)
-	}
-	if config.Logger.ErrorLog != "" {
-		paths = append(paths, config.Logger.ErrorLog)
-	}
-	return paths, nil
-}
-
-func (y YamlConfigFile) FindIncludedConfig() (ConfigFile, error) {
-	if y.Included {
-		//can't recurse
-		return YamlConfigFile{}, nil
-	}
-	inputFile, err := ioutil.ReadFile(y.Path)
-	if err != nil {
-		return YamlConfigFile{}, err
-	}
-	var config YamlConfig
-	err = yaml.Unmarshal(inputFile, &config)
-	if err != nil {
-		return YamlConfigFile{}, err
-	}
-	if config.Include_From != "" {
-		if filepath.IsAbs(config.Include_From) {
-			return YamlConfigFile{Path: config.Include_From, Included: true}, nil
-		}
-		confDir := filepath.Dir(y.FilePath())
-		return YamlConfigFile{Path: path.Join(confDir, config.Include_From), Included: true}, nil
-	}
-	return YamlConfigFile{}, nil
-}
-
-func sensitiveFileCopy(sourcePath string, destPath string, patterns map[string]*regexp.Regexp) error {
-	destDir := filepath.Dir(destPath)
-	if err := os.MkdirAll(destDir, os.ModePerm); err != nil {
-		return errors.Wrapf(err, "unable to create directory %s", destDir)
-	}
-	// currently, we don't unmarshall into a struct - we want to preserve structure and comments. Possibly could
-	// be handled but for simplicity we do a line parse for now
-	inputFile, err := os.Open(sourcePath)
-
-	if err != nil {
-		return err
-	}
-	defer inputFile.Close()
-	outputFile, err := os.Create(destPath)
-
-	if err != nil {
-		return err
-	}
-	defer outputFile.Close()
-	writer := bufio.NewWriter(outputFile)
-	scanner := bufio.NewScanner(inputFile)
-
-	for scanner.Scan() {
-		line := scanner.Text()
-		for repl, pattern := range patterns {
-			line = pattern.ReplaceAllString(line, repl)
-		}
-		_, err = writer.WriteString(line + "\n")
-		if err != nil {
-			return err
-		}
-	}
-	writer.Flush()
-	return nil
-}
diff --git a/programs/diagnostics/internal/platform/data/file_test.go b/programs/diagnostics/internal/platform/data/file_test.go
deleted file mode 100644
index 9e305b1a5da..00000000000
--- a/programs/diagnostics/internal/platform/data/file_test.go
+++ /dev/null
@@ -1,263 +0,0 @@
-package data_test
-
-import (
-	"fmt"
-	"io/ioutil"
-	"os"
-	"path"
-	"path/filepath"
-	"strings"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/stretchr/testify/require"
-)
-
-func TestNextFileDirectoryFrame(t *testing.T) {
-	t.Run("can iterate file frame", func(t *testing.T) {
-		tempDir := t.TempDir()
-		files := make([]string, 5)
-		for i := 0; i < 5; i++ {
-			fileDir := path.Join(tempDir, fmt.Sprintf("%d", i))
-			err := os.MkdirAll(fileDir, os.ModePerm)
-			require.Nil(t, err)
-			filepath := path.Join(fileDir, fmt.Sprintf("random-%d.txt", i))
-			files[i] = filepath
-			_, err = os.Create(filepath)
-			require.Nil(t, err)
-		}
-		fileFrame, errs := data.NewFileDirectoryFrame(tempDir, []string{"*.txt"})
-		require.Empty(t, errs)
-		i := 0
-		for {
-			values, ok, err := fileFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-			require.Len(t, values, 1)
-			require.Equal(t, files[i], values[0].(data.SimpleFile).Path)
-			i += 1
-		}
-		require.Equal(t, 5, i)
-	})
-
-	t.Run("can iterate file frame when empty", func(t *testing.T) {
-		// create 5 temporary files
-		tempDir := t.TempDir()
-		fileFrame, errs := data.NewFileDirectoryFrame(tempDir, []string{"*"})
-		require.Empty(t, errs)
-		i := 0
-		for {
-			_, ok, err := fileFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-		}
-		require.Equal(t, 0, i)
-	})
-}
-
-func TestNewConfigFileFrame(t *testing.T) {
-	t.Run("can iterate config file frame", func(t *testing.T) {
-		cwd, err := os.Getwd()
-		require.Nil(t, err)
-
-		configFrame, errs := data.NewConfigFileFrame(path.Join(cwd, "../../../testdata", "configs", "xml"))
-		require.Empty(t, errs)
-		i := 0
-		for {
-			values, ok, err := configFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-			require.Len(t, values, 1)
-			filePath := values[0].(data.XmlConfigFile).FilePath()
-			require.True(t, strings.Contains(filePath, ".xml"))
-			i += 1
-		}
-		// 5 not 3 due to the includes
-		require.Equal(t, 5, i)
-	})
-
-	t.Run("can iterate file frame when empty", func(t *testing.T) {
-		// create 5 temporary files
-		tempDir := t.TempDir()
-		configFrame, errs := data.NewConfigFileFrame(tempDir)
-		require.Empty(t, errs)
-		i := 0
-		for {
-			_, ok, err := configFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-		}
-		require.Equal(t, 0, i)
-	})
-}
-
-func TestConfigFileFrameCopy(t *testing.T) {
-	t.Run("can copy non-sensitive xml config files", func(t *testing.T) {
-		tmrDir := t.TempDir()
-		cwd, err := os.Getwd()
-		require.Nil(t, err)
-		configFrame, errs := data.NewConfigFileFrame(path.Join(cwd, "../../../testdata", "configs", "xml"))
-		require.Empty(t, errs)
-		for {
-			values, ok, err := configFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-			require.Nil(t, err)
-			require.True(t, ok)
-			configFile := values[0].(data.XmlConfigFile)
-			newPath := path.Join(tmrDir, filepath.Base(configFile.FilePath()))
-			err = configFile.Copy(newPath, false)
-			require.FileExists(t, newPath)
-			sourceInfo, _ := os.Stat(configFile.FilePath())
-			destInfo, _ := os.Stat(newPath)
-			require.Equal(t, sourceInfo.Size(), destInfo.Size())
-			require.Nil(t, err)
-		}
-	})
-
-	t.Run("can copy sensitive xml config files", func(t *testing.T) {
-		tmrDir := t.TempDir()
-		cwd, err := os.Getwd()
-		require.Nil(t, err)
-		configFrame, errs := data.NewConfigFileFrame(path.Join(cwd, "../../../testdata", "configs", "xml"))
-		require.Empty(t, errs)
-		i := 0
-		var checkedFiles []string
-		for {
-			values, ok, err := configFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-			require.Nil(t, err)
-			require.True(t, ok)
-			configFile := values[0].(data.XmlConfigFile)
-			fileName := filepath.Base(configFile.FilePath())
-			newPath := path.Join(tmrDir, fileName)
-			err = configFile.Copy(newPath, true)
-			require.FileExists(t, newPath)
-			require.Nil(t, err)
-			bytes, err := ioutil.ReadFile(newPath)
-			require.Nil(t, err)
-			s := string(bytes)
-			checkedFiles = append(checkedFiles, fileName)
-			if fileName == "users.xml" || fileName == "default-password.xml" || fileName == "user-include.xml" {
-				require.True(t, strings.Contains(s, "<password>Replaced</password>") ||
-					strings.Contains(s, "<password_sha256_hex>Replaced</password_sha256_hex>"))
-				require.NotContains(t, s, "<password>REPLACE_ME</password>")
-				require.NotContains(t, s, "<password_sha256_hex>REPLACE_ME</password_sha256_hex>")
-			} else if fileName == "config.xml" {
-				require.True(t, strings.Contains(s, "<access_key_id>Replaced</access_key_id>"))
-				require.True(t, strings.Contains(s, "<secret_access_key>Replaced</secret_access_key>"))
-				require.True(t, strings.Contains(s, "<secret>Replaced</secret>"))
-				require.NotContains(t, s, "<access_key_id>REPLACE_ME</access_key_id>")
-				require.NotContains(t, s, "<secret_access_key>REPLACE_ME</secret_access_key>")
-				require.NotContains(t, s, "<secret>REPLACE_ME</secret>")
-			}
-			i++
-		}
-		require.ElementsMatch(t, []string{"users.xml", "default-password.xml", "user-include.xml", "config.xml", "server-include.xml"}, checkedFiles)
-		require.Equal(t, 5, i)
-	})
-
-	t.Run("can copy sensitive yaml config files", func(t *testing.T) {
-		tmrDir := t.TempDir()
-		cwd, err := os.Getwd()
-		require.Nil(t, err)
-		configFrame, errs := data.NewConfigFileFrame(path.Join(cwd, "../../../testdata", "configs", "yaml"))
-		require.Empty(t, errs)
-		i := 0
-		var checkedFiles []string
-		for {
-			values, ok, err := configFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-			require.Nil(t, err)
-			require.True(t, ok)
-			configFile := values[0].(data.YamlConfigFile)
-			fileName := filepath.Base(configFile.FilePath())
-			newPath := path.Join(tmrDir, fileName)
-			err = configFile.Copy(newPath, true)
-			require.FileExists(t, newPath)
-			require.Nil(t, err)
-			bytes, err := ioutil.ReadFile(newPath)
-			require.Nil(t, err)
-			s := string(bytes)
-			checkedFiles = append(checkedFiles, fileName)
-			if fileName == "users.yaml" || fileName == "default-password.yaml" || fileName == "user-include.yaml" {
-				require.True(t, strings.Contains(s, "password: 'Replaced'") ||
-					strings.Contains(s, "password_sha256_hex: 'Replaced'"))
-				require.NotContains(t, s, "password: 'REPLACE_ME'")
-				require.NotContains(t, s, "password_sha256_hex: \"REPLACE_ME\"")
-			} else if fileName == "config.yaml" {
-				require.True(t, strings.Contains(s, "access_key_id: 'Replaced'"))
-				require.True(t, strings.Contains(s, "secret_access_key: 'Replaced'"))
-				require.True(t, strings.Contains(s, "secret: 'Replaced'"))
-				require.NotContains(t, s, "access_key_id: 'REPLACE_ME'")
-				require.NotContains(t, s, "secret_access_key: REPLACE_ME")
-				require.NotContains(t, s, "secret: REPLACE_ME")
-			}
-			i++
-		}
-		require.ElementsMatch(t, []string{"users.yaml", "default-password.yaml", "user-include.yaml", "config.yaml", "server-include.yaml"}, checkedFiles)
-		require.Equal(t, 5, i)
-	})
-}
-
-func TestConfigFileFrameFindLogPaths(t *testing.T) {
-	t.Run("can find xml log paths", func(t *testing.T) {
-		cwd, err := os.Getwd()
-		require.Nil(t, err)
-		configFrame, errs := data.NewConfigFileFrame(path.Join(cwd, "../../../testdata", "configs", "xml"))
-		require.Empty(t, errs)
-		paths, errs := configFrame.FindLogPaths()
-		require.Empty(t, errs)
-		require.ElementsMatch(t, []string{"/var/log/clickhouse-server/clickhouse-server.log",
-			"/var/log/clickhouse-server/clickhouse-server.err.log"}, paths)
-	})
-
-	t.Run("can handle empty log paths", func(t *testing.T) {
-		configFrame, errs := data.NewConfigFileFrame(t.TempDir())
-		require.Empty(t, errs)
-		paths, errs := configFrame.FindLogPaths()
-		require.Empty(t, errs)
-		require.Empty(t, paths)
-	})
-
-	t.Run("can find yaml log paths", func(t *testing.T) {
-		cwd, err := os.Getwd()
-		require.Nil(t, err)
-		configFrame, errs := data.NewConfigFileFrame(path.Join(cwd, "../../../testdata", "configs", "yaml"))
-		require.Empty(t, errs)
-		paths, errs := configFrame.FindLogPaths()
-		require.Empty(t, errs)
-		require.ElementsMatch(t, []string{"/var/log/clickhouse-server/clickhouse-server.log",
-			"/var/log/clickhouse-server/clickhouse-server.err.log"}, paths)
-	})
-}
-
-// test the legacy format for ClickHouse xml config files with a yandex root tag
-func TestYandexConfigFile(t *testing.T) {
-	t.Run("can find xml log paths with yandex root", func(t *testing.T) {
-		cwd, err := os.Getwd()
-		require.Nil(t, err)
-		configFrame, errs := data.NewConfigFileFrame(path.Join(cwd, "../../../testdata", "configs", "yandex_xml"))
-		require.Empty(t, errs)
-		paths, errs := configFrame.FindLogPaths()
-		require.Empty(t, errs)
-		require.ElementsMatch(t, []string{"/var/log/clickhouse-server/clickhouse-server.log",
-			"/var/log/clickhouse-server/clickhouse-server.err.log"}, paths)
-	})
-}
diff --git a/programs/diagnostics/internal/platform/data/frame.go b/programs/diagnostics/internal/platform/data/frame.go
deleted file mode 100644
index 65978430109..00000000000
--- a/programs/diagnostics/internal/platform/data/frame.go
+++ /dev/null
@@ -1,11 +0,0 @@
-package data
-
-type BaseFrame struct {
-	Name string
-}
-
-type Frame interface {
-	Next() ([]interface{}, bool, error)
-	Columns() []string
-	Name() string
-}
diff --git a/programs/diagnostics/internal/platform/data/memory.go b/programs/diagnostics/internal/platform/data/memory.go
deleted file mode 100644
index 25da25cf251..00000000000
--- a/programs/diagnostics/internal/platform/data/memory.go
+++ /dev/null
@@ -1,35 +0,0 @@
-package data
-
-type MemoryFrame struct {
-	i           *int
-	ColumnNames []string
-	Rows        [][]interface{}
-	name        string
-}
-
-func NewMemoryFrame(name string, columns []string, rows [][]interface{}) MemoryFrame {
-	i := 0
-	return MemoryFrame{
-		i:           &i,
-		Rows:        rows,
-		ColumnNames: columns,
-		name:        name,
-	}
-}
-
-func (f MemoryFrame) Next() ([]interface{}, bool, error) {
-	if f.Rows == nil || len(f.Rows) == *(f.i) {
-		return nil, false, nil
-	}
-	value := f.Rows[*f.i]
-	*f.i++
-	return value, true, nil
-}
-
-func (f MemoryFrame) Columns() []string {
-	return f.ColumnNames
-}
-
-func (f MemoryFrame) Name() string {
-	return f.name
-}
diff --git a/programs/diagnostics/internal/platform/data/memory_test.go b/programs/diagnostics/internal/platform/data/memory_test.go
deleted file mode 100644
index fcc02e37d32..00000000000
--- a/programs/diagnostics/internal/platform/data/memory_test.go
+++ /dev/null
@@ -1,61 +0,0 @@
-package data_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/stretchr/testify/require"
-)
-
-func TestNextMemoryFrame(t *testing.T) {
-	t.Run("can iterate memory frame", func(t *testing.T) {
-		columns := []string{"Filesystem", "Size", "Used", "Avail", "Use%", "Mounted on"}
-		rows := [][]interface{}{
-			{"sysfs", 0, 0, 0, 0, "/sys"},
-			{"proc", 0, 0, 0, 0, "/proc"},
-			{"udev", 33357840384, 0, 33357840384, 0, "/dev"},
-			{"devpts", 0, 0, 0, 0, "/dev/pts"},
-			{"tmpfs", 6682607616, 2228224, 6680379392, 1, "/run"},
-			{"/dev/mapper/system-root", 1938213220352, 118136926208, 1721548947456, 7.000000000000001, "/"},
-		}
-		memoryFrame := data.NewMemoryFrame("disks", columns, rows)
-		i := 0
-		for {
-			values, ok, err := memoryFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-			require.ElementsMatch(t, values, rows[i])
-			require.Len(t, values, 6)
-			i += 1
-		}
-		require.Equal(t, 6, i)
-	})
-
-	t.Run("can iterate memory frame when empty", func(t *testing.T) {
-		memoryFrame := data.NewMemoryFrame("test", []string{}, [][]interface{}{})
-		i := 0
-		for {
-			_, ok, err := memoryFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-		}
-		require.Equal(t, 0, i)
-	})
-
-	t.Run("can iterate memory frame when empty", func(t *testing.T) {
-		memoryFrame := data.MemoryFrame{}
-		i := 0
-		for {
-			_, ok, err := memoryFrame.Next()
-			require.Nil(t, err)
-			if !ok {
-				break
-			}
-		}
-		require.Equal(t, 0, i)
-	})
-}
diff --git a/programs/diagnostics/internal/platform/data/misc.go b/programs/diagnostics/internal/platform/data/misc.go
deleted file mode 100644
index a03213c4f46..00000000000
--- a/programs/diagnostics/internal/platform/data/misc.go
+++ /dev/null
@@ -1,27 +0,0 @@
-package data
-
-func NewHierarchicalFrame(name string, frame Frame, subFrames []HierarchicalFrame) HierarchicalFrame {
-	return HierarchicalFrame{
-		name:      name,
-		DataFrame: frame,
-		SubFrames: subFrames,
-	}
-}
-
-type HierarchicalFrame struct {
-	name      string
-	DataFrame Frame
-	SubFrames []HierarchicalFrame
-}
-
-func (hf HierarchicalFrame) Name() string {
-	return hf.name
-}
-
-func (hf HierarchicalFrame) Columns() []string {
-	return hf.DataFrame.Columns()
-}
-
-func (hf HierarchicalFrame) Next() ([]interface{}, bool, error) {
-	return hf.DataFrame.Next()
-}
diff --git a/programs/diagnostics/internal/platform/database/native.go b/programs/diagnostics/internal/platform/database/native.go
deleted file mode 100644
index 45b9af0349e..00000000000
--- a/programs/diagnostics/internal/platform/database/native.go
+++ /dev/null
@@ -1,95 +0,0 @@
-package database
-
-import (
-	"database/sql"
-	"fmt"
-	"net/url"
-	"strings"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	_ "github.com/ClickHouse/clickhouse-go/v2"
-	"github.com/pkg/errors"
-)
-
-type ClickhouseNativeClient struct {
-	host       string
-	connection *sql.DB
-}
-
-func NewNativeClient(host string, port uint16, username string, password string) (*ClickhouseNativeClient, error) {
-	// debug output ?debug=true
-	connection, err := sql.Open("clickhouse", fmt.Sprintf("clickhouse://%s:%s@%s:%d/", url.QueryEscape(username), url.QueryEscape(password), host, port))
-	if err != nil {
-		return &ClickhouseNativeClient{}, err
-	}
-	if err := connection.Ping(); err != nil {
-		return &ClickhouseNativeClient{}, err
-	}
-	return &ClickhouseNativeClient{
-		host:       host,
-		connection: connection,
-	}, nil
-}
-
-func (c *ClickhouseNativeClient) Ping() error {
-	return c.connection.Ping()
-}
-
-func (c *ClickhouseNativeClient) ReadTable(databaseName string, tableName string, excludeColumns []string, orderBy data.OrderBy, limit int64) (data.Frame, error) {
-	exceptClause := ""
-	if len(excludeColumns) > 0 {
-		exceptClause = fmt.Sprintf("EXCEPT(%s) ", strings.Join(excludeColumns, ","))
-	}
-	limitClause := ""
-	if limit >= 0 {
-		limitClause = fmt.Sprintf(" LIMIT %d", limit)
-	}
-	rows, err := c.connection.Query(fmt.Sprintf("SELECT * %sFROM %s.%s%s%s", exceptClause, databaseName, tableName, orderBy.String(), limitClause))
-	if err != nil {
-		return data.DatabaseFrame{}, err
-	}
-	return data.NewDatabaseFrame(fmt.Sprintf("%s.%s", databaseName, tableName), rows)
-}
-
-func (c *ClickhouseNativeClient) ReadTableNamesForDatabase(databaseName string) ([]string, error) {
-	rows, err := c.connection.Query(fmt.Sprintf("SHOW TABLES FROM %s", databaseName))
-	if err != nil {
-		return nil, err
-	}
-	defer rows.Close()
-	var tableNames []string
-	var name string
-	for rows.Next() {
-		if err := rows.Scan(&name); err != nil {
-			return nil, err
-		}
-		tableNames = append(tableNames, name)
-	}
-	return tableNames, nil
-}
-
-func (c *ClickhouseNativeClient) ExecuteStatement(id string, statement string) (data.Frame, error) {
-	rows, err := c.connection.Query(statement)
-	if err != nil {
-		return data.DatabaseFrame{}, err
-	}
-	return data.NewDatabaseFrame(id, rows)
-}
-
-func (c *ClickhouseNativeClient) Version() (string, error) {
-	frame, err := c.ExecuteStatement("version", "SELECT version() as version")
-	if err != nil {
-		return "", err
-	}
-	values, ok, err := frame.Next()
-	if err != nil {
-		return "", err
-	}
-	if !ok {
-		return "", errors.New("unable to read ClickHouse version")
-	}
-	if len(values) != 1 {
-		return "", errors.New("unable to read ClickHouse version - no rows returned")
-	}
-	return values[0].(string), nil
-}
diff --git a/programs/diagnostics/internal/platform/database/native_test.go b/programs/diagnostics/internal/platform/database/native_test.go
deleted file mode 100644
index 7028a4b4800..00000000000
--- a/programs/diagnostics/internal/platform/database/native_test.go
+++ /dev/null
@@ -1,289 +0,0 @@
-//go:build !no_docker
-
-package database_test
-
-import (
-	"context"
-	"fmt"
-	"os"
-	"path"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/database"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/docker/go-connections/nat"
-	"github.com/stretchr/testify/require"
-	"github.com/testcontainers/testcontainers-go"
-	"github.com/testcontainers/testcontainers-go/wait"
-)
-
-func createClickHouseContainer(t *testing.T, ctx context.Context) (testcontainers.Container, nat.Port) {
-	// create a ClickHouse container
-	cwd, err := os.Getwd()
-	if err != nil {
-		// can't test without current directory
-		panic(err)
-	}
-
-	// for now, we test against a hardcoded database-server version but we should make this a property
-	req := testcontainers.ContainerRequest{
-		Image:        fmt.Sprintf("clickhouse/clickhouse-server:%s", test.GetClickHouseTestVersion()),
-		ExposedPorts: []string{"9000/tcp"},
-		WaitingFor:   wait.ForLog("Ready for connections"),
-		Mounts: testcontainers.ContainerMounts{
-			{
-				Source: testcontainers.GenericBindMountSource{
-					HostPath: path.Join(cwd, "../../../testdata/docker/custom.xml"),
-				},
-				Target: "/etc/clickhouse-server/config.d/custom.xml",
-			},
-			{
-				Source: testcontainers.GenericBindMountSource{
-					HostPath: path.Join(cwd, "../../../testdata/docker/admin.xml"),
-				},
-				Target: "/etc/clickhouse-server/users.d/admin.xml",
-			},
-		},
-	}
-	clickhouseContainer, err := testcontainers.GenericContainer(ctx, testcontainers.GenericContainerRequest{
-		ContainerRequest: req,
-		Started:          true,
-	})
-	if err != nil {
-		// can't test without container
-		panic(err)
-	}
-
-	p, _ := clickhouseContainer.MappedPort(ctx, "9000")
-	if err != nil {
-		// can't test without container's port
-		panic(err)
-	}
-
-	t.Setenv("CLICKHOUSE_DB_PORT", p.Port())
-
-	return clickhouseContainer, p
-}
-
-func getClient(t *testing.T, mappedPort int) *database.ClickhouseNativeClient {
-	clickhouseClient, err := database.NewNativeClient("localhost", uint16(mappedPort), "", "")
-	if err != nil {
-		t.Fatalf("unable to build client : %v", err)
-	}
-	return clickhouseClient
-}
-
-func TestReadTableNamesForDatabase(t *testing.T) {
-	ctx := context.Background()
-	clickhouseContainer, mappedPort := createClickHouseContainer(t, ctx)
-	defer clickhouseContainer.Terminate(ctx) //nolint
-
-	clickhouseClient := getClient(t, mappedPort.Int())
-	t.Run("client can read tables for a database", func(t *testing.T) {
-		tables, err := clickhouseClient.ReadTableNamesForDatabase("system")
-		require.Nil(t, err)
-		require.GreaterOrEqual(t, len(tables), 70)
-		require.Contains(t, tables, "merge_tree_settings")
-	})
-}
-
-func TestReadTable(t *testing.T) {
-	t.Run("client can get all rows for system.disks table", func(t *testing.T) {
-		ctx := context.Background()
-		clickhouseContainer, mappedPort := createClickHouseContainer(t, ctx)
-		defer clickhouseContainer.Terminate(ctx) //nolint
-
-		clickhouseClient := getClient(t, mappedPort.Int())
-
-		// we read the table system.disks as this should contain only 1 row
-		frame, err := clickhouseClient.ReadTable("system", "disks", []string{}, data.OrderBy{}, 10)
-		require.Nil(t, err)
-		require.ElementsMatch(t, frame.Columns(), [9]string{"name", "path", "free_space", "total_space", "unreserved_space", "keep_free_space", "type", "is_encrypted", "cache_path"})
-		i := 0
-		for {
-			values, ok, err := frame.Next()
-			if i == 0 {
-				require.Nil(t, err)
-				require.True(t, ok)
-				require.Equal(t, "default", values[0])
-				require.Equal(t, "/var/lib/clickhouse/", values[1])
-				require.Greater(t, values[2], uint64(0))
-				require.Greater(t, values[3], uint64(0))
-				require.Greater(t, values[4], uint64(0))
-				require.Equal(t, values[5], uint64(0))
-				require.Equal(t, "local", values[6])
-				require.Equal(t, values[7], uint8(0))
-				require.Equal(t, values[8], "")
-			} else {
-				require.False(t, ok)
-				break
-			}
-			i += 1
-		}
-	})
-
-	t.Run("client can get all rows for system.databases table", func(t *testing.T) {
-		ctx := context.Background()
-		clickhouseContainer, mappedPort := createClickHouseContainer(t, ctx)
-		defer clickhouseContainer.Terminate(ctx) //nolint
-
-		clickhouseClient := getClient(t, mappedPort.Int())
-
-		// we read the table system.databases as this should be small and consistent on fresh db instances
-		frame, err := clickhouseClient.ReadTable("system", "databases", []string{}, data.OrderBy{}, 10)
-		require.Nil(t, err)
-		require.ElementsMatch(t, frame.Columns(), [6]string{"name", "engine", "data_path", "metadata_path", "uuid", "comment"})
-		expectedRows := [4][3]string{{"INFORMATION_SCHEMA", "Memory", "/var/lib/clickhouse/"},
-			{"default", "Atomic", "/var/lib/clickhouse/store/"},
-			{"information_schema", "Memory", "/var/lib/clickhouse/"},
-			{"system", "Atomic", "/var/lib/clickhouse/store/"}}
-		i := 0
-		for {
-			values, ok, err := frame.Next()
-
-			if i < 4 {
-				require.Nil(t, err)
-				require.True(t, ok)
-				require.Equal(t, expectedRows[i][0], values[0])
-				require.Equal(t, expectedRows[i][1], values[1])
-				require.Equal(t, expectedRows[i][2], values[2])
-				require.NotNil(t, values[3])
-				require.NotNil(t, values[4])
-				require.Equal(t, "", values[5])
-			} else {
-				require.False(t, ok)
-				break
-			}
-			i += 1
-		}
-	})
-
-	t.Run("client can get all rows for system.databases table with except", func(t *testing.T) {
-		ctx := context.Background()
-		clickhouseContainer, mappedPort := createClickHouseContainer(t, ctx)
-		defer clickhouseContainer.Terminate(ctx) //nolint
-
-		clickhouseClient := getClient(t, mappedPort.Int())
-
-		frame, err := clickhouseClient.ReadTable("system", "databases", []string{"data_path", "comment"}, data.OrderBy{}, 10)
-		require.Nil(t, err)
-		require.ElementsMatch(t, frame.Columns(), [4]string{"name", "engine", "metadata_path", "uuid"})
-	})
-
-	t.Run("client can limit rows for system.databases", func(t *testing.T) {
-		ctx := context.Background()
-		clickhouseContainer, mappedPort := createClickHouseContainer(t, ctx)
-		defer clickhouseContainer.Terminate(ctx) //nolint
-
-		clickhouseClient := getClient(t, mappedPort.Int())
-
-		frame, err := clickhouseClient.ReadTable("system", "databases", []string{}, data.OrderBy{}, 1)
-		require.Nil(t, err)
-		require.ElementsMatch(t, frame.Columns(), [6]string{"name", "engine", "data_path", "metadata_path", "uuid", "comment"})
-		expectedRows := [1][3]string{{"INFORMATION_SCHEMA", "Memory", "/var/lib/clickhouse/"}}
-		i := 0
-		for {
-			values, ok, err := frame.Next()
-			if i == 0 {
-				require.Nil(t, err)
-				require.True(t, ok)
-				require.Equal(t, expectedRows[i][0], values[0])
-				require.Equal(t, expectedRows[i][1], values[1])
-				require.Equal(t, expectedRows[i][2], values[2])
-				require.NotNil(t, values[3])
-				require.NotNil(t, values[4])
-				require.Equal(t, "", values[5])
-			} else {
-				require.False(t, ok)
-				break
-			}
-			i += 1
-		}
-	})
-
-	t.Run("client can order rows for system.databases", func(t *testing.T) {
-		ctx := context.Background()
-		clickhouseContainer, mappedPort := createClickHouseContainer(t, ctx)
-		defer clickhouseContainer.Terminate(ctx) //nolint
-
-		clickhouseClient := getClient(t, mappedPort.Int())
-
-		frame, err := clickhouseClient.ReadTable("system", "databases", []string{}, data.OrderBy{
-			Column: "engine",
-			Order:  data.Asc,
-		}, 10)
-		require.Nil(t, err)
-		require.ElementsMatch(t, frame.Columns(), [6]string{"name", "engine", "data_path", "metadata_path", "uuid", "comment"})
-		expectedRows := [4][3]string{
-			{"default", "Atomic", "/var/lib/clickhouse/store/"},
-			{"system", "Atomic", "/var/lib/clickhouse/store/"},
-			{"INFORMATION_SCHEMA", "Memory", "/var/lib/clickhouse/"},
-			{"information_schema", "Memory", "/var/lib/clickhouse/"},
-		}
-		i := 0
-		for {
-			values, ok, err := frame.Next()
-
-			if i < 4 {
-				require.Nil(t, err)
-				require.True(t, ok)
-				require.Equal(t, expectedRows[i][0], values[0])
-				require.Equal(t, expectedRows[i][1], values[1])
-				require.Equal(t, expectedRows[i][2], values[2])
-				require.NotNil(t, values[3])
-				require.NotNil(t, values[4])
-				require.Equal(t, "", values[5])
-			} else {
-				require.False(t, ok)
-				break
-			}
-			i += 1
-		}
-	})
-}
-
-func TestExecuteStatement(t *testing.T) {
-	t.Run("client can execute any statement", func(t *testing.T) {
-		ctx := context.Background()
-		clickhouseContainer, mappedPort := createClickHouseContainer(t, ctx)
-		defer clickhouseContainer.Terminate(ctx) //nolint
-
-		clickhouseClient := getClient(t, mappedPort.Int())
-
-		statement := "SELECT path, count(*) as count FROM system.disks GROUP BY path;"
-		frame, err := clickhouseClient.ExecuteStatement("engines", statement)
-		require.Nil(t, err)
-		require.ElementsMatch(t, frame.Columns(), [2]string{"path", "count"})
-		expectedRows := [1][2]interface{}{
-			{"/var/lib/clickhouse/", uint64(1)},
-		}
-		i := 0
-		for {
-			values, ok, err := frame.Next()
-			if !ok {
-				require.Nil(t, err)
-				break
-			}
-			require.Nil(t, err)
-			require.Equal(t, expectedRows[i][0], values[0])
-			require.Equal(t, expectedRows[i][1], values[1])
-			i++
-		}
-		fmt.Println(i)
-	})
-}
-
-func TestVersion(t *testing.T) {
-	t.Run("client can read version", func(t *testing.T) {
-		ctx := context.Background()
-		clickhouseContainer, mappedPort := createClickHouseContainer(t, ctx)
-		defer clickhouseContainer.Terminate(ctx) //nolint
-
-		clickhouseClient := getClient(t, mappedPort.Int())
-
-		version, err := clickhouseClient.Version()
-		require.Nil(t, err)
-		require.NotEmpty(t, version)
-	})
-}
diff --git a/programs/diagnostics/internal/platform/manager.go b/programs/diagnostics/internal/platform/manager.go
deleted file mode 100644
index b4435b62ea2..00000000000
--- a/programs/diagnostics/internal/platform/manager.go
+++ /dev/null
@@ -1,49 +0,0 @@
-package platform
-
-import (
-	"errors"
-	"sync"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/database"
-)
-
-var once sync.Once
-var dbInit sync.Once
-
-// manages all resources that collectors and outputs may wish to ensure inc. db connections
-
-type DBClient interface {
-	ReadTableNamesForDatabase(databaseName string) ([]string, error)
-	ReadTable(databaseName string, tableName string, excludeColumns []string, orderBy data.OrderBy, limit int64) (data.Frame, error)
-	ExecuteStatement(id string, statement string) (data.Frame, error)
-	Version() (string, error)
-}
-
-var manager *ResourceManager
-
-type ResourceManager struct {
-	DbClient DBClient
-}
-
-func GetResourceManager() *ResourceManager {
-	once.Do(func() {
-		manager = &ResourceManager{}
-	})
-	return manager
-}
-
-func (m *ResourceManager) Connect(host string, port uint16, username string, password string) error {
-	var err error
-	var clientInstance DBClient
-	init := false
-	dbInit.Do(func() {
-		clientInstance, err = database.NewNativeClient(host, port, username, password)
-		manager.DbClient = clientInstance
-		init = true
-	})
-	if !init {
-		return errors.New("connect can only be called once")
-	}
-	return err
-}
diff --git a/programs/diagnostics/internal/platform/manager_test.go b/programs/diagnostics/internal/platform/manager_test.go
deleted file mode 100644
index e6c50c6e505..00000000000
--- a/programs/diagnostics/internal/platform/manager_test.go
+++ /dev/null
@@ -1,100 +0,0 @@
-//go:build !no_docker
-
-package platform_test
-
-import (
-	"context"
-	"fmt"
-	"os"
-	"path"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/docker/go-connections/nat"
-	"github.com/stretchr/testify/require"
-	"github.com/testcontainers/testcontainers-go"
-	"github.com/testcontainers/testcontainers-go/wait"
-)
-
-// create a ClickHouse container
-func createClickHouseContainer(t *testing.T, ctx context.Context) (testcontainers.Container, nat.Port) {
-	cwd, err := os.Getwd()
-	if err != nil {
-		fmt.Println("unable to read current directory", err)
-		os.Exit(1)
-	}
-	// for now, we test against a hardcoded database-server version but we should make this a property
-	req := testcontainers.ContainerRequest{
-		Image:        fmt.Sprintf("clickhouse/clickhouse-server:%s", test.GetClickHouseTestVersion()),
-		ExposedPorts: []string{"9000/tcp"},
-		WaitingFor:   wait.ForLog("Ready for connections"),
-		Mounts: testcontainers.ContainerMounts{
-			{
-				Source: testcontainers.GenericBindMountSource{
-					HostPath: path.Join(cwd, "../../testdata/docker/custom.xml"),
-				},
-				Target: "/etc/clickhouse-server/config.d/custom.xml",
-			},
-			{
-				Source: testcontainers.GenericBindMountSource{
-					HostPath: path.Join(cwd, "../../testdata/docker/admin.xml"),
-				},
-				Target: "/etc/clickhouse-server/users.d/admin.xml",
-			},
-		},
-	}
-	clickhouseContainer, err := testcontainers.GenericContainer(ctx, testcontainers.GenericContainerRequest{
-		ContainerRequest: req,
-		Started:          true,
-	})
-	if err != nil {
-		// can't test without container
-		panic(err)
-	}
-
-	p, err := clickhouseContainer.MappedPort(ctx, "9000")
-	if err != nil {
-		// can't test without a port
-		panic(err)
-	}
-
-	return clickhouseContainer, p
-}
-
-func TestConnect(t *testing.T) {
-	t.Run("can only connect once", func(t *testing.T) {
-		ctx := context.Background()
-
-		clickhouseContainer, mappedPort := createClickHouseContainer(t, ctx)
-		defer clickhouseContainer.Terminate(ctx) //nolint
-
-		t.Setenv("CLICKHOUSE_DB_PORT", mappedPort.Port())
-
-		port := mappedPort.Int()
-
-		// get before connection
-		manager := platform.GetResourceManager()
-		require.Nil(t, manager.DbClient)
-		// init connection
-		err := manager.Connect("localhost", uint16(port), "", "")
-		require.Nil(t, err)
-		require.NotNil(t, manager.DbClient)
-		// try and re-fetch connection
-		err = manager.Connect("localhost", uint16(port), "", "")
-		require.NotNil(t, err)
-		require.Equal(t, "connect can only be called once", err.Error())
-	})
-
-}
-
-func TestGetResourceManager(t *testing.T) {
-	t.Run("get resource manager", func(t *testing.T) {
-		manager := platform.GetResourceManager()
-		require.NotNil(t, manager)
-		manager2 := platform.GetResourceManager()
-		require.NotNil(t, manager2)
-		require.Equal(t, &manager, &manager2)
-	})
-
-}
diff --git a/programs/diagnostics/internal/platform/test/data.go b/programs/diagnostics/internal/platform/test/data.go
deleted file mode 100644
index 7710e9a69a1..00000000000
--- a/programs/diagnostics/internal/platform/test/data.go
+++ /dev/null
@@ -1,166 +0,0 @@
-package test
-
-import (
-	"fmt"
-	"sort"
-	"strings"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/pkg/errors"
-)
-
-type fakeClickhouseClient struct {
-	tables         map[string][]string
-	QueryResponses map[string]*FakeDataFrame
-}
-
-func NewFakeClickhouseClient(tables map[string][]string) fakeClickhouseClient {
-	queryResponses := make(map[string]*FakeDataFrame)
-	return fakeClickhouseClient{
-		tables:         tables,
-		QueryResponses: queryResponses,
-	}
-}
-
-func (f fakeClickhouseClient) ReadTableNamesForDatabase(databaseName string) ([]string, error) {
-	if _, ok := f.tables[databaseName]; ok {
-		return f.tables[databaseName], nil
-	}
-	return nil, fmt.Errorf("database %s does not exist", databaseName)
-}
-
-func (f fakeClickhouseClient) ReadTable(databaseName string, tableName string, excludeColumns []string, orderBy data.OrderBy, limit int64) (data.Frame, error) {
-
-	exceptClause := ""
-	if len(excludeColumns) > 0 {
-		exceptClause = fmt.Sprintf("EXCEPT(%s) ", strings.Join(excludeColumns, ","))
-	}
-	limitClause := ""
-	if limit >= 0 {
-		limitClause = fmt.Sprintf(" LIMIT %d", limit)
-	}
-	query := fmt.Sprintf("SELECT * %sFROM %s.%s%s%s", exceptClause, databaseName, tableName, orderBy.String(), limitClause)
-	frame, error := f.ExecuteStatement(fmt.Sprintf("read_table_%s.%s", databaseName, tableName), query)
-	if error != nil {
-		return frame, error
-	}
-	fFrame := *(frame.(*FakeDataFrame))
-	fFrame = fFrame.FilterColumns(excludeColumns)
-	fFrame = fFrame.Order(orderBy)
-	fFrame = fFrame.Limit(limit)
-	return fFrame, nil
-}
-
-func (f fakeClickhouseClient) ExecuteStatement(id string, statement string) (data.Frame, error) {
-	if frame, ok := f.QueryResponses[statement]; ok {
-		return frame, nil
-	}
-	return FakeDataFrame{}, errors.New(fmt.Sprintf("No recorded response for %s", statement))
-}
-
-func (f fakeClickhouseClient) Version() (string, error) {
-	return "21.12.3", nil
-}
-
-func (f fakeClickhouseClient) Reset() {
-	for key, frame := range f.QueryResponses {
-		frame.Reset()
-		f.QueryResponses[key] = frame
-	}
-}
-
-type FakeDataFrame struct {
-	i           *int
-	Rows        [][]interface{}
-	ColumnNames []string
-	name        string
-}
-
-func NewFakeDataFrame(name string, columns []string, rows [][]interface{}) FakeDataFrame {
-	i := 0
-	return FakeDataFrame{
-		i:           &i,
-		Rows:        rows,
-		ColumnNames: columns,
-		name:        name,
-	}
-}
-
-func (f FakeDataFrame) Next() ([]interface{}, bool, error) {
-	if len(f.Rows) == *(f.i) {
-		return nil, false, nil
-	}
-	value := f.Rows[*f.i]
-	*f.i++
-	return value, true, nil
-}
-
-func (f FakeDataFrame) Columns() []string {
-	return f.ColumnNames
-}
-
-func (f FakeDataFrame) Name() string {
-	return f.name
-}
-
-func (f *FakeDataFrame) Reset() {
-	i := 0
-	f.i = &i
-}
-
-func (f FakeDataFrame) FilterColumns(excludeColumns []string) FakeDataFrame {
-	// get columns we can remove
-	rColumns := utils.Intersection(f.ColumnNames, excludeColumns)
-	rIndexes := make([]int, len(rColumns))
-	// find the indexes of the columns to remove
-	for i, column := range rColumns {
-		rIndexes[i] = utils.IndexOf(f.ColumnNames, column)
-	}
-	newRows := make([][]interface{}, len(f.Rows))
-	for r, row := range f.Rows {
-		newRow := row
-		for i, index := range rIndexes {
-			newRow = utils.Remove(newRow, index-i)
-		}
-		newRows[r] = newRow
-	}
-	f.Rows = newRows
-	f.ColumnNames = utils.Distinct(f.ColumnNames, excludeColumns)
-	return f
-}
-
-func (f FakeDataFrame) Limit(rowLimit int64) FakeDataFrame {
-	if rowLimit >= 0 {
-		if int64(len(f.Rows)) > rowLimit {
-			f.Rows = f.Rows[:rowLimit]
-		}
-	}
-	return f
-}
-
-func (f FakeDataFrame) Order(orderBy data.OrderBy) FakeDataFrame {
-	if orderBy.Column == "" {
-		return f
-	}
-	cIndex := utils.IndexOf(f.ColumnNames, orderBy.Column)
-	sort.Slice(f.Rows, func(i, j int) bool {
-		left := f.Rows[i][cIndex]
-		right := f.Rows[j][cIndex]
-		if iLeft, ok := left.(int); ok {
-			if orderBy.Order == data.Asc {
-				return iLeft < right.(int)
-			}
-			return iLeft > right.(int)
-		} else {
-			// we aren't a full db - revert to string order
-			sLeft := left.(string)
-			sRight := right.(string)
-			if orderBy.Order == data.Asc {
-				return sLeft < sRight
-			}
-			return sLeft > sRight
-		}
-	})
-	return f
-}
diff --git a/programs/diagnostics/internal/platform/test/env.go b/programs/diagnostics/internal/platform/test/env.go
deleted file mode 100644
index 36b03772ab0..00000000000
--- a/programs/diagnostics/internal/platform/test/env.go
+++ /dev/null
@@ -1,16 +0,0 @@
-package test
-
-import "os"
-
-const defaultClickHouseVersion = "latest"
-
-func GetClickHouseTestVersion() string {
-	return GetEnv("CLICKHOUSE_VERSION", defaultClickHouseVersion)
-}
-
-func GetEnv(key, fallback string) string {
-	if value, ok := os.LookupEnv(key); ok {
-		return value
-	}
-	return fallback
-}
diff --git a/programs/diagnostics/internal/platform/utils/file.go b/programs/diagnostics/internal/platform/utils/file.go
deleted file mode 100644
index 71af4b32658..00000000000
--- a/programs/diagnostics/internal/platform/utils/file.go
+++ /dev/null
@@ -1,95 +0,0 @@
-package utils
-
-import (
-	"fmt"
-	"io"
-	"io/fs"
-	"os"
-	"path/filepath"
-
-	"github.com/pkg/errors"
-)
-
-func FileExists(name string) (bool, error) {
-	f, err := os.Stat(name)
-	if err == nil {
-		if !f.IsDir() {
-			return true, nil
-		}
-		return false, fmt.Errorf("%s is a directory", name)
-	}
-	if errors.Is(err, os.ErrNotExist) {
-		return false, nil
-	}
-	return false, err
-}
-
-func DirExists(name string) (bool, error) {
-	f, err := os.Stat(name)
-	if err == nil {
-		if f.IsDir() {
-			return true, nil
-		}
-		return false, fmt.Errorf("%s is a file", name)
-	}
-	if errors.Is(err, os.ErrNotExist) {
-		return false, nil
-	}
-	return false, err
-}
-
-func CopyFile(sourceFilename string, destFilename string) error {
-	exists, err := FileExists(sourceFilename)
-	if err != nil {
-		return err
-	}
-	if !exists {
-		return fmt.Errorf("%s does not exist", sourceFilename)
-	}
-	source, err := os.Open(sourceFilename)
-	if err != nil {
-		return err
-	}
-	defer source.Close()
-	destDir := filepath.Dir(destFilename)
-	if err := os.MkdirAll(destDir, os.ModePerm); err != nil {
-		return errors.Wrapf(err, "unable to create directory %s", destDir)
-	}
-
-	destination, err := os.Create(destFilename)
-	if err != nil {
-		return err
-	}
-	defer destination.Close()
-	_, err = io.Copy(destination, source)
-	return err
-}
-
-// patterns passed are an OR - any can be satisfied and the file will be listed
-
-func ListFilesInDirectory(directory string, patterns []string) ([]string, []error) {
-	var files []string
-	exists, err := DirExists(directory)
-	if err != nil {
-		return files, []error{err}
-	}
-	if !exists {
-		return files, []error{fmt.Errorf("directory %s does not exist", directory)}
-	}
-	var pathErrors []error
-	_ = filepath.Walk(directory, func(path string, info fs.FileInfo, err error) error {
-		if err != nil {
-			pathErrors = append(pathErrors, err)
-		} else if !info.IsDir() {
-			for _, pattern := range patterns {
-				if matched, err := filepath.Match(pattern, filepath.Base(path)); err != nil {
-					pathErrors = append(pathErrors, err)
-				} else if matched {
-					files = append(files, path)
-				}
-			}
-		}
-		return nil
-	})
-	return files, pathErrors
-}
diff --git a/programs/diagnostics/internal/platform/utils/file_test.go b/programs/diagnostics/internal/platform/utils/file_test.go
deleted file mode 100644
index 8d0430090c9..00000000000
--- a/programs/diagnostics/internal/platform/utils/file_test.go
+++ /dev/null
@@ -1,134 +0,0 @@
-package utils_test
-
-import (
-	"fmt"
-	"os"
-	"path"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/stretchr/testify/require"
-)
-
-func TestFileExists(t *testing.T) {
-	t.Run("returns true for file", func(t *testing.T) {
-		tempDir := t.TempDir()
-		filepath := path.Join(tempDir, "random.txt")
-		_, err := os.Create(filepath)
-		require.Nil(t, err)
-		exists, err := utils.FileExists(filepath)
-		require.True(t, exists)
-		require.Nil(t, err)
-	})
-
-	t.Run("doesn't return true for not existence file", func(t *testing.T) {
-		tempDir := t.TempDir()
-		file := path.Join(tempDir, "random.txt")
-		exists, err := utils.FileExists(file)
-		require.False(t, exists)
-		require.Nil(t, err)
-	})
-
-	t.Run("doesn't return true for directory", func(t *testing.T) {
-		tempDir := t.TempDir()
-		exists, err := utils.FileExists(tempDir)
-		require.False(t, exists)
-		require.NotNil(t, err)
-		require.Equal(t, fmt.Sprintf("%s is a directory", tempDir), err.Error())
-	})
-}
-
-func TestDirExists(t *testing.T) {
-	t.Run("doesn't return true for file", func(t *testing.T) {
-		tempDir := t.TempDir()
-		filepath := path.Join(tempDir, "random.txt")
-		_, err := os.Create(filepath)
-		require.Nil(t, err)
-		exists, err := utils.DirExists(filepath)
-		require.False(t, exists)
-		require.NotNil(t, err)
-		require.Equal(t, fmt.Sprintf("%s is a file", filepath), err.Error())
-	})
-
-	t.Run("returns true for directory", func(t *testing.T) {
-		tempDir := t.TempDir()
-		exists, err := utils.DirExists(tempDir)
-		require.True(t, exists)
-		require.Nil(t, err)
-	})
-
-	t.Run("doesn't return true random directory", func(t *testing.T) {
-		exists, err := utils.FileExists(fmt.Sprintf("%d", utils.MakeTimestamp()))
-		require.False(t, exists)
-		require.Nil(t, err)
-	})
-}
-
-func TestCopyFile(t *testing.T) {
-	t.Run("can copy file", func(t *testing.T) {
-		tempDir := t.TempDir()
-		sourcePath := path.Join(tempDir, "random.txt")
-		_, err := os.Create(sourcePath)
-		require.Nil(t, err)
-		destPath := path.Join(tempDir, "random-2.txt")
-		err = utils.CopyFile(sourcePath, destPath)
-		require.Nil(t, err)
-	})
-
-	t.Run("can copy nested file", func(t *testing.T) {
-		tempDir := t.TempDir()
-		sourcePath := path.Join(tempDir, "random.txt")
-		_, err := os.Create(sourcePath)
-		require.Nil(t, err)
-		destPath := path.Join(tempDir, "sub_dir", "random-2.txt")
-		err = utils.CopyFile(sourcePath, destPath)
-		require.Nil(t, err)
-	})
-
-	t.Run("fails when file does not exist", func(t *testing.T) {
-		tempDir := t.TempDir()
-		sourcePath := path.Join(tempDir, "random.txt")
-		destPath := path.Join(tempDir, "random-2.txt")
-		err := utils.CopyFile(sourcePath, destPath)
-		require.NotNil(t, err)
-		require.Equal(t, fmt.Sprintf("%s does not exist", sourcePath), err.Error())
-	})
-}
-
-func TestListFilesInDirectory(t *testing.T) {
-	tempDir := t.TempDir()
-	files := make([]string, 5)
-	for i := 0; i < 5; i++ {
-		fileDir := path.Join(tempDir, fmt.Sprintf("%d", i))
-		err := os.MkdirAll(fileDir, os.ModePerm)
-		require.Nil(t, err)
-		ext := ".txt"
-		if i%2 == 0 {
-			ext = ".csv"
-		}
-		filepath := path.Join(fileDir, fmt.Sprintf("random-%d%s", i, ext))
-		files[i] = filepath
-		_, err = os.Create(filepath)
-		require.Nil(t, err)
-	}
-
-	t.Run("can list all files", func(t *testing.T) {
-		mFiles, errs := utils.ListFilesInDirectory(tempDir, []string{"*"})
-		require.Len(t, mFiles, 5)
-		require.Empty(t, errs)
-	})
-
-	t.Run("can list by extension", func(t *testing.T) {
-		mFiles, errs := utils.ListFilesInDirectory(tempDir, []string{"*.csv"})
-		require.Len(t, mFiles, 3)
-		require.Empty(t, errs)
-		require.ElementsMatch(t, []string{files[0], files[2], files[4]}, mFiles)
-	})
-
-	t.Run("can list on multiple extensions files", func(t *testing.T) {
-		mFiles, errs := utils.ListFilesInDirectory(tempDir, []string{"*.csv", "*.txt"})
-		require.Len(t, mFiles, 5)
-		require.Empty(t, errs)
-	})
-
-}
diff --git a/programs/diagnostics/internal/platform/utils/process.go b/programs/diagnostics/internal/platform/utils/process.go
deleted file mode 100644
index 7b27c215eea..00000000000
--- a/programs/diagnostics/internal/platform/utils/process.go
+++ /dev/null
@@ -1,49 +0,0 @@
-package utils
-
-import (
-	"github.com/elastic/gosigar"
-	"strings"
-)
-
-func FindClickHouseProcesses() ([]gosigar.ProcArgs, error) {
-	pids := gosigar.ProcList{}
-	err := pids.Get()
-	if err != nil {
-		return nil, err
-	}
-	var clickhousePs []gosigar.ProcArgs
-	for _, pid := range pids.List {
-		args := gosigar.ProcArgs{}
-		if err := args.Get(pid); err != nil {
-			continue
-		}
-		if len(args.List) > 0 {
-			if strings.Contains(args.List[0], "clickhouse-server") {
-				clickhousePs = append(clickhousePs, args)
-			}
-		}
-	}
-	return clickhousePs, nil
-}
-
-func FindConfigsFromClickHouseProcesses() ([]string, error) {
-	clickhouseProcesses, err := FindClickHouseProcesses()
-	if err != nil {
-		return nil, err
-	}
-	var configs []string
-	if len(clickhouseProcesses) > 0 {
-		// we have candidate matches
-		for _, ps := range clickhouseProcesses {
-			for _, arg := range ps.List {
-				if strings.Contains(arg, "--config") {
-					configFile := strings.ReplaceAll(arg, "--config-file=", "")
-					// containers receive config with --config
-					configFile = strings.ReplaceAll(configFile, "--config=", "")
-					configs = append(configs, configFile)
-				}
-			}
-		}
-	}
-	return configs, err
-}
diff --git a/programs/diagnostics/internal/platform/utils/process_test.go b/programs/diagnostics/internal/platform/utils/process_test.go
deleted file mode 100644
index 9baaa559752..00000000000
--- a/programs/diagnostics/internal/platform/utils/process_test.go
+++ /dev/null
@@ -1,97 +0,0 @@
-//go:build !no_docker
-
-package utils_test
-
-import (
-	"context"
-	"fmt"
-	"io"
-	"os"
-	"path"
-	"strings"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/stretchr/testify/require"
-	"github.com/testcontainers/testcontainers-go"
-	"github.com/testcontainers/testcontainers-go/wait"
-)
-
-func getProcessesInContainer(t *testing.T, container testcontainers.Container) ([]string, error) {
-	result, reader, err := container.Exec(context.Background(), []string{"ps", "-aux"})
-	if err != nil {
-		return nil, err
-	}
-	require.Zero(t, result)
-	require.NotNil(t, reader)
-
-	b, err := io.ReadAll(reader)
-	if err != nil {
-		return nil, err
-	}
-	require.NotNil(t, b)
-
-	lines := strings.Split(string(b), "\n")
-
-	// discard PS header
-	return lines[1:], nil
-}
-
-func TestFindClickHouseProcessesAndConfigs(t *testing.T) {
-
-	t.Run("can find ClickHouse processes and configs", func(t *testing.T) {
-		// create a ClickHouse container
-		ctx := context.Background()
-		cwd, err := os.Getwd()
-		if err != nil {
-			fmt.Println("unable to read current directory", err)
-			os.Exit(1)
-		}
-
-		// run a ClickHouse container that guarantees that it runs only for the duration of the test
-		req := testcontainers.ContainerRequest{
-			Image:        fmt.Sprintf("clickhouse/clickhouse-server:%s", test.GetClickHouseTestVersion()),
-			ExposedPorts: []string{"9000/tcp"},
-			WaitingFor:   wait.ForLog("Ready for connections"),
-			Mounts: testcontainers.ContainerMounts{
-				{
-					Source: testcontainers.GenericBindMountSource{
-						HostPath: path.Join(cwd, "../../../testdata/docker/custom.xml"),
-					},
-					Target: "/etc/clickhouse-server/config.d/custom.xml",
-				},
-			},
-		}
-		clickhouseContainer, err := testcontainers.GenericContainer(ctx, testcontainers.GenericContainerRequest{
-			ContainerRequest: req,
-			Started:          true,
-		})
-		if err != nil {
-			// can't test without container
-			panic(err)
-		}
-
-		p, _ := clickhouseContainer.MappedPort(ctx, "9000")
-
-		t.Setenv("CLICKHOUSE_DB_PORT", p.Port())
-
-		defer clickhouseContainer.Terminate(ctx) //nolint
-
-		lines, err := getProcessesInContainer(t, clickhouseContainer)
-		require.Nil(t, err)
-		require.NotEmpty(t, lines)
-
-		for _, line := range lines {
-			parts := strings.Fields(line)
-			if len(parts) < 11 {
-				continue
-			}
-			if !strings.Contains(parts[10], "clickhouse-server") {
-				continue
-			}
-
-			require.Equal(t, "/usr/bin/clickhouse-server", parts[10])
-			require.Equal(t, "--config-file=/etc/clickhouse-server/config.xml", parts[11])
-		}
-	})
-}
diff --git a/programs/diagnostics/internal/platform/utils/slices.go b/programs/diagnostics/internal/platform/utils/slices.go
deleted file mode 100644
index cf5a5f97ce8..00000000000
--- a/programs/diagnostics/internal/platform/utils/slices.go
+++ /dev/null
@@ -1,68 +0,0 @@
-package utils
-
-// Intersection of elements in s1 and s2
-func Intersection(s1, s2 []string) (inter []string) {
-	hash := make(map[string]bool)
-	for _, e := range s1 {
-		hash[e] = false
-	}
-	for _, e := range s2 {
-		// If elements present in the hashmap then append intersection list.
-		if val, ok := hash[e]; ok {
-			if !val {
-				// only add once
-				inter = append(inter, e)
-				hash[e] = true
-			}
-		}
-	}
-	return inter
-}
-
-// Distinct returns elements in s1, not in s2
-func Distinct(s1, s2 []string) (distinct []string) {
-	hash := make(map[string]bool)
-	for _, e := range s2 {
-		hash[e] = true
-	}
-	for _, e := range s1 {
-		if _, ok := hash[e]; !ok {
-			distinct = append(distinct, e)
-		}
-	}
-	return distinct
-}
-
-// Unique func Unique(s1 []string) (unique []string) returns unique elements in s1
-func Unique(s1 []string) (unique []string) {
-	hash := make(map[string]bool)
-	for _, e := range s1 {
-		if _, ok := hash[e]; !ok {
-			unique = append(unique, e)
-		}
-		hash[e] = true
-	}
-	return unique
-}
-
-func Contains(s []string, e string) bool {
-	for _, a := range s {
-		if a == e {
-			return true
-		}
-	}
-	return false
-}
-
-func IndexOf(s []string, e string) int {
-	for i, a := range s {
-		if a == e {
-			return i
-		}
-	}
-	return -1
-}
-
-func Remove(slice []interface{}, s int) []interface{} {
-	return append(slice[:s], slice[s+1:]...)
-}
diff --git a/programs/diagnostics/internal/platform/utils/slices_test.go b/programs/diagnostics/internal/platform/utils/slices_test.go
deleted file mode 100644
index ea5c1c81dcc..00000000000
--- a/programs/diagnostics/internal/platform/utils/slices_test.go
+++ /dev/null
@@ -1,64 +0,0 @@
-package utils_test
-
-import (
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/stretchr/testify/require"
-)
-
-func TestIntersection(t *testing.T) {
-	t.Run("can perform intersection", func(t *testing.T) {
-		setA := []string{"A", "b", "C", "D", "E"}
-		setB := []string{"A", "B", "F", "C", "G"}
-		setC := utils.Intersection(setA, setB)
-		require.Len(t, setC, 2)
-		require.ElementsMatch(t, []string{"A", "C"}, setC)
-	})
-}
-
-func TestDistinct(t *testing.T) {
-	t.Run("can perform distinct", func(t *testing.T) {
-		setA := []string{"A", "b", "C", "D", "E"}
-		setB := []string{"A", "B", "F", "C", "G"}
-		setC := utils.Distinct(setA, setB)
-		require.Len(t, setC, 3)
-		require.ElementsMatch(t, []string{"b", "D", "E"}, setC)
-	})
-
-	t.Run("can perform distinct on empty", func(t *testing.T) {
-		setA := []string{"A", "b", "C", "D", "E"}
-		var setB []string
-		setC := utils.Distinct(setA, setB)
-		require.Len(t, setC, 5)
-		require.ElementsMatch(t, []string{"A", "b", "C", "D", "E"}, setC)
-	})
-}
-
-func TestContains(t *testing.T) {
-	t.Run("can perform contains", func(t *testing.T) {
-		setA := []string{"A", "b", "C", "D", "E"}
-		require.True(t, utils.Contains(setA, "A"))
-		require.True(t, utils.Contains(setA, "b"))
-		require.True(t, utils.Contains(setA, "C"))
-		require.True(t, utils.Contains(setA, "D"))
-		require.True(t, utils.Contains(setA, "E"))
-		require.False(t, utils.Contains(setA, "B"))
-	})
-}
-
-func TestUnique(t *testing.T) {
-
-	t.Run("can perform unique", func(t *testing.T) {
-		setA := []string{"A", "b", "D", "D", "E", "E", "A"}
-		setC := utils.Unique(setA)
-		require.Len(t, setC, 4)
-		require.ElementsMatch(t, []string{"A", "b", "D", "E"}, setC)
-	})
-
-	t.Run("can perform unique on empty", func(t *testing.T) {
-		var setA []string
-		setC := utils.Unique(setA)
-		require.Len(t, setC, 0)
-	})
-}
diff --git a/programs/diagnostics/internal/platform/utils/time.go b/programs/diagnostics/internal/platform/utils/time.go
deleted file mode 100644
index 622e92b873a..00000000000
--- a/programs/diagnostics/internal/platform/utils/time.go
+++ /dev/null
@@ -1,7 +0,0 @@
-package utils
-
-import "time"
-
-func MakeTimestamp() int64 {
-	return time.Now().UnixNano() / int64(time.Millisecond)
-}
diff --git a/programs/diagnostics/internal/runner.go b/programs/diagnostics/internal/runner.go
deleted file mode 100644
index 9386a1d178b..00000000000
--- a/programs/diagnostics/internal/runner.go
+++ /dev/null
@@ -1,115 +0,0 @@
-package internal
-
-import (
-	c "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	o "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/data"
-	"github.com/pkg/errors"
-	"github.com/rs/zerolog/log"
-)
-
-type runConfiguration struct {
-	id               string
-	host             string
-	port             uint16
-	username         string
-	password         string
-	output           string
-	collectors       []string
-	collectorConfigs map[string]config.Configuration
-	outputConfig     config.Configuration
-}
-
-func NewRunConfiguration(id string, host string, port uint16, username string, password string, output string, outputConfig config.Configuration,
-	collectors []string, collectorConfigs map[string]config.Configuration) *runConfiguration {
-	config := runConfiguration{
-		id:               id,
-		host:             host,
-		port:             port,
-		username:         username,
-		password:         password,
-		collectors:       collectors,
-		output:           output,
-		collectorConfigs: collectorConfigs,
-		outputConfig:     outputConfig,
-	}
-	return &config
-}
-
-func Capture(config *runConfiguration) {
-	bundles, err := collect(config)
-	if err != nil {
-		log.Fatal().Err(err).Msg("unable to perform collection")
-	}
-	log.Info().Msgf("collectors initialized")
-	if err = output(config, bundles); err != nil {
-		log.Fatal().Err(err).Msg("unable to create output")
-	}
-	log.Info().Msgf("bundle export complete")
-}
-
-func collect(config *runConfiguration) (map[string]*data.DiagnosticBundle, error) {
-	resourceManager := platform.GetResourceManager()
-	err := resourceManager.Connect(config.host, config.port, config.username, config.password)
-	if err != nil {
-		// if we can't connect this is fatal
-		log.Fatal().Err(err).Msg("Unable to connect to database")
-	}
-	//grab the required connectors - we pass what we can
-	bundles := make(map[string]*data.DiagnosticBundle)
-	log.Info().Msgf("connection established")
-	//these store our collection errors and will be output in the bundle
-	var collectorErrors [][]interface{}
-	for _, collectorName := range config.collectors {
-		collectorConfig := config.collectorConfigs[collectorName]
-		log.Info().Msgf("initializing %s collector", collectorName)
-		collector, err := c.GetCollectorByName(collectorName)
-		if err != nil {
-			log.Error().Err(err).Msgf("Unable to fetch collector %s", collectorName)
-			collectorErrors = append(collectorErrors, []interface{}{err.Error()})
-			continue
-		}
-		bundle, err := collector.Collect(collectorConfig)
-		if err != nil {
-			log.Error().Err(err).Msgf("Error in collector %s", collectorName)
-			collectorErrors = append(collectorErrors, []interface{}{err.Error()})
-			// this indicates a fatal error in the collector
-			continue
-		}
-		for _, fError := range bundle.Errors.Errors {
-			err = errors.Wrapf(fError, "Failure to collect frame in collector %s", collectorName)
-			collectorErrors = append(collectorErrors, []interface{}{err.Error()})
-			log.Warn().Msg(err.Error())
-		}
-		bundles[collectorName] = bundle
-	}
-	bundles["diag_trace"] = buildTraceBundle(collectorErrors)
-	return bundles, nil
-}
-
-func output(config *runConfiguration, bundles map[string]*data.DiagnosticBundle) error {
-	log.Info().Msgf("attempting to export bundle using %s output...", config.output)
-	output, err := o.GetOutputByName(config.output)
-	if err != nil {
-		return err
-	}
-	frameErrors, err := output.Write(config.id, bundles, config.outputConfig)
-	// we report over failing hard on frame errors - up to the output to determine what is fatal via error
-	for _, fError := range frameErrors.Errors {
-		log.Warn().Msgf("failure to write frame in output %s - %s", config.output, fError)
-	}
-	return err
-}
-
-func buildTraceBundle(collectorErrors [][]interface{}) *data.DiagnosticBundle {
-	errorBundle := data.DiagnosticBundle{
-		Frames: map[string]data.Frame{
-			"errors": data.NewMemoryFrame("errors", []string{"errors"}, collectorErrors),
-		},
-		Errors: data.FrameErrors{},
-	}
-	// add any other metrics from collection
-	return &errorBundle
-}
diff --git a/programs/diagnostics/internal/runner_test.go b/programs/diagnostics/internal/runner_test.go
deleted file mode 100644
index 2369f8b3007..00000000000
--- a/programs/diagnostics/internal/runner_test.go
+++ /dev/null
@@ -1,130 +0,0 @@
-//go:build !no_docker
-
-package internal_test
-
-import (
-	"context"
-	"fmt"
-	"io/ioutil"
-	"os"
-	"path"
-	"testing"
-
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors"
-	_ "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/clickhouse"
-	_ "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/collectors/system"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs"
-	_ "github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/outputs/file"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/config"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/test"
-	"github.com/ClickHouse/ClickHouse/programs/diagnostics/internal/platform/utils"
-	"github.com/stretchr/testify/require"
-	"github.com/testcontainers/testcontainers-go"
-	"github.com/testcontainers/testcontainers-go/wait"
-)
-
-// Execute a full default capture, with simple output, and check if a bundle is produced and it's not empty
-func TestCapture(t *testing.T) {
-	// create a ClickHouse container
-	ctx := context.Background()
-	cwd, err := os.Getwd()
-
-	if err != nil {
-		// can't test without container
-		panic(err)
-	}
-	// for now, we test against a hardcoded database-server version but we should make this a property
-	req := testcontainers.ContainerRequest{
-		Image:        fmt.Sprintf("clickhouse/clickhouse-server:%s", test.GetClickHouseTestVersion()),
-		ExposedPorts: []string{"9000/tcp"},
-		WaitingFor:   wait.ForLog("Ready for connections"),
-		Mounts: testcontainers.ContainerMounts{
-			{
-				Source: testcontainers.GenericBindMountSource{
-					HostPath: path.Join(cwd, "../testdata/docker/custom.xml"),
-				},
-				Target: "/etc/clickhouse-server/config.d/custom.xml",
-			},
-			{
-				Source: testcontainers.GenericBindMountSource{
-					HostPath: path.Join(cwd, "../testdata/docker/admin.xml"),
-				},
-				Target: "/etc/clickhouse-server/users.d/admin.xml",
-			},
-		},
-	}
-	clickhouseContainer, err := testcontainers.GenericContainer(ctx, testcontainers.GenericContainerRequest{
-		ContainerRequest: req,
-		Started:          true,
-	})
-	if err != nil {
-		// can't test without container
-		panic(err)
-	}
-
-	p, _ := clickhouseContainer.MappedPort(ctx, "9000")
-
-	t.Setenv("CLICKHOUSE_DB_PORT", p.Port())
-	defer clickhouseContainer.Terminate(ctx) //nolint
-
-	tmrDir := t.TempDir()
-	port := p.Int()
-
-	// test a simple output exists
-	_, err = outputs.GetOutputByName("simple")
-	require.Nil(t, err)
-	// this relies on the simple out not changing its params - test will likely fail if so
-	outputConfig := config.Configuration{
-		Params: []config.ConfigParam{
-			config.StringParam{
-				Value: tmrDir,
-				Param: config.NewParam("directory", "Directory in which to create dump. Defaults to the current directory.", false),
-			},
-			config.StringOptions{
-				Value:   "csv",
-				Options: []string{"csv"},
-				Param:   config.NewParam("format", "Format of exported files", false),
-			},
-			config.BoolParam{
-				Value: true,
-				Param: config.NewParam("skip_archive", "Don't compress output to an archive", false),
-			},
-		},
-	}
-	// test default collectors
-	collectorNames := collectors.GetCollectorNames(true)
-	// grab all configs - only default will be used because of collectorNames
-	collectorConfigs, err := collectors.BuildConfigurationOptions()
-	require.Nil(t, err)
-	conf := internal.NewRunConfiguration("random", "localhost", uint16(port), "", "", "simple", outputConfig, collectorNames, collectorConfigs)
-	internal.Capture(conf)
-	outputDir := path.Join(tmrDir, "random")
-	_, err = os.Stat(outputDir)
-	require.Nil(t, err)
-	require.True(t, !os.IsNotExist(err))
-	files, err := ioutil.ReadDir(outputDir)
-	require.Nil(t, err)
-	require.Len(t, files, 1)
-	outputDir = path.Join(outputDir, files[0].Name())
-	// check we have a folder per collector i.e. collectorNames + diag_trace
-	files, err = ioutil.ReadDir(outputDir)
-	require.Nil(t, err)
-	require.Len(t, files, len(collectorNames)+1)
-	expectedFolders := append(collectorNames, "diag_trace")
-	for _, file := range files {
-		require.True(t, file.IsDir())
-		utils.Contains(expectedFolders, file.Name())
-	}
-	// we don't test the specific collector outputs but make sure something was written to system
-	systemFolder := path.Join(outputDir, "system")
-	files, err = ioutil.ReadDir(systemFolder)
-	require.Nil(t, err)
-	require.Greater(t, len(files), 0)
-	// test diag_trace
-	diagFolder := path.Join(outputDir, "diag_trace")
-	files, err = ioutil.ReadDir(diagFolder)
-	require.Nil(t, err)
-	require.Equal(t, 1, len(files))
-	require.FileExists(t, path.Join(diagFolder, "errors.csv"))
-}
diff --git a/programs/diagnostics/testdata/configs/include/xml/server-include.xml b/programs/diagnostics/testdata/configs/include/xml/server-include.xml
deleted file mode 100644
index 30e6587c935..00000000000
--- a/programs/diagnostics/testdata/configs/include/xml/server-include.xml
+++ /dev/null
@@ -1,8 +0,0 @@
-<clickhouse>
-    <network_max>5000000</network_max>
-    <test_profile>
-        <test_p>
-        </test_p>
-    </test_profile>
-    <pg_port>9008</pg_port>
-</clickhouse>
\ No newline at end of file
diff --git a/programs/diagnostics/testdata/configs/include/xml/user-include.xml b/programs/diagnostics/testdata/configs/include/xml/user-include.xml
deleted file mode 100644
index b12b34a56bb..00000000000
--- a/programs/diagnostics/testdata/configs/include/xml/user-include.xml
+++ /dev/null
@@ -1,20 +0,0 @@
-<clickhouse>
-    <test_user>
-        <networks>
-            <ip>::/0</ip>
-        </networks>
-        <profile>default</profile>
-        <quota>default</quota>
-        <password_sha256_hex>REPLACE_ME</password_sha256_hex>
-        <access_management>1</access_management>
-    </test_user>
-    <another_user>
-        <networks>
-            <ip>::/0</ip>
-        </networks>
-        <profile>default</profile>
-        <quota>default</quota>
-        <passwird>REPLACE_ME</passwird>
-        <access_management>1</access_management>
-    </another_user>
-</clickhouse>
diff --git a/programs/diagnostics/testdata/configs/include/yaml/server-include.yaml b/programs/diagnostics/testdata/configs/include/yaml/server-include.yaml
deleted file mode 100644
index 903d7b6f733..00000000000
--- a/programs/diagnostics/testdata/configs/include/yaml/server-include.yaml
+++ /dev/null
@@ -1 +0,0 @@
-network_max: 5000000
diff --git a/programs/diagnostics/testdata/configs/include/yaml/user-include.yaml b/programs/diagnostics/testdata/configs/include/yaml/user-include.yaml
deleted file mode 100644
index 23b592507fa..00000000000
--- a/programs/diagnostics/testdata/configs/include/yaml/user-include.yaml
+++ /dev/null
@@ -1,7 +0,0 @@
-test_user:
-  password: 'REPLACE_ME'
-  networks:
-    ip: '::/0'
-  profile: default
-  quota: default
-  access_management: 1
diff --git a/programs/diagnostics/testdata/configs/xml/config.xml b/programs/diagnostics/testdata/configs/xml/config.xml
deleted file mode 100644
index eb7c70cf498..00000000000
--- a/programs/diagnostics/testdata/configs/xml/config.xml
+++ /dev/null
@@ -1,1195 +0,0 @@
-<!--
-  NOTE: User and query level settings are set up in "users.xml" file.
-  If you have accidentally specified user-level settings here, server won't start.
-  You can either move the settings to the right place inside "users.xml" file
-   or add <skip_check_for_incorrect_settings>1</skip_check_for_incorrect_settings> here.
--->
-<clickhouse>
-    <include_from>../include/xml/server-include.xml</include_from>
-    <logger>
-        <!-- Possible levels [1]:
-
-          - none (turns off logging)
-          - fatal
-          - critical
-          - error
-          - warning
-          - notice
-          - information
-          - debug
-          - trace
-          - test (not for production usage)
-
-            [1]: https://github.com/pocoproject/poco/blob/poco-1.9.4-release/Foundation/include/Poco/Logger.h#L105-L114
-        -->
-        <level>trace</level>
-        <log>/var/log/clickhouse-server/clickhouse-server.log</log>
-        <errorlog>/var/log/clickhouse-server/clickhouse-server.err.log</errorlog>
-        <!-- Rotation policy
-             See https://github.com/pocoproject/poco/blob/poco-1.9.4-release/Foundation/include/Poco/FileChannel.h#L54-L85
-          -->
-        <size>1000M</size>
-        <count>10</count>
-        <!-- <console>1</console> --> <!-- Default behavior is autodetection (log to console if not daemon mode and is tty) -->
-
-        <!-- Per level overrides (legacy):
-
-        For example to suppress logging of the ConfigReloader you can use:
-        NOTE: levels.logger is reserved, see below.
-        -->
-        <!--
-        <levels>
-          <ConfigReloader>none</ConfigReloader>
-        </levels>
-        -->
-
-        <!-- Per level overrides:
-
-        For example to suppress logging of the RBAC for default user you can use:
-        (But please note that the logger name maybe changed from version to version, even after minor upgrade)
-        -->
-        <!--
-        <levels>
-          <logger>
-            <name>ContextAccess (default)</name>
-            <level>none</level>
-          </logger>
-          <logger>
-            <name>DatabaseOrdinary (test)</name>
-            <level>none</level>
-          </logger>
-        </levels>
-        -->
-    </logger>
-    <!-- Add headers to response in options request. OPTIONS method is used in CORS preflight requests. -->
-    <!-- It is off by default. Next headers are obligate for CORS.-->
-    <!-- http_options_response>
-        <header>
-            <name>Access-Control-Allow-Origin</name>
-            <value>*</value>
-        </header>
-        <header>
-            <name>Access-Control-Allow-Headers</name>
-            <value>origin, x-requested-with</value>
-        </header>
-        <header>
-            <name>Access-Control-Allow-Methods</name>
-            <value>POST, GET, OPTIONS</value>
-        </header>
-        <header>
-            <name>Access-Control-Max-Age</name>
-            <value>86400</value>
-        </header>
-    </http_options_response -->
-
-    <!-- It is the name that will be shown in the clickhouse-client.
-         By default, anything with "production" will be highlighted in red in query prompt.
-    -->
-    <!--display_name>production</display_name-->
-
-    <!-- Port for HTTP API. See also 'https_port' for secure connections.
-         This interface is also used by ODBC and JDBC drivers (DataGrip, Dbeaver, ...)
-         and by most of web interfaces (embedded UI, Grafana, Redash, ...).
-      -->
-    <http_port>8123</http_port>
-
-    <!-- Port for interaction by native protocol with:
-         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark);
-         - clickhouse-server with other clickhouse-servers for distributed query processing;
-         - ClickHouse drivers and applications supporting native protocol
-         (this protocol is also informally called as "the TCP protocol");
-         See also 'tcp_port_secure' for secure connections.
-    -->
-    <tcp_port>9000</tcp_port>
-
-    <!-- Compatibility with MySQL protocol.
-         ClickHouse will pretend to be MySQL for applications connecting to this port.
-    -->
-    <mysql_port>9004</mysql_port>
-
-    <!-- Compatibility with PostgreSQL protocol.
-         ClickHouse will pretend to be PostgreSQL for applications connecting to this port.
-    -->
-    <postgresql_port>9005</postgresql_port>
-
-    <!-- HTTP API with TLS (HTTPS).
-         You have to configure certificate to enable this interface.
-         See the openSSL section below.
-    -->
-    <!-- <https_port>8443</https_port> -->
-
-    <!-- Native interface with TLS.
-         You have to configure certificate to enable this interface.
-         See the openSSL section below.
-    -->
-    <!-- <tcp_port_secure>9440</tcp_port_secure> -->
-
-    <!-- Native interface wrapped with PROXYv1 protocol
-         PROXYv1 header sent for every connection.
-         ClickHouse will extract information about proxy-forwarded client address from the header.
-    -->
-    <!-- <tcp_with_proxy_port>9011</tcp_with_proxy_port> -->
-
-    <!-- Port for communication between replicas. Used for data exchange.
-         It provides low-level data access between servers.
-         This port should not be accessible from untrusted networks.
-         See also 'interserver_http_credentials'.
-         Data transferred over connections to this port should not go through untrusted networks.
-         See also 'interserver_https_port'.
-      -->
-    <interserver_http_port>9009</interserver_http_port>
-
-    <!-- Port for communication between replicas with TLS.
-         You have to configure certificate to enable this interface.
-         See the openSSL section below.
-         See also 'interserver_http_credentials'.
-      -->
-    <!-- <interserver_https_port>9010</interserver_https_port> -->
-
-    <!-- Hostname that is used by other replicas to request this server.
-         If not specified, than it is determined analogous to 'hostname -f' command.
-         This setting could be used to switch replication to another network interface
-         (the server may be connected to multiple networks via multiple addresses)
-      -->
-    <!--
-    <interserver_http_host>example.yandex.ru</interserver_http_host>
-    -->
-
-    <!-- You can specify credentials for authenthication between replicas.
-         This is required when interserver_https_port is accessible from untrusted networks,
-         and also recommended to avoid SSRF attacks from possibly compromised services in your network.
-      -->
-    <!--<interserver_http_credentials>
-        <user>interserver</user>
-        <password></password>
-    </interserver_http_credentials>-->
-
-    <!-- Listen specified address.
-         Use :: (wildcard IPv6 address), if you want to accept connections both with IPv4 and IPv6 from everywhere.
-         Notes:
-         If you open connections from wildcard address, make sure that at least one of the following measures applied:
-         - server is protected by firewall and not accessible from untrusted networks;
-         - all users are restricted to subset of network addresses (see users.xml);
-         - all users have strong passwords, only secure (TLS) interfaces are accessible, or connections are only made via TLS interfaces.
-         - users without password have readonly access.
-         See also: https://www.shodan.io/search?query=clickhouse
-      -->
-    <!-- <listen_host>::</listen_host> -->
-
-    <!-- Same for hosts without support for IPv6: -->
-    <!-- <listen_host>0.0.0.0</listen_host> -->
-
-    <!-- Default values - try listen localhost on IPv4 and IPv6. -->
-    <!--
-    <listen_host>::1</listen_host>
-    <listen_host>127.0.0.1</listen_host>
-    -->
-
-    <!-- Don't exit if IPv6 or IPv4 networks are unavailable while trying to listen. -->
-    <!-- <listen_try>0</listen_try> -->
-
-    <!-- Allow multiple servers to listen on the same address:port. This is not recommended.
-      -->
-    <!-- <listen_reuse_port>0</listen_reuse_port> -->
-
-    <!-- <listen_backlog>4096</listen_backlog> -->
-
-    <max_connections>4096</max_connections>
-
-    <!-- For 'Connection: keep-alive' in HTTP 1.1 -->
-    <keep_alive_timeout>3</keep_alive_timeout>
-
-    <!-- gRPC protocol (see src/Server/grpc_protos/clickhouse_grpc.proto for the API) -->
-    <!-- <grpc_port>9100</grpc_port> -->
-    <grpc>
-        <enable_ssl>false</enable_ssl>
-
-        <!-- The following two files are used only if enable_ssl=1 -->
-        <ssl_cert_file>/path/to/ssl_cert_file</ssl_cert_file>
-        <ssl_key_file>/path/to/ssl_key_file</ssl_key_file>
-
-        <!-- Whether server will request client for a certificate -->
-        <ssl_require_client_auth>false</ssl_require_client_auth>
-
-        <!-- The following file is used only if ssl_require_client_auth=1 -->
-        <ssl_ca_cert_file>/path/to/ssl_ca_cert_file</ssl_ca_cert_file>
-
-        <!-- Default compression algorithm (applied if client doesn't specify another algorithm, see result_compression in QueryInfo).
-             Supported algorithms: none, deflate, gzip, stream_gzip -->
-        <compression>deflate</compression>
-
-        <!-- Default compression level (applied if client doesn't specify another level, see result_compression in QueryInfo).
-             Supported levels: none, low, medium, high -->
-        <compression_level>medium</compression_level>
-
-        <!-- Send/receive message size limits in bytes. -1 means unlimited -->
-        <max_send_message_size>-1</max_send_message_size>
-        <max_receive_message_size>-1</max_receive_message_size>
-
-        <!-- Enable if you want very detailed logs -->
-        <verbose_logs>false</verbose_logs>
-    </grpc>
-
-    <!-- Used with https_port and tcp_port_secure. Full ssl options list: https://github.com/ClickHouse-Extras/poco/blob/master/NetSSL_OpenSSL/include/Poco/Net/SSLManager.h#L71 -->
-    <openSSL>
-        <server> <!-- Used for https server AND secure tcp port -->
-            <!-- openssl req -subj "/CN=localhost" -new -newkey rsa:2048 -days 365 -nodes -x509 -keyout /etc/clickhouse-server/server.key -out /etc/clickhouse-server/server.crt -->
-            <certificateFile>/etc/clickhouse-server/server.crt</certificateFile>
-            <privateKeyFile>/etc/clickhouse-server/server.key</privateKeyFile>
-            <!-- dhparams are optional. You can delete the <dhParamsFile> element.
-                 To generate dhparams, use the following command:
-                  openssl dhparam -out /etc/clickhouse-server/dhparam.pem 4096
-                 Only file format with BEGIN DH PARAMETERS is supported.
-              -->
-            <dhParamsFile>/etc/clickhouse-server/dhparam.pem</dhParamsFile>
-            <verificationMode>none</verificationMode>
-            <loadDefaultCAFile>true</loadDefaultCAFile>
-            <cacheSessions>true</cacheSessions>
-            <disableProtocols>sslv2,sslv3</disableProtocols>
-            <preferServerCiphers>true</preferServerCiphers>
-        </server>
-
-        <client> <!-- Used for connecting to https dictionary source and secured Zookeeper communication -->
-            <loadDefaultCAFile>true</loadDefaultCAFile>
-            <cacheSessions>true</cacheSessions>
-            <disableProtocols>sslv2,sslv3</disableProtocols>
-            <preferServerCiphers>true</preferServerCiphers>
-            <!-- Use for self-signed: <verificationMode>none</verificationMode> -->
-            <invalidCertificateHandler>
-                <!-- Use for self-signed: <name>AcceptCertificateHandler</name> -->
-                <name>RejectCertificateHandler</name>
-            </invalidCertificateHandler>
-        </client>
-    </openSSL>
-
-    <!-- Default root page on http[s] server. For example load UI from https://tabix.io/ when opening http://localhost:8123 -->
-    <!--
-    <http_server_default_response><![CDATA[<html ng-app="SMI2"><head><base href="http://ui.tabix.io/"></head><body><div ui-view="" class="content-ui"></div><script src="http://loader.tabix.io/master.js"></script></body></html>]]></http_server_default_response>
-    -->
-
-    <!-- Maximum number of concurrent queries. -->
-    <max_concurrent_queries>100</max_concurrent_queries>
-
-    <!-- Maximum memory usage (resident set size) for server process.
-         Zero value or unset means default. Default is "max_server_memory_usage_to_ram_ratio" of available physical RAM.
-         If the value is larger than "max_server_memory_usage_to_ram_ratio" of available physical RAM, it will be cut down.
-
-         The constraint is checked on query execution time.
-         If a query tries to allocate memory and the current memory usage plus allocation is greater
-          than specified threshold, exception will be thrown.
-
-         It is not practical to set this constraint to small values like just a few gigabytes,
-          because memory allocator will keep this amount of memory in caches and the server will deny service of queries.
-      -->
-    <max_server_memory_usage>0</max_server_memory_usage>
-
-    <!-- Maximum number of threads in the Global thread pool.
-    This will default to a maximum of 10000 threads if not specified.
-    This setting will be useful in scenarios where there are a large number
-    of distributed queries that are running concurrently but are idling most
-    of the time, in which case a higher number of threads might be required.
-    -->
-
-    <max_thread_pool_size>10000</max_thread_pool_size>
-
-    <!-- On memory constrained environments you may have to set this to value larger than 1.
-      -->
-    <max_server_memory_usage_to_ram_ratio>0.9</max_server_memory_usage_to_ram_ratio>
-
-    <!-- Simple server-wide memory profiler. Collect a stack trace at every peak allocation step (in bytes).
-         Data will be stored in system.trace_log table with query_id = empty string.
-         Zero means disabled.
-      -->
-    <total_memory_profiler_step>4194304</total_memory_profiler_step>
-
-    <!-- Collect random allocations and deallocations and write them into system.trace_log with 'MemorySample' trace_type.
-         The probability is for every alloc/free regardless to the size of the allocation.
-         Note that sampling happens only when the amount of untracked memory exceeds the untracked memory limit,
-          which is 4 MiB by default but can be lowered if 'total_memory_profiler_step' is lowered.
-         You may want to set 'total_memory_profiler_step' to 1 for extra fine grained sampling.
-      -->
-    <total_memory_tracker_sample_probability>0</total_memory_tracker_sample_probability>
-
-    <!-- Set limit on number of open files (default: maximum). This setting makes sense on Mac OS X because getrlimit() fails to retrieve
-         correct maximum value. -->
-    <!-- <max_open_files>262144</max_open_files> -->
-
-    <!-- Size of cache of uncompressed blocks of data, used in tables of MergeTree family.
-         In bytes. Cache is single for server. Memory is allocated only on demand.
-         Cache is used when 'use_uncompressed_cache' user setting turned on (off by default).
-         Uncompressed cache is advantageous only for very short queries and in rare cases.
-
-         Note: uncompressed cache can be pointless for lz4, because memory bandwidth
-         is slower than multi-core decompression on some server configurations.
-         Enabling it can sometimes paradoxically make queries slower.
-      -->
-    <uncompressed_cache_size>8589934592</uncompressed_cache_size>
-
-    <!-- Approximate size of mark cache, used in tables of MergeTree family.
-         In bytes. Cache is single for server. Memory is allocated only on demand.
-         You should not lower this value.
-      -->
-    <mark_cache_size>5368709120</mark_cache_size>
-
-
-    <!-- If you enable the `min_bytes_to_use_mmap_io` setting,
-         the data in MergeTree tables can be read with mmap to avoid copying from kernel to userspace.
-         It makes sense only for large files and helps only if data reside in page cache.
-         To avoid frequent open/mmap/munmap/close calls (which are very expensive due to consequent page faults)
-         and to reuse mappings from several threads and queries,
-         the cache of mapped files is maintained. Its size is the number of mapped regions (usually equal to the number of mapped files).
-         The amount of data in mapped files can be monitored
-         in system.metrics, system.metric_log by the MMappedFiles, MMappedFileBytes metrics
-         and in system.asynchronous_metrics, system.asynchronous_metrics_log by the MMapCacheCells metric,
-         and also in system.events, system.processes, system.query_log, system.query_thread_log, system.query_views_log by the
-         CreatedReadBufferMMap, CreatedReadBufferMMapFailed, MMappedFileCacheHits, MMappedFileCacheMisses events.
-         Note that the amount of data in mapped files does not consume memory directly and is not accounted
-         in query or server memory usage - because this memory can be discarded similar to OS page cache.
-         The cache is dropped (the files are closed) automatically on removal of old parts in MergeTree,
-         also it can be dropped manually by the SYSTEM DROP MMAP CACHE query.
-      -->
-    <mmap_cache_size>1000</mmap_cache_size>
-
-    <!-- Cache size in bytes for compiled expressions.-->
-    <compiled_expression_cache_size>134217728</compiled_expression_cache_size>
-
-    <!-- Cache size in elements for compiled expressions.-->
-    <compiled_expression_cache_elements_size>10000</compiled_expression_cache_elements_size>
-
-    <!-- Path to data directory, with trailing slash. -->
-    <path>/var/lib/clickhouse/</path>
-
-    <!-- Path to temporary data for processing hard queries. -->
-    <tmp_path>/var/lib/clickhouse/tmp/</tmp_path>
-
-    <!-- Policy from the <storage_configuration> for the temporary files.
-         If not set <tmp_path> is used, otherwise <tmp_path> is ignored.
-
-         Notes:
-         - move_factor              is ignored
-         - keep_free_space_bytes    is ignored
-         - max_data_part_size_bytes is ignored
-         - you must have exactly one volume in that policy
-    -->
-    <!-- <tmp_policy>tmp</tmp_policy> -->
-
-    <!-- Directory with user provided files that are accessible by 'file' table function. -->
-    <user_files_path>/var/lib/clickhouse/user_files/</user_files_path>
-
-    <!-- LDAP server definitions. -->
-    <ldap_servers>
-        <!-- List LDAP servers with their connection parameters here to later 1) use them as authenticators for dedicated local users,
-              who have 'ldap' authentication mechanism specified instead of 'password', or to 2) use them as remote user directories.
-             Parameters:
-                host - LDAP server hostname or IP, this parameter is mandatory and cannot be empty.
-                port - LDAP server port, default is 636 if enable_tls is set to true, 389 otherwise.
-                bind_dn - template used to construct the DN to bind to.
-                        The resulting DN will be constructed by replacing all '{user_name}' substrings of the template with the actual
-                         user name during each authentication attempt.
-                user_dn_detection - section with LDAP search parameters for detecting the actual user DN of the bound user.
-                        This is mainly used in search filters for further role mapping when the server is Active Directory. The
-                         resulting user DN will be used when replacing '{user_dn}' substrings wherever they are allowed. By default,
-                         user DN is set equal to bind DN, but once search is performed, it will be updated with to the actual detected
-                         user DN value.
-                    base_dn - template used to construct the base DN for the LDAP search.
-                            The resulting DN will be constructed by replacing all '{user_name}' and '{bind_dn}' substrings
-                             of the template with the actual user name and bind DN during the LDAP search.
-                    scope - scope of the LDAP search.
-                            Accepted values are: 'base', 'one_level', 'children', 'subtree' (the default).
-                    search_filter - template used to construct the search filter for the LDAP search.
-                            The resulting filter will be constructed by replacing all '{user_name}', '{bind_dn}', and '{base_dn}'
-                             substrings of the template with the actual user name, bind DN, and base DN during the LDAP search.
-                            Note, that the special characters must be escaped properly in XML.
-                verification_cooldown - a period of time, in seconds, after a successful bind attempt, during which a user will be assumed
-                         to be successfully authenticated for all consecutive requests without contacting the LDAP server.
-                        Specify 0 (the default) to disable caching and force contacting the LDAP server for each authentication request.
-                enable_tls - flag to trigger use of secure connection to the LDAP server.
-                        Specify 'no' for plain text (ldap://) protocol (not recommended).
-                        Specify 'yes' for LDAP over SSL/TLS (ldaps://) protocol (recommended, the default).
-                        Specify 'starttls' for legacy StartTLS protocol (plain text (ldap://) protocol, upgraded to TLS).
-                tls_minimum_protocol_version - the minimum protocol version of SSL/TLS.
-                        Accepted values are: 'ssl2', 'ssl3', 'tls1.0', 'tls1.1', 'tls1.2' (the default).
-                tls_require_cert - SSL/TLS peer certificate verification behavior.
-                        Accepted values are: 'never', 'allow', 'try', 'demand' (the default).
-                tls_cert_file - path to certificate file.
-                tls_key_file - path to certificate key file.
-                tls_ca_cert_file - path to CA certificate file.
-                tls_ca_cert_dir - path to the directory containing CA certificates.
-                tls_cipher_suite - allowed cipher suite (in OpenSSL notation).
-             Example:
-                <my_ldap_server>
-                    <host>localhost</host>
-                    <port>636</port>
-                    <bind_dn>uid={user_name},ou=users,dc=example,dc=com</bind_dn>
-                    <verification_cooldown>300</verification_cooldown>
-                    <enable_tls>yes</enable_tls>
-                    <tls_minimum_protocol_version>tls1.2</tls_minimum_protocol_version>
-                    <tls_require_cert>demand</tls_require_cert>
-                    <tls_cert_file>/path/to/tls_cert_file</tls_cert_file>
-                    <tls_key_file>/path/to/tls_key_file</tls_key_file>
-                    <tls_ca_cert_file>/path/to/tls_ca_cert_file</tls_ca_cert_file>
-                    <tls_ca_cert_dir>/path/to/tls_ca_cert_dir</tls_ca_cert_dir>
-                    <tls_cipher_suite>ECDHE-ECDSA-AES256-GCM-SHA384:ECDHE-RSA-AES256-GCM-SHA384:AES256-GCM-SHA384</tls_cipher_suite>
-                </my_ldap_server>
-             Example (typical Active Directory with configured user DN detection for further role mapping):
-                <my_ad_server>
-                    <host>localhost</host>
-                    <port>389</port>
-                    <bind_dn>EXAMPLE\{user_name}</bind_dn>
-                    <user_dn_detection>
-                        <base_dn>CN=Users,DC=example,DC=com</base_dn>
-                        <search_filter>(&amp;(objectClass=user)(sAMAccountName={user_name}))</search_filter>
-                    </user_dn_detection>
-                    <enable_tls>no</enable_tls>
-                </my_ad_server>
-        -->
-    </ldap_servers>
-
-    <!-- To enable Kerberos authentication support for HTTP requests (GSS-SPNEGO), for those users who are explicitly configured
-          to authenticate via Kerberos, define a single 'kerberos' section here.
-         Parameters:
-            principal - canonical service principal name, that will be acquired and used when accepting security contexts.
-                    This parameter is optional, if omitted, the default principal will be used.
-                    This parameter cannot be specified together with 'realm' parameter.
-            realm - a realm, that will be used to restrict authentication to only those requests whose initiator's realm matches it.
-                    This parameter is optional, if omitted, no additional filtering by realm will be applied.
-                    This parameter cannot be specified together with 'principal' parameter.
-         Example:
-            <kerberos />
-         Example:
-            <kerberos>
-                <principal>HTTP/clickhouse.example.com@EXAMPLE.COM</principal>
-            </kerberos>
-         Example:
-            <kerberos>
-                <realm>EXAMPLE.COM</realm>
-            </kerberos>
-    -->
-
-    <!-- Sources to read users, roles, access rights, profiles of settings, quotas. -->
-    <user_directories>
-        <users_xml>
-            <!-- Path to configuration file with predefined users. -->
-            <path>users.xml</path>
-        </users_xml>
-        <local_directory>
-            <!-- Path to folder where users created by SQL commands are stored. -->
-            <path>/var/lib/clickhouse/access/</path>
-        </local_directory>
-
-        <!-- To add an LDAP server as a remote user directory of users that are not defined locally, define a single 'ldap' section
-              with the following parameters:
-                server - one of LDAP server names defined in 'ldap_servers' config section above.
-                        This parameter is mandatory and cannot be empty.
-                roles - section with a list of locally defined roles that will be assigned to each user retrieved from the LDAP server.
-                        If no roles are specified here or assigned during role mapping (below), user will not be able to perform any
-                         actions after authentication.
-                role_mapping - section with LDAP search parameters and mapping rules.
-                        When a user authenticates, while still bound to LDAP, an LDAP search is performed using search_filter and the
-                         name of the logged in user. For each entry found during that search, the value of the specified attribute is
-                         extracted. For each attribute value that has the specified prefix, the prefix is removed, and the rest of the
-                         value becomes the name of a local role defined in ClickHouse, which is expected to be created beforehand by
-                         CREATE ROLE command.
-                        There can be multiple 'role_mapping' sections defined inside the same 'ldap' section. All of them will be
-                         applied.
-                    base_dn - template used to construct the base DN for the LDAP search.
-                            The resulting DN will be constructed by replacing all '{user_name}', '{bind_dn}', and '{user_dn}'
-                             substrings of the template with the actual user name, bind DN, and user DN during each LDAP search.
-                    scope - scope of the LDAP search.
-                            Accepted values are: 'base', 'one_level', 'children', 'subtree' (the default).
-                    search_filter - template used to construct the search filter for the LDAP search.
-                            The resulting filter will be constructed by replacing all '{user_name}', '{bind_dn}', '{user_dn}', and
-                             '{base_dn}' substrings of the template with the actual user name, bind DN, user DN, and base DN during
-                             each LDAP search.
-                            Note, that the special characters must be escaped properly in XML.
-                    attribute - attribute name whose values will be returned by the LDAP search. 'cn', by default.
-                    prefix - prefix, that will be expected to be in front of each string in the original list of strings returned by
-                             the LDAP search. Prefix will be removed from the original strings and resulting strings will be treated
-                             as local role names. Empty, by default.
-             Example:
-                <ldap>
-                    <server>my_ldap_server</server>
-                    <roles>
-                        <my_local_role1 />
-                        <my_local_role2 />
-                    </roles>
-                    <role_mapping>
-                        <base_dn>ou=groups,dc=example,dc=com</base_dn>
-                        <scope>subtree</scope>
-                        <search_filter>(&amp;(objectClass=groupOfNames)(member={bind_dn}))</search_filter>
-                        <attribute>cn</attribute>
-                        <prefix>clickhouse_</prefix>
-                    </role_mapping>
-                </ldap>
-             Example (typical Active Directory with role mapping that relies on the detected user DN):
-                <ldap>
-                    <server>my_ad_server</server>
-                    <role_mapping>
-                        <base_dn>CN=Users,DC=example,DC=com</base_dn>
-                        <attribute>CN</attribute>
-                        <scope>subtree</scope>
-                        <search_filter>(&amp;(objectClass=group)(member={user_dn}))</search_filter>
-                        <prefix>clickhouse_</prefix>
-                    </role_mapping>
-                </ldap>
-        -->
-    </user_directories>
-
-    <!-- Default profile of settings. -->
-    <default_profile>default</default_profile>
-
-    <!-- Comma-separated list of prefixes for user-defined settings. -->
-    <custom_settings_prefixes></custom_settings_prefixes>
-
-    <!-- System profile of settings. This settings are used by internal processes (Distributed DDL worker and so on). -->
-    <!-- <system_profile>default</system_profile> -->
-
-    <!-- Buffer profile of settings.
-         This settings are used by Buffer storage to flush data to the underlying table.
-         Default: used from system_profile directive.
-    -->
-    <!-- <buffer_profile>default</buffer_profile> -->
-
-    <!-- Default database. -->
-    <default_database>default</default_database>
-
-    <!-- Server time zone could be set here.
-
-         Time zone is used when converting between String and DateTime types,
-          when printing DateTime in text formats and parsing DateTime from text,
-          it is used in date and time related functions, if specific time zone was not passed as an argument.
-
-         Time zone is specified as identifier from IANA time zone database, like UTC or Africa/Abidjan.
-         If not specified, system time zone at server startup is used.
-
-         Please note, that server could display time zone alias instead of specified name.
-         Example: W-SU is an alias for Europe/Moscow and Zulu is an alias for UTC.
-    -->
-    <!-- <timezone>Europe/Moscow</timezone> -->
-
-    <!-- You can specify umask here (see "man umask"). Server will apply it on startup.
-         Number is always parsed as octal. Default umask is 027 (other users cannot read logs, data files, etc; group can only read).
-    -->
-    <!-- <umask>022</umask> -->
-
-    <!-- Perform mlockall after startup to lower first queries latency
-          and to prevent clickhouse executable from being paged out under high IO load.
-         Enabling this option is recommended but will lead to increased startup time for up to a few seconds.
-    -->
-    <mlock_executable>true</mlock_executable>
-
-    <!-- Reallocate memory for machine code ("text") using huge pages. Highly experimental. -->
-    <remap_executable>false</remap_executable>
-
-    <![CDATA[
-         Uncomment below in order to use JDBC table engine and function.
-
-         To install and run JDBC bridge in background:
-         * [Debian/Ubuntu]
-           export MVN_URL=https://repo1.maven.org/maven2/ru/yandex/clickhouse/clickhouse-jdbc-bridge
-           export PKG_VER=$(curl -sL $MVN_URL/maven-metadata.xml | grep '<release>' | sed -e 's|.*>\(.*\)<.*|\1|')
-           wget https://github.com/ClickHouse/clickhouse-jdbc-bridge/releases/download/v$PKG_VER/clickhouse-jdbc-bridge_$PKG_VER-1_all.deb
-           apt install --no-install-recommends -f ./clickhouse-jdbc-bridge_$PKG_VER-1_all.deb
-           clickhouse-jdbc-bridge &
-
-         * [CentOS/RHEL]
-           export MVN_URL=https://repo1.maven.org/maven2/ru/yandex/clickhouse/clickhouse-jdbc-bridge
-           export PKG_VER=$(curl -sL $MVN_URL/maven-metadata.xml | grep '<release>' | sed -e 's|.*>\(.*\)<.*|\1|')
-           wget https://github.com/ClickHouse/clickhouse-jdbc-bridge/releases/download/v$PKG_VER/clickhouse-jdbc-bridge-$PKG_VER-1.noarch.rpm
-           yum localinstall -y clickhouse-jdbc-bridge-$PKG_VER-1.noarch.rpm
-           clickhouse-jdbc-bridge &
-
-         Please refer to https://github.com/ClickHouse/clickhouse-jdbc-bridge#usage for more information.
-    ]]>
-    <!--
-    <jdbc_bridge>
-        <host>127.0.0.1</host>
-        <port>9019</port>
-    </jdbc_bridge>
-    -->
-
-    <!-- Configuration of clusters that could be used in Distributed tables.
-         https://clickhouse.com/docs/en/operations/table_engines/distributed/
-      -->
-    <remote_servers>
-        <!-- Test only shard config for testing distributed storage -->
-        <test_shard_localhost>
-            <!-- Inter-server per-cluster secret for Distributed queries
-                 default: no secret (no authentication will be performed)
-
-                 If set, then Distributed queries will be validated on shards, so at least:
-                 - such cluster should exist on the shard,
-                 - such cluster should have the same secret.
-
-                 And also (and which is more important), the initial_user will
-                 be used as current user for the query.
-
-                 Right now the protocol is pretty simple and it only takes into account:
-                 - cluster name
-                 - query
-
-                 Also it will be nice if the following will be implemented:
-                 - source hostname (see interserver_http_host), but then it will depends from DNS,
-                   it can use IP address instead, but then the you need to get correct on the initiator node.
-                 - target hostname / ip address (same notes as for source hostname)
-                 - time-based security tokens
-            -->
-            <secret>REPLACE_ME</secret>
-
-            <shard>
-                <!-- Optional. Whether to write data to just one of the replicas. Default: false (write data to all replicas). -->
-                <!-- <internal_replication>false</internal_replication> -->
-                <!-- Optional. Shard weight when writing data. Default: 1. -->
-                <!-- <weight>1</weight> -->
-                <replica>
-                    <host>localhost</host>
-                    <port>9000</port>
-                    <!-- Optional. Priority of the replica for load_balancing. Default: 1 (less value has more priority). -->
-                    <!-- <priority>1</priority> -->
-                </replica>
-            </shard>
-        </test_shard_localhost>
-    </remote_servers>
-
-    <!-- The list of hosts allowed to use in URL-related storage engines and table functions.
-        If this section is not present in configuration, all hosts are allowed.
-    -->
-    <!--<remote_url_allow_hosts>-->
-    <!-- Host should be specified exactly as in URL. The name is checked before DNS resolution.
-        Example: "yandex.ru", "yandex.ru." and "www.yandex.ru" are different hosts.
-                If port is explicitly specified in URL, the host:port is checked as a whole.
-                If host specified here without port, any port with this host allowed.
-                "yandex.ru" -> "yandex.ru:443", "yandex.ru:80" etc. is allowed, but "yandex.ru:80" -> only "yandex.ru:80" is allowed.
-        If the host is specified as IP address, it is checked as specified in URL. Example: "[2a02:6b8:a::a]".
-        If there are redirects and support for redirects is enabled, every redirect (the Location field) is checked.
-        Host should be specified using the host xml tag:
-                <host>yandex.ru</host>
-    -->
-
-    <!-- Regular expression can be specified. RE2 engine is used for regexps.
-        Regexps are not aligned: don't forget to add ^ and $. Also don't forget to escape dot (.) metacharacter
-        (forgetting to do so is a common source of error).
-    -->
-    <!--</remote_url_allow_hosts>-->
-
-    <!-- If element has 'incl' attribute, then for it's value will be used corresponding substitution from another file.
-         By default, path to file with substitutions is /etc/metrika.xml. It could be changed in config in 'include_from' element.
-         Values for substitutions are specified in /clickhouse/name_of_substitution elements in that file.
-      -->
-
-    <!-- ZooKeeper is used to store metadata about replicas, when using Replicated tables.
-         Optional. If you don't use replicated tables, you could omit that.
-
-         See https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/replication/
-      -->
-
-    <!--
-    <zookeeper>
-        <node>
-            <host>example1</host>
-            <port>2181</port>
-        </node>
-        <node>
-            <host>example2</host>
-            <port>2181</port>
-        </node>
-        <node>
-            <host>example3</host>
-            <port>2181</port>
-        </node>
-    </zookeeper>
-    -->
-
-    <!-- Substitutions for parameters of replicated tables.
-          Optional. If you don't use replicated tables, you could omit that.
-
-         See https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/replication/#creating-replicated-tables
-      -->
-    <!--
-    <macros>
-        <shard>01</shard>
-        <replica>example01-01-1</replica>
-    </macros>
-    -->
-
-
-    <!-- Reloading interval for embedded dictionaries, in seconds. Default: 3600. -->
-    <builtin_dictionaries_reload_interval>3600</builtin_dictionaries_reload_interval>
-
-
-    <!-- Maximum session timeout, in seconds. Default: 3600. -->
-    <max_session_timeout>3600</max_session_timeout>
-
-    <!-- Default session timeout, in seconds. Default: 60. -->
-    <default_session_timeout>60</default_session_timeout>
-
-    <!-- Sending data to Graphite for monitoring. Several sections can be defined. -->
-    <!--
-        interval - send every X second
-        root_path - prefix for keys
-        hostname_in_path - append hostname to root_path (default = true)
-        metrics - send data from table system.metrics
-        events - send data from table system.events
-        asynchronous_metrics - send data from table system.asynchronous_metrics
-    -->
-    <!--
-    <graphite>
-        <host>localhost</host>
-        <port>42000</port>
-        <timeout>0.1</timeout>
-        <interval>60</interval>
-        <root_path>one_min</root_path>
-        <hostname_in_path>true</hostname_in_path>
-
-        <metrics>true</metrics>
-        <events>true</events>
-        <events_cumulative>false</events_cumulative>
-        <asynchronous_metrics>true</asynchronous_metrics>
-    </graphite>
-    <graphite>
-        <host>localhost</host>
-        <port>42000</port>
-        <timeout>0.1</timeout>
-        <interval>1</interval>
-        <root_path>one_sec</root_path>
-
-        <metrics>true</metrics>
-        <events>true</events>
-        <events_cumulative>false</events_cumulative>
-        <asynchronous_metrics>false</asynchronous_metrics>
-    </graphite>
-    -->
-
-    <!-- Query log. Used only for queries with setting log_queries = 1. -->
-    <query_log>
-        <!-- What table to insert data. If table is not exist, it will be created.
-             When query log structure is changed after system update,
-              then old table will be renamed and new table will be created automatically.
-        -->
-        <database>system</database>
-        <table>query_log</table>
-        <!--
-            PARTITION BY expr: https://clickhouse.com/docs/en/table_engines/mergetree-family/custom_partitioning_key/
-            Example:
-                event_date
-                toMonday(event_date)
-                toYYYYMM(event_date)
-                toStartOfHour(event_time)
-        -->
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <!--
-            Table TTL specification: https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/mergetree/#mergetree-table-ttl
-            Example:
-                event_date + INTERVAL 1 WEEK
-                event_date + INTERVAL 7 DAY DELETE
-                event_date + INTERVAL 2 WEEK TO DISK 'bbb'
-
-        <ttl>event_date + INTERVAL 30 DAY DELETE</ttl>
-        -->
-
-        <!-- Instead of partition_by, you can provide full engine expression (starting with ENGINE = ) with parameters,
-             Example: <engine>ENGINE = MergeTree PARTITION BY toYYYYMM(event_date) ORDER BY (event_date, event_time) SETTINGS index_granularity = 1024</engine>
-          -->
-
-        <!-- Interval of flushing data. -->
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </query_log>
-
-    <!-- Trace log. Stores stack traces collected by query profilers.
-         See query_profiler_real_time_period_ns and query_profiler_cpu_time_period_ns settings. -->
-    <trace_log>
-        <database>system</database>
-        <table>trace_log</table>
-
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </trace_log>
-
-    <!-- Query thread log. Has information about all threads participated in query execution.
-         Used only for queries with setting log_query_threads = 1. -->
-    <query_thread_log>
-        <database>system</database>
-        <table>query_thread_log</table>
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </query_thread_log>
-
-    <!-- Query views log. Has information about all dependent views associated with a query.
-         Used only for queries with setting log_query_views = 1. -->
-    <query_views_log>
-        <database>system</database>
-        <table>query_views_log</table>
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </query_views_log>
-
-    <!-- Uncomment if use part log.
-         Part log contains information about all actions with parts in MergeTree tables (creation, deletion, merges, downloads).-->
-    <part_log>
-        <database>system</database>
-        <table>part_log</table>
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </part_log>
-
-    <!-- Uncomment to write text log into table.
-         Text log contains all information from usual server log but stores it in structured and efficient way.
-         The level of the messages that goes to the table can be limited (<level>), if not specified all messages will go to the table.
-    <text_log>
-        <database>system</database>
-        <table>text_log</table>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-        <level></level>
-    </text_log>
-    -->
-
-    <!-- Metric log contains rows with current values of ProfileEvents, CurrentMetrics collected with "collect_interval_milliseconds" interval. -->
-    <metric_log>
-        <database>system</database>
-        <table>metric_log</table>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-        <collect_interval_milliseconds>1000</collect_interval_milliseconds>
-    </metric_log>
-
-    <!--
-        Asynchronous metric log contains values of metrics from
-        system.asynchronous_metrics.
-    -->
-    <asynchronous_metric_log>
-        <database>system</database>
-        <table>asynchronous_metric_log</table>
-        <!--
-            Asynchronous metrics are updated once a minute, so there is
-            no need to flush more often.
-        -->
-        <flush_interval_milliseconds>7000</flush_interval_milliseconds>
-    </asynchronous_metric_log>
-
-    <!--
-        OpenTelemetry log contains OpenTelemetry trace spans.
-    -->
-    <opentelemetry_span_log>
-        <!--
-            The default table creation code is insufficient, this <engine> spec
-            is a workaround. There is no 'event_time' for this log, but two times,
-            start and finish. It is sorted by finish time, to avoid inserting
-            data too far away in the past (probably we can sometimes insert a span
-            that is seconds earlier than the last span in the table, due to a race
-            between several spans inserted in parallel). This gives the spans a
-            global order that we can use to e.g. retry insertion into some external
-            system.
-        -->
-        <engine>
-            engine MergeTree
-            partition by toYYYYMM(finish_date)
-            order by (finish_date, finish_time_us, trace_id)
-        </engine>
-        <database>system</database>
-        <table>opentelemetry_span_log</table>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </opentelemetry_span_log>
-
-
-    <!-- Crash log. Stores stack traces for fatal errors.
-         This table is normally empty. -->
-    <crash_log>
-        <database>system</database>
-        <table>crash_log</table>
-
-        <partition_by/>
-        <flush_interval_milliseconds>1000</flush_interval_milliseconds>
-    </crash_log>
-
-    <!-- Session log. Stores user log in (successful or not) and log out events. -->
-    <session_log>
-        <database>system</database>
-        <table>session_log</table>
-
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </session_log>
-
-    <!-- Parameters for embedded dictionaries, used in Yandex.Metrica.
-         See https://clickhouse.com/docs/en/dicts/internal_dicts/
-    -->
-
-    <!-- Path to file with region hierarchy. -->
-    <!-- <path_to_regions_hierarchy_file>/opt/geo/regions_hierarchy.txt</path_to_regions_hierarchy_file> -->
-
-    <!-- Path to directory with files containing names of regions -->
-    <!-- <path_to_regions_names_files>/opt/geo/</path_to_regions_names_files> -->
-
-
-    <!-- <top_level_domains_path>/var/lib/clickhouse/top_level_domains/</top_level_domains_path> -->
-    <!-- Custom TLD lists.
-         Format: <name>/path/to/file</name>
-
-         Changes will not be applied w/o server restart.
-         Path to the list is under top_level_domains_path (see above).
-    -->
-    <top_level_domains_lists>
-        <!--
-        <public_suffix_list>/path/to/public_suffix_list.dat</public_suffix_list>
-        -->
-    </top_level_domains_lists>
-
-    <!-- Configuration of external dictionaries. See:
-         https://clickhouse.com/docs/en/sql-reference/dictionaries/external-dictionaries/external-dicts
-    -->
-    <dictionaries_config>*_dictionary.xml</dictionaries_config>
-
-    <!-- Configuration of user defined executable functions -->
-    <user_defined_executable_functions_config>*_function.xml</user_defined_executable_functions_config>
-
-    <!-- Uncomment if you want data to be compressed 30-100% better.
-         Don't do that if you just started using ClickHouse.
-      -->
-    <!--
-    <compression>
-        <!- - Set of variants. Checked in order. Last matching case wins. If nothing matches, lz4 will be used. - ->
-        <case>
-
-            <!- - Conditions. All must be satisfied. Some conditions may be omitted. - ->
-            <min_part_size>10000000000</min_part_size>        <!- - Min part size in bytes. - ->
-            <min_part_size_ratio>0.01</min_part_size_ratio>   <!- - Min size of part relative to whole table size. - ->
-
-            <!- - What compression method to use. - ->
-            <method>zstd</method>
-        </case>
-    </compression>
-    -->
-
-    <!-- Configuration of encryption. The server executes a command to
-         obtain an encryption key at startup if such a command is
-         defined, or encryption codecs will be disabled otherwise. The
-         command is executed through /bin/sh and is expected to write
-         a Base64-encoded key to the stdout. -->
-    <encryption_codecs>
-        <!-- aes_128_gcm_siv -->
-        <!-- Example of getting hex key from env -->
-        <!-- the code should use this key and throw an exception if its length is not 16 bytes -->
-        <!--key_hex from_env="..."></key_hex -->
-
-        <!-- Example of multiple hex keys. They can be imported from env or be written down in config-->
-        <!-- the code should use these keys and throw an exception if their length is not 16 bytes -->
-        <!-- key_hex id="0">...</key_hex -->
-        <!-- key_hex id="1" from_env=".."></key_hex -->
-        <!-- key_hex id="2">...</key_hex -->
-        <!-- current_key_id>2</current_key_id -->
-
-        <!-- Example of getting hex key from config -->
-        <!-- the code should use this key and throw an exception if its length is not 16 bytes -->
-        <!-- key>...</key -->
-
-        <!-- example of adding nonce -->
-        <!-- nonce>...</nonce -->
-
-        <!-- /aes_128_gcm_siv -->
-    </encryption_codecs>
-
-    <!-- Allow to execute distributed DDL queries (CREATE, DROP, ALTER, RENAME) on cluster.
-         Works only if ZooKeeper is enabled. Comment it if such functionality isn't required. -->
-    <distributed_ddl>
-        <!-- Path in ZooKeeper to queue with DDL queries -->
-        <path>/clickhouse/task_queue/ddl</path>
-
-        <!-- Settings from this profile will be used to execute DDL queries -->
-        <!-- <profile>default</profile> -->
-
-        <!-- Controls how much ON CLUSTER queries can be run simultaneously. -->
-        <!-- <pool_size>1</pool_size> -->
-
-        <!--
-             Cleanup settings (active tasks will not be removed)
-        -->
-
-        <!-- Controls task TTL (default 1 week) -->
-        <!-- <task_max_lifetime>604800</task_max_lifetime> -->
-
-        <!-- Controls how often cleanup should be performed (in seconds) -->
-        <!-- <cleanup_delay_period>60</cleanup_delay_period> -->
-
-        <!-- Controls how many tasks could be in the queue -->
-        <!-- <max_tasks_in_queue>1000</max_tasks_in_queue> -->
-    </distributed_ddl>
-
-    <!-- Settings to fine tune MergeTree tables. See documentation in source code, in MergeTreeSettings.h -->
-    <!--
-    <merge_tree>
-        <max_suspicious_broken_parts>5</max_suspicious_broken_parts>
-    </merge_tree>
-    -->
-
-    <!-- Protection from accidental DROP.
-         If size of a MergeTree table is greater than max_table_size_to_drop (in bytes) than table could not be dropped with any DROP query.
-         If you want do delete one table and don't want to change clickhouse-server config, you could create special file <clickhouse-path>/flags/force_drop_table and make DROP once.
-         By default max_table_size_to_drop is 50GB; max_table_size_to_drop=0 allows to DROP any tables.
-         The same for max_partition_size_to_drop.
-         Uncomment to disable protection.
-    -->
-    <!-- <max_table_size_to_drop>0</max_table_size_to_drop> -->
-    <!-- <max_partition_size_to_drop>0</max_partition_size_to_drop> -->
-
-    <!-- Example of parameters for GraphiteMergeTree table engine -->
-    <graphite_rollup_example>
-        <pattern>
-            <regexp>click_cost</regexp>
-            <function>any</function>
-            <retention>
-                <age>0</age>
-                <precision>3600</precision>
-            </retention>
-            <retention>
-                <age>86400</age>
-                <precision>60</precision>
-            </retention>
-        </pattern>
-        <default>
-            <function>max</function>
-            <retention>
-                <age>0</age>
-                <precision>60</precision>
-            </retention>
-            <retention>
-                <age>3600</age>
-                <precision>300</precision>
-            </retention>
-            <retention>
-                <age>86400</age>
-                <precision>3600</precision>
-            </retention>
-        </default>
-    </graphite_rollup_example>
-
-    <!-- Directory in <clickhouse-path> containing schema files for various input formats.
-         The directory will be created if it doesn't exist.
-      -->
-    <format_schema_path>/var/lib/clickhouse/format_schemas/</format_schema_path>
-
-    <!-- Default query masking rules, matching lines would be replaced with something else in the logs
-        (both text logs and system.query_log).
-        name - name for the rule (optional)
-        regexp - RE2 compatible regular expression (mandatory)
-        replace - substitution string for sensitive data (optional, by default - six asterisks)
-    -->
-    <query_masking_rules>
-        <rule>
-            <name>hide encrypt/decrypt arguments</name>
-            <regexp>((?:aes_)?(?:encrypt|decrypt)(?:_mysql)?)\s*\(\s*(?:'(?:\\'|.)+'|.*?)\s*\)</regexp>
-            <!-- or more secure, but also more invasive:
-                (aes_\w+)\s*\(.*\)
-            -->
-            <replace>\1(???)</replace>
-        </rule>
-    </query_masking_rules>
-
-    <!-- Uncomment to use custom http handlers.
-        rules are checked from top to bottom, first match runs the handler
-            url - to match request URL, you can use 'regex:' prefix to use regex match(optional)
-            methods - to match request method, you can use commas to separate multiple method matches(optional)
-            headers - to match request headers, match each child element(child element name is header name), you can use 'regex:' prefix to use regex match(optional)
-        handler is request handler
-            type - supported types: static, dynamic_query_handler, predefined_query_handler
-            query - use with predefined_query_handler type, executes query when the handler is called
-            query_param_name - use with dynamic_query_handler type, extracts and executes the value corresponding to the <query_param_name> value in HTTP request params
-            status - use with static type, response status code
-            content_type - use with static type, response content-type
-            response_content - use with static type, Response content sent to client, when using the prefix 'file://' or 'config://', find the content from the file or configuration send to client.
-
-    <http_handlers>
-        <rule>
-            <url>/</url>
-            <methods>POST,GET</methods>
-            <headers><pragma>no-cache</pragma></headers>
-            <handler>
-                <type>dynamic_query_handler</type>
-                <query_param_name>query</query_param_name>
-            </handler>
-        </rule>
-
-        <rule>
-            <url>/predefined_query</url>
-            <methods>POST,GET</methods>
-            <handler>
-                <type>predefined_query_handler</type>
-                <query>SELECT * FROM system.settings</query>
-            </handler>
-        </rule>
-
-        <rule>
-            <handler>
-                <type>static</type>
-                <status>200</status>
-                <content_type>text/plain; charset=UTF-8</content_type>
-                <response_content>config://http_server_default_response</response_content>
-            </handler>
-        </rule>
-    </http_handlers>
-    -->
-
-    <send_crash_reports>
-        <!-- Changing <enabled> to true allows sending crash reports to -->
-        <!-- the ClickHouse core developers team via Sentry https://sentry.io -->
-        <!-- Doing so at least in pre-production environments is highly appreciated -->
-        <enabled>false</enabled>
-        <!-- Change <anonymize> to true if you don't feel comfortable attaching the server hostname to the crash report -->
-        <anonymize>false</anonymize>
-        <!-- Default endpoint should be changed to different Sentry DSN only if you have -->
-        <!-- some in-house engineers or hired consultants who're going to debug ClickHouse issues for you -->
-        <endpoint>https://6f33034cfe684dd7a3ab9875e57b1c8d@o388870.ingest.sentry.io/5226277</endpoint>
-    </send_crash_reports>
-
-    <!-- Uncomment to disable ClickHouse internal DNS caching. -->
-    <!-- <disable_internal_dns_cache>1</disable_internal_dns_cache> -->
-
-    <!-- You can also configure rocksdb like this: -->
-    <!--
-    <rocksdb>
-        <options>
-            <max_background_jobs>8</max_background_jobs>
-        </options>
-        <column_family_options>
-            <num_levels>2</num_levels>
-        </column_family_options>
-        <tables>
-            <table>
-                <name>TABLE</name>
-                <options>
-                    <max_background_jobs>8</max_background_jobs>
-                </options>
-                <column_family_options>
-                    <num_levels>2</num_levels>
-                </column_family_options>
-            </table>
-        </tables>
-    </rocksdb>
-    -->
-    <storage_configuration>
-        <disks>
-            <s3>
-                <type>s3</type>
-                <endpoint>https://storage.yandexcloud.net/my-bucket/root-path/</endpoint>
-                <access_key_id>REPLACE_ME</access_key_id>
-                <secret_access_key>REPLACE_ME</secret_access_key>
-                <region></region>
-                <header>Authorization: Bearer SOME-TOKEN</header>
-                <server_side_encryption_customer_key_base64>your_base64_encoded_customer_key
-                </server_side_encryption_customer_key_base64>
-                <server_side_encryption_kms_key_id>REPLACE_ME</server_side_encryption_kms_key_id>
-                <server_side_encryption_kms_encryption_context>REPLACE_ME</server_side_encryption_kms_encryption_context>
-                <server_side_encryption_kms_bucket_key_enabled>true</server_side_encryption_kms_bucket_key_enabled>
-                <proxy>
-                    <uri>http://proxy1</uri>
-                    <uri>http://proxy2</uri>
-                </proxy>
-                <connect_timeout_ms>10000</connect_timeout_ms>
-                <request_timeout_ms>5000</request_timeout_ms>
-                <retry_attempts>10</retry_attempts>
-                <single_read_retries>4</single_read_retries>
-                <min_bytes_for_seek>1000</min_bytes_for_seek>
-                <metadata_path>/var/lib/clickhouse/disks/s3/</metadata_path>
-                <skip_access_check>false</skip_access_check>
-            </s3>
-        </disks>
-    </storage_configuration>
-</clickhouse>
diff --git a/programs/diagnostics/testdata/configs/xml/users.d/default-password.xml b/programs/diagnostics/testdata/configs/xml/users.d/default-password.xml
deleted file mode 100644
index 242a6a4b02e..00000000000
--- a/programs/diagnostics/testdata/configs/xml/users.d/default-password.xml
+++ /dev/null
@@ -1,8 +0,0 @@
-<clickhouse>
-    <users>
-        <default>
-            <password remove="1"/>
-            <password_sha256_hex>REPLACE_ME</password_sha256_hex>
-        </default>
-    </users>
-</clickhouse>
\ No newline at end of file
diff --git a/programs/diagnostics/testdata/configs/xml/users.xml b/programs/diagnostics/testdata/configs/xml/users.xml
deleted file mode 100644
index cd5f17e922e..00000000000
--- a/programs/diagnostics/testdata/configs/xml/users.xml
+++ /dev/null
@@ -1,57 +0,0 @@
-<clickhouse>
-    <!-- See also the files in users.d directory where the settings can be overridden. -->
-    <!-- Profiles of settings. -->
-    <include_from>../include/xml/user-include.xml</include_from>
-
-    <profiles>
-        <!-- Default settings. -->
-        <default>
-            <!-- Maximum memory usage for processing single query, in bytes. -->
-            <max_memory_usage>10000000000</max_memory_usage>
-
-            <load_balancing>random</load_balancing>
-            <log_query_threads>1</log_query_threads>
-        </default>
-        <!-- Profile that allows only read queries. -->
-        <readonly>
-            <readonly>1</readonly>
-        </readonly>
-    </profiles>
-    <!-- Users and ACL. -->
-    <users>
-        <test_user>
-            <include incl="test_user"></include>
-        </test_user>
-        <!-- If user name was not specified, 'default' user is used. -->
-        <default>
-            <password>REPLACE_ME</password>
-            <networks>
-                <ip>::/0</ip>
-            </networks>
-            <!-- Settings profile for user. -->
-            <profile>default</profile>
-            <!-- Quota for user. -->
-            <quota>default</quota>
-            <!-- User can create other users and grant rights to them. -->
-            <!-- <access_management>1</access_management> -->
-        </default>
-    </users>
-    <!-- Quotas. -->
-    <quotas>
-        <!-- Name of quota. -->
-        <default>
-            <!-- Limits for time interval. You could specify many intervals with different limits. -->
-            <interval>
-                <!-- Length of interval. -->
-                <duration>3600</duration>
-
-                <!-- No limits. Just calculate resource usage for time interval. -->
-                <queries>0</queries>
-                <errors>0</errors>
-                <result_rows>0</result_rows>
-                <read_rows>0</read_rows>
-                <execution_time>0</execution_time>
-            </interval>
-        </default>
-    </quotas>
-</clickhouse>
diff --git a/programs/diagnostics/testdata/configs/yaml/config.yaml b/programs/diagnostics/testdata/configs/yaml/config.yaml
deleted file mode 100644
index e577a99e675..00000000000
--- a/programs/diagnostics/testdata/configs/yaml/config.yaml
+++ /dev/null
@@ -1,927 +0,0 @@
-# This is an example of a configuration file "config.xml" rewritten in YAML
-# You can read this documentation for detailed information about YAML configuration:
-# https://clickhouse.com/docs/en/operations/configuration-files/
-
-# NOTE: User and query level settings are set up in "users.yaml" file.
-# If you have accidentally specified user-level settings here, server won't start.
-# You can either move the settings to the right place inside "users.xml" file
-# or add skip_check_for_incorrect_settings: 1 here.
-include_from: "../include/yaml/server-include.yaml"
-logger:
-  # Possible levels [1]:
-  # - none (turns off logging)
-  # - fatal
-  # - critical
-  # - error
-  # - warning
-  # - notice
-  # - information
-  # - debug
-  # - trace
-  # [1]: https://github.com/pocoproject/poco/blob/poco-1.9.4-release/Foundation/include/Poco/Logger.h#L105-L114
-  level: trace
-  log: /var/log/clickhouse-server/clickhouse-server.log
-  errorlog: /var/log/clickhouse-server/clickhouse-server.err.log
-  # Rotation policy
-  # See https://github.com/pocoproject/poco/blob/poco-1.9.4-release/Foundation/include/Poco/FileChannel.h#L54-L85
-  size: 1000M
-  count: 10
-  # console: 1
-  # Default behavior is autodetection (log to console if not daemon mode and is tty)
-
-  # Per level overrides (legacy):
-  # For example to suppress logging of the ConfigReloader you can use:
-  # NOTE: levels.logger is reserved, see below.
-  # levels:
-  #     ConfigReloader: none
-
-  # Per level overrides:
-  # For example to suppress logging of the RBAC for default user you can use:
-  # (But please note that the logger name maybe changed from version to version, even after minor upgrade)
-  # levels:
-  #     - logger:
-  #         name: 'ContextAccess (default)'
-  #         level: none
-  #     - logger:
-  #         name: 'DatabaseOrdinary (test)'
-  #         level: none
-
-# It is the name that will be shown in the clickhouse-client.
-# By default, anything with "production" will be highlighted in red in query prompt.
-# display_name: production
-
-# Port for HTTP API. See also 'https_port' for secure connections.
-# This interface is also used by ODBC and JDBC drivers (DataGrip, Dbeaver, ...)
-# and by most of web interfaces (embedded UI, Grafana, Redash, ...).
-http_port: 8123
-
-# Port for interaction by native protocol with:
-# - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark);
-# - clickhouse-server with other clickhouse-servers for distributed query processing;
-# - ClickHouse drivers and applications supporting native protocol
-# (this protocol is also informally called as "the TCP protocol");
-# See also 'tcp_port_secure' for secure connections.
-tcp_port: 9000
-
-# Compatibility with MySQL protocol.
-# ClickHouse will pretend to be MySQL for applications connecting to this port.
-mysql_port: 9004
-
-# Compatibility with PostgreSQL protocol.
-# ClickHouse will pretend to be PostgreSQL for applications connecting to this port.
-postgresql_port: 9005
-
-# HTTP API with TLS (HTTPS).
-# You have to configure certificate to enable this interface.
-# See the openSSL section below.
-# https_port: 8443
-
-# Native interface with TLS.
-# You have to configure certificate to enable this interface.
-# See the openSSL section below.
-# tcp_port_secure: 9440
-
-# Native interface wrapped with PROXYv1 protocol
-# PROXYv1 header sent for every connection.
-# ClickHouse will extract information about proxy-forwarded client address from the header.
-# tcp_with_proxy_port: 9011
-
-# Port for communication between replicas. Used for data exchange.
-# It provides low-level data access between servers.
-# This port should not be accessible from untrusted networks.
-# See also 'interserver_http_credentials'.
-# Data transferred over connections to this port should not go through untrusted networks.
-# See also 'interserver_https_port'.
-interserver_http_port: 9009
-
-# Port for communication between replicas with TLS.
-# You have to configure certificate to enable this interface.
-# See the openSSL section below.
-# See also 'interserver_http_credentials'.
-# interserver_https_port: 9010
-
-# Hostname that is used by other replicas to request this server.
-# If not specified, than it is determined analogous to 'hostname -f' command.
-# This setting could be used to switch replication to another network interface
-# (the server may be connected to multiple networks via multiple addresses)
-# interserver_http_host: example.yandex.ru
-
-# You can specify credentials for authenthication between replicas.
-# This is required when interserver_https_port is accessible from untrusted networks,
-# and also recommended to avoid SSRF attacks from possibly compromised services in your network.
-# interserver_http_credentials:
-#     user: interserver
-#     password: ''
-
-# Listen specified address.
-# Use :: (wildcard IPv6 address), if you want to accept connections both with IPv4 and IPv6 from everywhere.
-# Notes:
-# If you open connections from wildcard address, make sure that at least one of the following measures applied:
-# - server is protected by firewall and not accessible from untrusted networks;
-# - all users are restricted to subset of network addresses (see users.xml);
-# - all users have strong passwords, only secure (TLS) interfaces are accessible, or connections are only made via TLS interfaces.
-# - users without password have readonly access.
-# See also: https://www.shodan.io/search?query=clickhouse
-# listen_host: '::'
-
-# Same for hosts without support for IPv6:
-# listen_host: 0.0.0.0
-
-# Default values - try listen localhost on IPv4 and IPv6.
-# listen_host: '::1'
-# listen_host: 127.0.0.1
-
-# Don't exit if IPv6 or IPv4 networks are unavailable while trying to listen.
-# listen_try: 0
-
-# Allow multiple servers to listen on the same address:port. This is not recommended.
-# listen_reuse_port: 0
-
-# listen_backlog: 64
-max_connections: 4096
-
-# For 'Connection: keep-alive' in HTTP 1.1
-keep_alive_timeout: 3
-
-# gRPC protocol (see src/Server/grpc_protos/clickhouse_grpc.proto for the API)
-# grpc_port: 9100
-grpc:
-  enable_ssl: false
-
-  # The following two files are used only if enable_ssl=1
-  ssl_cert_file: /path/to/ssl_cert_file
-  ssl_key_file: /path/to/ssl_key_file
-
-  # Whether server will request client for a certificate
-  ssl_require_client_auth: false
-
-  # The following file is used only if ssl_require_client_auth=1
-  ssl_ca_cert_file: /path/to/ssl_ca_cert_file
-
-  # Default compression algorithm (applied if client doesn't specify another algorithm).
-  # Supported algorithms: none, deflate, gzip, stream_gzip
-  compression: deflate
-
-  # Default compression level (applied if client doesn't specify another level).
-  # Supported levels: none, low, medium, high
-  compression_level: medium
-
-  # Send/receive message size limits in bytes. -1 means unlimited
-  max_send_message_size: -1
-  max_receive_message_size: -1
-
-  # Enable if you want very detailed logs
-  verbose_logs: false
-
-# Used with https_port and tcp_port_secure. Full ssl options list: https://github.com/ClickHouse-Extras/poco/blob/master/NetSSL_OpenSSL/include/Poco/Net/SSLManager.h#L71
-openSSL:
-  server:
-    # Used for https server AND secure tcp port
-    # openssl req -subj "/CN=localhost" -new -newkey rsa:2048 -days 365 -nodes -x509 -keyout /etc/clickhouse-server/server.key -out /etc/clickhouse-server/server.crt
-    certificateFile: /etc/clickhouse-server/server.crt
-    privateKeyFile: /etc/clickhouse-server/server.key
-
-    # dhparams are optional. You can delete the dhParamsFile: element.
-    # To generate dhparams, use the following command:
-    # openssl dhparam -out /etc/clickhouse-server/dhparam.pem 4096
-    # Only file format with BEGIN DH PARAMETERS is supported.
-    dhParamsFile: /etc/clickhouse-server/dhparam.pem
-    verificationMode: none
-    loadDefaultCAFile: true
-    cacheSessions: true
-    disableProtocols: 'sslv2,sslv3'
-    preferServerCiphers: true
-  client:
-    # Used for connecting to https dictionary source and secured Zookeeper communication
-    loadDefaultCAFile: true
-    cacheSessions: true
-    disableProtocols: 'sslv2,sslv3'
-    preferServerCiphers: true
-
-    # Use for self-signed: verificationMode: none
-    invalidCertificateHandler:
-      # Use for self-signed: name: AcceptCertificateHandler
-      name: RejectCertificateHandler
-
-# Default root page on http[s] server. For example load UI from https://tabix.io/ when opening http://localhost:8123
-# http_server_default_response: |-
-#     <html ng-app="SMI2"><head><base href="http://ui.tabix.io/"></head><body><div ui-view="" class="content-ui"></div><script src="http://loader.tabix.io/master.js"></script></body></html>
-
-# Maximum number of concurrent queries.
-max_concurrent_queries: 100
-
-# Maximum memory usage (resident set size) for server process.
-# Zero value or unset means default. Default is "max_server_memory_usage_to_ram_ratio" of available physical RAM.
-# If the value is larger than "max_server_memory_usage_to_ram_ratio" of available physical RAM, it will be cut down.
-
-# The constraint is checked on query execution time.
-# If a query tries to allocate memory and the current memory usage plus allocation is greater
-# than specified threshold, exception will be thrown.
-
-# It is not practical to set this constraint to small values like just a few gigabytes,
-# because memory allocator will keep this amount of memory in caches and the server will deny service of queries.
-max_server_memory_usage: 0
-
-# Maximum number of threads in the Global thread pool.
-# This will default to a maximum of 10000 threads if not specified.
-# This setting will be useful in scenarios where there are a large number
-# of distributed queries that are running concurrently but are idling most
-# of the time, in which case a higher number of threads might be required.
-max_thread_pool_size: 10000
-
-# On memory constrained environments you may have to set this to value larger than 1.
-max_server_memory_usage_to_ram_ratio: 0.9
-
-# Simple server-wide memory profiler. Collect a stack trace at every peak allocation step (in bytes).
-# Data will be stored in system.trace_log table with query_id = empty string.
-# Zero means disabled.
-total_memory_profiler_step: 4194304
-
-# Collect random allocations and deallocations and write them into system.trace_log with 'MemorySample' trace_type.
-# The probability is for every alloc/free regardless to the size of the allocation.
-# Note that sampling happens only when the amount of untracked memory exceeds the untracked memory limit,
-# which is 4 MiB by default but can be lowered if 'total_memory_profiler_step' is lowered.
-# You may want to set 'total_memory_profiler_step' to 1 for extra fine grained sampling.
-total_memory_tracker_sample_probability: 0
-
-# Set limit on number of open files (default: maximum). This setting makes sense on Mac OS X because getrlimit() fails to retrieve
-# correct maximum value.
-# max_open_files: 262144
-
-# Size of cache of uncompressed blocks of data, used in tables of MergeTree family.
-# In bytes. Cache is single for server. Memory is allocated only on demand.
-# Cache is used when 'use_uncompressed_cache' user setting turned on (off by default).
-# Uncompressed cache is advantageous only for very short queries and in rare cases.
-
-# Note: uncompressed cache can be pointless for lz4, because memory bandwidth
-# is slower than multi-core decompression on some server configurations.
-# Enabling it can sometimes paradoxically make queries slower.
-uncompressed_cache_size: 8589934592
-
-# Approximate size of mark cache, used in tables of MergeTree family.
-# In bytes. Cache is single for server. Memory is allocated only on demand.
-# You should not lower this value.
-mark_cache_size: 5368709120
-
-# If you enable the `min_bytes_to_use_mmap_io` setting,
-# the data in MergeTree tables can be read with mmap to avoid copying from kernel to userspace.
-# It makes sense only for large files and helps only if data reside in page cache.
-# To avoid frequent open/mmap/munmap/close calls (which are very expensive due to consequent page faults)
-# and to reuse mappings from several threads and queries,
-# the cache of mapped files is maintained. Its size is the number of mapped regions (usually equal to the number of mapped files).
-# The amount of data in mapped files can be monitored
-# in system.metrics, system.metric_log by the MMappedFiles, MMappedFileBytes metrics
-# and in system.asynchronous_metrics, system.asynchronous_metrics_log by the MMapCacheCells metric,
-# and also in system.events, system.processes, system.query_log, system.query_thread_log, system.query_views_log by the
-# CreatedReadBufferMMap, CreatedReadBufferMMapFailed, MMappedFileCacheHits, MMappedFileCacheMisses events.
-# Note that the amount of data in mapped files does not consume memory directly and is not accounted
-# in query or server memory usage - because this memory can be discarded similar to OS page cache.
-# The cache is dropped (the files are closed) automatically on removal of old parts in MergeTree,
-# also it can be dropped manually by the SYSTEM DROP MMAP CACHE query.
-mmap_cache_size: 1000
-
-# Cache size in bytes for compiled expressions.
-compiled_expression_cache_size: 134217728
-
-# Cache size in elements for compiled expressions.
-compiled_expression_cache_elements_size: 10000
-
-# Path to data directory, with trailing slash.
-path: /var/lib/clickhouse/
-
-# Path to temporary data for processing hard queries.
-tmp_path: /var/lib/clickhouse/tmp/
-
-# Policy from the <storage_configuration> for the temporary files.
-# If not set <tmp_path> is used, otherwise <tmp_path> is ignored.
-
-# Notes:
-# - move_factor              is ignored
-# - keep_free_space_bytes    is ignored
-# - max_data_part_size_bytes is ignored
-# - you must have exactly one volume in that policy
-# tmp_policy: tmp
-
-# Directory with user provided files that are accessible by 'file' table function.
-user_files_path: /var/lib/clickhouse/user_files/
-
-# LDAP server definitions.
-ldap_servers: ''
-
-# List LDAP servers with their connection parameters here to later 1) use them as authenticators for dedicated local users,
-# who have 'ldap' authentication mechanism specified instead of 'password', or to 2) use them as remote user directories.
-# Parameters:
-# host - LDAP server hostname or IP, this parameter is mandatory and cannot be empty.
-# port - LDAP server port, default is 636 if enable_tls is set to true, 389 otherwise.
-# bind_dn - template used to construct the DN to bind to.
-# The resulting DN will be constructed by replacing all '{user_name}' substrings of the template with the actual
-# user name during each authentication attempt.
-# user_dn_detection - section with LDAP search parameters for detecting the actual user DN of the bound user.
-# This is mainly used in search filters for further role mapping when the server is Active Directory. The
-# resulting user DN will be used when replacing '{user_dn}' substrings wherever they are allowed. By default,
-# user DN is set equal to bind DN, but once search is performed, it will be updated with to the actual detected
-# user DN value.
-# base_dn - template used to construct the base DN for the LDAP search.
-# The resulting DN will be constructed by replacing all '{user_name}' and '{bind_dn}' substrings
-# of the template with the actual user name and bind DN during the LDAP search.
-# scope - scope of the LDAP search.
-# Accepted values are: 'base', 'one_level', 'children', 'subtree' (the default).
-# search_filter - template used to construct the search filter for the LDAP search.
-# The resulting filter will be constructed by replacing all '{user_name}', '{bind_dn}', and '{base_dn}'
-# substrings of the template with the actual user name, bind DN, and base DN during the LDAP search.
-# Note, that the special characters must be escaped properly in XML.
-# verification_cooldown - a period of time, in seconds, after a successful bind attempt, during which a user will be assumed
-# to be successfully authenticated for all consecutive requests without contacting the LDAP server.
-# Specify 0 (the default) to disable caching and force contacting the LDAP server for each authentication request.
-# enable_tls - flag to trigger use of secure connection to the LDAP server.
-# Specify 'no' for plain text (ldap://) protocol (not recommended).
-# Specify 'yes' for LDAP over SSL/TLS (ldaps://) protocol (recommended, the default).
-# Specify 'starttls' for legacy StartTLS protocol (plain text (ldap://) protocol, upgraded to TLS).
-# tls_minimum_protocol_version - the minimum protocol version of SSL/TLS.
-# Accepted values are: 'ssl2', 'ssl3', 'tls1.0', 'tls1.1', 'tls1.2' (the default).
-# tls_require_cert - SSL/TLS peer certificate verification behavior.
-# Accepted values are: 'never', 'allow', 'try', 'demand' (the default).
-# tls_cert_file - path to certificate file.
-# tls_key_file - path to certificate key file.
-# tls_ca_cert_file - path to CA certificate file.
-# tls_ca_cert_dir - path to the directory containing CA certificates.
-# tls_cipher_suite - allowed cipher suite (in OpenSSL notation).
-# Example:
-# my_ldap_server:
-#     host: localhost
-#     port: 636
-#     bind_dn: 'uid={user_name},ou=users,dc=example,dc=com'
-#     verification_cooldown: 300
-#     enable_tls: yes
-#     tls_minimum_protocol_version: tls1.2
-#     tls_require_cert: demand
-#     tls_cert_file: /path/to/tls_cert_file
-#     tls_key_file: /path/to/tls_key_file
-#     tls_ca_cert_file: /path/to/tls_ca_cert_file
-#     tls_ca_cert_dir: /path/to/tls_ca_cert_dir
-#     tls_cipher_suite: ECDHE-ECDSA-AES256-GCM-SHA384:ECDHE-RSA-AES256-GCM-SHA384:AES256-GCM-SHA384
-
-# Example (typical Active Directory with configured user DN detection for further role mapping):
-# my_ad_server:
-#     host: localhost
-#     port: 389
-#     bind_dn: 'EXAMPLE\{user_name}'
-#     user_dn_detection:
-#         base_dn: CN=Users,DC=example,DC=com
-#         search_filter: '(&amp;(objectClass=user)(sAMAccountName={user_name}))'
-#     enable_tls: no
-
-# To enable Kerberos authentication support for HTTP requests (GSS-SPNEGO), for those users who are explicitly configured
-# to authenticate via Kerberos, define a single 'kerberos' section here.
-# Parameters:
-# principal - canonical service principal name, that will be acquired and used when accepting security contexts.
-# This parameter is optional, if omitted, the default principal will be used.
-# This parameter cannot be specified together with 'realm' parameter.
-# realm - a realm, that will be used to restrict authentication to only those requests whose initiator's realm matches it.
-# This parameter is optional, if omitted, no additional filtering by realm will be applied.
-# This parameter cannot be specified together with 'principal' parameter.
-# Example:
-# kerberos: ''
-
-# Example:
-# kerberos:
-#     principal: HTTP/clickhouse.example.com@EXAMPLE.COM
-
-# Example:
-# kerberos:
-#     realm: EXAMPLE.COM
-
-# Sources to read users, roles, access rights, profiles of settings, quotas.
-user_directories:
-  users_xml:
-    # Path to configuration file with predefined users.
-    path: users.yaml
-  local_directory:
-    # Path to folder where users created by SQL commands are stored.
-    path: /var/lib/clickhouse/access/
-
-#   # To add an LDAP server as a remote user directory of users that are not defined locally, define a single 'ldap' section
-#   # with the following parameters:
-#   # server - one of LDAP server names defined in 'ldap_servers' config section above.
-#   # This parameter is mandatory and cannot be empty.
-#   # roles - section with a list of locally defined roles that will be assigned to each user retrieved from the LDAP server.
-#   # If no roles are specified here or assigned during role mapping (below), user will not be able to perform any
-#   # actions after authentication.
-#   # role_mapping - section with LDAP search parameters and mapping rules.
-#   # When a user authenticates, while still bound to LDAP, an LDAP search is performed using search_filter and the
-#   # name of the logged in user. For each entry found during that search, the value of the specified attribute is
-#   # extracted. For each attribute value that has the specified prefix, the prefix is removed, and the rest of the
-#   # value becomes the name of a local role defined in ClickHouse, which is expected to be created beforehand by
-#   # CREATE ROLE command.
-#   # There can be multiple 'role_mapping' sections defined inside the same 'ldap' section. All of them will be
-#   # applied.
-#   # base_dn - template used to construct the base DN for the LDAP search.
-#   # The resulting DN will be constructed by replacing all '{user_name}', '{bind_dn}', and '{user_dn}'
-#   # substrings of the template with the actual user name, bind DN, and user DN during each LDAP search.
-#   # scope - scope of the LDAP search.
-#   # Accepted values are: 'base', 'one_level', 'children', 'subtree' (the default).
-#   # search_filter - template used to construct the search filter for the LDAP search.
-#   # The resulting filter will be constructed by replacing all '{user_name}', '{bind_dn}', '{user_dn}', and
-#   # '{base_dn}' substrings of the template with the actual user name, bind DN, user DN, and base DN during
-#   # each LDAP search.
-#   # Note, that the special characters must be escaped properly in XML.
-#   # attribute - attribute name whose values will be returned by the LDAP search. 'cn', by default.
-#   # prefix - prefix, that will be expected to be in front of each string in the original list of strings returned by
-#   # the LDAP search. Prefix will be removed from the original strings and resulting strings will be treated
-#   # as local role names. Empty, by default.
-#   # Example:
-#   # ldap:
-#   #     server: my_ldap_server
-#   #     roles:
-#   #         my_local_role1: ''
-#   #         my_local_role2: ''
-#   #     role_mapping:
-#   #         base_dn: 'ou=groups,dc=example,dc=com'
-#   #         scope: subtree
-#   #         search_filter: '(&amp;(objectClass=groupOfNames)(member={bind_dn}))'
-#   #         attribute: cn
-#   #         prefix: clickhouse_
-#   # Example (typical Active Directory with role mapping that relies on the detected user DN):
-#   # ldap:
-#   #     server: my_ad_server
-#   #     role_mapping:
-#   #         base_dn: 'CN=Users,DC=example,DC=com'
-#   #         attribute: CN
-#   #         scope: subtree
-#   #         search_filter: '(&amp;(objectClass=group)(member={user_dn}))'
-#   #         prefix: clickhouse_
-
-# Default profile of settings.
-default_profile: default
-
-# Comma-separated list of prefixes for user-defined settings.
-# custom_settings_prefixes: ''
-# System profile of settings. This settings are used by internal processes (Distributed DDL worker and so on).
-# system_profile: default
-
-# Buffer profile of settings.
-# This settings are used by Buffer storage to flush data to the underlying table.
-# Default: used from system_profile directive.
-# buffer_profile: default
-
-# Default database.
-default_database: default
-
-# Server time zone could be set here.
-
-# Time zone is used when converting between String and DateTime types,
-# when printing DateTime in text formats and parsing DateTime from text,
-# it is used in date and time related functions, if specific time zone was not passed as an argument.
-
-# Time zone is specified as identifier from IANA time zone database, like UTC or Africa/Abidjan.
-# If not specified, system time zone at server startup is used.
-
-# Please note, that server could display time zone alias instead of specified name.
-# Example: W-SU is an alias for Europe/Moscow and Zulu is an alias for UTC.
-# timezone: Europe/Moscow
-
-# You can specify umask here (see "man umask"). Server will apply it on startup.
-# Number is always parsed as octal. Default umask is 027 (other users cannot read logs, data files, etc; group can only read).
-# umask: 022
-
-# Perform mlockall after startup to lower first queries latency
-# and to prevent clickhouse executable from being paged out under high IO load.
-# Enabling this option is recommended but will lead to increased startup time for up to a few seconds.
-mlock_executable: true
-
-# Reallocate memory for machine code ("text") using huge pages. Highly experimental.
-remap_executable: false
-
-# Uncomment below in order to use JDBC table engine and function.
-# To install and run JDBC bridge in background:
-# * [Debian/Ubuntu]
-# export MVN_URL=https://repo1.maven.org/maven2/ru/yandex/clickhouse/clickhouse-jdbc-bridge
-# export PKG_VER=$(curl -sL $MVN_URL/maven-metadata.xml | grep '<release>' | sed -e 's|.*>\(.*\)<.*|\1|')
-# wget https://github.com/ClickHouse/clickhouse-jdbc-bridge/releases/download/v$PKG_VER/clickhouse-jdbc-bridge_$PKG_VER-1_all.deb
-# apt install --no-install-recommends -f ./clickhouse-jdbc-bridge_$PKG_VER-1_all.deb
-# clickhouse-jdbc-bridge &
-# * [CentOS/RHEL]
-# export MVN_URL=https://repo1.maven.org/maven2/ru/yandex/clickhouse/clickhouse-jdbc-bridge
-# export PKG_VER=$(curl -sL $MVN_URL/maven-metadata.xml | grep '<release>' | sed -e 's|.*>\(.*\)<.*|\1|')
-# wget https://github.com/ClickHouse/clickhouse-jdbc-bridge/releases/download/v$PKG_VER/clickhouse-jdbc-bridge-$PKG_VER-1.noarch.rpm
-# yum localinstall -y clickhouse-jdbc-bridge-$PKG_VER-1.noarch.rpm
-# clickhouse-jdbc-bridge &
-# Please refer to https://github.com/ClickHouse/clickhouse-jdbc-bridge#usage for more information.
-
-# jdbc_bridge:
-#     host: 127.0.0.1
-#     port: 9019
-
-# Configuration of clusters that could be used in Distributed tables.
-# https://clickhouse.com/docs/en/operations/table_engines/distributed/
-remote_servers:
-  # Test only shard config for testing distributed storage
-  test_shard_localhost:
-    # Inter-server per-cluster secret for Distributed queries
-    # default: no secret (no authentication will be performed)
-
-    # If set, then Distributed queries will be validated on shards, so at least:
-    # - such cluster should exist on the shard,
-    # - such cluster should have the same secret.
-
-    # And also (and which is more important), the initial_user will
-    # be used as current user for the query.
-
-    # Right now the protocol is pretty simple and it only takes into account:
-    # - cluster name
-    # - query
-
-    # Also it will be nice if the following will be implemented:
-    # - source hostname (see interserver_http_host), but then it will depends from DNS,
-    # it can use IP address instead, but then the you need to get correct on the initiator node.
-    # - target hostname / ip address (same notes as for source hostname)
-    # - time-based security tokens
-    secret: 'REPLACE_ME'
-    shard:
-      # Optional. Whether to write data to just one of the replicas. Default: false (write data to all replicas).
-      # internal_replication: false
-      # Optional. Shard weight when writing data. Default: 1.
-      # weight: 1
-      replica:
-        host: localhost
-        port: 9000
-        # Optional. Priority of the replica for load_balancing. Default: 1 (less value has more priority).
-        # priority: 1
-
-# The list of hosts allowed to use in URL-related storage engines and table functions.
-# If this section is not present in configuration, all hosts are allowed.
-# remote_url_allow_hosts:
-
-# Host should be specified exactly as in URL. The name is checked before DNS resolution.
-# Example: "yandex.ru", "yandex.ru." and "www.yandex.ru" are different hosts.
-# If port is explicitly specified in URL, the host:port is checked as a whole.
-# If host specified here without port, any port with this host allowed.
-# "yandex.ru" -> "yandex.ru:443", "yandex.ru:80" etc. is allowed, but "yandex.ru:80" -> only "yandex.ru:80" is allowed.
-# If the host is specified as IP address, it is checked as specified in URL. Example: "[2a02:6b8:a::a]".
-# If there are redirects and support for redirects is enabled, every redirect (the Location field) is checked.
-
-# Regular expression can be specified. RE2 engine is used for regexps.
-# Regexps are not aligned: don't forget to add ^ and $. Also don't forget to escape dot (.) metacharacter
-# (forgetting to do so is a common source of error).
-
-# If element has 'incl' attribute, then for it's value will be used corresponding substitution from another file.
-# By default, path to file with substitutions is /etc/metrika.xml. It could be changed in config in 'include_from' element.
-# Values for substitutions are specified in /clickhouse/name_of_substitution elements in that file.
-
-# ZooKeeper is used to store metadata about replicas, when using Replicated tables.
-# Optional. If you don't use replicated tables, you could omit that.
-# See https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/replication/
-
-# zookeeper:
-#     - node:
-#         host: example1
-#         port: 2181
-#     - node:
-#         host: example2
-#         port: 2181
-#     - node:
-#         host: example3
-#         port: 2181
-
-# Substitutions for parameters of replicated tables.
-# Optional. If you don't use replicated tables, you could omit that.
-# See https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/replication/#creating-replicated-tables
-# macros:
-#     shard: 01
-#     replica: example01-01-1
-
-# Reloading interval for embedded dictionaries, in seconds. Default: 3600.
-builtin_dictionaries_reload_interval: 3600
-
-# Maximum session timeout, in seconds. Default: 3600.
-max_session_timeout: 3600
-
-# Default session timeout, in seconds. Default: 60.
-default_session_timeout: 60
-
-# Sending data to Graphite for monitoring. Several sections can be defined.
-# interval - send every X second
-# root_path - prefix for keys
-# hostname_in_path - append hostname to root_path (default = true)
-# metrics - send data from table system.metrics
-# events - send data from table system.events
-# asynchronous_metrics - send data from table system.asynchronous_metrics
-
-# graphite:
-#     host: localhost
-#     port: 42000
-#     timeout: 0.1
-#     interval: 60
-#     root_path: one_min
-#     hostname_in_path: true
-
-#     metrics: true
-#     events: true
-#     events_cumulative: false
-#     asynchronous_metrics: true
-
-# graphite:
-#     host: localhost
-#     port: 42000
-#     timeout: 0.1
-#     interval: 1
-#     root_path: one_sec
-
-#     metrics: true
-#     events: true
-#     events_cumulative: false
-#     asynchronous_metrics: false
-
-# Serve endpoint for Prometheus monitoring.
-# endpoint - mertics path (relative to root, statring with "/")
-# port - port to setup server. If not defined or 0 than http_port used
-# metrics - send data from table system.metrics
-# events - send data from table system.events
-# asynchronous_metrics - send data from table system.asynchronous_metrics
-
-# prometheus:
-#     endpoint: /metrics
-#     port: 9363
-
-#     metrics: true
-#     events: true
-#     asynchronous_metrics: true
-
-# Query log. Used only for queries with setting log_queries = 1.
-query_log:
-  # What table to insert data. If table is not exist, it will be created.
-  # When query log structure is changed after system update,
-  # then old table will be renamed and new table will be created automatically.
-  database: system
-  table: query_log
-
-  # PARTITION BY expr: https://clickhouse.com/docs/en/table_engines/mergetree-family/custom_partitioning_key/
-  # Example:
-  # event_date
-  # toMonday(event_date)
-  # toYYYYMM(event_date)
-  # toStartOfHour(event_time)
-  partition_by: toYYYYMM(event_date)
-
-  # Table TTL specification: https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/mergetree/#mergetree-table-ttl
-  # Example:
-  # event_date + INTERVAL 1 WEEK
-  # event_date + INTERVAL 7 DAY DELETE
-  # event_date + INTERVAL 2 WEEK TO DISK 'bbb'
-
-  # ttl: 'event_date + INTERVAL 30 DAY DELETE'
-
-  # Instead of partition_by, you can provide full engine expression (starting with ENGINE = ) with parameters,
-  # Example: engine: 'ENGINE = MergeTree PARTITION BY toYYYYMM(event_date) ORDER BY (event_date, event_time) SETTINGS index_granularity = 1024'
-
-  # Interval of flushing data.
-  flush_interval_milliseconds: 7500
-
-# Trace log. Stores stack traces collected by query profilers.
-# See query_profiler_real_time_period_ns and query_profiler_cpu_time_period_ns settings.
-trace_log:
-  database: system
-  table: trace_log
-  partition_by: toYYYYMM(event_date)
-  flush_interval_milliseconds: 7500
-
-# Query thread log. Has information about all threads participated in query execution.
-# Used only for queries with setting log_query_threads = 1.
-query_thread_log:
-  database: system
-  table: query_thread_log
-  partition_by: toYYYYMM(event_date)
-  flush_interval_milliseconds: 7500
-
-# Query views log. Has information about all dependent views associated with a query.
-# Used only for queries with setting log_query_views = 1.
-query_views_log:
-  database: system
-  table: query_views_log
-  partition_by: toYYYYMM(event_date)
-  flush_interval_milliseconds: 7500
-
-# Uncomment if use part log.
-# Part log contains information about all actions with parts in MergeTree tables (creation, deletion, merges, downloads).
-part_log:
-  database: system
-  table: part_log
-  partition_by: toYYYYMM(event_date)
-  flush_interval_milliseconds: 7500
-
-# Uncomment to write text log into table.
-# Text log contains all information from usual server log but stores it in structured and efficient way.
-# The level of the messages that goes to the table can be limited (<level>), if not specified all messages will go to the table.
-# text_log:
-#     database: system
-#     table: text_log
-#     flush_interval_milliseconds: 7500
-#     level: ''
-
-# Metric log contains rows with current values of ProfileEvents, CurrentMetrics collected with "collect_interval_milliseconds" interval.
-metric_log:
-  database: system
-  table: metric_log
-  flush_interval_milliseconds: 7500
-  collect_interval_milliseconds: 1000
-
-# Asynchronous metric log contains values of metrics from
-# system.asynchronous_metrics.
-asynchronous_metric_log:
-  database: system
-  table: asynchronous_metric_log
-
-  # Asynchronous metrics are updated once a minute, so there is
-  # no need to flush more often.
-  flush_interval_milliseconds: 60000
-
-# OpenTelemetry log contains OpenTelemetry trace spans.
-opentelemetry_span_log:
-
-  # The default table creation code is insufficient, this <engine> spec
-  # is a workaround. There is no 'event_time' for this log, but two times,
-  # start and finish. It is sorted by finish time, to avoid inserting
-  # data too far away in the past (probably we can sometimes insert a span
-  # that is seconds earlier than the last span in the table, due to a race
-  # between several spans inserted in parallel). This gives the spans a
-  # global order that we can use to e.g. retry insertion into some external
-  # system.
-  engine: |-
-    engine MergeTree
-         partition by toYYYYMM(finish_date)
-         order by (finish_date, finish_time_us, trace_id)
-  database: system
-  table: opentelemetry_span_log
-  flush_interval_milliseconds: 7500
-
-# Crash log. Stores stack traces for fatal errors.
-# This table is normally empty.
-crash_log:
-  database: system
-  table: crash_log
-  partition_by: ''
-  flush_interval_milliseconds: 1000
-
-# Parameters for embedded dictionaries, used in Yandex.Metrica.
-# See https://clickhouse.com/docs/en/dicts/internal_dicts/
-
-# Path to file with region hierarchy.
-# path_to_regions_hierarchy_file: /opt/geo/regions_hierarchy.txt
-
-# Path to directory with files containing names of regions
-# path_to_regions_names_files: /opt/geo/
-
-
-# top_level_domains_path: /var/lib/clickhouse/top_level_domains/
-# Custom TLD lists.
-# Format: name: /path/to/file
-
-# Changes will not be applied w/o server restart.
-# Path to the list is under top_level_domains_path (see above).
-top_level_domains_lists: ''
-
-# public_suffix_list: /path/to/public_suffix_list.dat
-
-# Configuration of external dictionaries. See:
-# https://clickhouse.com/docs/en/sql-reference/dictionaries/external-dictionaries/external-dicts
-dictionaries_config: '*_dictionary.xml'
-
-# Uncomment if you want data to be compressed 30-100% better.
-# Don't do that if you just started using ClickHouse.
-
-# compression:
-#     # Set of variants. Checked in order. Last matching case wins. If nothing matches, lz4 will be used.
-#     case:
-#         Conditions. All must be satisfied. Some conditions may be omitted.
-#         # min_part_size: 10000000000    # Min part size in bytes.
-#         # min_part_size_ratio: 0.01     # Min size of part relative to whole table size.
-#         # What compression method to use.
-#         method: zstd
-
-# Allow to execute distributed DDL queries (CREATE, DROP, ALTER, RENAME) on cluster.
-# Works only if ZooKeeper is enabled. Comment it if such functionality isn't required.
-distributed_ddl:
-  # Path in ZooKeeper to queue with DDL queries
-  path: /clickhouse/task_queue/ddl
-
-  # Settings from this profile will be used to execute DDL queries
-  # profile: default
-
-  # Controls how much ON CLUSTER queries can be run simultaneously.
-  # pool_size: 1
-
-  # Cleanup settings (active tasks will not be removed)
-
-  # Controls task TTL (default 1 week)
-  # task_max_lifetime: 604800
-
-  # Controls how often cleanup should be performed (in seconds)
-  # cleanup_delay_period: 60
-
-  # Controls how many tasks could be in the queue
-  # max_tasks_in_queue: 1000
-
-# Settings to fine tune MergeTree tables. See documentation in source code, in MergeTreeSettings.h
-# merge_tree:
-#     max_suspicious_broken_parts: 5
-
-# Protection from accidental DROP.
-# If size of a MergeTree table is greater than max_table_size_to_drop (in bytes) than table could not be dropped with any DROP query.
-# If you want do delete one table and don't want to change clickhouse-server config, you could create special file <clickhouse-path>/flags/force_drop_table and make DROP once.
-# By default max_table_size_to_drop is 50GB; max_table_size_to_drop=0 allows to DROP any tables.
-# The same for max_partition_size_to_drop.
-# Uncomment to disable protection.
-
-# max_table_size_to_drop: 0
-# max_partition_size_to_drop: 0
-
-# Example of parameters for GraphiteMergeTree table engine
-graphite_rollup_example:
-  pattern:
-    regexp: click_cost
-    function: any
-    retention:
-      - age: 0
-        precision: 3600
-      - age: 86400
-        precision: 60
-  default:
-    function: max
-    retention:
-      - age: 0
-        precision: 60
-      - age: 3600
-        precision: 300
-      - age: 86400
-        precision: 3600
-
-# Directory in <clickhouse-path> containing schema files for various input formats.
-# The directory will be created if it doesn't exist.
-format_schema_path: /var/lib/clickhouse/format_schemas/
-
-# Default query masking rules, matching lines would be replaced with something else in the logs
-# (both text logs and system.query_log).
-# name - name for the rule (optional)
-# regexp - RE2 compatible regular expression (mandatory)
-# replace - substitution string for sensitive data (optional, by default - six asterisks)
-query_masking_rules:
-  rule:
-    name: hide encrypt/decrypt arguments
-    regexp: '((?:aes_)?(?:encrypt|decrypt)(?:_mysql)?)\s*\(\s*(?:''(?:\\''|.)+''|.*?)\s*\)'
-    # or more secure, but also more invasive:
-    # (aes_\w+)\s*\(.*\)
-    replace: \1(???)
-
-# Uncomment to use custom http handlers.
-# rules are checked from top to bottom, first match runs the handler
-# url - to match request URL, you can use 'regex:' prefix to use regex match(optional)
-# methods - to match request method, you can use commas to separate multiple method matches(optional)
-# headers - to match request headers, match each child element(child element name is header name), you can use 'regex:' prefix to use regex match(optional)
-# handler is request handler
-# type - supported types: static, dynamic_query_handler, predefined_query_handler
-# query - use with predefined_query_handler type, executes query when the handler is called
-# query_param_name - use with dynamic_query_handler type, extracts and executes the value corresponding to the <query_param_name> value in HTTP request params
-# status - use with static type, response status code
-# content_type - use with static type, response content-type
-# response_content - use with static type, Response content sent to client, when using the prefix 'file://' or 'config://', find the content from the file or configuration send to client.
-
-# http_handlers:
-#     - rule:
-#         url: /
-#         methods: POST,GET
-#         headers:
-#           pragma: no-cache
-#         handler:
-#           type: dynamic_query_handler
-#           query_param_name: query
-#     - rule:
-#         url: /predefined_query
-#         methods: POST,GET
-#         handler:
-#           type: predefined_query_handler
-#           query: 'SELECT * FROM system.settings'
-#     - rule:
-#         handler:
-#           type: static
-#           status: 200
-#           content_type: 'text/plain; charset=UTF-8'
-#           response_content: config://http_server_default_response
-
-send_crash_reports:
-  # Changing <enabled> to true allows sending crash reports to
-  # the ClickHouse core developers team via Sentry https://sentry.io
-  # Doing so at least in pre-production environments is highly appreciated
-  enabled: false
-  # Change <anonymize> to true if you don't feel comfortable attaching the server hostname to the crash report
-  anonymize: false
-  # Default endpoint should be changed to different Sentry DSN only if you have
-  # some in-house engineers or hired consultants who're going to debug ClickHouse issues for you
-  endpoint: 'https://6f33034cfe684dd7a3ab9875e57b1c8d@o388870.ingest.sentry.io/5226277'
-  # Uncomment to disable ClickHouse internal DNS caching.
-  # disable_internal_dns_cache: 1
-
-storage_configuration:
-  disks:
-    s3:
-      secret_access_key: REPLACE_ME
-      access_key_id: 'REPLACE_ME'
diff --git a/programs/diagnostics/testdata/configs/yaml/users.d/default-password.yaml b/programs/diagnostics/testdata/configs/yaml/users.d/default-password.yaml
deleted file mode 100644
index c27bb7cb071..00000000000
--- a/programs/diagnostics/testdata/configs/yaml/users.d/default-password.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-# Users and ACL.
-users:
-  # If user name was not specified, 'default' user is used.
-  default:
-
-    password_sha256_hex: "REPLACE_ME"
diff --git a/programs/diagnostics/testdata/configs/yaml/users.yaml b/programs/diagnostics/testdata/configs/yaml/users.yaml
deleted file mode 100644
index 82f2d67f2a4..00000000000
--- a/programs/diagnostics/testdata/configs/yaml/users.yaml
+++ /dev/null
@@ -1,47 +0,0 @@
-include_from: "../include/yaml/user-include.yaml"
-# Profiles of settings.
-profiles:
-  # Default settings.
-  default:
-    # Maximum memory usage for processing single query, in bytes.
-    max_memory_usage: 10000000000
-    load_balancing: random
-
-    # Profile that allows only read queries.
-  readonly:
-    readonly: 1
-
-# Users and ACL.
-users:
-  # If user name was not specified, 'default' user is used.
-  default:
-
-    password: 'REPLACE_ME'
-
-    networks:
-      ip: '::/0'
-
-    # Settings profile for user.
-    profile: default
-
-    # Quota for user.
-    quota: default
-
-    # User can create other users and grant rights to them.
-    # access_management: 1
-
-# Quotas.
-quotas:
-  # Name of quota.
-  default:
-    # Limits for time interval. You could specify many intervals with different limits.
-    interval:
-      # Length of interval.
-      duration: 3600
-
-      # No limits. Just calculate resource usage for time interval.
-      queries: 0
-      errors: 0
-      result_rows: 0
-      read_rows: 0
-      execution_time: 0
diff --git a/programs/diagnostics/testdata/configs/yandex_xml/config.xml b/programs/diagnostics/testdata/configs/yandex_xml/config.xml
deleted file mode 100644
index 40d1fa34b1a..00000000000
--- a/programs/diagnostics/testdata/configs/yandex_xml/config.xml
+++ /dev/null
@@ -1,1167 +0,0 @@
-<!--
-  NOTE: User and query level settings are set up in "users.xml" file.
-  If you have accidentally specified user-level settings here, server won't start.
-  You can either move the settings to the right place inside "users.xml" file
-   or add <skip_check_for_incorrect_settings>1</skip_check_for_incorrect_settings> here.
--->
-<yandex>
-    <include_from>../include/xml/server-include.xml</include_from>
-    <logger>
-        <!-- Possible levels [1]:
-
-          - none (turns off logging)
-          - fatal
-          - critical
-          - error
-          - warning
-          - notice
-          - information
-          - debug
-          - trace
-          - test (not for production usage)
-
-            [1]: https://github.com/pocoproject/poco/blob/poco-1.9.4-release/Foundation/include/Poco/Logger.h#L105-L114
-        -->
-        <level>trace</level>
-        <log>/var/log/clickhouse-server/clickhouse-server.log</log>
-        <errorlog>/var/log/clickhouse-server/clickhouse-server.err.log</errorlog>
-        <!-- Rotation policy
-             See https://github.com/pocoproject/poco/blob/poco-1.9.4-release/Foundation/include/Poco/FileChannel.h#L54-L85
-          -->
-        <size>1000M</size>
-        <count>10</count>
-        <!-- <console>1</console> --> <!-- Default behavior is autodetection (log to console if not daemon mode and is tty) -->
-
-        <!-- Per level overrides (legacy):
-
-        For example to suppress logging of the ConfigReloader you can use:
-        NOTE: levels.logger is reserved, see below.
-        -->
-        <!--
-        <levels>
-          <ConfigReloader>none</ConfigReloader>
-        </levels>
-        -->
-
-        <!-- Per level overrides:
-
-        For example to suppress logging of the RBAC for default user you can use:
-        (But please note that the logger name maybe changed from version to version, even after minor upgrade)
-        -->
-        <!--
-        <levels>
-          <logger>
-            <name>ContextAccess (default)</name>
-            <level>none</level>
-          </logger>
-          <logger>
-            <name>DatabaseOrdinary (test)</name>
-            <level>none</level>
-          </logger>
-        </levels>
-        -->
-    </logger>
-    <!-- Add headers to response in options request. OPTIONS method is used in CORS preflight requests. -->
-    <!-- It is off by default. Next headers are obligate for CORS.-->
-    <!-- http_options_response>
-        <header>
-            <name>Access-Control-Allow-Origin</name>
-            <value>*</value>
-        </header>
-        <header>
-            <name>Access-Control-Allow-Headers</name>
-            <value>origin, x-requested-with</value>
-        </header>
-        <header>
-            <name>Access-Control-Allow-Methods</name>
-            <value>POST, GET, OPTIONS</value>
-        </header>
-        <header>
-            <name>Access-Control-Max-Age</name>
-            <value>86400</value>
-        </header>
-    </http_options_response -->
-
-    <!-- It is the name that will be shown in the clickhouse-client.
-         By default, anything with "production" will be highlighted in red in query prompt.
-    -->
-    <!--display_name>production</display_name-->
-
-    <!-- Port for HTTP API. See also 'https_port' for secure connections.
-         This interface is also used by ODBC and JDBC drivers (DataGrip, Dbeaver, ...)
-         and by most of web interfaces (embedded UI, Grafana, Redash, ...).
-      -->
-    <http_port>8123</http_port>
-
-    <!-- Port for interaction by native protocol with:
-         - clickhouse-client and other native ClickHouse tools (clickhouse-benchmark);
-         - clickhouse-server with other clickhouse-servers for distributed query processing;
-         - ClickHouse drivers and applications supporting native protocol
-         (this protocol is also informally called as "the TCP protocol");
-         See also 'tcp_port_secure' for secure connections.
-    -->
-    <tcp_port>9000</tcp_port>
-
-    <!-- Compatibility with MySQL protocol.
-         ClickHouse will pretend to be MySQL for applications connecting to this port.
-    -->
-    <mysql_port>9004</mysql_port>
-
-    <!-- Compatibility with PostgreSQL protocol.
-         ClickHouse will pretend to be PostgreSQL for applications connecting to this port.
-    -->
-    <postgresql_port>9005</postgresql_port>
-
-    <!-- HTTP API with TLS (HTTPS).
-         You have to configure certificate to enable this interface.
-         See the openSSL section below.
-    -->
-    <!-- <https_port>8443</https_port> -->
-
-    <!-- Native interface with TLS.
-         You have to configure certificate to enable this interface.
-         See the openSSL section below.
-    -->
-    <!-- <tcp_port_secure>9440</tcp_port_secure> -->
-
-    <!-- Native interface wrapped with PROXYv1 protocol
-         PROXYv1 header sent for every connection.
-         ClickHouse will extract information about proxy-forwarded client address from the header.
-    -->
-    <!-- <tcp_with_proxy_port>9011</tcp_with_proxy_port> -->
-
-    <!-- Port for communication between replicas. Used for data exchange.
-         It provides low-level data access between servers.
-         This port should not be accessible from untrusted networks.
-         See also 'interserver_http_credentials'.
-         Data transferred over connections to this port should not go through untrusted networks.
-         See also 'interserver_https_port'.
-      -->
-    <interserver_http_port>9009</interserver_http_port>
-
-    <!-- Port for communication between replicas with TLS.
-         You have to configure certificate to enable this interface.
-         See the openSSL section below.
-         See also 'interserver_http_credentials'.
-      -->
-    <!-- <interserver_https_port>9010</interserver_https_port> -->
-
-    <!-- Hostname that is used by other replicas to request this server.
-         If not specified, than it is determined analogous to 'hostname -f' command.
-         This setting could be used to switch replication to another network interface
-         (the server may be connected to multiple networks via multiple addresses)
-      -->
-    <!--
-    <interserver_http_host>example.yandex.ru</interserver_http_host>
-    -->
-
-    <!-- You can specify credentials for authenthication between replicas.
-         This is required when interserver_https_port is accessible from untrusted networks,
-         and also recommended to avoid SSRF attacks from possibly compromised services in your network.
-      -->
-    <!--<interserver_http_credentials>
-        <user>interserver</user>
-        <password></password>
-    </interserver_http_credentials>-->
-
-    <!-- Listen specified address.
-         Use :: (wildcard IPv6 address), if you want to accept connections both with IPv4 and IPv6 from everywhere.
-         Notes:
-         If you open connections from wildcard address, make sure that at least one of the following measures applied:
-         - server is protected by firewall and not accessible from untrusted networks;
-         - all users are restricted to subset of network addresses (see users.xml);
-         - all users have strong passwords, only secure (TLS) interfaces are accessible, or connections are only made via TLS interfaces.
-         - users without password have readonly access.
-         See also: https://www.shodan.io/search?query=clickhouse
-      -->
-    <!-- <listen_host>::</listen_host> -->
-
-    <!-- Same for hosts without support for IPv6: -->
-    <!-- <listen_host>0.0.0.0</listen_host> -->
-
-    <!-- Default values - try listen localhost on IPv4 and IPv6. -->
-    <!--
-    <listen_host>::1</listen_host>
-    <listen_host>127.0.0.1</listen_host>
-    -->
-
-    <!-- Don't exit if IPv6 or IPv4 networks are unavailable while trying to listen. -->
-    <!-- <listen_try>0</listen_try> -->
-
-    <!-- Allow multiple servers to listen on the same address:port. This is not recommended.
-      -->
-    <!-- <listen_reuse_port>0</listen_reuse_port> -->
-
-    <!-- <listen_backlog>4096</listen_backlog> -->
-
-    <max_connections>4096</max_connections>
-
-    <!-- For 'Connection: keep-alive' in HTTP 1.1 -->
-    <keep_alive_timeout>3</keep_alive_timeout>
-
-    <!-- gRPC protocol (see src/Server/grpc_protos/clickhouse_grpc.proto for the API) -->
-    <!-- <grpc_port>9100</grpc_port> -->
-    <grpc>
-        <enable_ssl>false</enable_ssl>
-
-        <!-- The following two files are used only if enable_ssl=1 -->
-        <ssl_cert_file>/path/to/ssl_cert_file</ssl_cert_file>
-        <ssl_key_file>/path/to/ssl_key_file</ssl_key_file>
-
-        <!-- Whether server will request client for a certificate -->
-        <ssl_require_client_auth>false</ssl_require_client_auth>
-
-        <!-- The following file is used only if ssl_require_client_auth=1 -->
-        <ssl_ca_cert_file>/path/to/ssl_ca_cert_file</ssl_ca_cert_file>
-
-        <!-- Default compression algorithm (applied if client doesn't specify another algorithm, see result_compression in QueryInfo).
-             Supported algorithms: none, deflate, gzip, stream_gzip -->
-        <compression>deflate</compression>
-
-        <!-- Default compression level (applied if client doesn't specify another level, see result_compression in QueryInfo).
-             Supported levels: none, low, medium, high -->
-        <compression_level>medium</compression_level>
-
-        <!-- Send/receive message size limits in bytes. -1 means unlimited -->
-        <max_send_message_size>-1</max_send_message_size>
-        <max_receive_message_size>-1</max_receive_message_size>
-
-        <!-- Enable if you want very detailed logs -->
-        <verbose_logs>false</verbose_logs>
-    </grpc>
-
-    <!-- Used with https_port and tcp_port_secure. Full ssl options list: https://github.com/ClickHouse-Extras/poco/blob/master/NetSSL_OpenSSL/include/Poco/Net/SSLManager.h#L71 -->
-    <openSSL>
-        <server> <!-- Used for https server AND secure tcp port -->
-            <!-- openssl req -subj "/CN=localhost" -new -newkey rsa:2048 -days 365 -nodes -x509 -keyout /etc/clickhouse-server/server.key -out /etc/clickhouse-server/server.crt -->
-            <certificateFile>/etc/clickhouse-server/server.crt</certificateFile>
-            <privateKeyFile>/etc/clickhouse-server/server.key</privateKeyFile>
-            <!-- dhparams are optional. You can delete the <dhParamsFile> element.
-                 To generate dhparams, use the following command:
-                  openssl dhparam -out /etc/clickhouse-server/dhparam.pem 4096
-                 Only file format with BEGIN DH PARAMETERS is supported.
-              -->
-            <dhParamsFile>/etc/clickhouse-server/dhparam.pem</dhParamsFile>
-            <verificationMode>none</verificationMode>
-            <loadDefaultCAFile>true</loadDefaultCAFile>
-            <cacheSessions>true</cacheSessions>
-            <disableProtocols>sslv2,sslv3</disableProtocols>
-            <preferServerCiphers>true</preferServerCiphers>
-        </server>
-
-        <client> <!-- Used for connecting to https dictionary source and secured Zookeeper communication -->
-            <loadDefaultCAFile>true</loadDefaultCAFile>
-            <cacheSessions>true</cacheSessions>
-            <disableProtocols>sslv2,sslv3</disableProtocols>
-            <preferServerCiphers>true</preferServerCiphers>
-            <!-- Use for self-signed: <verificationMode>none</verificationMode> -->
-            <invalidCertificateHandler>
-                <!-- Use for self-signed: <name>AcceptCertificateHandler</name> -->
-                <name>RejectCertificateHandler</name>
-            </invalidCertificateHandler>
-        </client>
-    </openSSL>
-
-    <!-- Default root page on http[s] server. For example load UI from https://tabix.io/ when opening http://localhost:8123 -->
-    <!--
-    <http_server_default_response><![CDATA[<html ng-app="SMI2"><head><base href="http://ui.tabix.io/"></head><body><div ui-view="" class="content-ui"></div><script src="http://loader.tabix.io/master.js"></script></body></html>]]></http_server_default_response>
-    -->
-
-    <!-- Maximum number of concurrent queries. -->
-    <max_concurrent_queries>100</max_concurrent_queries>
-
-    <!-- Maximum memory usage (resident set size) for server process.
-         Zero value or unset means default. Default is "max_server_memory_usage_to_ram_ratio" of available physical RAM.
-         If the value is larger than "max_server_memory_usage_to_ram_ratio" of available physical RAM, it will be cut down.
-
-         The constraint is checked on query execution time.
-         If a query tries to allocate memory and the current memory usage plus allocation is greater
-          than specified threshold, exception will be thrown.
-
-         It is not practical to set this constraint to small values like just a few gigabytes,
-          because memory allocator will keep this amount of memory in caches and the server will deny service of queries.
-      -->
-    <max_server_memory_usage>0</max_server_memory_usage>
-
-    <!-- Maximum number of threads in the Global thread pool.
-    This will default to a maximum of 10000 threads if not specified.
-    This setting will be useful in scenarios where there are a large number
-    of distributed queries that are running concurrently but are idling most
-    of the time, in which case a higher number of threads might be required.
-    -->
-
-    <max_thread_pool_size>10000</max_thread_pool_size>
-
-    <!-- On memory constrained environments you may have to set this to value larger than 1.
-      -->
-    <max_server_memory_usage_to_ram_ratio>0.9</max_server_memory_usage_to_ram_ratio>
-
-    <!-- Simple server-wide memory profiler. Collect a stack trace at every peak allocation step (in bytes).
-         Data will be stored in system.trace_log table with query_id = empty string.
-         Zero means disabled.
-      -->
-    <total_memory_profiler_step>4194304</total_memory_profiler_step>
-
-    <!-- Collect random allocations and deallocations and write them into system.trace_log with 'MemorySample' trace_type.
-         The probability is for every alloc/free regardless to the size of the allocation.
-         Note that sampling happens only when the amount of untracked memory exceeds the untracked memory limit,
-          which is 4 MiB by default but can be lowered if 'total_memory_profiler_step' is lowered.
-         You may want to set 'total_memory_profiler_step' to 1 for extra fine grained sampling.
-      -->
-    <total_memory_tracker_sample_probability>0</total_memory_tracker_sample_probability>
-
-    <!-- Set limit on number of open files (default: maximum). This setting makes sense on Mac OS X because getrlimit() fails to retrieve
-         correct maximum value. -->
-    <!-- <max_open_files>262144</max_open_files> -->
-
-    <!-- Size of cache of uncompressed blocks of data, used in tables of MergeTree family.
-         In bytes. Cache is single for server. Memory is allocated only on demand.
-         Cache is used when 'use_uncompressed_cache' user setting turned on (off by default).
-         Uncompressed cache is advantageous only for very short queries and in rare cases.
-
-         Note: uncompressed cache can be pointless for lz4, because memory bandwidth
-         is slower than multi-core decompression on some server configurations.
-         Enabling it can sometimes paradoxically make queries slower.
-      -->
-    <uncompressed_cache_size>8589934592</uncompressed_cache_size>
-
-    <!-- Approximate size of mark cache, used in tables of MergeTree family.
-         In bytes. Cache is single for server. Memory is allocated only on demand.
-         You should not lower this value.
-      -->
-    <mark_cache_size>5368709120</mark_cache_size>
-
-
-    <!-- If you enable the `min_bytes_to_use_mmap_io` setting,
-         the data in MergeTree tables can be read with mmap to avoid copying from kernel to userspace.
-         It makes sense only for large files and helps only if data reside in page cache.
-         To avoid frequent open/mmap/munmap/close calls (which are very expensive due to consequent page faults)
-         and to reuse mappings from several threads and queries,
-         the cache of mapped files is maintained. Its size is the number of mapped regions (usually equal to the number of mapped files).
-         The amount of data in mapped files can be monitored
-         in system.metrics, system.metric_log by the MMappedFiles, MMappedFileBytes metrics
-         and in system.asynchronous_metrics, system.asynchronous_metrics_log by the MMapCacheCells metric,
-         and also in system.events, system.processes, system.query_log, system.query_thread_log, system.query_views_log by the
-         CreatedReadBufferMMap, CreatedReadBufferMMapFailed, MMappedFileCacheHits, MMappedFileCacheMisses events.
-         Note that the amount of data in mapped files does not consume memory directly and is not accounted
-         in query or server memory usage - because this memory can be discarded similar to OS page cache.
-         The cache is dropped (the files are closed) automatically on removal of old parts in MergeTree,
-         also it can be dropped manually by the SYSTEM DROP MMAP CACHE query.
-      -->
-    <mmap_cache_size>1000</mmap_cache_size>
-
-    <!-- Cache size in bytes for compiled expressions.-->
-    <compiled_expression_cache_size>134217728</compiled_expression_cache_size>
-
-    <!-- Cache size in elements for compiled expressions.-->
-    <compiled_expression_cache_elements_size>10000</compiled_expression_cache_elements_size>
-
-    <!-- Path to data directory, with trailing slash. -->
-    <path>/var/lib/clickhouse/</path>
-
-    <!-- Path to temporary data for processing hard queries. -->
-    <tmp_path>/var/lib/clickhouse/tmp/</tmp_path>
-
-    <!-- Policy from the <storage_configuration> for the temporary files.
-         If not set <tmp_path> is used, otherwise <tmp_path> is ignored.
-
-         Notes:
-         - move_factor              is ignored
-         - keep_free_space_bytes    is ignored
-         - max_data_part_size_bytes is ignored
-         - you must have exactly one volume in that policy
-    -->
-    <!-- <tmp_policy>tmp</tmp_policy> -->
-
-    <!-- Directory with user provided files that are accessible by 'file' table function. -->
-    <user_files_path>/var/lib/clickhouse/user_files/</user_files_path>
-
-    <!-- LDAP server definitions. -->
-    <ldap_servers>
-        <!-- List LDAP servers with their connection parameters here to later 1) use them as authenticators for dedicated local users,
-              who have 'ldap' authentication mechanism specified instead of 'password', or to 2) use them as remote user directories.
-             Parameters:
-                host - LDAP server hostname or IP, this parameter is mandatory and cannot be empty.
-                port - LDAP server port, default is 636 if enable_tls is set to true, 389 otherwise.
-                bind_dn - template used to construct the DN to bind to.
-                        The resulting DN will be constructed by replacing all '{user_name}' substrings of the template with the actual
-                         user name during each authentication attempt.
-                user_dn_detection - section with LDAP search parameters for detecting the actual user DN of the bound user.
-                        This is mainly used in search filters for further role mapping when the server is Active Directory. The
-                         resulting user DN will be used when replacing '{user_dn}' substrings wherever they are allowed. By default,
-                         user DN is set equal to bind DN, but once search is performed, it will be updated with to the actual detected
-                         user DN value.
-                    base_dn - template used to construct the base DN for the LDAP search.
-                            The resulting DN will be constructed by replacing all '{user_name}' and '{bind_dn}' substrings
-                             of the template with the actual user name and bind DN during the LDAP search.
-                    scope - scope of the LDAP search.
-                            Accepted values are: 'base', 'one_level', 'children', 'subtree' (the default).
-                    search_filter - template used to construct the search filter for the LDAP search.
-                            The resulting filter will be constructed by replacing all '{user_name}', '{bind_dn}', and '{base_dn}'
-                             substrings of the template with the actual user name, bind DN, and base DN during the LDAP search.
-                            Note, that the special characters must be escaped properly in XML.
-                verification_cooldown - a period of time, in seconds, after a successful bind attempt, during which a user will be assumed
-                         to be successfully authenticated for all consecutive requests without contacting the LDAP server.
-                        Specify 0 (the default) to disable caching and force contacting the LDAP server for each authentication request.
-                enable_tls - flag to trigger use of secure connection to the LDAP server.
-                        Specify 'no' for plain text (ldap://) protocol (not recommended).
-                        Specify 'yes' for LDAP over SSL/TLS (ldaps://) protocol (recommended, the default).
-                        Specify 'starttls' for legacy StartTLS protocol (plain text (ldap://) protocol, upgraded to TLS).
-                tls_minimum_protocol_version - the minimum protocol version of SSL/TLS.
-                        Accepted values are: 'ssl2', 'ssl3', 'tls1.0', 'tls1.1', 'tls1.2' (the default).
-                tls_require_cert - SSL/TLS peer certificate verification behavior.
-                        Accepted values are: 'never', 'allow', 'try', 'demand' (the default).
-                tls_cert_file - path to certificate file.
-                tls_key_file - path to certificate key file.
-                tls_ca_cert_file - path to CA certificate file.
-                tls_ca_cert_dir - path to the directory containing CA certificates.
-                tls_cipher_suite - allowed cipher suite (in OpenSSL notation).
-             Example:
-                <my_ldap_server>
-                    <host>localhost</host>
-                    <port>636</port>
-                    <bind_dn>uid={user_name},ou=users,dc=example,dc=com</bind_dn>
-                    <verification_cooldown>300</verification_cooldown>
-                    <enable_tls>yes</enable_tls>
-                    <tls_minimum_protocol_version>tls1.2</tls_minimum_protocol_version>
-                    <tls_require_cert>demand</tls_require_cert>
-                    <tls_cert_file>/path/to/tls_cert_file</tls_cert_file>
-                    <tls_key_file>/path/to/tls_key_file</tls_key_file>
-                    <tls_ca_cert_file>/path/to/tls_ca_cert_file</tls_ca_cert_file>
-                    <tls_ca_cert_dir>/path/to/tls_ca_cert_dir</tls_ca_cert_dir>
-                    <tls_cipher_suite>ECDHE-ECDSA-AES256-GCM-SHA384:ECDHE-RSA-AES256-GCM-SHA384:AES256-GCM-SHA384</tls_cipher_suite>
-                </my_ldap_server>
-             Example (typical Active Directory with configured user DN detection for further role mapping):
-                <my_ad_server>
-                    <host>localhost</host>
-                    <port>389</port>
-                    <bind_dn>EXAMPLE\{user_name}</bind_dn>
-                    <user_dn_detection>
-                        <base_dn>CN=Users,DC=example,DC=com</base_dn>
-                        <search_filter>(&amp;(objectClass=user)(sAMAccountName={user_name}))</search_filter>
-                    </user_dn_detection>
-                    <enable_tls>no</enable_tls>
-                </my_ad_server>
-        -->
-    </ldap_servers>
-
-    <!-- To enable Kerberos authentication support for HTTP requests (GSS-SPNEGO), for those users who are explicitly configured
-          to authenticate via Kerberos, define a single 'kerberos' section here.
-         Parameters:
-            principal - canonical service principal name, that will be acquired and used when accepting security contexts.
-                    This parameter is optional, if omitted, the default principal will be used.
-                    This parameter cannot be specified together with 'realm' parameter.
-            realm - a realm, that will be used to restrict authentication to only those requests whose initiator's realm matches it.
-                    This parameter is optional, if omitted, no additional filtering by realm will be applied.
-                    This parameter cannot be specified together with 'principal' parameter.
-         Example:
-            <kerberos />
-         Example:
-            <kerberos>
-                <principal>HTTP/clickhouse.example.com@EXAMPLE.COM</principal>
-            </kerberos>
-         Example:
-            <kerberos>
-                <realm>EXAMPLE.COM</realm>
-            </kerberos>
-    -->
-
-    <!-- Sources to read users, roles, access rights, profiles of settings, quotas. -->
-    <user_directories>
-        <users_xml>
-            <!-- Path to configuration file with predefined users. -->
-            <path>users.xml</path>
-        </users_xml>
-        <local_directory>
-            <!-- Path to folder where users created by SQL commands are stored. -->
-            <path>/var/lib/clickhouse/access/</path>
-        </local_directory>
-
-        <!-- To add an LDAP server as a remote user directory of users that are not defined locally, define a single 'ldap' section
-              with the following parameters:
-                server - one of LDAP server names defined in 'ldap_servers' config section above.
-                        This parameter is mandatory and cannot be empty.
-                roles - section with a list of locally defined roles that will be assigned to each user retrieved from the LDAP server.
-                        If no roles are specified here or assigned during role mapping (below), user will not be able to perform any
-                         actions after authentication.
-                role_mapping - section with LDAP search parameters and mapping rules.
-                        When a user authenticates, while still bound to LDAP, an LDAP search is performed using search_filter and the
-                         name of the logged in user. For each entry found during that search, the value of the specified attribute is
-                         extracted. For each attribute value that has the specified prefix, the prefix is removed, and the rest of the
-                         value becomes the name of a local role defined in ClickHouse, which is expected to be created beforehand by
-                         CREATE ROLE command.
-                        There can be multiple 'role_mapping' sections defined inside the same 'ldap' section. All of them will be
-                         applied.
-                    base_dn - template used to construct the base DN for the LDAP search.
-                            The resulting DN will be constructed by replacing all '{user_name}', '{bind_dn}', and '{user_dn}'
-                             substrings of the template with the actual user name, bind DN, and user DN during each LDAP search.
-                    scope - scope of the LDAP search.
-                            Accepted values are: 'base', 'one_level', 'children', 'subtree' (the default).
-                    search_filter - template used to construct the search filter for the LDAP search.
-                            The resulting filter will be constructed by replacing all '{user_name}', '{bind_dn}', '{user_dn}', and
-                             '{base_dn}' substrings of the template with the actual user name, bind DN, user DN, and base DN during
-                             each LDAP search.
-                            Note, that the special characters must be escaped properly in XML.
-                    attribute - attribute name whose values will be returned by the LDAP search. 'cn', by default.
-                    prefix - prefix, that will be expected to be in front of each string in the original list of strings returned by
-                             the LDAP search. Prefix will be removed from the original strings and resulting strings will be treated
-                             as local role names. Empty, by default.
-             Example:
-                <ldap>
-                    <server>my_ldap_server</server>
-                    <roles>
-                        <my_local_role1 />
-                        <my_local_role2 />
-                    </roles>
-                    <role_mapping>
-                        <base_dn>ou=groups,dc=example,dc=com</base_dn>
-                        <scope>subtree</scope>
-                        <search_filter>(&amp;(objectClass=groupOfNames)(member={bind_dn}))</search_filter>
-                        <attribute>cn</attribute>
-                        <prefix>clickhouse_</prefix>
-                    </role_mapping>
-                </ldap>
-             Example (typical Active Directory with role mapping that relies on the detected user DN):
-                <ldap>
-                    <server>my_ad_server</server>
-                    <role_mapping>
-                        <base_dn>CN=Users,DC=example,DC=com</base_dn>
-                        <attribute>CN</attribute>
-                        <scope>subtree</scope>
-                        <search_filter>(&amp;(objectClass=group)(member={user_dn}))</search_filter>
-                        <prefix>clickhouse_</prefix>
-                    </role_mapping>
-                </ldap>
-        -->
-    </user_directories>
-
-    <!-- Default profile of settings. -->
-    <default_profile>default</default_profile>
-
-    <!-- Comma-separated list of prefixes for user-defined settings. -->
-    <custom_settings_prefixes></custom_settings_prefixes>
-
-    <!-- System profile of settings. This settings are used by internal processes (Distributed DDL worker and so on). -->
-    <!-- <system_profile>default</system_profile> -->
-
-    <!-- Buffer profile of settings.
-         This settings are used by Buffer storage to flush data to the underlying table.
-         Default: used from system_profile directive.
-    -->
-    <!-- <buffer_profile>default</buffer_profile> -->
-
-    <!-- Default database. -->
-    <default_database>default</default_database>
-
-    <!-- Server time zone could be set here.
-
-         Time zone is used when converting between String and DateTime types,
-          when printing DateTime in text formats and parsing DateTime from text,
-          it is used in date and time related functions, if specific time zone was not passed as an argument.
-
-         Time zone is specified as identifier from IANA time zone database, like UTC or Africa/Abidjan.
-         If not specified, system time zone at server startup is used.
-
-         Please note, that server could display time zone alias instead of specified name.
-         Example: W-SU is an alias for Europe/Moscow and Zulu is an alias for UTC.
-    -->
-    <!-- <timezone>Europe/Moscow</timezone> -->
-
-    <!-- You can specify umask here (see "man umask"). Server will apply it on startup.
-         Number is always parsed as octal. Default umask is 027 (other users cannot read logs, data files, etc; group can only read).
-    -->
-    <!-- <umask>022</umask> -->
-
-    <!-- Perform mlockall after startup to lower first queries latency
-          and to prevent clickhouse executable from being paged out under high IO load.
-         Enabling this option is recommended but will lead to increased startup time for up to a few seconds.
-    -->
-    <mlock_executable>true</mlock_executable>
-
-    <!-- Reallocate memory for machine code ("text") using huge pages. Highly experimental. -->
-    <remap_executable>false</remap_executable>
-
-    <![CDATA[
-         Uncomment below in order to use JDBC table engine and function.
-
-         To install and run JDBC bridge in background:
-         * [Debian/Ubuntu]
-           export MVN_URL=https://repo1.maven.org/maven2/ru/yandex/clickhouse/clickhouse-jdbc-bridge
-           export PKG_VER=$(curl -sL $MVN_URL/maven-metadata.xml | grep '<release>' | sed -e 's|.*>\(.*\)<.*|\1|')
-           wget https://github.com/ClickHouse/clickhouse-jdbc-bridge/releases/download/v$PKG_VER/clickhouse-jdbc-bridge_$PKG_VER-1_all.deb
-           apt install --no-install-recommends -f ./clickhouse-jdbc-bridge_$PKG_VER-1_all.deb
-           clickhouse-jdbc-bridge &
-
-         * [CentOS/RHEL]
-           export MVN_URL=https://repo1.maven.org/maven2/ru/yandex/clickhouse/clickhouse-jdbc-bridge
-           export PKG_VER=$(curl -sL $MVN_URL/maven-metadata.xml | grep '<release>' | sed -e 's|.*>\(.*\)<.*|\1|')
-           wget https://github.com/ClickHouse/clickhouse-jdbc-bridge/releases/download/v$PKG_VER/clickhouse-jdbc-bridge-$PKG_VER-1.noarch.rpm
-           yum localinstall -y clickhouse-jdbc-bridge-$PKG_VER-1.noarch.rpm
-           clickhouse-jdbc-bridge &
-
-         Please refer to https://github.com/ClickHouse/clickhouse-jdbc-bridge#usage for more information.
-    ]]>
-    <!--
-    <jdbc_bridge>
-        <host>127.0.0.1</host>
-        <port>9019</port>
-    </jdbc_bridge>
-    -->
-
-    <!-- Configuration of clusters that could be used in Distributed tables.
-         https://clickhouse.com/docs/en/operations/table_engines/distributed/
-      -->
-    <remote_servers>
-        <!-- Test only shard config for testing distributed storage -->
-        <test_shard_localhost>
-            <!-- Inter-server per-cluster secret for Distributed queries
-                 default: no secret (no authentication will be performed)
-
-                 If set, then Distributed queries will be validated on shards, so at least:
-                 - such cluster should exist on the shard,
-                 - such cluster should have the same secret.
-
-                 And also (and which is more important), the initial_user will
-                 be used as current user for the query.
-
-                 Right now the protocol is pretty simple and it only takes into account:
-                 - cluster name
-                 - query
-
-                 Also it will be nice if the following will be implemented:
-                 - source hostname (see interserver_http_host), but then it will depends from DNS,
-                   it can use IP address instead, but then the you need to get correct on the initiator node.
-                 - target hostname / ip address (same notes as for source hostname)
-                 - time-based security tokens
-            -->
-            <!-- <secret></secret> -->
-
-            <shard>
-                <!-- Optional. Whether to write data to just one of the replicas. Default: false (write data to all replicas). -->
-                <!-- <internal_replication>false</internal_replication> -->
-                <!-- Optional. Shard weight when writing data. Default: 1. -->
-                <!-- <weight>1</weight> -->
-                <replica>
-                    <host>localhost</host>
-                    <port>9000</port>
-                    <!-- Optional. Priority of the replica for load_balancing. Default: 1 (less value has more priority). -->
-                    <!-- <priority>1</priority> -->
-                </replica>
-            </shard>
-        </test_shard_localhost>
-    </remote_servers>
-
-    <!-- The list of hosts allowed to use in URL-related storage engines and table functions.
-        If this section is not present in configuration, all hosts are allowed.
-    -->
-    <!--<remote_url_allow_hosts>-->
-    <!-- Host should be specified exactly as in URL. The name is checked before DNS resolution.
-        Example: "yandex.ru", "yandex.ru." and "www.yandex.ru" are different hosts.
-                If port is explicitly specified in URL, the host:port is checked as a whole.
-                If host specified here without port, any port with this host allowed.
-                "yandex.ru" -> "yandex.ru:443", "yandex.ru:80" etc. is allowed, but "yandex.ru:80" -> only "yandex.ru:80" is allowed.
-        If the host is specified as IP address, it is checked as specified in URL. Example: "[2a02:6b8:a::a]".
-        If there are redirects and support for redirects is enabled, every redirect (the Location field) is checked.
-        Host should be specified using the host xml tag:
-                <host>yandex.ru</host>
-    -->
-
-    <!-- Regular expression can be specified. RE2 engine is used for regexps.
-        Regexps are not aligned: don't forget to add ^ and $. Also don't forget to escape dot (.) metacharacter
-        (forgetting to do so is a common source of error).
-    -->
-    <!--</remote_url_allow_hosts>-->
-
-    <!-- If element has 'incl' attribute, then for it's value will be used corresponding substitution from another file.
-         By default, path to file with substitutions is /etc/metrika.xml. It could be changed in config in 'include_from' element.
-         Values for substitutions are specified in /clickhouse/name_of_substitution elements in that file.
-      -->
-
-    <!-- ZooKeeper is used to store metadata about replicas, when using Replicated tables.
-         Optional. If you don't use replicated tables, you could omit that.
-
-         See https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/replication/
-      -->
-
-    <!--
-    <zookeeper>
-        <node>
-            <host>example1</host>
-            <port>2181</port>
-        </node>
-        <node>
-            <host>example2</host>
-            <port>2181</port>
-        </node>
-        <node>
-            <host>example3</host>
-            <port>2181</port>
-        </node>
-    </zookeeper>
-    -->
-
-    <!-- Substitutions for parameters of replicated tables.
-          Optional. If you don't use replicated tables, you could omit that.
-
-         See https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/replication/#creating-replicated-tables
-      -->
-    <!--
-    <macros>
-        <shard>01</shard>
-        <replica>example01-01-1</replica>
-    </macros>
-    -->
-
-
-    <!-- Reloading interval for embedded dictionaries, in seconds. Default: 3600. -->
-    <builtin_dictionaries_reload_interval>3600</builtin_dictionaries_reload_interval>
-
-
-    <!-- Maximum session timeout, in seconds. Default: 3600. -->
-    <max_session_timeout>3600</max_session_timeout>
-
-    <!-- Default session timeout, in seconds. Default: 60. -->
-    <default_session_timeout>60</default_session_timeout>
-
-    <!-- Sending data to Graphite for monitoring. Several sections can be defined. -->
-    <!--
-        interval - send every X second
-        root_path - prefix for keys
-        hostname_in_path - append hostname to root_path (default = true)
-        metrics - send data from table system.metrics
-        events - send data from table system.events
-        asynchronous_metrics - send data from table system.asynchronous_metrics
-    -->
-    <!--
-    <graphite>
-        <host>localhost</host>
-        <port>42000</port>
-        <timeout>0.1</timeout>
-        <interval>60</interval>
-        <root_path>one_min</root_path>
-        <hostname_in_path>true</hostname_in_path>
-
-        <metrics>true</metrics>
-        <events>true</events>
-        <events_cumulative>false</events_cumulative>
-        <asynchronous_metrics>true</asynchronous_metrics>
-    </graphite>
-    <graphite>
-        <host>localhost</host>
-        <port>42000</port>
-        <timeout>0.1</timeout>
-        <interval>1</interval>
-        <root_path>one_sec</root_path>
-
-        <metrics>true</metrics>
-        <events>true</events>
-        <events_cumulative>false</events_cumulative>
-        <asynchronous_metrics>false</asynchronous_metrics>
-    </graphite>
-    -->
-
-    <!-- Query log. Used only for queries with setting log_queries = 1. -->
-    <query_log>
-        <!-- What table to insert data. If table is not exist, it will be created.
-             When query log structure is changed after system update,
-              then old table will be renamed and new table will be created automatically.
-        -->
-        <database>system</database>
-        <table>query_log</table>
-        <!--
-            PARTITION BY expr: https://clickhouse.com/docs/en/table_engines/mergetree-family/custom_partitioning_key/
-            Example:
-                event_date
-                toMonday(event_date)
-                toYYYYMM(event_date)
-                toStartOfHour(event_time)
-        -->
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <!--
-            Table TTL specification: https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/mergetree/#mergetree-table-ttl
-            Example:
-                event_date + INTERVAL 1 WEEK
-                event_date + INTERVAL 7 DAY DELETE
-                event_date + INTERVAL 2 WEEK TO DISK 'bbb'
-
-        <ttl>event_date + INTERVAL 30 DAY DELETE</ttl>
-        -->
-
-        <!-- Instead of partition_by, you can provide full engine expression (starting with ENGINE = ) with parameters,
-             Example: <engine>ENGINE = MergeTree PARTITION BY toYYYYMM(event_date) ORDER BY (event_date, event_time) SETTINGS index_granularity = 1024</engine>
-          -->
-
-        <!-- Interval of flushing data. -->
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </query_log>
-
-    <!-- Trace log. Stores stack traces collected by query profilers.
-         See query_profiler_real_time_period_ns and query_profiler_cpu_time_period_ns settings. -->
-    <trace_log>
-        <database>system</database>
-        <table>trace_log</table>
-
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </trace_log>
-
-    <!-- Query thread log. Has information about all threads participated in query execution.
-         Used only for queries with setting log_query_threads = 1. -->
-    <query_thread_log>
-        <database>system</database>
-        <table>query_thread_log</table>
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </query_thread_log>
-
-    <!-- Query views log. Has information about all dependent views associated with a query.
-         Used only for queries with setting log_query_views = 1. -->
-    <query_views_log>
-        <database>system</database>
-        <table>query_views_log</table>
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </query_views_log>
-
-    <!-- Uncomment if use part log.
-         Part log contains information about all actions with parts in MergeTree tables (creation, deletion, merges, downloads).-->
-    <part_log>
-        <database>system</database>
-        <table>part_log</table>
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </part_log>
-
-    <!-- Uncomment to write text log into table.
-         Text log contains all information from usual server log but stores it in structured and efficient way.
-         The level of the messages that goes to the table can be limited (<level>), if not specified all messages will go to the table.
-    <text_log>
-        <database>system</database>
-        <table>text_log</table>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-        <level></level>
-    </text_log>
-    -->
-
-    <!-- Metric log contains rows with current values of ProfileEvents, CurrentMetrics collected with "collect_interval_milliseconds" interval. -->
-    <metric_log>
-        <database>system</database>
-        <table>metric_log</table>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-        <collect_interval_milliseconds>1000</collect_interval_milliseconds>
-    </metric_log>
-
-    <!--
-        Asynchronous metric log contains values of metrics from
-        system.asynchronous_metrics.
-    -->
-    <asynchronous_metric_log>
-        <database>system</database>
-        <table>asynchronous_metric_log</table>
-        <!--
-            Asynchronous metrics are updated once a minute, so there is
-            no need to flush more often.
-        -->
-        <flush_interval_milliseconds>7000</flush_interval_milliseconds>
-    </asynchronous_metric_log>
-
-    <!--
-        OpenTelemetry log contains OpenTelemetry trace spans.
-    -->
-    <opentelemetry_span_log>
-        <!--
-            The default table creation code is insufficient, this <engine> spec
-            is a workaround. There is no 'event_time' for this log, but two times,
-            start and finish. It is sorted by finish time, to avoid inserting
-            data too far away in the past (probably we can sometimes insert a span
-            that is seconds earlier than the last span in the table, due to a race
-            between several spans inserted in parallel). This gives the spans a
-            global order that we can use to e.g. retry insertion into some external
-            system.
-        -->
-        <engine>
-            engine MergeTree
-            partition by toYYYYMM(finish_date)
-            order by (finish_date, finish_time_us, trace_id)
-        </engine>
-        <database>system</database>
-        <table>opentelemetry_span_log</table>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </opentelemetry_span_log>
-
-
-    <!-- Crash log. Stores stack traces for fatal errors.
-         This table is normally empty. -->
-    <crash_log>
-        <database>system</database>
-        <table>crash_log</table>
-
-        <partition_by />
-        <flush_interval_milliseconds>1000</flush_interval_milliseconds>
-    </crash_log>
-
-    <!-- Session log. Stores user log in (successful or not) and log out events. -->
-    <session_log>
-        <database>system</database>
-        <table>session_log</table>
-
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-    </session_log>
-
-    <!-- Parameters for embedded dictionaries, used in Yandex.Metrica.
-         See https://clickhouse.com/docs/en/dicts/internal_dicts/
-    -->
-
-    <!-- Path to file with region hierarchy. -->
-    <!-- <path_to_regions_hierarchy_file>/opt/geo/regions_hierarchy.txt</path_to_regions_hierarchy_file> -->
-
-    <!-- Path to directory with files containing names of regions -->
-    <!-- <path_to_regions_names_files>/opt/geo/</path_to_regions_names_files> -->
-
-
-    <!-- <top_level_domains_path>/var/lib/clickhouse/top_level_domains/</top_level_domains_path> -->
-    <!-- Custom TLD lists.
-         Format: <name>/path/to/file</name>
-
-         Changes will not be applied w/o server restart.
-         Path to the list is under top_level_domains_path (see above).
-    -->
-    <top_level_domains_lists>
-        <!--
-        <public_suffix_list>/path/to/public_suffix_list.dat</public_suffix_list>
-        -->
-    </top_level_domains_lists>
-
-    <!-- Configuration of external dictionaries. See:
-         https://clickhouse.com/docs/en/sql-reference/dictionaries/external-dictionaries/external-dicts
-    -->
-    <dictionaries_config>*_dictionary.xml</dictionaries_config>
-
-    <!-- Configuration of user defined executable functions -->
-    <user_defined_executable_functions_config>*_function.xml</user_defined_executable_functions_config>
-
-    <!-- Uncomment if you want data to be compressed 30-100% better.
-         Don't do that if you just started using ClickHouse.
-      -->
-    <!--
-    <compression>
-        <!- - Set of variants. Checked in order. Last matching case wins. If nothing matches, lz4 will be used. - ->
-        <case>
-
-            <!- - Conditions. All must be satisfied. Some conditions may be omitted. - ->
-            <min_part_size>10000000000</min_part_size>        <!- - Min part size in bytes. - ->
-            <min_part_size_ratio>0.01</min_part_size_ratio>   <!- - Min size of part relative to whole table size. - ->
-
-            <!- - What compression method to use. - ->
-            <method>zstd</method>
-        </case>
-    </compression>
-    -->
-
-    <!-- Configuration of encryption. The server executes a command to
-         obtain an encryption key at startup if such a command is
-         defined, or encryption codecs will be disabled otherwise. The
-         command is executed through /bin/sh and is expected to write
-         a Base64-encoded key to the stdout. -->
-    <encryption_codecs>
-        <!-- aes_128_gcm_siv -->
-        <!-- Example of getting hex key from env -->
-        <!-- the code should use this key and throw an exception if its length is not 16 bytes -->
-        <!--key_hex from_env="..."></key_hex -->
-
-        <!-- Example of multiple hex keys. They can be imported from env or be written down in config-->
-        <!-- the code should use these keys and throw an exception if their length is not 16 bytes -->
-        <!-- key_hex id="0">...</key_hex -->
-        <!-- key_hex id="1" from_env=".."></key_hex -->
-        <!-- key_hex id="2">...</key_hex -->
-        <!-- current_key_id>2</current_key_id -->
-
-        <!-- Example of getting hex key from config -->
-        <!-- the code should use this key and throw an exception if its length is not 16 bytes -->
-        <!-- key>...</key -->
-
-        <!-- example of adding nonce -->
-        <!-- nonce>...</nonce -->
-
-        <!-- /aes_128_gcm_siv -->
-    </encryption_codecs>
-
-    <!-- Allow to execute distributed DDL queries (CREATE, DROP, ALTER, RENAME) on cluster.
-         Works only if ZooKeeper is enabled. Comment it if such functionality isn't required. -->
-    <distributed_ddl>
-        <!-- Path in ZooKeeper to queue with DDL queries -->
-        <path>/clickhouse/task_queue/ddl</path>
-
-        <!-- Settings from this profile will be used to execute DDL queries -->
-        <!-- <profile>default</profile> -->
-
-        <!-- Controls how much ON CLUSTER queries can be run simultaneously. -->
-        <!-- <pool_size>1</pool_size> -->
-
-        <!--
-             Cleanup settings (active tasks will not be removed)
-        -->
-
-        <!-- Controls task TTL (default 1 week) -->
-        <!-- <task_max_lifetime>604800</task_max_lifetime> -->
-
-        <!-- Controls how often cleanup should be performed (in seconds) -->
-        <!-- <cleanup_delay_period>60</cleanup_delay_period> -->
-
-        <!-- Controls how many tasks could be in the queue -->
-        <!-- <max_tasks_in_queue>1000</max_tasks_in_queue> -->
-    </distributed_ddl>
-
-    <!-- Settings to fine tune MergeTree tables. See documentation in source code, in MergeTreeSettings.h -->
-    <!--
-    <merge_tree>
-        <max_suspicious_broken_parts>5</max_suspicious_broken_parts>
-    </merge_tree>
-    -->
-
-    <!-- Protection from accidental DROP.
-         If size of a MergeTree table is greater than max_table_size_to_drop (in bytes) than table could not be dropped with any DROP query.
-         If you want do delete one table and don't want to change clickhouse-server config, you could create special file <clickhouse-path>/flags/force_drop_table and make DROP once.
-         By default max_table_size_to_drop is 50GB; max_table_size_to_drop=0 allows to DROP any tables.
-         The same for max_partition_size_to_drop.
-         Uncomment to disable protection.
-    -->
-    <!-- <max_table_size_to_drop>0</max_table_size_to_drop> -->
-    <!-- <max_partition_size_to_drop>0</max_partition_size_to_drop> -->
-
-    <!-- Example of parameters for GraphiteMergeTree table engine -->
-    <graphite_rollup_example>
-        <pattern>
-            <regexp>click_cost</regexp>
-            <function>any</function>
-            <retention>
-                <age>0</age>
-                <precision>3600</precision>
-            </retention>
-            <retention>
-                <age>86400</age>
-                <precision>60</precision>
-            </retention>
-        </pattern>
-        <default>
-            <function>max</function>
-            <retention>
-                <age>0</age>
-                <precision>60</precision>
-            </retention>
-            <retention>
-                <age>3600</age>
-                <precision>300</precision>
-            </retention>
-            <retention>
-                <age>86400</age>
-                <precision>3600</precision>
-            </retention>
-        </default>
-    </graphite_rollup_example>
-
-    <!-- Directory in <clickhouse-path> containing schema files for various input formats.
-         The directory will be created if it doesn't exist.
-      -->
-    <format_schema_path>/var/lib/clickhouse/format_schemas/</format_schema_path>
-
-    <!-- Default query masking rules, matching lines would be replaced with something else in the logs
-        (both text logs and system.query_log).
-        name - name for the rule (optional)
-        regexp - RE2 compatible regular expression (mandatory)
-        replace - substitution string for sensitive data (optional, by default - six asterisks)
-    -->
-    <query_masking_rules>
-        <rule>
-            <name>hide encrypt/decrypt arguments</name>
-            <regexp>((?:aes_)?(?:encrypt|decrypt)(?:_mysql)?)\s*\(\s*(?:'(?:\\'|.)+'|.*?)\s*\)</regexp>
-            <!-- or more secure, but also more invasive:
-                (aes_\w+)\s*\(.*\)
-            -->
-            <replace>\1(???)</replace>
-        </rule>
-    </query_masking_rules>
-
-    <!-- Uncomment to use custom http handlers.
-        rules are checked from top to bottom, first match runs the handler
-            url - to match request URL, you can use 'regex:' prefix to use regex match(optional)
-            methods - to match request method, you can use commas to separate multiple method matches(optional)
-            headers - to match request headers, match each child element(child element name is header name), you can use 'regex:' prefix to use regex match(optional)
-        handler is request handler
-            type - supported types: static, dynamic_query_handler, predefined_query_handler
-            query - use with predefined_query_handler type, executes query when the handler is called
-            query_param_name - use with dynamic_query_handler type, extracts and executes the value corresponding to the <query_param_name> value in HTTP request params
-            status - use with static type, response status code
-            content_type - use with static type, response content-type
-            response_content - use with static type, Response content sent to client, when using the prefix 'file://' or 'config://', find the content from the file or configuration send to client.
-
-    <http_handlers>
-        <rule>
-            <url>/</url>
-            <methods>POST,GET</methods>
-            <headers><pragma>no-cache</pragma></headers>
-            <handler>
-                <type>dynamic_query_handler</type>
-                <query_param_name>query</query_param_name>
-            </handler>
-        </rule>
-
-        <rule>
-            <url>/predefined_query</url>
-            <methods>POST,GET</methods>
-            <handler>
-                <type>predefined_query_handler</type>
-                <query>SELECT * FROM system.settings</query>
-            </handler>
-        </rule>
-
-        <rule>
-            <handler>
-                <type>static</type>
-                <status>200</status>
-                <content_type>text/plain; charset=UTF-8</content_type>
-                <response_content>config://http_server_default_response</response_content>
-            </handler>
-        </rule>
-    </http_handlers>
-    -->
-
-    <send_crash_reports>
-        <!-- Changing <enabled> to true allows sending crash reports to -->
-        <!-- the ClickHouse core developers team via Sentry https://sentry.io -->
-        <!-- Doing so at least in pre-production environments is highly appreciated -->
-        <enabled>false</enabled>
-        <!-- Change <anonymize> to true if you don't feel comfortable attaching the server hostname to the crash report -->
-        <anonymize>false</anonymize>
-        <!-- Default endpoint should be changed to different Sentry DSN only if you have -->
-        <!-- some in-house engineers or hired consultants who're going to debug ClickHouse issues for you -->
-        <endpoint>https://6f33034cfe684dd7a3ab9875e57b1c8d@o388870.ingest.sentry.io/5226277</endpoint>
-    </send_crash_reports>
-
-    <!-- Uncomment to disable ClickHouse internal DNS caching. -->
-    <!-- <disable_internal_dns_cache>1</disable_internal_dns_cache> -->
-
-    <!-- You can also configure rocksdb like this: -->
-    <!--
-    <rocksdb>
-        <options>
-            <max_background_jobs>8</max_background_jobs>
-        </options>
-        <column_family_options>
-            <num_levels>2</num_levels>
-        </column_family_options>
-        <tables>
-            <table>
-                <name>TABLE</name>
-                <options>
-                    <max_background_jobs>8</max_background_jobs>
-                </options>
-                <column_family_options>
-                    <num_levels>2</num_levels>
-                </column_family_options>
-            </table>
-        </tables>
-    </rocksdb>
-    -->
-</yandex>
diff --git a/programs/diagnostics/testdata/docker/admin.xml b/programs/diagnostics/testdata/docker/admin.xml
deleted file mode 100644
index 76aa670dcfe..00000000000
--- a/programs/diagnostics/testdata/docker/admin.xml
+++ /dev/null
@@ -1,15 +0,0 @@
-<clickhouse>
-    <!-- Profiles of settings. -->
-    <profiles>
-        <!-- Default settings. -->
-        <default>
-            <!-- Allows us to create replicated databases. -->
-            <allow_experimental_database_replicated>1</allow_experimental_database_replicated>
-        </default>
-    </profiles>
-    <users>
-        <default>
-            <access_management>1</access_management>
-        </default>
-    </users>
-</clickhouse>
\ No newline at end of file
diff --git a/programs/diagnostics/testdata/docker/custom.xml b/programs/diagnostics/testdata/docker/custom.xml
deleted file mode 100644
index bc1051178ca..00000000000
--- a/programs/diagnostics/testdata/docker/custom.xml
+++ /dev/null
@@ -1,8 +0,0 @@
-<clickhouse>
-    <listen_host>::</listen_host>
-    <listen_host>0.0.0.0</listen_host>
-    <listen_try>1</listen_try>
-    <logger>
-        <console>1</console>
-    </logger>
-</clickhouse>
diff --git a/programs/diagnostics/testdata/logs/var/logs/clickhouse-server.err.log b/programs/diagnostics/testdata/logs/var/logs/clickhouse-server.err.log
deleted file mode 100644
index 1a1768fe87e..00000000000
--- a/programs/diagnostics/testdata/logs/var/logs/clickhouse-server.err.log
+++ /dev/null
@@ -1,10 +0,0 @@
-2021.12.13 10:12:26.940169 [ 38398 ] {} <Warning> Access(local directory): File /var/lib/clickhouse/access/users.list doesn't exist
-2021.12.13 10:12:26.940204 [ 38398 ] {} <Warning> Access(local directory): Recovering lists in directory /var/lib/clickhouse/access/
-2021.12.13 10:12:40.649453 [ 38445 ] {} <Error> Access(user directories): from: 127.0.0.1, user: default: Authentication failed: Code: 193. DB::Exception: Invalid credentials. (WRONG_PASSWORD), Stack trace (when copying this message, always include the lines below):
-
-0. DB::Exception::Exception(std::__1::basic_string<char, std::__1::char_traits<char>, std::__1::allocator<char> > const&, int, bool) @ 0x9b722d4 in /usr/bin/clickhouse
-1. DB::IAccessStorage::throwInvalidCredentials() @ 0x119d9b27 in /usr/bin/clickhouse
-2. DB::IAccessStorage::loginImpl(DB::Credentials const&, Poco::Net::IPAddress const&, DB::ExternalAuthenticators const&) const @ 0x119d98d7 in /usr/bin/clickhouse
-3. DB::IAccessStorage::login(DB::Credentials const&, Poco::Net::IPAddress const&, DB::ExternalAuthenticators const&, bool) const @ 0x119d9084 in /usr/bin/clickhouse
-4. DB::MultipleAccessStorage::loginImpl(DB::Credentials const&, Poco::Net::IPAddress const&, DB::ExternalAuthenticators const&) const @ 0x119ff93c in /usr/bin/clickhouse
-5. DB::IAccessStorage::login(DB::Credentials const&, Poco::Net::IPAddress const&, DB::ExternalAuthenticators const&, bool) const @ 0x119d9084 in /usr/bin/clickhouse
diff --git a/programs/diagnostics/testdata/logs/var/logs/clickhouse-server.log b/programs/diagnostics/testdata/logs/var/logs/clickhouse-server.log
deleted file mode 100644
index f6abe7764ba..00000000000
--- a/programs/diagnostics/testdata/logs/var/logs/clickhouse-server.log
+++ /dev/null
@@ -1,10 +0,0 @@
-2022.02.02 14:49:32.458680 [ 200404 ] {} <Debug> DiskLocal: Reserving 2.47 MiB on disk `default`, having unreserved 1.56 TiB.
-2022.02.02 14:49:32.459086 [ 200359 ] {de87df8b-2250-439c-9e87-df8b2250339c::202202_147058_147550_344} <Debug> MergeTask::PrepareStage: Merging 2 parts: from 202202_147058_147549_343 to 202202_147550_147550_0 into Wide
-2022.02.02 14:49:32.459201 [ 200359 ] {de87df8b-2250-439c-9e87-df8b2250339c::202202_147058_147550_344} <Debug> MergeTask::PrepareStage: Selected MergeAlgorithm: Horizontal
-2022.02.02 14:49:32.459262 [ 200359 ] {de87df8b-2250-439c-9e87-df8b2250339c::202202_147058_147550_344} <Debug> MergeTreeSequentialSource: Reading 159 marks from part 202202_147058_147549_343, total 1289014 rows starting from the beginning of the part
-2022.02.02 14:49:32.459614 [ 200359 ] {de87df8b-2250-439c-9e87-df8b2250339c::202202_147058_147550_344} <Debug> MergeTreeSequentialSource: Reading 2 marks from part 202202_147550_147550_0, total 2618 rows starting from the beginning of the part
-2022.02.02 14:49:32.507755 [ 200359 ] {de87df8b-2250-439c-9e87-df8b2250339c::202202_147058_147550_344} <Debug> MergeTask::MergeProjectionsStage: Merge sorted 1291632 rows, containing 5 columns (5 merged, 0 gathered) in 0.048711404 sec., 26516008.448452853 rows/sec., 639.52 MiB/sec.
-2022.02.02 14:49:32.508332 [ 200359 ] {de87df8b-2250-439c-9e87-df8b2250339c::202202_147058_147550_344} <Trace> system.asynchronous_metric_log (de87df8b-2250-439c-9e87-df8b2250339c): Renaming temporary part tmp_merge_202202_147058_147550_344 to 202202_147058_147550_344.
-2022.02.02 14:49:32.508406 [ 200359 ] {de87df8b-2250-439c-9e87-df8b2250339c::202202_147058_147550_344} <Trace> system.asynchronous_metric_log (de87df8b-2250-439c-9e87-df8b2250339c) (MergerMutator): Merged 2 parts: from 202202_147058_147549_343 to 202202_147550_147550_0
-2022.02.02 14:49:32.508440 [ 200359 ] {} <Debug> MemoryTracker: Peak memory usage Mutate/Merge: 16.31 MiB.
-2022.02.02 14:49:33.000148 [ 200388 ] {} <Trace> AsynchronousMetrics: MemoryTracking: was 774.16 MiB, peak 2.51 GiB, will set to 772.30 MiB (RSS), difference: -1.86 MiB
diff --git a/programs/diagnostics/testdata/logs/var/logs/clickhouse-server.log.gz b/programs/diagnostics/testdata/logs/var/logs/clickhouse-server.log.gz
deleted file mode 100644
index 136bf5913aa..00000000000
--- a/programs/diagnostics/testdata/logs/var/logs/clickhouse-server.log.gz
+++ /dev/null
@@ -1 +0,0 @@
-dummy hz file for tests

From ada4384deb5fe0c4dd95459da9ac8a225cf92a51 Mon Sep 17 00:00:00 2001
From: liuneng <1398775315@qq.com>
Date: Thu, 21 Mar 2024 10:38:51 +0800
Subject: [PATCH 831/985] fix ut failed

---
 src/Analyzer/Passes/ConvertInToEqualPass.cpp     | 16 +++++++++++-----
 ...est_transform_query_for_external_database.cpp |  6 ++++--
 2 files changed, 15 insertions(+), 7 deletions(-)

diff --git a/src/Analyzer/Passes/ConvertInToEqualPass.cpp b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
index fbac09de7aa..ddd8a8f266f 100644
--- a/src/Analyzer/Passes/ConvertInToEqualPass.cpp
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
@@ -32,7 +32,8 @@ public:
         if (!column_node || !constant_node)
             return ;
         // IN multiple values is not supported
-        if (constant_node->getValue().getType() == Field::Types::Which::Tuple)
+        if (constant_node->getValue().getType() == Field::Types::Which::Tuple
+            || constant_node->getValue().getType() == Field::Types::Which::Array)
             return ;
         // x IN null not equivalent to x = null
         if (constant_node->hasSourceExpression() || constant_node->getValue().isNull())
@@ -51,12 +52,17 @@ public:
         {
             resolver = createInternalFunctionNotEqualOverloadResolver(decimal_check_overflow);
         }
-        equal->resolveAsFunction(resolver);
+        try
+        {
+            equal->resolveAsFunction(resolver);
+        }
+        catch (...)
+        {
+            // When function resolver fails, we should not replace the function node
+            return;
+        }
         node = equal;
     }
-private:
-    FunctionOverloadResolverPtr equal_resolver;
-    FunctionOverloadResolverPtr not_equal_resolver;
 };
 
 void ConvertInToEqualPass::run(QueryTreeNodePtr & query_tree_node, ContextPtr context)
diff --git a/src/Storages/tests/gtest_transform_query_for_external_database.cpp b/src/Storages/tests/gtest_transform_query_for_external_database.cpp
index 7e2d393c3d1..6490498d717 100644
--- a/src/Storages/tests/gtest_transform_query_for_external_database.cpp
+++ b/src/Storages/tests/gtest_transform_query_for_external_database.cpp
@@ -306,7 +306,8 @@ TEST(TransformQueryForExternalDatabase, Aliases)
 
     check(state, 1, {"field"},
           "SELECT field AS value, field AS display FROM table WHERE field NOT IN ('') AND display LIKE '%test%'",
-          R"(SELECT "field" FROM "test"."table" WHERE ("field" NOT IN ('')) AND ("field" LIKE '%test%'))");
+          R"(SELECT "field" FROM "test"."table" WHERE ("field" NOT IN ('')) AND ("field" LIKE '%test%'))",
+          R"(SELECT "field" FROM "test"."table" WHERE ("field" != '') AND ("field" LIKE '%test%'))");
 }
 
 TEST(TransformQueryForExternalDatabase, ForeignColumnInWhere)
@@ -408,5 +409,6 @@ TEST(TransformQueryForExternalDatabase, Analyzer)
 
     check(state, 1, {"column", "apply_id", "apply_type", "apply_status", "create_time", "field", "value", "a", "b", "foo"},
         "SELECT * FROM table WHERE (column) IN (1)",
-        R"(SELECT "column", "apply_id", "apply_type", "apply_status", "create_time", "field", "value", "a", "b", "foo" FROM "test"."table" WHERE "column" IN (1))");
+        R"(SELECT "column", "apply_id", "apply_type", "apply_status", "create_time", "field", "value", "a", "b", "foo" FROM "test"."table" WHERE "column" IN (1))",
+        R"(SELECT "column", "apply_id", "apply_type", "apply_status", "create_time", "field", "value", "a", "b", "foo" FROM "test"."table" WHERE "column" = 1)");
 }

From adc964568c29e69131c37e600c867a98957c65da Mon Sep 17 00:00:00 2001
From: unashi <unashi@tencent.com>
Date: Thu, 21 Mar 2024 15:44:27 +0800
Subject: [PATCH 832/985] [update] Merge the on same disk and on another disk
 scenarios into cloneAndLoadDataPart; remove the try catch; instead of
 obtaining the copied destination hard disk through traversal, the destination
 hard disk is obtained through reservation.

---
 src/Storages/MergeTree/MergeTreeData.cpp    | 166 ++------------------
 src/Storages/MergeTree/MergeTreeData.h      |  11 +-
 src/Storages/MergeTree/MutateTask.cpp       |   2 +-
 src/Storages/StorageMergeTree.cpp           |  43 ++---
 src/Storages/StorageReplicatedMergeTree.cpp |  48 ++----
 5 files changed, 42 insertions(+), 228 deletions(-)

diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index f8448be7268..aed2db16504 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -7063,7 +7063,7 @@ MergeTreeData & MergeTreeData::checkStructureAndGetMergeTreeData(
     return checkStructureAndGetMergeTreeData(*source_table, src_snapshot, my_snapshot);
 }
 
-std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAndLoadDataPartOnSameDisk(
+std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAndLoadDataPart(
     const MergeTreeData::DataPartPtr & src_part,
     const String & tmp_part_prefix,
     const MergeTreePartInfo & dst_part_info,
@@ -7073,22 +7073,16 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     const WriteSettings & write_settings)
 {
     chassert(!isStaticStorage());
-
-    /// Check that the storage policy contains the disk where the src_part is located.
-    bool does_storage_policy_allow_same_disk = false;
-    for (const DiskPtr & disk : getStoragePolicy()->getDisks())
+    bool on_same_disk = false;
+    for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
     {
         if (disk->getName() == src_part->getDataPartStorage().getDiskName())
         {
-            does_storage_policy_allow_same_disk = true;
+            on_same_disk = true;
             break;
         }
     }
-    if (!does_storage_policy_allow_same_disk)
-        throw Exception(
-            ErrorCodes::BAD_ARGUMENTS,
-            "Could not clone and load part {} because disk does not belong to storage policy",
-            quoteString(src_part->getDataPartStorage().getFullPath()));
+
 
     String dst_part_name = src_part->getNewName(dst_part_info);
     String tmp_dst_part_name = tmp_part_prefix + dst_part_name;
@@ -7103,11 +7097,12 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
     MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
 
     String with_copy;
-    if (params.copy_instead_of_hardlink)
+    if (params.copy_instead_of_hardlink || !on_same_disk)
         with_copy = " (copying data)";
 
+
     std::shared_ptr<IDataPartStorage> dst_part_storage{};
-    try
+    if (on_same_disk && !params.copy_instead_of_hardlink)
     {
         dst_part_storage = src_part_storage->freeze(
             relative_data_path,
@@ -7117,34 +7112,13 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
             /* save_metadata_callback= */ {},
             params);
     }
-    catch (...)
+    else
     {
-        /// Hardlink fail. Try copy.
-        LOG_WARNING(
-            &Poco::Logger::get("MergeTreeData"),
-            "Hard link fail, try tp copy directly. to:{}, path:{}",
-            this->getRelativeDataPath(),
-            tmp_dst_part_name);
-        bool copy_successful = false;
-        for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
-        {
-            try
-            {
-                auto reservation_space = src_part_storage->reserve(src_part->getBytesOnDisk());
-                if (!reservation_space)
-                    throw Exception(ErrorCodes::NOT_ENOUGH_SPACE, "Not enough space on disk.");
-                dst_part_storage = src_part_storage->clonePart(
-                    this->getRelativeDataPath(), tmp_dst_part_name, disk, read_settings, write_settings, {}, {});
-                copy_successful = true;
-                break;
-            }
-            catch (Exception & e)
-            {
-                LOG_TRACE(&Poco::Logger::get("MergeTreeData"), "Clone part on disk {} fail: {}", disk->getName(), e.what());
-            }
-        }
-        if (!copy_successful)
-            LOG_ERROR(&Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail.");
+        auto reservation_on_dst = getStoragePolicy()->reserve(src_part->getBytesOnDisk());
+        if (!reservation_on_dst)
+            throw Exception(ErrorCodes::NOT_ENOUGH_SPACE, "Not enough space on disk.");
+        dst_part_storage = src_part_storage->clonePart(
+            this->getRelativeDataPath(), tmp_dst_part_name, reservation_on_dst->getDisk(), read_settings, write_settings, {}, {});
     }
 
 
@@ -7168,117 +7142,7 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAn
         .withPartFormatFromDisk()
         .build();
 
-    if (!params.copy_instead_of_hardlink && params.hardlinked_files)
-    {
-        params.hardlinked_files->source_part_name = src_part->name;
-        params.hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
-
-        for (auto it = src_part->getDataPartStorage().iterate(); it->isValid(); it->next())
-        {
-            if (!params.files_to_copy_instead_of_hardlinks.contains(it->name())
-                && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
-                && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
-            {
-                params.hardlinked_files->hardlinks_from_source_part.insert(it->name());
-            }
-        }
-
-        auto projections = src_part->getProjectionParts();
-        for (const auto & [name, projection_part] : projections)
-        {
-            const auto & projection_storage = projection_part->getDataPartStorage();
-            for (auto it = projection_storage.iterate(); it->isValid(); it->next())
-            {
-                auto file_name_with_projection_prefix = fs::path(projection_storage.getPartDirectory()) / it->name();
-                if (!params.files_to_copy_instead_of_hardlinks.contains(file_name_with_projection_prefix)
-                    && it->name() != IMergeTreeDataPart::DELETE_ON_DESTROY_MARKER_FILE_NAME_DEPRECATED
-                    && it->name() != IMergeTreeDataPart::TXN_VERSION_METADATA_FILE_NAME)
-                {
-                    params.hardlinked_files->hardlinks_from_source_part.insert(file_name_with_projection_prefix);
-                }
-            }
-        }
-    }
-
-    /// We should write version metadata on part creation to distinguish it from parts that were created without transaction.
-    TransactionID tid = params.txn ? params.txn->tid : Tx::PrehistoricTID;
-    dst_data_part->version.setCreationTID(tid, nullptr);
-    dst_data_part->storeVersionMetadata();
-
-    dst_data_part->is_temp = true;
-
-    dst_data_part->loadColumnsChecksumsIndexes(require_part_metadata, true);
-    dst_data_part->modification_time = dst_part_storage->getLastModified().epochTime();
-    return std::make_pair(dst_data_part, std::move(temporary_directory_lock));
-}
-
-std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> MergeTreeData::cloneAndLoadDataPartOnOtherDisk(
-    const MergeTreeData::DataPartPtr & src_part,
-    const String & tmp_part_prefix,
-    const MergeTreePartInfo & dst_part_info,
-    const StorageMetadataPtr & metadata_snapshot,
-    const IDataPartStorage::ClonePartParams & params,
-    const ReadSettings & read_settings,
-    const WriteSettings & write_settings)
-{
-    chassert(!isStaticStorage());
-
-    String dst_part_name = src_part->getNewName(dst_part_info);
-    String tmp_dst_part_name = tmp_part_prefix + dst_part_name;
-    auto temporary_directory_lock = getTemporaryPartDirectoryHolder(tmp_dst_part_name);
-
-    auto reservation = src_part->getDataPartStorage().reserve(src_part->getBytesOnDisk());
-    auto src_part_storage = src_part->getDataPartStoragePtr();
-
-    scope_guard src_flushed_tmp_dir_lock;
-    MergeTreeData::MutableDataPartPtr src_flushed_tmp_part;
-
-    String with_copy;
-    if (params.copy_instead_of_hardlink)
-        with_copy = " (copying data)";
-
-    std::shared_ptr<IDataPartStorage> dst_part_storage{};
-    bool copy_successful = false;
-    for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
-    {
-        try
-        {
-            auto reservation_space = src_part_storage->reserve(src_part->getBytesOnDisk());
-            if (!reservation_space)
-                throw Exception(ErrorCodes::NOT_ENOUGH_SPACE, "Not enough space on disk.");
-            dst_part_storage
-                = src_part_storage->clonePart(this->getRelativeDataPath(), tmp_dst_part_name, disk, read_settings, write_settings, {}, {});
-            copy_successful = true;
-            break;
-        }
-        catch (...)
-        {
-            LOG_TRACE(&Poco::Logger::get("MergeTreeData"), "Clone part on disk {} fail", disk->getName());
-        }
-    }
-    if (!copy_successful)
-        LOG_FATAL(&Poco::Logger::get("MergeTreeData"), "Hard link fail, clone fail.");
-    if (params.metadata_version_to_write.has_value())
-    {
-        chassert(!params.keep_metadata_version);
-        auto out_metadata = dst_part_storage->writeFile(IMergeTreeDataPart::METADATA_VERSION_FILE_NAME, 4096, getContext()->getWriteSettings());
-        writeText(metadata_snapshot->getMetadataVersion(), *out_metadata);
-        out_metadata->finalize();
-        if (getSettings()->fsync_after_insert)
-            out_metadata->sync();
-    }
-
-    LOG_DEBUG(log, "Clone{} part {} to {}{}",
-              src_flushed_tmp_part ? " flushed" : "",
-              src_part_storage->getFullPath(),
-              std::string(fs::path(dst_part_storage->getFullRootPath()) / tmp_dst_part_name),
-              with_copy);
-
-    auto dst_data_part = MergeTreeDataPartBuilder(*this, dst_part_name, dst_part_storage)
-        .withPartFormatFromDisk()
-        .build();
-
-    if (!params.copy_instead_of_hardlink && params.hardlinked_files)
+    if (on_same_disk && !params.copy_instead_of_hardlink && params.hardlinked_files)
     {
         params.hardlinked_files->source_part_name = src_part->name;
         params.hardlinked_files->source_table_shared_id = src_part->storage.getTableSharedID();
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index 95bec1eeb2b..9b9e5f97f36 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -834,16 +834,7 @@ public:
     MergeTreeData & checkStructureAndGetMergeTreeData(const StoragePtr & source_table, const StorageMetadataPtr & src_snapshot, const StorageMetadataPtr & my_snapshot) const;
     MergeTreeData & checkStructureAndGetMergeTreeData(IStorage & source_table, const StorageMetadataPtr & src_snapshot, const StorageMetadataPtr & my_snapshot) const;
 
-    std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneAndLoadDataPartOnSameDisk(
-        const MergeTreeData::DataPartPtr & src_part,
-        const String & tmp_part_prefix,
-        const MergeTreePartInfo & dst_part_info,
-        const StorageMetadataPtr & metadata_snapshot,
-        const IDataPartStorage::ClonePartParams & params,
-        const ReadSettings & read_settings,
-        const WriteSettings & write_settings);
-
-    std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneAndLoadDataPartOnOtherDisk(
+    std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> cloneAndLoadDataPart(
         const MergeTreeData::DataPartPtr & src_part,
         const String & tmp_part_prefix,
         const MergeTreePartInfo & dst_part_info,
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 150cc27c369..3ac103824bd 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -2097,7 +2097,7 @@ bool MutateTask::prepare()
         scope_guard lock;
 
         {
-            std::tie(part, lock) = ctx->data->cloneAndLoadDataPartOnSameDisk(
+            std::tie(part, lock) = ctx->data->cloneAndLoadDataPart(
                 ctx->source_part, prefix, ctx->future_part->part_info, ctx->metadata_snapshot, clone_params, ctx->context->getReadSettings(), ctx->context->getWriteSettings());
             part->getDataPartStorage().beginTransaction();
             ctx->temporary_directory_lock = std::move(lock);
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 89857156701..6adfc860cbc 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -2099,37 +2099,16 @@ void StorageMergeTree::replacePartitionFrom(const StoragePtr & source_table, con
         MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
 
         IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
-        bool on_same_disk = false;
-        for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
-            if (disk->getName() == src_part->getDataPartStorage().getDiskName())
-                on_same_disk = true;
-        if (on_same_disk && !clone_params.copy_instead_of_hardlink)
-        {
-
-            auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-                src_part,
-                TMP_PREFIX,
-                dst_part_info,
-                my_metadata_snapshot,
-                clone_params,
-                local_context->getReadSettings(),
-                local_context->getWriteSettings());
-            dst_parts.emplace_back(std::move(dst_part));
-            dst_parts_locks.emplace_back(std::move(part_lock));
-        }
-        else
-        {
-            auto [dst_part, part_lock] = cloneAndLoadDataPartOnOtherDisk(
-                src_part,
-                TMP_PREFIX,
-                dst_part_info,
-                my_metadata_snapshot,
-                clone_params,
-                local_context->getReadSettings(),
-                local_context->getWriteSettings());
-            dst_parts.emplace_back(std::move(dst_part));
-            dst_parts_locks.emplace_back(std::move(part_lock));
-        }
+        auto [dst_part, part_lock] = cloneAndLoadDataPart(
+            src_part,
+            TMP_PREFIX,
+            dst_part_info,
+            my_metadata_snapshot,
+            clone_params,
+            local_context->getReadSettings(),
+            local_context->getWriteSettings());
+        dst_parts.emplace_back(std::move(dst_part));
+        dst_parts_locks.emplace_back(std::move(part_lock));
     }
 
     /// ATTACH empty part set
@@ -2231,7 +2210,7 @@ void StorageMergeTree::movePartitionToTable(const StoragePtr & dest_table, const
             .copy_instead_of_hardlink = getSettings()->always_use_copy_instead_of_hardlinks,
         };
 
-        auto [dst_part, part_lock] = dest_table_storage->cloneAndLoadDataPartOnSameDisk(
+        auto [dst_part, part_lock] = dest_table_storage->cloneAndLoadDataPart(
             src_part,
             TMP_PREFIX,
             dst_part_info,
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index fdbd2d47fe4..cf9cc6f27e1 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -2751,7 +2751,7 @@ bool StorageReplicatedMergeTree::executeReplaceRange(LogEntry & entry)
 
     auto obtain_part = [&] (PartDescriptionPtr & part_desc)
     {
-        /// Fetches with zero-copy-replication are cheap, but cloneAndLoadDataPartOnSameDisk will do full copy.
+        /// Fetches with zero-copy-replication are cheap, but cloneAndLoadDataPart(OnSameDisk) will do full copy.
         /// It's okay to check the setting for current table and disk for the source table, because src and dst part are on the same disk.
         bool prefer_fetch_from_other_replica = !part_desc->replica.empty() && storage_settings_ptr->allow_remote_fs_zero_copy_replication
             && part_desc->src_table_part && part_desc->src_table_part->isStoredOnRemoteDiskWithZeroCopySupport();
@@ -2770,7 +2770,7 @@ bool StorageReplicatedMergeTree::executeReplaceRange(LogEntry & entry)
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || ((our_zero_copy_enabled || source_zero_copy_enabled) && part_desc->src_table_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
-            auto [res_part, temporary_part_lock] = cloneAndLoadDataPartOnSameDisk(
+            auto [res_part, temporary_part_lock] = cloneAndLoadDataPart(
                 part_desc->src_table_part,
                 TMP_PREFIX + "clone_",
                 part_desc->new_part_info,
@@ -4847,7 +4847,7 @@ bool StorageReplicatedMergeTree::fetchPart(
                 .keep_metadata_version = true,
             };
 
-            auto [cloned_part, lock] = cloneAndLoadDataPartOnSameDisk(
+            auto [cloned_part, lock] = cloneAndLoadDataPart(
                 part_to_clone,
                 "tmp_clone_",
                 part_info,
@@ -8023,36 +8023,16 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || (zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
-            bool on_same_disk = false;
-            for (const DiskPtr & disk : this->getStoragePolicy()->getDisks())
-                if (disk->getName() == src_part->getDataPartStorage().getDiskName())
-                    on_same_disk = true;
-            if (on_same_disk && !clone_params.copy_instead_of_hardlink)
-            {
-                auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
-                    src_part,
-                    TMP_PREFIX,
-                    dst_part_info,
-                    metadata_snapshot,
-                    clone_params,
-                    query_context->getReadSettings(),
-                    query_context->getWriteSettings());
-                dst_parts.emplace_back(std::move(dst_part));
-                dst_parts_locks.emplace_back(std::move(part_lock));
-            }
-            else
-            {
-                auto [dst_part, part_lock] = cloneAndLoadDataPartOnOtherDisk(
-                    src_part,
-                    TMP_PREFIX,
-                    dst_part_info,
-                    metadata_snapshot,
-                    clone_params,
-                    query_context->getReadSettings(),
-                    query_context->getWriteSettings());
-                dst_parts.emplace_back(std::move(dst_part));
-                dst_parts_locks.emplace_back(std::move(part_lock));
-            }
+            auto [dst_part, part_lock] = cloneAndLoadDataPart(
+                src_part,
+                TMP_PREFIX,
+                dst_part_info,
+                metadata_snapshot,
+                clone_params,
+                query_context->getReadSettings(),
+                query_context->getWriteSettings());
+            dst_parts.emplace_back(std::move(dst_part));
+            dst_parts_locks.emplace_back(std::move(part_lock));
             src_parts.emplace_back(src_part);
             ephemeral_locks.emplace_back(std::move(*lock));
             block_id_paths.emplace_back(block_id_path);
@@ -8291,7 +8271,7 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || (zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = dest_metadata_snapshot->getMetadataVersion()
             };
-            auto [dst_part, dst_part_lock] = dest_table_storage->cloneAndLoadDataPartOnSameDisk(
+            auto [dst_part, dst_part_lock] = dest_table_storage->cloneAndLoadDataPart(
                 src_part,
                 TMP_PREFIX,
                 dst_part_info,

From 758b07db3c9eebea354e1f20f6d14b4102d1d3d8 Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Thu, 21 Mar 2024 08:45:35 +0100
Subject: [PATCH 833/985] Update 02967_parallel_replicas_join_algo_and_analyzer
 #ci_set_analyzer

---
 ..._replicas_join_algo_and_analyzer.reference | 56 +++++++++----------
 1 file changed, 28 insertions(+), 28 deletions(-)

diff --git a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
index fa343571ba0..165504174d0 100644
--- a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
+++ b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
@@ -25,8 +25,8 @@ simple (global) join with analyzer and parallel replicas
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` (stage: WithMergeableState)
 SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, allow_experimental_parallel_reading_from_replicas = 2, send_logs_level = 'trace', max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, allow_experimental_parallel_reading_from_replicas = 2, send_logs_level = 'trace', max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
 
 simple (local) join with analyzer and parallel replicas
@@ -40,8 +40,8 @@ simple (local) join with analyzer and parallel replicas
 4200042	4200042	4200042	-1400014
 4200048	4200048	4200048	-1400016
 4200054	4200054	4200054	-1400018
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
 
 simple (local) join with analyzer and parallel replicas and full sorting merge join
@@ -55,8 +55,8 @@ simple (local) join with analyzer and parallel replicas and full sorting merge j
 4200042	4200042	4200042	-1400014
 4200048	4200048	4200048	-1400016
 4200054	4200054	4200054	-1400018
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4`) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(700000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
 
 nested join with analyzer
@@ -82,8 +82,8 @@ nested join with analyzer and parallel replicas, both local
 420294	420294	420294	-140098
 420336	420336	420336	-140112
 420378	420378	420378	-140126
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` SETTINGS parallel_replicas_prefer_local_join = 1) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` SETTINGS parallel_replicas_prefer_local_join = 1) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, join_algorithm = 'full_sorting_merge', send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
 
 nested join with analyzer and parallel replicas, both global
@@ -97,11 +97,11 @@ nested join with analyzer and parallel replicas, both global
 420294	420294	420294	-140098
 420336	420336	420336	-140112
 420378	420378	420378	-140126
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
 
 nested join with analyzer and parallel replicas, global + local
@@ -115,11 +115,11 @@ nested join with analyzer and parallel replicas, global + local
 420294	420294	420294	-140098
 420336	420336	420336	-140112
 420378	420378	420378	-140126
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` ALL INNER JOIN (SELECT `__table3`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table3`) AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` ALL INNER JOIN (SELECT `__table3`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table3`) AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS parallel_replicas_prefer_local_join = 1 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` ALL INNER JOIN (SELECT `__table3`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table3`) AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` ALL INNER JOIN (SELECT `__table3`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table3`) AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', parallel_replicas_prefer_local_join = 0 (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
 
 nested join with analyzer and parallel replicas, both local, both full sorting merge join
@@ -133,11 +133,11 @@ nested join with analyzer and parallel replicas, both local, both full sorting m
 420294	420294	420294	-140098
 420336	420336	420336	-140112
 420378	420378	420378	-140126
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
 
 nested join with analyzer and parallel replicas, both local, both full sorting and hash join
@@ -151,11 +151,11 @@ nested join with analyzer and parallel replicas, both local, both full sorting a
 420294	420294	420294	-140098
 420336	420336	420336	-140112
 420378	420378	420378	-140126
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'hash' (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'hash' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
 
 nested join with analyzer and parallel replicas, both local, both full sorting and hash join
@@ -169,9 +169,9 @@ nested join with analyzer and parallel replicas, both local, both full sorting a
 420294	420294	420294	-140098
 420336	420336	420336	-140112
 420378	420378	420378	-140126
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` SETTINGS join_algorithm = 'full_sorting_merge' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value` FROM `default`.`num_2` AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table2` ON `__table1`.`key` = `__table2`.`key` (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'hash' (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') SETTINGS allow_experimental_analyzer = 1, parallel_replicas_prefer_local_join = 0, send_logs_level = 'trace', allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 2, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', join_algorithm = 'hash' (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` GLOBAL ALL INNER JOIN `_data_` AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
 <Debug> DefaultCoordinator: Coordination done

From 7a3ab461bfe88b6d073ac8284ac5f12841b120cf Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 21 Mar 2024 09:24:35 +0100
Subject: [PATCH 834/985] Fix style check

---
 src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp | 7 -------
 1 file changed, 7 deletions(-)

diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
index 5941dca0b48..3555c71abee 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
@@ -29,7 +29,6 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-
 ReadBufferFromAzureBlobStorage::ReadBufferFromAzureBlobStorage(
     std::shared_ptr<const Azure::Storage::Blobs::BlobContainerClient> blob_container_client_,
     const String & path_,
@@ -58,7 +57,6 @@ ReadBufferFromAzureBlobStorage::ReadBufferFromAzureBlobStorage(
     }
 }
 
-
 void ReadBufferFromAzureBlobStorage::setReadUntilEnd()
 {
     if (read_until_position)
@@ -141,7 +139,6 @@ bool ReadBufferFromAzureBlobStorage::nextImpl()
     return true;
 }
 
-
 off_t ReadBufferFromAzureBlobStorage::seek(off_t offset_, int whence)
 {
     if (offset_ == getPosition() && whence == SEEK_SET)
@@ -195,13 +192,11 @@ off_t ReadBufferFromAzureBlobStorage::seek(off_t offset_, int whence)
     return offset;
 }
 
-
 off_t ReadBufferFromAzureBlobStorage::getPosition()
 {
     return offset - available();
 }
 
-
 void ReadBufferFromAzureBlobStorage::initialize()
 {
     if (initialized)
@@ -279,8 +274,6 @@ size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t ran
         sleep_time_with_backoff_milliseconds *= 2;
     };
 
-
-
     for (size_t i = 0; i < max_single_download_retries && n > 0; ++i)
     {
         size_t bytes_copied = 0;

From 4b144f94f8ef2f3fa3cc90fcf6431f4d75691189 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 4 Mar 2024 14:24:55 +0300
Subject: [PATCH 835/985] MergeTree read split ranges into intersecting and non
 intersecting injection

---
 src/Core/Settings.h                           |  1 +
 src/Core/SettingsChangesHistory.h             |  1 +
 src/Processors/QueryPlan/PartsSplitter.cpp    | 10 ++-
 .../QueryPlan/ReadFromMergeTree.cpp           | 76 +++++++++++++++++++
 4 files changed, 86 insertions(+), 2 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 5c25368fb00..b7ed8fc7d1d 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -287,6 +287,7 @@ class IColumn;
     M(UInt64, read_backoff_min_concurrency, 1, "Settings to try keeping the minimal number of threads in case of slow reads.", 0) \
     \
     M(Float, memory_tracker_fault_probability, 0., "For testing of `exception safety` - throw an exception every time you allocate memory with the specified probability.", 0) \
+    M(Float, merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability, 1.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability.", 0) \
     \
     M(Bool, enable_http_compression, false, "Compress the result if the client over HTTP said that it understands data compressed by gzip, deflate, zstd, br, lz4, bz2, xz.", 0) \
     M(Int64, http_zlib_compression_level, 3, "Compression level - used if the client on HTTP said that it understands data compressed by gzip or deflate.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 0bce814170b..e8e38ca82f9 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -131,6 +131,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"default_normal_view_sql_security", "INVOKER", "INVOKER", "Allows to set default `SQL SECURITY` option while creating a normal view"},
               {"mysql_map_string_to_text_in_show_columns", false, true, "Reduce the configuration effort to connect ClickHouse with BI tools."},
               {"mysql_map_fixed_string_to_text_in_show_columns", false, true, "Reduce the configuration effort to connect ClickHouse with BI tools."},
+              {"merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability", 0.0, 0.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability."},
               }},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},
diff --git a/src/Processors/QueryPlan/PartsSplitter.cpp b/src/Processors/QueryPlan/PartsSplitter.cpp
index 5235785907c..33151597a38 100644
--- a/src/Processors/QueryPlan/PartsSplitter.cpp
+++ b/src/Processors/QueryPlan/PartsSplitter.cpp
@@ -34,6 +34,12 @@ std::string toString(const Values & value)
     return fmt::format("({})", fmt::join(value, ", "));
 }
 
+/** We rely that FieldVisitorAccurateLess will have strict weak ordering for any Field values including
+  * NaN, Null and containers (Array, Tuple, Map) that contain NaN or Null. But right now it does not properly
+  * support NaN and Nulls inside containers, because it uses Field operator< or accurate::lessOp for comparison
+  * that compares Nulls and NaNs differently than FieldVisitorAccurateLess.
+  * TODO: Update Field operator< to compare NaNs and Nulls the same way as FieldVisitorAccurateLess.
+  */
 bool isSafePrimaryDataKeyType(const IDataType & data_type)
 {
     auto type_id = data_type.getTypeId();
@@ -316,12 +322,12 @@ struct PartRangeIndex
 
     bool operator==(const PartRangeIndex & other) const
     {
-        return part_index == other.part_index && range.begin == other.range.begin && range.end == other.range.end;
+        return std::tie(part_index, range.begin, range.end) == std::tie(other.part_index, other.range.begin, other.range.end);
     }
 
     bool operator<(const PartRangeIndex & other) const
     {
-        return part_index < other.part_index && range.begin < other.range.begin && range.end < other.range.end;
+        return std::tie(part_index, range.begin, range.end) < std::tie(other.part_index, other.range.begin, other.range.end);
     }
 
     size_t part_index;
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index f1ce5a7802f..4689e67a1ae 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -766,6 +766,82 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreams(RangesInDataParts && parts_
 
     auto read_type = is_parallel_reading_from_replicas ? ReadType::ParallelReplicas : ReadType::Default;
 
+    double read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = settings.merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability;
+    std::bernoulli_distribution fault(read_split_ranges_into_intersecting_and_non_intersecting_injection_probability);
+
+    if (read_type != ReadType::ParallelReplicas &&
+        num_streams > 1 &&
+        read_split_ranges_into_intersecting_and_non_intersecting_injection_probability >= 0.0 &&
+        fault(thread_local_rng) &&
+        !isQueryWithFinal() &&
+        data.merging_params.is_deleted_column.empty() &&
+        !prewhere_info)
+    {
+        NameSet column_names_set(column_names.begin(), column_names.end());
+        Names in_order_column_names_to_read(column_names);
+
+        /// Add columns needed to calculate the sorting expression
+        for (const auto & column_name : metadata_for_reading->getColumnsRequiredForSortingKey())
+        {
+            if (column_names_set.contains(column_name))
+                continue;
+
+            in_order_column_names_to_read.push_back(column_name);
+            column_names_set.insert(column_name);
+        }
+
+        auto in_order_reading_step_getter = [this, &in_order_column_names_to_read, &info](auto parts)
+        {
+            return this->read(
+                std::move(parts),
+                in_order_column_names_to_read,
+                ReadType::InOrder,
+                1 /* num_streams */,
+                0 /* min_marks_for_concurrent_read */,
+                info.use_uncompressed_cache);
+        };
+
+        auto sorting_expr = std::make_shared<ExpressionActions>(metadata_for_reading->getSortingKey().expression->getActionsDAG().clone());
+
+        SplitPartsWithRangesByPrimaryKeyResult split_ranges_result = splitPartsWithRangesByPrimaryKey(
+            metadata_for_reading->getPrimaryKey(),
+            std::move(sorting_expr),
+            std::move(parts_with_ranges),
+            num_streams,
+            context,
+            std::move(in_order_reading_step_getter),
+            true /*split_parts_ranges_into_intersecting_and_non_intersecting_final*/,
+            true /*split_intersecting_parts_ranges_into_layers*/);
+
+        auto merging_pipes = std::move(split_ranges_result.merging_pipes);
+        auto non_intersecting_parts_ranges_read_pipe = read(std::move(split_ranges_result.non_intersecting_parts_ranges),
+            column_names,
+            read_type,
+            num_streams,
+            info.min_marks_for_concurrent_read,
+            info.use_uncompressed_cache);
+
+        if (merging_pipes.empty())
+            return non_intersecting_parts_ranges_read_pipe;
+
+        Pipes pipes;
+        pipes.resize(2);
+        pipes[0] = Pipe::unitePipes(std::move(merging_pipes));
+        pipes[1] = std::move(non_intersecting_parts_ranges_read_pipe);
+
+        auto conversion_action = ActionsDAG::makeConvertingActions(
+            pipes[0].getHeader().getColumnsWithTypeAndName(),
+            pipes[1].getHeader().getColumnsWithTypeAndName(),
+            ActionsDAG::MatchColumnsMode::Name);
+        pipes[0].addSimpleTransform(
+            [conversion_action](const Block & header)
+            {
+                auto converting_expr = std::make_shared<ExpressionActions>(conversion_action);
+                return std::make_shared<ExpressionTransform>(header, converting_expr);
+            });
+        return Pipe::unitePipes(std::move(pipes));
+    }
+
     return read(std::move(parts_with_ranges),
         column_names,
         read_type,

From a1435fc915a151ef057065854f8b8ed79fd7af2c Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 4 Mar 2024 14:27:12 +0300
Subject: [PATCH 836/985] Fixed tests

---
 .../00278_insert_already_sorted.sql           |  4 +-
 .../0_stateless/00319_index_for_like.sql      |  4 +-
 .../0_stateless/00612_pk_in_tuple_perf.sh     |  4 +-
 .../0_stateless/00943_materialize_index.sh    | 20 +++---
 .../00944_clear_index_in_partition.sh         | 12 ++--
 .../0_stateless/00945_bloom_filter_index.sql  |  1 +
 .../00974_primary_key_for_lowCardinality.sh   |  4 +-
 ...ices_mutation_replicated_zookeeper_long.sh | 12 ++--
 .../00979_toFloat_monotonicity.sql            |  2 +
 ..._materialize_clear_index_compact_parts.sql |  2 +
 .../01200_mutations_memory_consumption.sql    |  2 +
 .../0_stateless/01234_to_string_monotonic.sql |  2 +
 ...with_constant_string_in_index_analysis.sql |  2 +
 .../01585_use_index_for_global_in.sql         |  2 +
 .../0_stateless/01624_soft_constraints.sh     |  2 +-
 .../01710_aggregate_projections.sh            |  2 +-
 .../0_stateless/01710_projection_in_index.sql |  2 +
 .../01748_partition_id_pruning.sql            |  2 +
 .../02155_read_in_order_max_rows_to_read.sql  |  2 +
 ...3_optimize_aggregation_in_order_prefix.sql |  2 +
 .../02340_parts_refcnt_mergetree.sh           |  4 +-
 .../02343_aggregation_pipeline.sql            |  1 +
 .../02346_inverted_index_search.sql           | 61 ++++++++++---------
 ...ting_by_input_stream_properties_explain.sh |  6 +-
 .../02402_merge_engine_with_view.sql          |  2 +
 .../02418_tautological_if_index.sql           |  2 +
 ...493_max_streams_for_merge_tree_reading.sql |  2 +
 .../02494_query_cache_nested_query_bug.sh     |  8 ++-
 .../02521_aggregation_by_partitions.sql       |  2 +
 .../0_stateless/02532_send_logs_level_test.sh |  2 +-
 .../02582_async_reading_with_small_limit.sql  |  2 +
 .../02714_read_bytes_aggregateFunction.sql    |  2 +
 .../02862_sorted_distinct_sparse_fix.sql      |  2 +
 ...02899_indexing_by_space_filling_curves.sql |  2 +
 .../0_stateless/02949_ttl_group_by_bug.sql    |  2 +
 .../02950_part_offset_as_primary_key.sql      |  2 +
 36 files changed, 118 insertions(+), 69 deletions(-)

diff --git a/tests/queries/0_stateless/00278_insert_already_sorted.sql b/tests/queries/0_stateless/00278_insert_already_sorted.sql
index b3de48dc155..dbd129d85cd 100644
--- a/tests/queries/0_stateless/00278_insert_already_sorted.sql
+++ b/tests/queries/0_stateless/00278_insert_already_sorted.sql
@@ -7,11 +7,11 @@ INSERT INTO sorted (x) SELECT intDiv(number, 100000) AS x FROM system.numbers LI
 SET max_threads = 1;
 
 SELECT count() FROM sorted;
-SELECT DISTINCT x FROM sorted;
+SELECT x FROM (SELECT DISTINCT x FROM sorted) ORDER BY x;
 
 INSERT INTO sorted (x) SELECT (intHash64(number) % 1000 = 0 ? 999 : intDiv(number, 100000)) AS x FROM system.numbers LIMIT 1000000;
 
 SELECT count() FROM sorted;
-SELECT DISTINCT x FROM sorted;
+SELECT x FROM (SELECT DISTINCT x FROM sorted) ORDER BY x;
 
 DROP TABLE sorted;
diff --git a/tests/queries/0_stateless/00319_index_for_like.sql b/tests/queries/0_stateless/00319_index_for_like.sql
index e490e595142..6abd1edc3ed 100644
--- a/tests/queries/0_stateless/00319_index_for_like.sql
+++ b/tests/queries/0_stateless/00319_index_for_like.sql
@@ -1,8 +1,10 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS index_for_like;
 set allow_deprecated_syntax_for_merge_tree=1;
 CREATE TABLE index_for_like (s String, d Date DEFAULT today()) ENGINE = MergeTree(d, (s, d), 1);
 
-INSERT INTO index_for_like (s) VALUES ('Hello'), ('Hello, World'), ('Hello, World 1'), ('Hello 1'), ('Goodbye'), ('Goodbye, World'), ('Goodbye 1'), ('Goodbye, World 1'); 
+INSERT INTO index_for_like (s) VALUES ('Hello'), ('Hello, World'), ('Hello, World 1'), ('Hello 1'), ('Goodbye'), ('Goodbye, World'), ('Goodbye 1'), ('Goodbye, World 1');
 
 SET max_rows_to_read = 3;
 SELECT s FROM index_for_like WHERE s LIKE 'Hello, World%';
diff --git a/tests/queries/0_stateless/00612_pk_in_tuple_perf.sh b/tests/queries/0_stateless/00612_pk_in_tuple_perf.sh
index 99813d894ae..c8297635c43 100755
--- a/tests/queries/0_stateless/00612_pk_in_tuple_perf.sh
+++ b/tests/queries/0_stateless/00612_pk_in_tuple_perf.sh
@@ -20,7 +20,7 @@ SETTINGS index_granularity = 1;
 INSERT INTO pk_in_tuple_perf SELECT number, number * 10 FROM numbers(100);
 EOF
 
-query="SELECT count() FROM pk_in_tuple_perf WHERE (v, u) IN ((2, 10), (2, 20))"
+query="SELECT count() FROM pk_in_tuple_perf WHERE (v, u) IN ((2, 10), (2, 20)) SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0"
 
 $CLICKHOUSE_CLIENT --query "$query"
 $CLICKHOUSE_CLIENT --query "$query FORMAT JSON" | grep "rows_read"
@@ -40,7 +40,7 @@ SETTINGS index_granularity = 1;
 INSERT INTO pk_in_tuple_perf_non_const SELECT today() - number, number FROM numbers(100);
 EOF
 
-query="SELECT count() FROM pk_in_tuple_perf_non_const WHERE (u, d) IN ((0, today()), (1, today()))"
+query="SELECT count() FROM pk_in_tuple_perf_non_const WHERE (u, d) IN ((0, today()), (1, today())) SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0"
 
 $CLICKHOUSE_CLIENT --query "$query"
 $CLICKHOUSE_CLIENT --query "$query FORMAT JSON" | grep "rows_read"
diff --git a/tests/queries/0_stateless/00943_materialize_index.sh b/tests/queries/0_stateless/00943_materialize_index.sh
index 30ef46e5cb0..6ff7d34a9d7 100755
--- a/tests/queries/0_stateless/00943_materialize_index.sh
+++ b/tests/queries/0_stateless/00943_materialize_index.sh
@@ -31,31 +31,31 @@ $CLICKHOUSE_CLIENT --query="INSERT INTO minmax_idx VALUES
 (8, 1, 2),
 (9, 1, 2)"
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 FORMAT JSON" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read"
 
 $CLICKHOUSE_CLIENT -n --query="
 ALTER TABLE minmax_idx ADD INDEX idx (i64, u64 * i64) TYPE minmax GRANULARITY 1 SETTINGS mutations_sync = 2;"
 
 $CLICKHOUSE_CLIENT --query="ALTER TABLE minmax_idx MATERIALIZE INDEX idx IN PARTITION 1 SETTINGS mutations_sync = 2;"
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 FORMAT JSON" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read"
 
 $CLICKHOUSE_CLIENT --query="ALTER TABLE minmax_idx MATERIALIZE INDEX idx IN PARTITION 2 SETTINGS mutations_sync = 2"
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 FORMAT JSON" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read"
 
 $CLICKHOUSE_CLIENT --query="ALTER TABLE minmax_idx CLEAR INDEX idx IN PARTITION 1 SETTINGS mutations_sync = 2"
 $CLICKHOUSE_CLIENT --query="ALTER TABLE minmax_idx CLEAR INDEX idx IN PARTITION 2 SETTINGS mutations_sync = 2"
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 FORMAT JSON" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read"
 
 $CLICKHOUSE_CLIENT --query="ALTER TABLE minmax_idx MATERIALIZE INDEX idx SETTINGS mutations_sync = 2"
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 FORMAT JSON" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read"
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE minmax_idx"
diff --git a/tests/queries/0_stateless/00944_clear_index_in_partition.sh b/tests/queries/0_stateless/00944_clear_index_in_partition.sh
index 8b74bd94f2c..4655077960f 100755
--- a/tests/queries/0_stateless/00944_clear_index_in_partition.sh
+++ b/tests/queries/0_stateless/00944_clear_index_in_partition.sh
@@ -32,17 +32,17 @@ $CLICKHOUSE_CLIENT --query="INSERT INTO minmax_idx VALUES
 (8, 1, 2),
 (9, 1, 2)"
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 FORMAT JSON" | grep "rows_read" # Returns 4
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read" # Returns 4
 
 $CLICKHOUSE_CLIENT --query="ALTER TABLE minmax_idx CLEAR INDEX idx IN PARTITION 1;" --mutations_sync=1
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 FORMAT JSON" | grep "rows_read" # Returns 6
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read" # Returns 6
 
 $CLICKHOUSE_CLIENT --query="ALTER TABLE minmax_idx MATERIALIZE INDEX idx IN PARTITION 1;" --mutations_sync=1
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 FORMAT JSON" | grep "rows_read" # Returns 4
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM minmax_idx WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read" # Returns 4
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE minmax_idx"
diff --git a/tests/queries/0_stateless/00945_bloom_filter_index.sql b/tests/queries/0_stateless/00945_bloom_filter_index.sql
index faa7feda04d..4c26988574a 100644
--- a/tests/queries/0_stateless/00945_bloom_filter_index.sql
+++ b/tests/queries/0_stateless/00945_bloom_filter_index.sql
@@ -1,4 +1,5 @@
 SET allow_suspicious_low_cardinality_types=1;
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
 
 DROP TABLE IF EXISTS single_column_bloom_filter;
 
diff --git a/tests/queries/0_stateless/00974_primary_key_for_lowCardinality.sh b/tests/queries/0_stateless/00974_primary_key_for_lowCardinality.sh
index f8527cd491e..389d433c7e2 100755
--- a/tests/queries/0_stateless/00974_primary_key_for_lowCardinality.sh
+++ b/tests/queries/0_stateless/00974_primary_key_for_lowCardinality.sh
@@ -32,9 +32,9 @@ $CLICKHOUSE_CLIENT --query="insert into lowString (a, b) select top 100000 toStr
 
 $CLICKHOUSE_CLIENT --query="insert into string (a, b) select top 100000 toString(number), today() from system.numbers"
 
-$CLICKHOUSE_CLIENT --query="select count() from lowString where a in ('1', '2') FORMAT JSON" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="select count() from lowString where a in ('1', '2') SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read"
 
-$CLICKHOUSE_CLIENT --query="select count() from string where a in ('1', '2') FORMAT JSON" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="select count() from string where a in ('1', '2') SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON" | grep "rows_read"
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE lowString;"
 $CLICKHOUSE_CLIENT --query="DROP TABLE string;"
diff --git a/tests/queries/0_stateless/00975_indices_mutation_replicated_zookeeper_long.sh b/tests/queries/0_stateless/00975_indices_mutation_replicated_zookeeper_long.sh
index 89b17ffe2bf..686dd7f6df0 100755
--- a/tests/queries/0_stateless/00975_indices_mutation_replicated_zookeeper_long.sh
+++ b/tests/queries/0_stateless/00975_indices_mutation_replicated_zookeeper_long.sh
@@ -49,18 +49,18 @@ $CLICKHOUSE_CLIENT --query="INSERT INTO indices_mutaions1 VALUES
 
 $CLICKHOUSE_CLIENT --query="SYSTEM SYNC REPLICA indices_mutaions2"
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2 FORMAT JSON;" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON;" | grep "rows_read"
 
 $CLICKHOUSE_CLIENT --query="ALTER TABLE indices_mutaions1 CLEAR INDEX idx IN PARTITION 1;" --replication_alter_partitions_sync=2 --mutations_sync=2
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2 FORMAT JSON;" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON;" | grep "rows_read"
 
 $CLICKHOUSE_CLIENT --query="ALTER TABLE indices_mutaions1 MATERIALIZE INDEX idx IN PARTITION 1;" --replication_alter_partitions_sync=2 --mutations_sync=2
 
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2;"
-$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2 FORMAT JSON;" | grep "rows_read"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
+$CLICKHOUSE_CLIENT --query="SELECT count() FROM indices_mutaions2 WHERE i64 = 2 SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0 FORMAT JSON;" | grep "rows_read"
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE indices_mutaions1"
 $CLICKHOUSE_CLIENT --query="DROP TABLE indices_mutaions2"
diff --git a/tests/queries/0_stateless/00979_toFloat_monotonicity.sql b/tests/queries/0_stateless/00979_toFloat_monotonicity.sql
index 9b3bdf91573..fa1f5b17a1c 100644
--- a/tests/queries/0_stateless/00979_toFloat_monotonicity.sql
+++ b/tests/queries/0_stateless/00979_toFloat_monotonicity.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS test1;
 DROP TABLE IF EXISTS test2;
 DROP TABLE IF EXISTS test3;
diff --git a/tests/queries/0_stateless/01114_materialize_clear_index_compact_parts.sql b/tests/queries/0_stateless/01114_materialize_clear_index_compact_parts.sql
index 767ca0e4073..b2ebe7e2cc2 100644
--- a/tests/queries/0_stateless/01114_materialize_clear_index_compact_parts.sql
+++ b/tests/queries/0_stateless/01114_materialize_clear_index_compact_parts.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS minmax_compact;
 
 CREATE TABLE minmax_compact
diff --git a/tests/queries/0_stateless/01200_mutations_memory_consumption.sql b/tests/queries/0_stateless/01200_mutations_memory_consumption.sql
index bca2286aa22..61263d125b0 100644
--- a/tests/queries/0_stateless/01200_mutations_memory_consumption.sql
+++ b/tests/queries/0_stateless/01200_mutations_memory_consumption.sql
@@ -1,5 +1,7 @@
 -- Tags: no-debug, no-parallel, long, no-s3-storage, no-random-merge-tree-settings
 
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS table_with_single_pk;
 
 CREATE TABLE table_with_single_pk
diff --git a/tests/queries/0_stateless/01234_to_string_monotonic.sql b/tests/queries/0_stateless/01234_to_string_monotonic.sql
index 87324fdda27..65b7ab21073 100644
--- a/tests/queries/0_stateless/01234_to_string_monotonic.sql
+++ b/tests/queries/0_stateless/01234_to_string_monotonic.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS test1;
 DROP TABLE IF EXISTS test2;
 
diff --git a/tests/queries/0_stateless/01312_comparison_with_constant_string_in_index_analysis.sql b/tests/queries/0_stateless/01312_comparison_with_constant_string_in_index_analysis.sql
index 50aa434a28c..b7778dfd780 100644
--- a/tests/queries/0_stateless/01312_comparison_with_constant_string_in_index_analysis.sql
+++ b/tests/queries/0_stateless/01312_comparison_with_constant_string_in_index_analysis.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS test;
 CREATE TABLE test (x UInt64) ENGINE = MergeTree ORDER BY x SETTINGS index_granularity = 1000, index_granularity_bytes = '10Mi';
 INSERT INTO test SELECT * FROM numbers(1000000);
diff --git a/tests/queries/0_stateless/01585_use_index_for_global_in.sql b/tests/queries/0_stateless/01585_use_index_for_global_in.sql
index 1dd7609350f..3b0ca726dfa 100644
--- a/tests/queries/0_stateless/01585_use_index_for_global_in.sql
+++ b/tests/queries/0_stateless/01585_use_index_for_global_in.sql
@@ -1,5 +1,7 @@
 -- Tags: global
 
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 drop table if exists xp;
 drop table if exists xp_d;
 
diff --git a/tests/queries/0_stateless/01624_soft_constraints.sh b/tests/queries/0_stateless/01624_soft_constraints.sh
index 944a4e4234f..aae193f6a5d 100755
--- a/tests/queries/0_stateless/01624_soft_constraints.sh
+++ b/tests/queries/0_stateless/01624_soft_constraints.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-SETTINGS="SET convert_query_to_cnf = 1; SET optimize_using_constraints = 1; SET optimize_move_to_prewhere = 1; SET optimize_substitute_columns = 1; SET optimize_append_index = 1"
+SETTINGS="SET convert_query_to_cnf = 1; SET optimize_using_constraints = 1; SET optimize_move_to_prewhere = 1; SET optimize_substitute_columns = 1; SET optimize_append_index = 1; SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;"
 
 $CLICKHOUSE_CLIENT -n --query="
 $SETTINGS;
diff --git a/tests/queries/0_stateless/01710_aggregate_projections.sh b/tests/queries/0_stateless/01710_aggregate_projections.sh
index 7ea40365937..b02d961bf97 100755
--- a/tests/queries/0_stateless/01710_aggregate_projections.sh
+++ b/tests/queries/0_stateless/01710_aggregate_projections.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 # Number of read rows depends on max_bytes_before_external_group_by.
-CLICKHOUSE_CLIENT="$CLICKHOUSE_CLIENT --max_bytes_before_external_group_by 0"
+CLICKHOUSE_CLIENT="$CLICKHOUSE_CLIENT --max_bytes_before_external_group_by 0 --merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability 0.0"
 
 $CLICKHOUSE_CLIENT -q "CREATE TABLE test_agg_proj (x Int32, y Int32, PROJECTION x_plus_y (SELECT sum(x - y), argMax(x, y) group by x + y)) ENGINE = MergeTree ORDER BY tuple() settings index_granularity = 1"
 $CLICKHOUSE_CLIENT -q "insert into test_agg_proj select intDiv(number, 2), -intDiv(number,3) - 1 from numbers(100)"
diff --git a/tests/queries/0_stateless/01710_projection_in_index.sql b/tests/queries/0_stateless/01710_projection_in_index.sql
index b858418584c..425653ec501 100644
--- a/tests/queries/0_stateless/01710_projection_in_index.sql
+++ b/tests/queries/0_stateless/01710_projection_in_index.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 drop table if exists t;
 
 create table t (i int, j int, k int, projection p (select * order by j)) engine MergeTree order by i settings index_granularity = 1;
diff --git a/tests/queries/0_stateless/01748_partition_id_pruning.sql b/tests/queries/0_stateless/01748_partition_id_pruning.sql
index 9a26dd8daba..b637528bc6c 100644
--- a/tests/queries/0_stateless/01748_partition_id_pruning.sql
+++ b/tests/queries/0_stateless/01748_partition_id_pruning.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 drop table if exists x;
 
 create table x (i int, j int) engine MergeTree partition by i order by j settings index_granularity = 1;
diff --git a/tests/queries/0_stateless/02155_read_in_order_max_rows_to_read.sql b/tests/queries/0_stateless/02155_read_in_order_max_rows_to_read.sql
index b387582296d..4b47a860071 100644
--- a/tests/queries/0_stateless/02155_read_in_order_max_rows_to_read.sql
+++ b/tests/queries/0_stateless/02155_read_in_order_max_rows_to_read.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS t_max_rows_to_read;
 
 CREATE TABLE t_max_rows_to_read (a UInt64)
diff --git a/tests/queries/0_stateless/02233_optimize_aggregation_in_order_prefix.sql b/tests/queries/0_stateless/02233_optimize_aggregation_in_order_prefix.sql
index 5065bd96bc1..8bc75040e5a 100644
--- a/tests/queries/0_stateless/02233_optimize_aggregation_in_order_prefix.sql
+++ b/tests/queries/0_stateless/02233_optimize_aggregation_in_order_prefix.sql
@@ -1,5 +1,7 @@
 -- Tags: no-s3-storage
 
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 drop table if exists data_02233;
 create table data_02233 (parent_key Int, child_key Int, value Int) engine=MergeTree() order by parent_key;
 
diff --git a/tests/queries/0_stateless/02340_parts_refcnt_mergetree.sh b/tests/queries/0_stateless/02340_parts_refcnt_mergetree.sh
index 9ea924377b2..208a9038681 100755
--- a/tests/queries/0_stateless/02340_parts_refcnt_mergetree.sh
+++ b/tests/queries/0_stateless/02340_parts_refcnt_mergetree.sh
@@ -15,11 +15,13 @@ function check_refcnt_for_table()
     local query_id
     query_id="$table-$(random_str 10)"
 
+    SETTINGS="--format Null --max_threads 1 --max_block_size 1  --merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability 0.0"
+
     # Notes:
     # - query may sleep 1*(200/4)=50 seconds maximum, it is enough to check system.parts
     # - "part = 1" condition should prune all parts except first
     # - max_block_size=1 with index_granularity=1 will allow to cancel the query earlier
-    $CLICKHOUSE_CLIENT --format Null --max_threads 1 --max_block_size 1 --query_id "$query_id" -q "select sleepEachRow(1) from $table where part = 1" &
+    $CLICKHOUSE_CLIENT $SETTINGS --query_id "$query_id" -q "select sleepEachRow(1) from $table where part = 1" &
     PID=$!
 
     # wait for query to be started
diff --git a/tests/queries/0_stateless/02343_aggregation_pipeline.sql b/tests/queries/0_stateless/02343_aggregation_pipeline.sql
index 496379f5c48..d73ac66763e 100644
--- a/tests/queries/0_stateless/02343_aggregation_pipeline.sql
+++ b/tests/queries/0_stateless/02343_aggregation_pipeline.sql
@@ -2,6 +2,7 @@
 
 -- produces different pipeline if enabled
 set enable_memory_bound_merging_of_aggregation_results = 0;
+set merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
 
 set max_threads = 16;
 set prefer_localhost_replica = 1;
diff --git a/tests/queries/0_stateless/02346_inverted_index_search.sql b/tests/queries/0_stateless/02346_inverted_index_search.sql
index d225d3463d1..052703dceaf 100644
--- a/tests/queries/0_stateless/02346_inverted_index_search.sql
+++ b/tests/queries/0_stateless/02346_inverted_index_search.sql
@@ -1,5 +1,6 @@
 SET allow_experimental_inverted_index = 1;
 SET log_queries = 1;
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
 
 ----------------------------------------------------
 SELECT 'Test inverted(2)';
@@ -23,7 +24,7 @@ SELECT * FROM tab WHERE s == 'Alick a01';
 
 -- check the query only read 1 granules (2 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==2 from system.query_log 
+SELECT read_rows==2 from system.query_log
         WHERE query_kind ='Select'
             AND current_database = currentDatabase()
             AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE s == \'Alick a01\';')
@@ -36,7 +37,7 @@ SELECT * FROM tab WHERE s LIKE '%01%' ORDER BY k;
 
 -- check the query only read 2 granules (4 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==4 from system.query_log 
+SELECT read_rows==4 from system.query_log
         WHERE query_kind ='Select'
             AND current_database = currentDatabase()
             AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE s LIKE \'%01%\' ORDER BY k;')
@@ -49,11 +50,11 @@ SELECT * FROM tab WHERE hasToken(s, 'Click') ORDER BY k;
 
 -- check the query only read 4 granules (8 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==8 from system.query_log 
+SELECT read_rows==8 from system.query_log
         WHERE query_kind ='Select'
             AND current_database = currentDatabase()
             AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE hasToken(s, \'Click\') ORDER BY k;')
-            AND type='QueryFinish' 
+            AND type='QueryFinish'
             AND result_rows==4
         LIMIT 1;
 
@@ -76,11 +77,11 @@ SELECT * FROM tab_x WHERE hasToken(s, 'Alick') ORDER BY k;
 
 -- check the query only read 4 granules (8 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==8 from system.query_log 
+SELECT read_rows==8 from system.query_log
     WHERE query_kind ='Select'
         AND current_database = currentDatabase()
-        AND endsWith(trimRight(query), 'SELECT * FROM tab_x WHERE hasToken(s, \'Alick\');') 
-        AND type='QueryFinish' 
+        AND endsWith(trimRight(query), 'SELECT * FROM tab_x WHERE hasToken(s, \'Alick\');')
+        AND type='QueryFinish'
         AND result_rows==4
     LIMIT 1;
 
@@ -89,24 +90,24 @@ SELECT * FROM tab_x WHERE s IN ('Alick a01', 'Alick a06') ORDER BY k;
 
 -- check the query only read 2 granules (4 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==4 from system.query_log 
+SELECT read_rows==4 from system.query_log
     WHERE query_kind ='Select'
         AND current_database = currentDatabase()
-        AND endsWith(trimRight(query), 'SELECT * FROM tab_x WHERE s IN (\'Alick a01\', \'Alick a06\') ORDER BY k;') 
-        AND type='QueryFinish' 
+        AND endsWith(trimRight(query), 'SELECT * FROM tab_x WHERE s IN (\'Alick a01\', \'Alick a06\') ORDER BY k;')
+        AND type='QueryFinish'
         AND result_rows==2
     LIMIT 1;
 
--- search inverted index with multiSearch        
+-- search inverted index with multiSearch
 SELECT * FROM tab_x WHERE multiSearchAny(s, ['a01', 'b01']) ORDER BY k;
 
 -- check the query only read 2 granules (4 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==4 from system.query_log 
+SELECT read_rows==4 from system.query_log
     WHERE query_kind ='Select'
         AND current_database = currentDatabase()
-        AND endsWith(trimRight(query), 'SELECT * FROM tab_x WHERE multiSearchAny(s, [\'a01\', \'b01\']) ORDER BY k;') 
-        AND type='QueryFinish' 
+        AND endsWith(trimRight(query), 'SELECT * FROM tab_x WHERE multiSearchAny(s, [\'a01\', \'b01\']) ORDER BY k;')
+        AND type='QueryFinish'
         AND result_rows==2
     LIMIT 1;
 
@@ -129,11 +130,11 @@ SELECT * FROM tab WHERE has(s, 'Click a03') ORDER BY k;
 
 -- check the query must read all 10 granules (20 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==2 from system.query_log 
+SELECT read_rows==2 from system.query_log
     WHERE query_kind ='Select'
         AND current_database = currentDatabase()
-        AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE has(s, \'Click a03\') ORDER BY k;') 
-        AND type='QueryFinish' 
+        AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE has(s, \'Click a03\') ORDER BY k;')
+        AND type='QueryFinish'
         AND result_rows==1
     LIMIT 1;
 
@@ -156,11 +157,11 @@ SELECT * FROM tab WHERE mapContains(s, 'Click') ORDER BY k;
 
 -- check the query must read all 4 granules (8 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==8 from system.query_log 
+SELECT read_rows==8 from system.query_log
     WHERE query_kind ='Select'
         AND current_database = currentDatabase()
-        AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE mapContains(s, \'Click\') ORDER BY k;') 
-        AND type='QueryFinish' 
+        AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE mapContains(s, \'Click\') ORDER BY k;')
+        AND type='QueryFinish'
         AND result_rows==4
     LIMIT 1;
 
@@ -169,11 +170,11 @@ SELECT * FROM tab WHERE s['Click'] = 'Click a03';
 
 -- check the query must read all 4 granules (8 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==8 from system.query_log 
+SELECT read_rows==8 from system.query_log
     WHERE query_kind ='Select'
         AND current_database = currentDatabase()
-        AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE s[\'Click\'] = \'Click a03\';') 
-        AND type='QueryFinish' 
+        AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE s[\'Click\'] = \'Click a03\';')
+        AND type='QueryFinish'
         AND result_rows==1
     LIMIT 1;
 
@@ -199,10 +200,10 @@ SELECT * FROM tab WHERE s LIKE '%01%' ORDER BY k;
 -- check the query only read 3 granules (6 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
 SELECT read_rows==6 from system.query_log
-    WHERE query_kind ='Select' 
+    WHERE query_kind ='Select'
         AND current_database = currentDatabase()
         AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE s LIKE \'%01%\' ORDER BY k;')
-        AND type='QueryFinish' 
+        AND type='QueryFinish'
         AND result_rows==3
     LIMIT 1;
 
@@ -226,11 +227,11 @@ SELECT * FROM tab WHERE s LIKE '%你好%' ORDER BY k;
 
 -- check the query only read 1 granule (2 rows total; each granule has 2 rows)
 SYSTEM FLUSH LOGS;
-SELECT read_rows==2 from system.query_log 
-    WHERE query_kind ='Select' 
-        AND current_database = currentDatabase()    
-        AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE s LIKE \'%你好%\' ORDER BY k;') 
-        AND type='QueryFinish' 
+SELECT read_rows==2 from system.query_log
+    WHERE query_kind ='Select'
+        AND current_database = currentDatabase()
+        AND endsWith(trimRight(query), 'SELECT * FROM tab WHERE s LIKE \'%你好%\' ORDER BY k;')
+        AND type='QueryFinish'
         AND result_rows==1
     LIMIT 1;
 
diff --git a/tests/queries/0_stateless/02377_optimize_sorting_by_input_stream_properties_explain.sh b/tests/queries/0_stateless/02377_optimize_sorting_by_input_stream_properties_explain.sh
index 7e937ac42b6..c223fcc86bc 100755
--- a/tests/queries/0_stateless/02377_optimize_sorting_by_input_stream_properties_explain.sh
+++ b/tests/queries/0_stateless/02377_optimize_sorting_by_input_stream_properties_explain.sh
@@ -15,14 +15,14 @@ FIND_SORTMODE="$GREP_SORTMODE | $TRIM_LEADING_SPACES"
 
 function explain_sorting {
     echo "-- QUERY: "$1
-    $CLICKHOUSE_CLIENT -nq "$1" | eval $FIND_SORTING
+    $CLICKHOUSE_CLIENT --merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability=0.0 -nq "$1" | eval $FIND_SORTING
 }
 
 function explain_sortmode {
     echo "-- QUERY: "$1
-    $CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 -nq "$1" | eval $FIND_SORTMODE
+    $CLICKHOUSE_CLIENT --allow_experimental_analyzer=0 --merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability=0.0 -nq "$1" | eval $FIND_SORTMODE
     echo "-- QUERY (analyzer): "$1
-    $CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 -nq "$1" | eval $FIND_SORTMODE
+    $CLICKHOUSE_CLIENT --allow_experimental_analyzer=1 --merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability=0.0 -nq "$1" | eval $FIND_SORTMODE
 }
 
 $CLICKHOUSE_CLIENT -q "drop table if exists optimize_sorting sync"
diff --git a/tests/queries/0_stateless/02402_merge_engine_with_view.sql b/tests/queries/0_stateless/02402_merge_engine_with_view.sql
index 81c2d67d05b..3998f410a63 100644
--- a/tests/queries/0_stateless/02402_merge_engine_with_view.sql
+++ b/tests/queries/0_stateless/02402_merge_engine_with_view.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 -- #40014
 CREATE TABLE m0 (id UInt64) ENGINE=MergeTree ORDER BY id SETTINGS index_granularity = 1, ratio_of_defaults_for_sparse_serialization = 1.0;
 INSERT INTO m0 SELECT number FROM numbers(10);
diff --git a/tests/queries/0_stateless/02418_tautological_if_index.sql b/tests/queries/0_stateless/02418_tautological_if_index.sql
index c37f24b29f6..1368347e88f 100644
--- a/tests/queries/0_stateless/02418_tautological_if_index.sql
+++ b/tests/queries/0_stateless/02418_tautological_if_index.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS constCondOptimization;
 
 CREATE TABLE constCondOptimization
diff --git a/tests/queries/0_stateless/02493_max_streams_for_merge_tree_reading.sql b/tests/queries/0_stateless/02493_max_streams_for_merge_tree_reading.sql
index f2e81273f12..cbf645ddec5 100644
--- a/tests/queries/0_stateless/02493_max_streams_for_merge_tree_reading.sql
+++ b/tests/queries/0_stateless/02493_max_streams_for_merge_tree_reading.sql
@@ -1,5 +1,7 @@
 -- Tags: no-random-merge-tree-settings
 
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 drop table if exists t;
 create table t (x UInt64) engine = MergeTree order by x;
 insert into t select number from numbers_mt(10000000) settings max_insert_threads=8;
diff --git a/tests/queries/0_stateless/02494_query_cache_nested_query_bug.sh b/tests/queries/0_stateless/02494_query_cache_nested_query_bug.sh
index 394367919e9..8712c7c84c6 100755
--- a/tests/queries/0_stateless/02494_query_cache_nested_query_bug.sh
+++ b/tests/queries/0_stateless/02494_query_cache_nested_query_bug.sh
@@ -15,9 +15,11 @@ ${CLICKHOUSE_CLIENT} --query "CREATE TABLE tab (a UInt64) ENGINE=MergeTree() ORD
 ${CLICKHOUSE_CLIENT} --query "INSERT INTO tab VALUES (1) (2) (3)"
 ${CLICKHOUSE_CLIENT} --query "INSERT INTO tab VALUES (3) (4) (5)"
 
+SETTINGS="SETTINGS use_query_cache=1, max_threads=1, allow_experimental_analyzer=0, merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability=0.0"
+
 # Verify that the first query does two aggregations and the second query zero aggregations. Since query cache is currently not integrated
-# with EXPLAIN PLAN, we need need to check the logs.
-${CLICKHOUSE_CLIENT} --send_logs_level=trace --query "SELECT count(a) / (SELECT sum(a) FROM tab) FROM tab SETTINGS use_query_cache=1, max_threads=1, allow_experimental_analyzer=0" 2>&1 | grep "Aggregated. " | wc -l
-${CLICKHOUSE_CLIENT} --send_logs_level=trace --query "SELECT count(a) / (SELECT sum(a) FROM tab) FROM tab SETTINGS use_query_cache=1, max_threads=1, allow_experimental_analyzer=0" 2>&1 | grep "Aggregated. " | wc -l
+# with EXPLAIN PLAN, we need to check the logs.
+${CLICKHOUSE_CLIENT} --send_logs_level=trace --query "SELECT count(a) / (SELECT sum(a) FROM tab) FROM tab $SETTINGS" 2>&1 | grep "Aggregated. " | wc -l
+${CLICKHOUSE_CLIENT} --send_logs_level=trace --query "SELECT count(a) / (SELECT sum(a) FROM tab) FROM tab $SETTINGS" 2>&1 | grep "Aggregated. " | wc -l
 
 ${CLICKHOUSE_CLIENT} --query "SYSTEM DROP QUERY CACHE"
diff --git a/tests/queries/0_stateless/02521_aggregation_by_partitions.sql b/tests/queries/0_stateless/02521_aggregation_by_partitions.sql
index 5b013ca5aef..a90e56a9822 100644
--- a/tests/queries/0_stateless/02521_aggregation_by_partitions.sql
+++ b/tests/queries/0_stateless/02521_aggregation_by_partitions.sql
@@ -1,5 +1,7 @@
 -- Tags: long, no-s3-storage
 
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 set max_threads = 16;
 set allow_aggregate_partitions_independently = 1;
 set force_aggregate_partitions_independently = 1;
diff --git a/tests/queries/0_stateless/02532_send_logs_level_test.sh b/tests/queries/0_stateless/02532_send_logs_level_test.sh
index 7dd9a152385..f65d8705569 100755
--- a/tests/queries/0_stateless/02532_send_logs_level_test.sh
+++ b/tests/queries/0_stateless/02532_send_logs_level_test.sh
@@ -17,6 +17,6 @@ $CLICKHOUSE_CLIENT -nm -q "
 # instead of "last" value, hence you cannot simply append another
 # --send_logs_level here.
 CLICKHOUSE_CLIENT_CLEAN=$(echo ${CLICKHOUSE_CLIENT} | sed 's/'"--send_logs_level=${CLICKHOUSE_CLIENT_SERVER_LOGS_LEVEL}"'/--send_logs_level=test/g')
-$CLICKHOUSE_CLIENT_CLEAN -q "select * from data" |& grep -o -e '<Unknown>.*' -e '<Test>.*'
+$CLICKHOUSE_CLIENT_CLEAN -q "select * from data SETTINGS merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;" |& grep -o -e '<Unknown>.*' -e '<Test>.*'
 
 $CLICKHOUSE_CLIENT -q "drop table data"
diff --git a/tests/queries/0_stateless/02582_async_reading_with_small_limit.sql b/tests/queries/0_stateless/02582_async_reading_with_small_limit.sql
index e51666673b1..cb6b1b6083e 100644
--- a/tests/queries/0_stateless/02582_async_reading_with_small_limit.sql
+++ b/tests/queries/0_stateless/02582_async_reading_with_small_limit.sql
@@ -1,5 +1,7 @@
 -- Tags: no-s3-storage
 
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 drop table if exists t;
 
 create table t(a UInt64) engine=MergeTree order by tuple();
diff --git a/tests/queries/0_stateless/02714_read_bytes_aggregateFunction.sql b/tests/queries/0_stateless/02714_read_bytes_aggregateFunction.sql
index 1c70a77c4d1..eb0a37045ef 100644
--- a/tests/queries/0_stateless/02714_read_bytes_aggregateFunction.sql
+++ b/tests/queries/0_stateless/02714_read_bytes_aggregateFunction.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 CREATE TABLE test (id UInt64, `amax` AggregateFunction(argMax, String, DateTime))
 ENGINE=MergeTree()
 ORDER BY id
diff --git a/tests/queries/0_stateless/02862_sorted_distinct_sparse_fix.sql b/tests/queries/0_stateless/02862_sorted_distinct_sparse_fix.sql
index 2bcdb3d43ff..d303a53fc39 100644
--- a/tests/queries/0_stateless/02862_sorted_distinct_sparse_fix.sql
+++ b/tests/queries/0_stateless/02862_sorted_distinct_sparse_fix.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS t_sparse_distinct;
 
 CREATE TABLE t_sparse_distinct (id UInt32, v String)
diff --git a/tests/queries/0_stateless/02899_indexing_by_space_filling_curves.sql b/tests/queries/0_stateless/02899_indexing_by_space_filling_curves.sql
index c7325b2478d..a3989039f50 100644
--- a/tests/queries/0_stateless/02899_indexing_by_space_filling_curves.sql
+++ b/tests/queries/0_stateless/02899_indexing_by_space_filling_curves.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS test;
 
 CREATE TABLE test (x UInt32, y UInt32) ENGINE = MergeTree ORDER BY mortonEncode(x, y) SETTINGS index_granularity = 8192, index_granularity_bytes = '1Mi';
diff --git a/tests/queries/0_stateless/02949_ttl_group_by_bug.sql b/tests/queries/0_stateless/02949_ttl_group_by_bug.sql
index a3d0794c897..83776cc9d85 100644
--- a/tests/queries/0_stateless/02949_ttl_group_by_bug.sql
+++ b/tests/queries/0_stateless/02949_ttl_group_by_bug.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS ttl_group_by_bug;
 
 CREATE TABLE ttl_group_by_bug
diff --git a/tests/queries/0_stateless/02950_part_offset_as_primary_key.sql b/tests/queries/0_stateless/02950_part_offset_as_primary_key.sql
index 736d54023ce..31a82cce1cd 100644
--- a/tests/queries/0_stateless/02950_part_offset_as_primary_key.sql
+++ b/tests/queries/0_stateless/02950_part_offset_as_primary_key.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 drop table if exists a;
 
 create table a (i int) engine MergeTree order by i settings index_granularity = 2;

From b8c53d7cf3f8de58ca8778be4bb87df4faaa6cca Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 6 Mar 2024 12:06:19 +0300
Subject: [PATCH 837/985] Fixed tests

---
 src/Core/Settings.h                                           | 2 +-
 src/Processors/QueryPlan/PartsSplitter.cpp                    | 2 +-
 src/Processors/QueryPlan/ReadFromMergeTree.cpp                | 2 +-
 tests/ci/stress.py                                            | 3 +++
 tests/clickhouse-test                                         | 1 +
 .../0_stateless/01200_mutations_memory_consumption.sql        | 4 +---
 6 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index b7ed8fc7d1d..891bd8c0de9 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -287,7 +287,7 @@ class IColumn;
     M(UInt64, read_backoff_min_concurrency, 1, "Settings to try keeping the minimal number of threads in case of slow reads.", 0) \
     \
     M(Float, memory_tracker_fault_probability, 0., "For testing of `exception safety` - throw an exception every time you allocate memory with the specified probability.", 0) \
-    M(Float, merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability, 1.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability.", 0) \
+    M(Float, merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability, 0.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability.", 0) \
     \
     M(Bool, enable_http_compression, false, "Compress the result if the client over HTTP said that it understands data compressed by gzip, deflate, zstd, br, lz4, bz2, xz.", 0) \
     M(Int64, http_zlib_compression_level, 3, "Compression level - used if the client on HTTP said that it understands data compressed by gzip or deflate.", 0) \
diff --git a/src/Processors/QueryPlan/PartsSplitter.cpp b/src/Processors/QueryPlan/PartsSplitter.cpp
index 33151597a38..2af1bcb0260 100644
--- a/src/Processors/QueryPlan/PartsSplitter.cpp
+++ b/src/Processors/QueryPlan/PartsSplitter.cpp
@@ -792,7 +792,7 @@ ASTs buildFilters(const KeyDescription & primary_key, const std::vector<Values>
             const auto & type = primary_key.data_types.at(i);
 
             // PK may contain functions of the table columns, so we need the actual PK AST with all expressions it contains.
-            auto pk_ast = primary_key.expression_list_ast->children.at(i);
+            auto pk_ast = primary_key.expression_list_ast->children.at(i)->clone();
 
             // If PK is nullable, prepend a null mask column for > comparison.
             // Also transform the AST into assumeNotNull(pk) so that the result type is not-nullable.
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index 4689e67a1ae..f4607cad040 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -771,7 +771,7 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreams(RangesInDataParts && parts_
 
     if (read_type != ReadType::ParallelReplicas &&
         num_streams > 1 &&
-        read_split_ranges_into_intersecting_and_non_intersecting_injection_probability >= 0.0 &&
+        read_split_ranges_into_intersecting_and_non_intersecting_injection_probability > 0.0 &&
         fault(thread_local_rng) &&
         !isQueryWithFinal() &&
         data.merging_params.is_deleted_column.empty() &&
diff --git a/tests/ci/stress.py b/tests/ci/stress.py
index 7ccc058f79f..dbc04835fae 100755
--- a/tests/ci/stress.py
+++ b/tests/ci/stress.py
@@ -52,6 +52,9 @@ def get_options(i: int, upgrade_check: bool) -> str:
     if i % 5 == 1:
         client_options.append("memory_tracker_fault_probability=0.001")
 
+    if i % 5 == 1:
+        client_options.append("merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability=0.05")
+
     if i % 2 == 1 and not upgrade_check:
         client_options.append("group_by_use_nulls=1")
 
diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 13d1200758e..6eac6e537ec 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -843,6 +843,7 @@ class SettingsRandomizer:
         "prefer_warmed_unmerged_parts_seconds": lambda: random.randint(0, 10),
         "use_page_cache_for_disks_without_file_cache": lambda: random.random() < 0.7,
         "page_cache_inject_eviction": lambda: random.random() < 0.5,
+        "merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability": lambda : round(random.random(), 2)
     }
 
     @staticmethod
diff --git a/tests/queries/0_stateless/01200_mutations_memory_consumption.sql b/tests/queries/0_stateless/01200_mutations_memory_consumption.sql
index 61263d125b0..2266da5fc8f 100644
--- a/tests/queries/0_stateless/01200_mutations_memory_consumption.sql
+++ b/tests/queries/0_stateless/01200_mutations_memory_consumption.sql
@@ -1,6 +1,4 @@
--- Tags: no-debug, no-parallel, long, no-s3-storage, no-random-merge-tree-settings
-
-SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+-- Tags: no-debug, no-parallel, long, no-s3-storage, no-random-settings, no-random-merge-tree-settings
 
 DROP TABLE IF EXISTS table_with_single_pk;
 

From 4dc985aa2fc9dcb0ded21e70e175ca41cd25e785 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 6 Mar 2024 12:20:51 +0300
Subject: [PATCH 838/985] Fixed style check

---
 tests/ci/stress.py    | 4 +++-
 tests/clickhouse-test | 4 +++-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/tests/ci/stress.py b/tests/ci/stress.py
index dbc04835fae..e0601b86f00 100755
--- a/tests/ci/stress.py
+++ b/tests/ci/stress.py
@@ -53,7 +53,9 @@ def get_options(i: int, upgrade_check: bool) -> str:
         client_options.append("memory_tracker_fault_probability=0.001")
 
     if i % 5 == 1:
-        client_options.append("merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability=0.05")
+        client_options.append(
+            "merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability=0.05"
+        )
 
     if i % 2 == 1 and not upgrade_check:
         client_options.append("group_by_use_nulls=1")
diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 6eac6e537ec..0dd408a2c8c 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -843,7 +843,9 @@ class SettingsRandomizer:
         "prefer_warmed_unmerged_parts_seconds": lambda: random.randint(0, 10),
         "use_page_cache_for_disks_without_file_cache": lambda: random.random() < 0.7,
         "page_cache_inject_eviction": lambda: random.random() < 0.5,
-        "merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability": lambda : round(random.random(), 2)
+        "merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability": lambda: round(
+            random.random(), 2
+        ),
     }
 
     @staticmethod

From 218655228887bed057c057fd89afbffef0b9681c Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 6 Mar 2024 18:41:56 +0300
Subject: [PATCH 839/985] Updated SettingsChangesHistory

---
 src/Core/SettingsChangesHistory.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index e8e38ca82f9..be31dd52b10 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -102,6 +102,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"keeper_retry_initial_backoff_ms", 100, 100, "Initial backoff timeout for general keeper operations"},
               {"keeper_retry_max_backoff_ms", 5000, 5000, "Max backoff timeout for general keeper operations"},
               {"s3queue_allow_experimental_sharded_mode", false, false, "Enable experimental sharded mode of S3Queue table engine. It is experimental because it will be rewritten"},
+              {"merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability", 0.0, 0.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability."},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
@@ -131,7 +132,6 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"default_normal_view_sql_security", "INVOKER", "INVOKER", "Allows to set default `SQL SECURITY` option while creating a normal view"},
               {"mysql_map_string_to_text_in_show_columns", false, true, "Reduce the configuration effort to connect ClickHouse with BI tools."},
               {"mysql_map_fixed_string_to_text_in_show_columns", false, true, "Reduce the configuration effort to connect ClickHouse with BI tools."},
-              {"merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability", 0.0, 0.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability."},
               }},
     {"24.1", {{"print_pretty_type_names", false, true, "Better user experience."},
               {"input_format_json_read_bools_as_strings", false, true, "Allow to read bools as strings in JSON formats by default"},

From d8a31160b4547e9e56eeb4af768272faacc35bf2 Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Mon, 11 Mar 2024 11:20:54 +0300
Subject: [PATCH 840/985] Fixed tests

---
 tests/queries/0_stateless/02302_s3_file_pruning.sql       | 2 ++
 tests/queries/0_stateless/02987_group_array_intersect.sql | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/tests/queries/0_stateless/02302_s3_file_pruning.sql b/tests/queries/0_stateless/02302_s3_file_pruning.sql
index 93fc8a1bc25..647dfd5e5eb 100644
--- a/tests/queries/0_stateless/02302_s3_file_pruning.sql
+++ b/tests/queries/0_stateless/02302_s3_file_pruning.sql
@@ -1,6 +1,8 @@
 -- Tags: no-parallel, no-fasttest
 -- Tag no-fasttest: Depends on S3
 
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 -- { echo }
 drop table if exists test_02302;
 create table test_02302 (a UInt64) engine = S3(s3_conn, filename='test_02302_{_partition_id}', format=Parquet) partition by a;
diff --git a/tests/queries/0_stateless/02987_group_array_intersect.sql b/tests/queries/0_stateless/02987_group_array_intersect.sql
index 703914e464d..321e860b0a8 100644
--- a/tests/queries/0_stateless/02987_group_array_intersect.sql
+++ b/tests/queries/0_stateless/02987_group_array_intersect.sql
@@ -1,3 +1,5 @@
+SET merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability = 0.0;
+
 DROP TABLE IF EXISTS test_empty;
 CREATE TABLE test_empty (a Array(Int64)) engine=MergeTree ORDER BY a;
 INSERT INTO test_empty VALUES ([]);

From a5d286dc27ca3d9d32217be3c4d7fdd55ec82b0c Mon Sep 17 00:00:00 2001
From: Maksim Kita <kitaetoya@gmail.com>
Date: Wed, 13 Mar 2024 18:13:34 +0300
Subject: [PATCH 841/985] Fixed tests

---
 tests/queries/0_stateless/01508_partition_pruning_long.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01508_partition_pruning_long.sh b/tests/queries/0_stateless/01508_partition_pruning_long.sh
index c1f2d6562ab..b951e550708 100755
--- a/tests/queries/0_stateless/01508_partition_pruning_long.sh
+++ b/tests/queries/0_stateless/01508_partition_pruning_long.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long, no-polymorphic-parts, no-random-merge-tree-settings
+# Tags: long, no-polymorphic-parts, no-random-settings, no-random-merge-tree-settings
 
 # Description of test result:
 # Test the correctness of the partition pruning

From f162ea83417ab93a6883ad5f3ac9daa80e013dcd Mon Sep 17 00:00:00 2001
From: Nikolay Degterinsky <evillique@gmail.com>
Date: Thu, 21 Mar 2024 09:51:10 +0000
Subject: [PATCH 842/985] Fix use-of-uninitialized-value in
 parseDateTimeBestEffort

---
 src/IO/parseDateTimeBestEffort.cpp                             | 3 +++
 tests/queries/0_stateless/03014_msan_parse_date_time.reference | 0
 tests/queries/0_stateless/03014_msan_parse_date_time.sql       | 1 +
 3 files changed, 4 insertions(+)
 create mode 100644 tests/queries/0_stateless/03014_msan_parse_date_time.reference
 create mode 100644 tests/queries/0_stateless/03014_msan_parse_date_time.sql

diff --git a/src/IO/parseDateTimeBestEffort.cpp b/src/IO/parseDateTimeBestEffort.cpp
index caf51d94bb3..83928b32f2f 100644
--- a/src/IO/parseDateTimeBestEffort.cpp
+++ b/src/IO/parseDateTimeBestEffort.cpp
@@ -147,6 +147,9 @@ ReturnType parseDateTimeBestEffortImpl(
             {
                 has_comma_between_date_and_time = true;
                 ++in.position();
+
+                if (in.eof())
+                    break;
             }
         }
 
diff --git a/tests/queries/0_stateless/03014_msan_parse_date_time.reference b/tests/queries/0_stateless/03014_msan_parse_date_time.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/03014_msan_parse_date_time.sql b/tests/queries/0_stateless/03014_msan_parse_date_time.sql
new file mode 100644
index 00000000000..d6daea69cfa
--- /dev/null
+++ b/tests/queries/0_stateless/03014_msan_parse_date_time.sql
@@ -0,0 +1 @@
+SELECT parseDateTimeBestEffort(toFixedString('01/12/2017,', 11)); -- { serverError CANNOT_PARSE_DATETIME }

From e0d14a1eaf2028ca806ebef0a64b555798a57988 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 21 Mar 2024 11:10:54 +0100
Subject: [PATCH 843/985] Updated lambda and name of BufferAllocationPolicy

---
 src/Common/BufferAllocationPolicy.cpp         | 12 +++++-----
 src/Common/BufferAllocationPolicy.h           | 12 +++++-----
 .../IO/WriteBufferFromAzureBlobStorage.cpp    | 22 +++++++++----------
 .../IO/WriteBufferFromAzureBlobStorage.h      |  2 +-
 src/IO/WriteBufferFromS3.cpp                  |  6 ++---
 src/IO/WriteBufferFromS3.h                    |  3 +--
 6 files changed, 28 insertions(+), 29 deletions(-)

diff --git a/src/Common/BufferAllocationPolicy.cpp b/src/Common/BufferAllocationPolicy.cpp
index 359da0f8313..980cbcca729 100644
--- a/src/Common/BufferAllocationPolicy.cpp
+++ b/src/Common/BufferAllocationPolicy.cpp
@@ -5,13 +5,13 @@
 namespace DB
 {
 
-class FixedSizeBufferAllocationPolicy : public IBufferAllocationPolicy
+class FixedSizeBufferAllocationPolicy : public BufferAllocationPolicy
 {
     const size_t buffer_size = 0;
     size_t buffer_number = 0;
 
 public:
-    explicit FixedSizeBufferAllocationPolicy(const IBufferAllocationPolicy::Settings & settings_)
+    explicit FixedSizeBufferAllocationPolicy(const BufferAllocationPolicy::Settings & settings_)
         : buffer_size(settings_.strict_size)
     {
         chassert(buffer_size > 0);
@@ -32,7 +32,7 @@ public:
 };
 
 
-class ExpBufferAllocationPolicy : public DB::IBufferAllocationPolicy
+class ExpBufferAllocationPolicy : public DB::BufferAllocationPolicy
 {
     const size_t first_size = 0;
     const size_t second_size = 0;
@@ -45,7 +45,7 @@ class ExpBufferAllocationPolicy : public DB::IBufferAllocationPolicy
     size_t buffer_number = 0;
 
 public:
-    explicit ExpBufferAllocationPolicy(const IBufferAllocationPolicy::Settings & settings_)
+    explicit ExpBufferAllocationPolicy(const BufferAllocationPolicy::Settings & settings_)
         : first_size(std::max(settings_.max_single_size, settings_.min_size))
         , second_size(settings_.min_size)
         , multiply_factor(settings_.multiply_factor)
@@ -89,9 +89,9 @@ public:
 };
 
 
-IBufferAllocationPolicy::~IBufferAllocationPolicy() = default;
+BufferAllocationPolicy::~BufferAllocationPolicy() = default;
 
-IBufferAllocationPolicy::IBufferAllocationPolicyPtr IBufferAllocationPolicy::create(IBufferAllocationPolicy::Settings settings_)
+BufferAllocationPolicyPtr BufferAllocationPolicy::create(BufferAllocationPolicy::Settings settings_)
 {
     if (settings_.strict_size > 0)
         return std::make_unique<FixedSizeBufferAllocationPolicy>(settings_);
diff --git a/src/Common/BufferAllocationPolicy.h b/src/Common/BufferAllocationPolicy.h
index 4ac20f1605b..7017891f9e2 100644
--- a/src/Common/BufferAllocationPolicy.h
+++ b/src/Common/BufferAllocationPolicy.h
@@ -9,8 +9,11 @@
 namespace DB
 {
 
+class BufferAllocationPolicy;
+using BufferAllocationPolicyPtr = std::unique_ptr<BufferAllocationPolicy>;
+
 ///  Buffer number starts with 0
-class IBufferAllocationPolicy
+class BufferAllocationPolicy
 {
 public:
 
@@ -24,15 +27,12 @@ public:
         size_t max_single_size = 32 * 1024 * 1024; /// Max size for a single buffer/block
     };
 
-
     virtual size_t getBufferNumber() const = 0;
     virtual size_t getBufferSize() const = 0;
     virtual void nextBuffer() = 0;
-    virtual ~IBufferAllocationPolicy() = 0;
+    virtual ~BufferAllocationPolicy() = 0;
 
-    using IBufferAllocationPolicyPtr = std::unique_ptr<IBufferAllocationPolicy>;
-
-    static IBufferAllocationPolicyPtr create(Settings settings_);
+    static BufferAllocationPolicyPtr create(Settings settings_);
 
 };
 
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index 1ef54272295..ed3ce76bd94 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -22,11 +22,12 @@ struct WriteBufferFromAzureBlobStorage::PartData
 {
     Memory<> memory;
     size_t data_size = 0;
+    std::string block_id;
 };
 
-IBufferAllocationPolicy::IBufferAllocationPolicyPtr createBufferAllocationPolicy(const AzureObjectStorageSettings & settings)
+BufferAllocationPolicyPtr createBufferAllocationPolicy(const AzureObjectStorageSettings & settings)
 {
-    IBufferAllocationPolicy::Settings allocation_settings;
+    BufferAllocationPolicy::Settings allocation_settings;
     allocation_settings.strict_size = settings.strict_upload_part_size;
     allocation_settings.min_size = settings.min_upload_part_size;
     allocation_settings.max_size = settings.max_upload_part_size;
@@ -34,7 +35,7 @@ IBufferAllocationPolicy::IBufferAllocationPolicyPtr createBufferAllocationPolicy
     allocation_settings.multiply_parts_count_threshold = settings.upload_part_size_multiply_parts_count_threshold;
     allocation_settings.max_single_size = settings.max_single_part_upload_size;
 
-    return IBufferAllocationPolicy::create(allocation_settings);
+    return BufferAllocationPolicy::create(allocation_settings);
 }
 
 WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
@@ -146,21 +147,20 @@ void WriteBufferFromAzureBlobStorage::allocateBuffer()
 
 void WriteBufferFromAzureBlobStorage::writePart()
 {
-    std::shared_ptr<PartData> part_data;
     auto data_size = size_t(position() - memory.data());
-    part_data = std::make_shared<PartData>(std::move(memory), data_size);
-    WriteBuffer::set(nullptr, 0);
-
-    if (part_data->data_size == 0)
+    if (data_size == 0)
         return;
 
-    auto upload_worker = [&, part_data] ()
+    const std::string & block_id = block_ids.emplace_back(getRandomASCIIString(64));
+    std::shared_ptr<PartData> part_data = std::make_shared<PartData>(std::move(memory), data_size, block_id);
+    WriteBuffer::set(nullptr, 0);
+
+    auto upload_worker = [this, part_data] ()
     {
         auto block_blob_client = blob_container_client->GetBlockBlobClient(blob_path);
-        const std::string & block_id = block_ids.emplace_back(getRandomASCIIString(64));
 
         Azure::Core::IO::MemoryBodyStream memory_stream(reinterpret_cast<const uint8_t *>(part_data->memory.data()), part_data->data_size);
-        execWithRetry([&](){ block_blob_client.StageBlock(block_id, memory_stream); }, max_unexpected_write_error_retries, part_data->data_size);
+        execWithRetry([&](){ block_blob_client.StageBlock(part_data->block_id, memory_stream); }, max_unexpected_write_error_retries, part_data->data_size);
 
         if (write_settings.remote_throttler)
             write_settings.remote_throttler->add(part_data->data_size, ProfileEvents::RemoteWriteThrottlerBytes, ProfileEvents::RemoteWriteThrottlerSleepMicroseconds);
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
index a210a75030a..6e10c07b255 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.h
@@ -58,7 +58,7 @@ private:
     LoggerPtr log;
     LogSeriesLimiterPtr limitedLog = std::make_shared<LogSeriesLimiter>(log, 1, 5);
 
-    IBufferAllocationPolicy::IBufferAllocationPolicyPtr buffer_allocation_policy;
+    BufferAllocationPolicyPtr buffer_allocation_policy;
 
     const size_t max_single_part_upload_size;
     const size_t max_unexpected_write_error_retries;
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index 3ee59c42079..865bac86ff5 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -74,9 +74,9 @@ struct WriteBufferFromS3::PartData
     }
 };
 
-IBufferAllocationPolicy::IBufferAllocationPolicyPtr createBufferAllocationPolicy(const S3Settings::RequestSettings::PartUploadSettings & settings)
+BufferAllocationPolicyPtr createBufferAllocationPolicy(const S3Settings::RequestSettings::PartUploadSettings & settings)
 {
-    IBufferAllocationPolicy::Settings allocation_settings;
+    BufferAllocationPolicy::Settings allocation_settings;
     allocation_settings.strict_size = settings.strict_upload_part_size;
     allocation_settings.min_size = settings.min_upload_part_size;
     allocation_settings.max_size = settings.max_upload_part_size;
@@ -84,7 +84,7 @@ IBufferAllocationPolicy::IBufferAllocationPolicyPtr createBufferAllocationPolicy
     allocation_settings.multiply_parts_count_threshold = settings.upload_part_size_multiply_parts_count_threshold;
     allocation_settings.max_single_size = settings.max_single_part_upload_size;
 
-    return IBufferAllocationPolicy::create(allocation_settings);
+    return BufferAllocationPolicy::create(allocation_settings);
 }
 
 
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 3d2aed74e88..0eab20891bf 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -85,7 +85,7 @@ private:
     LoggerPtr log = getLogger("WriteBufferFromS3");
     LogSeriesLimiterPtr limitedLog = std::make_shared<LogSeriesLimiter>(log, 1, 5);
 
-    IBufferAllocationPolicy::IBufferAllocationPolicyPtr buffer_allocation_policy;
+    BufferAllocationPolicyPtr buffer_allocation_policy;
 
     /// Upload in S3 is made in parts.
     /// We initiate upload, then upload each part and get ETag as a response, and then finalizeImpl() upload with listing all our parts.
@@ -109,7 +109,6 @@ private:
     size_t total_size = 0;
     size_t hidden_size = 0;
 
-//    class TaskTracker;
     std::unique_ptr<TaskTracker> task_tracker;
 
     BlobStorageLogWriterPtr blob_log;

From 6e260d9419eaea891d972cf37447872980479531 Mon Sep 17 00:00:00 2001
From: Oxide Computer Company <eng@oxide.computer>
Date: Wed, 22 Nov 2023 11:47:36 +0000
Subject: [PATCH 844/985] poco foundation: add illumos support

---
 base/poco/Foundation/src/Environment_UNIX.cpp | 6 +++---
 base/poco/Foundation/src/NamedEvent_UNIX.cpp  | 2 +-
 base/poco/Foundation/src/NamedMutex_UNIX.cpp  | 2 +-
 base/poco/Net/CMakeLists.txt                  | 4 ++++
 4 files changed, 9 insertions(+), 5 deletions(-)

diff --git a/base/poco/Foundation/src/Environment_UNIX.cpp b/base/poco/Foundation/src/Environment_UNIX.cpp
index 202e5d88f83..faabb374778 100644
--- a/base/poco/Foundation/src/Environment_UNIX.cpp
+++ b/base/poco/Foundation/src/Environment_UNIX.cpp
@@ -281,15 +281,15 @@ void EnvironmentImpl::nodeIdImpl(NodeId& id)
 /// #include <sys/ioctl.h>
 #if defined(sun) || defined(__sun)
 #include <sys/sockio.h>
+#include <netdb.h>
+#include <net/if.h>
+#include <net/if_arp.h>
 #endif
 /// #include <sys/socket.h>
 /// #include <sys/types.h>
 /// #include <netinet/in.h>
 /// #include <net/if.h>
 /// #include <arpa/inet.h>
-/// #include <netdb.h>
-/// #include <net/if.h>
-/// #include <net/if_arp.h>
 /// #include <unistd.h>
 
 
diff --git a/base/poco/Foundation/src/NamedEvent_UNIX.cpp b/base/poco/Foundation/src/NamedEvent_UNIX.cpp
index 978e6e0bc02..3cda4104c73 100644
--- a/base/poco/Foundation/src/NamedEvent_UNIX.cpp
+++ b/base/poco/Foundation/src/NamedEvent_UNIX.cpp
@@ -31,7 +31,7 @@
 namespace Poco {
 
 
-#if (POCO_OS == POCO_OS_LINUX) || (POCO_OS == POCO_OS_ANDROID) || (POCO_OS == POCO_OS_CYGWIN) || (POCO_OS == POCO_OS_FREE_BSD)
+#if (POCO_OS == POCO_OS_LINUX) || (POCO_OS == POCO_OS_ANDROID) || (POCO_OS == POCO_OS_CYGWIN) || (POCO_OS == POCO_OS_FREE_BSD) || (POCO_OS == POCO_OS_SOLARIS)
 	union semun
 	{
 		int                 val;
diff --git a/base/poco/Foundation/src/NamedMutex_UNIX.cpp b/base/poco/Foundation/src/NamedMutex_UNIX.cpp
index 6cfa1369c9d..d53d54d7bb5 100644
--- a/base/poco/Foundation/src/NamedMutex_UNIX.cpp
+++ b/base/poco/Foundation/src/NamedMutex_UNIX.cpp
@@ -31,7 +31,7 @@
 namespace Poco {
 
 
-#if (POCO_OS == POCO_OS_LINUX) || (POCO_OS == POCO_OS_ANDROID) || (POCO_OS == POCO_OS_CYGWIN) || (POCO_OS == POCO_OS_FREE_BSD)
+#if (POCO_OS == POCO_OS_LINUX) || (POCO_OS == POCO_OS_ANDROID) || (POCO_OS == POCO_OS_CYGWIN) || (POCO_OS == POCO_OS_FREE_BSD) || (POCO_OS == POCO_OS_SOLARIS)
 	union semun
 	{
 		int                 val;
diff --git a/base/poco/Net/CMakeLists.txt b/base/poco/Net/CMakeLists.txt
index 792045c9b43..50ffbdf905a 100644
--- a/base/poco/Net/CMakeLists.txt
+++ b/base/poco/Net/CMakeLists.txt
@@ -9,6 +9,10 @@ elseif (OS_DARWIN OR OS_FREEBSD)
     target_compile_definitions (_poco_net PUBLIC POCO_HAVE_FD_POLL)
 endif ()
 
+if (OS_SUNOS)
+    target_link_libraries (_poco_net PUBLIC socket nsl)
+endif ()
+
 # TODO: remove these warning exclusions
 target_compile_options (_poco_net
     PRIVATE

From 7abdc66e0d8f3be7f488cdcf9362f4b599f2a8ce Mon Sep 17 00:00:00 2001
From: Oxide Computer Company <eng@oxide.computer>
Date: Wed, 22 Nov 2023 11:47:33 +0000
Subject: [PATCH 845/985] contrib/c-ares: add illumos as a platform

---
 contrib/c-ares-cmake/CMakeLists.txt        |   2 +
 contrib/c-ares-cmake/solaris/ares_build.h  | 104 +++++
 contrib/c-ares-cmake/solaris/ares_config.h | 503 +++++++++++++++++++++
 3 files changed, 609 insertions(+)
 create mode 100644 contrib/c-ares-cmake/solaris/ares_build.h
 create mode 100644 contrib/c-ares-cmake/solaris/ares_config.h

diff --git a/contrib/c-ares-cmake/CMakeLists.txt b/contrib/c-ares-cmake/CMakeLists.txt
index 86ab6f90260..daec96ff1b1 100644
--- a/contrib/c-ares-cmake/CMakeLists.txt
+++ b/contrib/c-ares-cmake/CMakeLists.txt
@@ -86,6 +86,8 @@ elseif (OS_DARWIN)
     target_compile_definitions(_c-ares PRIVATE -D_DARWIN_C_SOURCE)
 elseif (OS_FREEBSD)
     target_include_directories(_c-ares SYSTEM PUBLIC "${ClickHouse_SOURCE_DIR}/contrib/c-ares-cmake/freebsd")
+elseif (OS_SUNOS)
+    target_include_directories(_c-ares SYSTEM PUBLIC "${ClickHouse_SOURCE_DIR}/contrib/c-ares-cmake/solaris")
 endif()
 
 add_library(ch_contrib::c-ares ALIAS _c-ares)
diff --git a/contrib/c-ares-cmake/solaris/ares_build.h b/contrib/c-ares-cmake/solaris/ares_build.h
new file mode 100644
index 00000000000..f42b59d07bd
--- /dev/null
+++ b/contrib/c-ares-cmake/solaris/ares_build.h
@@ -0,0 +1,104 @@
+/* include/ares_build.h.  Generated from ares_build.h.in by configure.  */
+#ifndef __CARES_BUILD_H
+#define __CARES_BUILD_H
+
+
+/* Copyright (C) 2009 - 2021 by Daniel Stenberg et al
+ *
+ * Permission to use, copy, modify, and distribute this software and its
+ * documentation for any purpose and without fee is hereby granted, provided
+ * that the above copyright notice appear in all copies and that both that
+ * copyright notice and this permission notice appear in supporting
+ * documentation, and that the name of M.I.T. not be used in advertising or
+ * publicity pertaining to distribution of the software without specific,
+ * written prior permission.  M.I.T. makes no representations about the
+ * suitability of this software for any purpose.  It is provided "as is"
+ * without express or implied warranty.
+ */
+
+/* ================================================================ */
+/*               NOTES FOR CONFIGURE CAPABLE SYSTEMS                */
+/* ================================================================ */
+
+/*
+ * NOTE 1:
+ * -------
+ *
+ * Nothing in this file is intended to be modified or adjusted by the
+ * c-ares library user nor by the c-ares library builder.
+ *
+ * If you think that something actually needs to be changed, adjusted
+ * or fixed in this file, then, report it on the c-ares development
+ * mailing list: http://lists.haxx.se/listinfo/c-ares/
+ *
+ * This header file shall only export symbols which are 'cares' or 'CARES'
+ * prefixed, otherwise public name space would be polluted.
+ *
+ * NOTE 2:
+ * -------
+ *
+ * Right now you might be staring at file ares_build.h.in or ares_build.h,
+ * this is due to the following reason:
+ *
+ * On systems capable of running the configure script, the configure process
+ * will overwrite the distributed ares_build.h file with one that is suitable
+ * and specific to the library being configured and built, which is generated
+ * from the ares_build.h.in template file.
+ *
+ */
+
+/* ================================================================ */
+/*  DEFINITION OF THESE SYMBOLS SHALL NOT TAKE PLACE ANYWHERE ELSE  */
+/* ================================================================ */
+
+#ifdef CARES_TYPEOF_ARES_SOCKLEN_T
+#  error "CARES_TYPEOF_ARES_SOCKLEN_T shall not be defined except in ares_build.h"
+   Error Compilation_aborted_CARES_TYPEOF_ARES_SOCKLEN_T_already_defined
+#endif
+
+#define CARES_HAVE_ARPA_NAMESER_H 1
+#define CARES_HAVE_ARPA_NAMESER_COMPAT_H 1
+
+/* ================================================================ */
+/*  EXTERNAL INTERFACE SETTINGS FOR CONFIGURE CAPABLE SYSTEMS ONLY  */
+/* ================================================================ */
+
+/* Configure process defines this to 1 when it finds out that system  */
+/* header file ws2tcpip.h must be included by the external interface. */
+/* #undef CARES_PULL_WS2TCPIP_H */
+#ifdef CARES_PULL_WS2TCPIP_H
+#  ifndef WIN32_LEAN_AND_MEAN
+#    define WIN32_LEAN_AND_MEAN
+#  endif
+#  include <windows.h>
+#  include <winsock2.h>
+#  include <ws2tcpip.h>
+#endif
+
+/* Configure process defines this to 1 when it finds out that system   */
+/* header file sys/types.h must be included by the external interface. */
+#define CARES_PULL_SYS_TYPES_H 1
+#ifdef CARES_PULL_SYS_TYPES_H
+#  include <sys/types.h>
+#endif
+
+/* Configure process defines this to 1 when it finds out that system    */
+/* header file sys/socket.h must be included by the external interface. */
+#define CARES_PULL_SYS_SOCKET_H 1
+#ifdef CARES_PULL_SYS_SOCKET_H
+#  include <sys/socket.h>
+#endif
+
+/* Integral data type used for ares_socklen_t. */
+#define CARES_TYPEOF_ARES_SOCKLEN_T socklen_t
+
+/* Data type definition of ares_socklen_t. */
+typedef CARES_TYPEOF_ARES_SOCKLEN_T ares_socklen_t;
+
+/* Integral data type used for ares_ssize_t. */
+#define CARES_TYPEOF_ARES_SSIZE_T ssize_t
+
+/* Data type definition of ares_ssize_t. */
+typedef CARES_TYPEOF_ARES_SSIZE_T ares_ssize_t;
+
+#endif /* __CARES_BUILD_H */
diff --git a/contrib/c-ares-cmake/solaris/ares_config.h b/contrib/c-ares-cmake/solaris/ares_config.h
new file mode 100644
index 00000000000..c4ac5e38966
--- /dev/null
+++ b/contrib/c-ares-cmake/solaris/ares_config.h
@@ -0,0 +1,503 @@
+/* src/lib/ares_config.h.  Generated from ares_config.h.in by configure.  */
+/* src/lib/ares_config.h.in.  Generated from configure.ac by autoheader.  */
+
+/* Define if building universal (internal helper macro) */
+/* #undef AC_APPLE_UNIVERSAL_BUILD */
+
+/* define this if ares is built for a big endian system */
+/* #undef ARES_BIG_ENDIAN */
+
+/* Defined for build that exposes internal static functions for testing. */
+/* #undef CARES_EXPOSE_STATICS */
+
+/* a suitable file/device to read random data from */
+#define CARES_RANDOM_FILE "/dev/urandom"
+
+/* Defined for build with symbol hiding. */
+#define CARES_SYMBOL_HIDING 1
+
+/* Definition to make a library symbol externally visible. */
+#define CARES_SYMBOL_SCOPE_EXTERN __attribute__ ((__visibility__ ("default")))
+
+/* the signed version of size_t */
+#define CARES_TYPEOF_ARES_SSIZE_T ssize_t
+
+/* Use resolver library to configure cares */
+/* #undef CARES_USE_LIBRESOLV */
+
+/* if a /etc/inet dir is being used */
+#define ETC_INET 1
+
+/* Define to the type of arg 2 for gethostname. */
+#define GETHOSTNAME_TYPE_ARG2 int
+
+/* Define to the type qualifier of arg 1 for getnameinfo. */
+#define GETNAMEINFO_QUAL_ARG1 const
+
+/* Define to the type of arg 1 for getnameinfo. */
+#define GETNAMEINFO_TYPE_ARG1 struct sockaddr *
+
+/* Define to the type of arg 2 for getnameinfo. */
+#define GETNAMEINFO_TYPE_ARG2 socklen_t
+
+/* Define to the type of args 4 and 6 for getnameinfo. */
+#define GETNAMEINFO_TYPE_ARG46 socklen_t
+
+/* Define to the type of arg 7 for getnameinfo. */
+#define GETNAMEINFO_TYPE_ARG7 int
+
+/* Specifies the number of arguments to getservbyport_r */
+#define GETSERVBYPORT_R_ARGS 5
+
+/* Specifies the size of the buffer to pass to getservbyport_r */
+#define GETSERVBYPORT_R_BUFSIZE 4096
+
+/* Define to 1 if you have AF_INET6. */
+#define HAVE_AF_INET6 1
+
+/* Define to 1 if you have the <arpa/inet.h> header file. */
+#define HAVE_ARPA_INET_H 1
+
+/* Define to 1 if you have the <arpa/nameser_compat.h> header file. */
+#define HAVE_ARPA_NAMESER_COMPAT_H 1
+
+/* Define to 1 if you have the <arpa/nameser.h> header file. */
+#define HAVE_ARPA_NAMESER_H 1
+
+/* Define to 1 if you have the <assert.h> header file. */
+#define HAVE_ASSERT_H 1
+
+/* Define to 1 if you have the `bitncmp' function. */
+/* #undef HAVE_BITNCMP */
+
+/* Define to 1 if bool is an available type. */
+#define HAVE_BOOL_T 1
+
+/* Define to 1 if you have the clock_gettime function and monotonic timer. */
+#define HAVE_CLOCK_GETTIME_MONOTONIC 1
+
+/* Define to 1 if you have the closesocket function. */
+/* #undef HAVE_CLOSESOCKET */
+
+/* Define to 1 if you have the CloseSocket camel case function. */
+/* #undef HAVE_CLOSESOCKET_CAMEL */
+
+/* Define to 1 if you have the connect function. */
+#define HAVE_CONNECT 1
+
+/* define if the compiler supports basic C++11 syntax */
+#define HAVE_CXX11 1
+
+/* Define to 1 if you have the <dlfcn.h> header file. */
+#define HAVE_DLFCN_H 1
+
+/* Define to 1 if you have the <errno.h> header file. */
+#define HAVE_ERRNO_H 1
+
+/* Define to 1 if you have the fcntl function. */
+#define HAVE_FCNTL 1
+
+/* Define to 1 if you have the <fcntl.h> header file. */
+#define HAVE_FCNTL_H 1
+
+/* Define to 1 if you have a working fcntl O_NONBLOCK function. */
+#define HAVE_FCNTL_O_NONBLOCK 1
+
+/* Define to 1 if you have the freeaddrinfo function. */
+#define HAVE_FREEADDRINFO 1
+
+/* Define to 1 if you have a working getaddrinfo function. */
+#define HAVE_GETADDRINFO 1
+
+/* Define to 1 if the getaddrinfo function is threadsafe. */
+#define HAVE_GETADDRINFO_THREADSAFE 1
+
+/* Define to 1 if you have the getenv function. */
+#define HAVE_GETENV 1
+
+/* Define to 1 if you have the gethostbyaddr function. */
+#define HAVE_GETHOSTBYADDR 1
+
+/* Define to 1 if you have the gethostbyname function. */
+#define HAVE_GETHOSTBYNAME 1
+
+/* Define to 1 if you have the gethostname function. */
+#define HAVE_GETHOSTNAME 1
+
+/* Define to 1 if you have the getnameinfo function. */
+#define HAVE_GETNAMEINFO 1
+
+/* Define to 1 if you have the getservbyport_r function. */
+#define HAVE_GETSERVBYPORT_R 1
+
+/* Define to 1 if you have the `gettimeofday' function. */
+#define HAVE_GETTIMEOFDAY 1
+
+/* Define to 1 if you have the `if_indextoname' function. */
+#define HAVE_IF_INDEXTONAME 1
+
+/* Define to 1 if you have a IPv6 capable working inet_net_pton function. */
+/* #undef HAVE_INET_NET_PTON */
+
+/* Define to 1 if you have a IPv6 capable working inet_ntop function. */
+#define HAVE_INET_NTOP 1
+
+/* Define to 1 if you have a IPv6 capable working inet_pton function. */
+#define HAVE_INET_PTON 1
+
+/* Define to 1 if you have the <inttypes.h> header file. */
+#define HAVE_INTTYPES_H 1
+
+/* Define to 1 if you have the ioctl function. */
+#define HAVE_IOCTL 1
+
+/* Define to 1 if you have the ioctlsocket function. */
+/* #undef HAVE_IOCTLSOCKET */
+
+/* Define to 1 if you have the IoctlSocket camel case function. */
+/* #undef HAVE_IOCTLSOCKET_CAMEL */
+
+/* Define to 1 if you have a working IoctlSocket camel case FIONBIO function.
+   */
+/* #undef HAVE_IOCTLSOCKET_CAMEL_FIONBIO */
+
+/* Define to 1 if you have a working ioctlsocket FIONBIO function. */
+/* #undef HAVE_IOCTLSOCKET_FIONBIO */
+
+/* Define to 1 if you have a working ioctl FIONBIO function. */
+/* #undef HAVE_IOCTL_FIONBIO */
+
+/* Define to 1 if you have a working ioctl SIOCGIFADDR function. */
+/* #undef HAVE_IOCTL_SIOCGIFADDR */
+
+/* Define to 1 if you have the `resolve' library (-lresolve). */
+/* #undef HAVE_LIBRESOLVE */
+
+/* Define to 1 if you have the <limits.h> header file. */
+#define HAVE_LIMITS_H 1
+
+/* if your compiler supports LL */
+#define HAVE_LL 1
+
+/* Define to 1 if the compiler supports the 'long long' data type. */
+#define HAVE_LONGLONG 1
+
+/* Define to 1 if you have the malloc.h header file. */
+#define HAVE_MALLOC_H 1
+
+/* Define to 1 if you have the memory.h header file. */
+#define HAVE_MEMORY_H 1
+
+/* Define to 1 if you have the MSG_NOSIGNAL flag. */
+#define HAVE_MSG_NOSIGNAL 1
+
+/* Define to 1 if you have the <netdb.h> header file. */
+#define HAVE_NETDB_H 1
+
+/* Define to 1 if you have the <netinet/in.h> header file. */
+#define HAVE_NETINET_IN_H 1
+
+/* Define to 1 if you have the <netinet/tcp.h> header file. */
+#define HAVE_NETINET_TCP_H 1
+
+/* Define to 1 if you have the <net/if.h> header file. */
+#define HAVE_NET_IF_H 1
+
+/* Define to 1 if you have PF_INET6. */
+#define HAVE_PF_INET6 1
+
+/* Define to 1 if you have the recv function. */
+#define HAVE_RECV 1
+
+/* Define to 1 if you have the recvfrom function. */
+#define HAVE_RECVFROM 1
+
+/* Define to 1 if you have the send function. */
+#define HAVE_SEND 1
+
+/* Define to 1 if you have the setsockopt function. */
+#define HAVE_SETSOCKOPT 1
+
+/* Define to 1 if you have a working setsockopt SO_NONBLOCK function. */
+/* #undef HAVE_SETSOCKOPT_SO_NONBLOCK */
+
+/* Define to 1 if you have the <signal.h> header file. */
+#define HAVE_SIGNAL_H 1
+
+/* Define to 1 if sig_atomic_t is an available typedef. */
+#define HAVE_SIG_ATOMIC_T 1
+
+/* Define to 1 if sig_atomic_t is already defined as volatile. */
+/* #undef HAVE_SIG_ATOMIC_T_VOLATILE */
+
+/* Define to 1 if your struct sockaddr_in6 has sin6_scope_id. */
+#define HAVE_SOCKADDR_IN6_SIN6_SCOPE_ID 1
+
+/* Define to 1 if you have the socket function. */
+#define HAVE_SOCKET 1
+
+/* Define to 1 if you have the <socket.h> header file. */
+/* #undef HAVE_SOCKET_H */
+
+/* Define to 1 if you have the <stdbool.h> header file. */
+#define HAVE_STDBOOL_H 1
+
+/* Define to 1 if you have the <stdint.h> header file. */
+#define HAVE_STDINT_H 1
+
+/* Define to 1 if you have the <stdio.h> header file. */
+#define HAVE_STDIO_H 1
+
+/* Define to 1 if you have the <stdlib.h> header file. */
+#define HAVE_STDLIB_H 1
+
+/* Define to 1 if you have the strcasecmp function. */
+#define HAVE_STRCASECMP 1
+
+/* Define to 1 if you have the strcmpi function. */
+/* #undef HAVE_STRCMPI */
+
+/* Define to 1 if you have the strdup function. */
+#define HAVE_STRDUP 1
+
+/* Define to 1 if you have the stricmp function. */
+/* #undef HAVE_STRICMP */
+
+/* Define to 1 if you have the <strings.h> header file. */
+#define HAVE_STRINGS_H 1
+
+/* Define to 1 if you have the <string.h> header file. */
+#define HAVE_STRING_H 1
+
+/* Define to 1 if you have the strncasecmp function. */
+#define HAVE_STRNCASECMP 1
+
+/* Define to 1 if you have the strncmpi function. */
+/* #undef HAVE_STRNCMPI */
+
+/* Define to 1 if you have the strnicmp function. */
+/* #undef HAVE_STRNICMP */
+
+/* Define to 1 if you have the <stropts.h> header file. */
+#define HAVE_STROPTS_H 1
+
+/* Define to 1 if you have struct addrinfo. */
+#define HAVE_STRUCT_ADDRINFO 1
+
+/* Define to 1 if you have struct in6_addr. */
+#define HAVE_STRUCT_IN6_ADDR 1
+
+/* Define to 1 if you have struct sockaddr_in6. */
+#define HAVE_STRUCT_SOCKADDR_IN6 1
+
+/* if struct sockaddr_storage is defined */
+#define HAVE_STRUCT_SOCKADDR_STORAGE 1
+
+/* Define to 1 if you have the timeval struct. */
+#define HAVE_STRUCT_TIMEVAL 1
+
+/* Define to 1 if you have the <sys/ioctl.h> header file. */
+#define HAVE_SYS_IOCTL_H 1
+
+/* Define to 1 if you have the <sys/param.h> header file. */
+#define HAVE_SYS_PARAM_H 1
+
+/* Define to 1 if you have the <sys/select.h> header file. */
+#define HAVE_SYS_SELECT_H 1
+
+/* Define to 1 if you have the <sys/socket.h> header file. */
+#define HAVE_SYS_SOCKET_H 1
+
+/* Define to 1 if you have the <sys/stat.h> header file. */
+#define HAVE_SYS_STAT_H 1
+
+/* Define to 1 if you have the <sys/time.h> header file. */
+#define HAVE_SYS_TIME_H 1
+
+/* Define to 1 if you have the <sys/types.h> header file. */
+#define HAVE_SYS_TYPES_H 1
+
+/* Define to 1 if you have the <sys/uio.h> header file. */
+#define HAVE_SYS_UIO_H 1
+
+/* Define to 1 if you have the <time.h> header file. */
+#define HAVE_TIME_H 1
+
+/* Define to 1 if you have the <unistd.h> header file. */
+#define HAVE_UNISTD_H 1
+
+/* Define to 1 if you have the windows.h header file. */
+/* #undef HAVE_WINDOWS_H */
+
+/* Define to 1 if you have the winsock2.h header file. */
+/* #undef HAVE_WINSOCK2_H */
+
+/* Define to 1 if you have the winsock.h header file. */
+/* #undef HAVE_WINSOCK_H */
+
+/* Define to 1 if you have the writev function. */
+#define HAVE_WRITEV 1
+
+/* Define to 1 if you have the ws2tcpip.h header file. */
+/* #undef HAVE_WS2TCPIP_H */
+
+/* Define if __system_property_get exists. */
+/* #undef HAVE___SYSTEM_PROPERTY_GET */
+
+/* Define to the sub-directory where libtool stores uninstalled libraries. */
+#define LT_OBJDIR ".libs/"
+
+/* Define to 1 if you need the malloc.h header file even with stdlib.h */
+/* #undef NEED_MALLOC_H */
+
+/* Define to 1 if you need the memory.h header file even with stdlib.h */
+/* #undef NEED_MEMORY_H */
+
+/* Define to 1 if _REENTRANT preprocessor symbol must be defined. */
+#define NEED_REENTRANT 1
+
+/* Define to 1 if _THREAD_SAFE preprocessor symbol must be defined. */
+/* #undef NEED_THREAD_SAFE */
+
+/* cpu-machine-OS */
+#define OS "x86_64-pc-solaris2.11"
+
+/* Name of package */
+#define PACKAGE "c-ares"
+
+/* Define to the address where bug reports for this package should be sent. */
+#define PACKAGE_BUGREPORT "c-ares mailing list: http://lists.haxx.se/listinfo/c-ares"
+
+/* Define to the full name of this package. */
+#define PACKAGE_NAME "c-ares"
+
+/* Define to the full name and version of this package. */
+#define PACKAGE_STRING "c-ares 1.18.1"
+
+/* Define to the one symbol short name of this package. */
+#define PACKAGE_TARNAME "c-ares"
+
+/* Define to the home page for this package. */
+#define PACKAGE_URL ""
+
+/* Define to the version of this package. */
+#define PACKAGE_VERSION "1.18.1"
+
+/* Define to the type qualifier pointed by arg 5 for recvfrom. */
+#define RECVFROM_QUAL_ARG5 
+
+/* Define to the type of arg 1 for recvfrom. */
+#define RECVFROM_TYPE_ARG1 int
+
+/* Define to the type pointed by arg 2 for recvfrom. */
+#define RECVFROM_TYPE_ARG2 void
+
+/* Define to 1 if the type pointed by arg 2 for recvfrom is void. */
+#define RECVFROM_TYPE_ARG2_IS_VOID 1
+
+/* Define to the type of arg 3 for recvfrom. */
+#define RECVFROM_TYPE_ARG3 size_t
+
+/* Define to the type of arg 4 for recvfrom. */
+#define RECVFROM_TYPE_ARG4 int
+
+/* Define to the type pointed by arg 5 for recvfrom. */
+#define RECVFROM_TYPE_ARG5 struct sockaddr
+
+/* Define to 1 if the type pointed by arg 5 for recvfrom is void. */
+/* #undef RECVFROM_TYPE_ARG5_IS_VOID */
+
+/* Define to the type pointed by arg 6 for recvfrom. */
+#define RECVFROM_TYPE_ARG6 void
+
+/* Define to 1 if the type pointed by arg 6 for recvfrom is void. */
+#define RECVFROM_TYPE_ARG6_IS_VOID 1
+
+/* Define to the function return type for recvfrom. */
+#define RECVFROM_TYPE_RETV ssize_t
+
+/* Define to the type of arg 1 for recv. */
+#define RECV_TYPE_ARG1 int
+
+/* Define to the type of arg 2 for recv. */
+#define RECV_TYPE_ARG2 void *
+
+/* Define to the type of arg 3 for recv. */
+#define RECV_TYPE_ARG3 size_t
+
+/* Define to the type of arg 4 for recv. */
+#define RECV_TYPE_ARG4 int
+
+/* Define to the function return type for recv. */
+#define RECV_TYPE_RETV ssize_t
+
+/* Define as the return type of signal handlers (`int' or `void'). */
+#define RETSIGTYPE void
+
+/* Define to the type qualifier of arg 2 for send. */
+#define SEND_QUAL_ARG2 const
+
+/* Define to the type of arg 1 for send. */
+#define SEND_TYPE_ARG1 int
+
+/* Define to the type of arg 2 for send. */
+#define SEND_TYPE_ARG2 void *
+
+/* Define to the type of arg 3 for send. */
+#define SEND_TYPE_ARG3 size_t
+
+/* Define to the type of arg 4 for send. */
+#define SEND_TYPE_ARG4 int
+
+/* Define to the function return type for send. */
+#define SEND_TYPE_RETV ssize_t
+
+/* Define to 1 if all of the C90 standard headers exist (not just the ones
+   required in a freestanding environment). This macro is provided for
+   backward compatibility; new code need not use it. */
+#define STDC_HEADERS 1
+
+/* Define to 1 if you can safely include both <sys/time.h> and <time.h>. This
+   macro is obsolete. */
+#define TIME_WITH_SYS_TIME 1
+
+/* Define to disable non-blocking sockets. */
+/* #undef USE_BLOCKING_SOCKETS */
+
+/* Version number of package */
+#define VERSION "1.18.1"
+
+/* Define to avoid automatic inclusion of winsock.h */
+/* #undef WIN32_LEAN_AND_MEAN */
+
+/* Define WORDS_BIGENDIAN to 1 if your processor stores words with the most
+   significant byte first (like Motorola and SPARC, unlike Intel). */
+#if defined AC_APPLE_UNIVERSAL_BUILD
+# if defined __BIG_ENDIAN__
+#  define WORDS_BIGENDIAN 1
+# endif
+#else
+# ifndef WORDS_BIGENDIAN
+/* #  undef WORDS_BIGENDIAN */
+# endif
+#endif
+
+/* Define to 1 if OS is AIX. */
+#ifndef _ALL_SOURCE
+/* #  undef _ALL_SOURCE */
+#endif
+
+/* Number of bits in a file offset, on hosts where this is settable. */
+/* #undef _FILE_OFFSET_BITS */
+
+/* Define for large files, on AIX-style hosts. */
+/* #undef _LARGE_FILES */
+
+/* Define to empty if `const' does not conform to ANSI C. */
+/* #undef const */
+
+/* Type to use in place of in_addr_t when system does not provide it. */
+/* #undef in_addr_t */
+
+/* Define to `unsigned int' if <sys/types.h> does not define. */
+/* #undef size_t */

From 6a28e7ec9ce789b5d1684f6fb92365a1ac244aed Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Thu, 21 Mar 2024 12:24:59 +0100
Subject: [PATCH 846/985] Fix #ci_set_analyzer

---
 .../02967_parallel_replicas_join_algo_and_analyzer.reference  | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
index 165504174d0..d7fa419aeab 100644
--- a/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
+++ b/tests/queries/0_stateless/02967_parallel_replicas_join_algo_and_analyzer.reference
@@ -82,8 +82,8 @@ nested join with analyzer and parallel replicas, both local
 420294	420294	420294	-140098
 420336	420336	420336	-140112
 420378	420378	420378	-140126
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` (stage: WithMergeableState)
-SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` SETTINGS parallel_replicas_prefer_local_join = 1) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
+SELECT `__table1`.`key` AS `key`, `__table1`.`value` AS `value`, `__table3`.`key` AS `r.key`, `__table3`.`value` AS `r.value` FROM (SELECT `__table2`.`key` AS `key`, `__table2`.`value` AS `value` FROM `default`.`num_1` AS `__table2`) AS `__table1` ALL INNER JOIN (SELECT `__table4`.`key` AS `key`, `__table4`.`value` AS `value` FROM `default`.`num_2` AS `__table4` ALL INNER JOIN (SELECT `__table6`.`number` * 7 AS `key` FROM numbers(100000.) AS `__table6`) AS `__table5` ON `__table4`.`key` = `__table5`.`key` SETTINGS parallel_replicas_prefer_local_join = 1) AS `__table3` ON `__table1`.`key` = `__table3`.`key` ORDER BY `__table1`.`key` ASC LIMIT _CAST(10000, 'UInt64'), _CAST(10, 'UInt64') (stage: WithMergeableState)
 <Debug> WithOrderCoordinator: Coordination done
 
 nested join with analyzer and parallel replicas, both global

From f64001ebfab4e7327d754ac139cbd8674b5d0ffe Mon Sep 17 00:00:00 2001
From: Oxide Computer Company <eng@oxide.computer>
Date: Thu, 21 Mar 2024 11:37:26 +0000
Subject: [PATCH 847/985] contrib/curl: Add illumos support

---
 contrib/curl-cmake/curl_config.h | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/contrib/curl-cmake/curl_config.h b/contrib/curl-cmake/curl_config.h
index a38aa60fe6d..4d4c2972f57 100644
--- a/contrib/curl-cmake/curl_config.h
+++ b/contrib/curl-cmake/curl_config.h
@@ -51,3 +51,8 @@
 #define USE_OPENSSL
 #define USE_THREADS_POSIX
 #define USE_ARES
+
+#ifdef __illumos__
+#define HAVE_POSIX_STRERROR_R 1
+#define HAVE_STRERROR_R 1
+#endif

From 4700222a0d363a978b12ceb486930679ecd63442 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 21 Mar 2024 12:40:07 +0100
Subject: [PATCH 848/985] Fuzzer: Try a different way to wait for the server

---
 docker/test/fuzzer/run-fuzzer.sh | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/docker/test/fuzzer/run-fuzzer.sh b/docker/test/fuzzer/run-fuzzer.sh
index 55f4d379005..76661a5b51c 100755
--- a/docker/test/fuzzer/run-fuzzer.sh
+++ b/docker/test/fuzzer/run-fuzzer.sh
@@ -181,7 +181,15 @@ function fuzz
         --  --path db \
             --logger.console=0 \
             --logger.log=server.log 2>&1 | tee -a stderr.log >> server.log 2>&1 &
-    server_pid=$(pidof clickhouse-server)
+    for _ in {1..30}
+    do
+        if clickhouse-client --query "select 1"
+        then
+            break
+        fi
+        sleep 1
+    done
+    server_pid=$(cat /var/run/clickhouse-server/clickhouse-server.pid)
 
     kill -0 $server_pid
 

From cb71537c62cf4cb87121bd8d3db0d0602fac7286 Mon Sep 17 00:00:00 2001
From: kssenii <sumarokovakseniia@mail.ru>
Date: Thu, 21 Mar 2024 13:11:56 +0100
Subject: [PATCH 849/985] Ping CI


From 7708e0e093a333baf39e9eb3058548cd52eed244 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 21 Mar 2024 13:12:59 +0100
Subject: [PATCH 850/985] Disable some tests for SMT

---
 .../0_stateless/03002_part_log_rmt_fetch_merge_error.sql       | 3 ++-
 .../0_stateless/03002_part_log_rmt_fetch_mutate_error.sql      | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.sql b/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.sql
index a7381df5e11..548a8e5570a 100644
--- a/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.sql
+++ b/tests/queries/0_stateless/03002_part_log_rmt_fetch_merge_error.sql
@@ -1,4 +1,5 @@
--- Tags: no-replicated-database, no-parallel
+-- Tags: no-replicated-database, no-parallel, no-shared-merge-tree
+-- SMT: The merge process is completely different from RMT
 
 drop table if exists rmt_master;
 drop table if exists rmt_slave;
diff --git a/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.sql b/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.sql
index f19cb9c73c9..34ba034f798 100644
--- a/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.sql
+++ b/tests/queries/0_stateless/03002_part_log_rmt_fetch_mutate_error.sql
@@ -1,4 +1,5 @@
--- Tags: no-replicated-database, no-parallel
+-- Tags: no-replicated-database, no-parallel, no-shared-merge-tree
+-- SMT: The merge process is completely different from RMT
 
 drop table if exists rmt_master;
 drop table if exists rmt_slave;

From 638754f988cb70511801ec904af85dd4b763d92a Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Thu, 21 Mar 2024 13:34:32 +0100
Subject: [PATCH 851/985] Fix signal handler for sanitizer signals

---
 src/Daemon/BaseDaemon.cpp | 24 ++++++++++++++++++++----
 1 file changed, 20 insertions(+), 4 deletions(-)

diff --git a/src/Daemon/BaseDaemon.cpp b/src/Daemon/BaseDaemon.cpp
index 289a41bb75e..7fc210a691a 100644
--- a/src/Daemon/BaseDaemon.cpp
+++ b/src/Daemon/BaseDaemon.cpp
@@ -275,7 +275,10 @@ public:
                 }
 
                 readPODBinary(stack_trace, in);
-                readVectorBinary(thread_frame_pointers, in);
+
+                if (sig != SanitizerTrap)
+                    readVectorBinary(thread_frame_pointers, in);
+
                 readBinary(thread_num, in);
                 readPODBinary(thread_ptr, in);
 
@@ -542,6 +545,16 @@ private:
 
 
 #if defined(SANITIZER)
+
+template <typename T>
+struct ValueHolder
+{
+    ValueHolder(T value_) : value(value_)
+    {}
+
+    T value;
+};
+
 extern "C" void __sanitizer_set_death_callback(void (*)());
 
 /// Sanitizers may not expect some function calls from death callback.
@@ -559,10 +572,13 @@ static DISABLE_SANITIZER_INSTRUMENTATION void sanitizerDeathCallback()
 
     const StackTrace stack_trace;
 
-    int sig = SignalListener::SanitizerTrap;
-    writeBinary(sig, out);
+    writeBinary(SignalListener::SanitizerTrap, out);
     writePODBinary(stack_trace, out);
-    writeBinary(UInt32(getThreadId()), out);
+    /// We create a dummy struct with a constructor so DISABLE_SANITIZER_INSTRUMENTATION is not applied to it
+    /// otherwise, Memory sanitizer can't know that values initiialized inside this function are actually initialized
+    /// because instrumentations are disabled leading to false positives later on
+    ValueHolder<UInt32> thread_id{static_cast<UInt32>(getThreadId())};
+    writeBinary(thread_id.value, out);
     writePODBinary(current_thread, out);
 
     out.next();

From 77e947c44f343d3aab32340c4fda4545fb794a57 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 21 Mar 2024 14:09:01 +0100
Subject: [PATCH 852/985] Avoid `IsADirectoryError: Is a directory
 contrib/azure`

---
 tests/ci/style_check.py | 24 ++++++++++++++++--------
 1 file changed, 16 insertions(+), 8 deletions(-)

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 797c0ef12d0..2604793c900 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -100,20 +100,28 @@ def is_python(file: Union[Path, str]) -> bool:
     """returns if the changed file in the repository is python script"""
     # WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
     # and `Support os.PathLike values in magic.from_file` is only from 0.4.25
-    return bool(
-        magic.from_file(os.path.join(REPO_COPY, file), mime=True)
-        == "text/x-script.python"
-    )
+    try:
+        return bool(
+            magic.from_file(os.path.join(REPO_COPY, file), mime=True)
+            == "text/x-script.python"
+        )
+    except IsADirectoryError:
+        # Process submodules w/o errors
+        return False
 
 
 def is_shell(file: Union[Path, str]) -> bool:
     """returns if the changed file in the repository is shell script"""
     # WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
     # and `Support os.PathLike values in magic.from_file` is only from 0.4.25
-    return bool(
-        magic.from_file(os.path.join(REPO_COPY, file), mime=True)
-        == "text/x-shellscript"
-    )
+    try:
+        return bool(
+            magic.from_file(os.path.join(REPO_COPY, file), mime=True)
+            == "text/x-shellscript"
+        )
+    except IsADirectoryError:
+        # Process submodules w/o errors
+        return False
 
 
 def main():

From e828acd0e5f98d0f6c61c260be9cb428ab0695d6 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Thu, 21 Mar 2024 13:17:15 +0000
Subject: [PATCH 853/985] Review fixes.

---
 src/Storages/System/StorageSystemDetachedParts.cpp |  6 +-----
 src/Storages/System/StorageSystemPartsBase.cpp     | 10 ++--------
 src/Storages/VirtualColumnUtils.cpp                |  6 +++---
 src/Storages/VirtualColumnUtils.h                  |  3 +++
 4 files changed, 9 insertions(+), 16 deletions(-)

diff --git a/src/Storages/System/StorageSystemDetachedParts.cpp b/src/Storages/System/StorageSystemDetachedParts.cpp
index 7207e981561..ebcd8d63a52 100644
--- a/src/Storages/System/StorageSystemDetachedParts.cpp
+++ b/src/Storages/System/StorageSystemDetachedParts.cpp
@@ -329,7 +329,6 @@ protected:
 
 void ReadFromSystemDetachedParts::applyFilters(ActionDAGNodes added_filter_nodes)
 {
-    filter_actions_dag = ActionsDAG::buildFilterActionsDAG(added_filter_nodes.nodes);
     filter_actions_dag = ActionsDAG::buildFilterActionsDAG(added_filter_nodes.nodes);
     if (filter_actions_dag)
     {
@@ -344,10 +343,7 @@ void ReadFromSystemDetachedParts::applyFilters(ActionDAGNodes added_filter_nodes
 
         filter = VirtualColumnUtils::splitFilterDagForAllowedInputs(predicate, &block);
         if (filter)
-        {
-            auto empty_block = block.cloneWithColumns(block.cloneEmptyColumns());
-            VirtualColumnUtils::filterBlockWithDAG(filter, empty_block, context);
-        }
+            VirtualColumnUtils::buildSetsForDAG(filter, context);
     }
 }
 
diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index c81c2c18b2e..11cd6989f31 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -264,10 +264,7 @@ void ReadFromSystemPartsBase::applyFilters(ActionDAGNodes added_filter_nodes)
 
         filter_by_database = VirtualColumnUtils::splitFilterDagForAllowedInputs(predicate, &block);
         if (filter_by_database)
-        {
-            auto empty_block = block.cloneWithColumns(block.cloneEmptyColumns());
-            VirtualColumnUtils::filterBlockWithDAG(filter_by_database, empty_block, context);
-        }
+            VirtualColumnUtils::buildSetsForDAG(filter_by_database, context);
 
         block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeString>(), "table"));
         block.insert(ColumnWithTypeAndName({}, std::make_shared<DataTypeString>(), "engine"));
@@ -276,10 +273,7 @@ void ReadFromSystemPartsBase::applyFilters(ActionDAGNodes added_filter_nodes)
 
         filter_by_other_columns = VirtualColumnUtils::splitFilterDagForAllowedInputs(predicate, &block);
         if (filter_by_other_columns)
-        {
-            auto empty_block = block.cloneWithColumns(block.cloneEmptyColumns());
-            VirtualColumnUtils::filterBlockWithDAG(filter_by_database, empty_block, context);
-        }
+            VirtualColumnUtils::buildSetsForDAG(filter_by_other_columns, context);
     }
 }
 
diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index c3ac27903c9..e3cbff5f01b 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -53,9 +53,9 @@ namespace DB
 namespace VirtualColumnUtils
 {
 
-static void makeSets(const ExpressionActionsPtr & actions, const ContextPtr & context)
+void buildSetsForDAG(const ActionsDAGPtr & dag, const ContextPtr & context)
 {
-    for (const auto & node : actions->getNodes())
+    for (const auto & node : dag->getNodes())
     {
         if (node.type == ActionsDAG::ActionType::COLUMN)
         {
@@ -78,8 +78,8 @@ static void makeSets(const ExpressionActionsPtr & actions, const ContextPtr & co
 
 void filterBlockWithDAG(ActionsDAGPtr dag, Block & block, ContextPtr context)
 {
+    buildSetsForDAG(dag, context);
     auto actions = std::make_shared<ExpressionActions>(dag);
-    makeSets(actions, context);
     Block block_with_filter = block;
     actions->execute(block_with_filter, /*dry_run=*/ false, /*allow_duplicates_in_input=*/ true);
 
diff --git a/src/Storages/VirtualColumnUtils.h b/src/Storages/VirtualColumnUtils.h
index 83494872cac..62f2e4855b5 100644
--- a/src/Storages/VirtualColumnUtils.h
+++ b/src/Storages/VirtualColumnUtils.h
@@ -25,6 +25,9 @@ void filterBlockWithPredicate(const ActionsDAG::Node * predicate, Block & block,
 /// Just filters block. Block should contain all the required columns.
 void filterBlockWithDAG(ActionsDAGPtr dag, Block & block, ContextPtr context);
 
+/// Builds sets used by ActionsDAG inplace.
+void buildSetsForDAG(const ActionsDAGPtr & dag, const ContextPtr & context);
+
 /// Recursively checks if all functions used in DAG are deterministic in scope of query.
 bool isDeterministicInScopeOfQuery(const ActionsDAG::Node * node);
 

From 15a61a998a176314debe152b5d59be4ff3f5797a Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Thu, 21 Mar 2024 14:34:31 +0100
Subject: [PATCH 854/985] Fix logic for run_cpp_check, it had a bug

---
 tests/ci/style_check.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 2604793c900..d7f6fa998e9 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -143,8 +143,8 @@ def main():
     run_python_check = True
     if CI and pr_info.number > 0:
         pr_info.fetch_changed_files()
-        run_cpp_check = not any(
-            is_python(file) or is_shell(file) for file in pr_info.changed_files
+        run_cpp_check = any(
+            not (is_python(file) or is_shell(file)) for file in pr_info.changed_files
         )
         run_shell_check = any(is_shell(file) for file in pr_info.changed_files)
         run_python_check = any(is_python(file) for file in pr_info.changed_files)

From 48cb228c9a88b1f77c9ec10ce04107edec3e190c Mon Sep 17 00:00:00 2001
From: Shuai li <loneylee@live.cn>
Date: Thu, 21 Mar 2024 21:47:29 +0800
Subject: [PATCH 855/985] Fix addDays cause an error when used datetime64
 (#61561)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* Fix addDays cause an error when used datetime64

* add exception describe

* Update tests/queries/0_stateless/03013_addDays_with_timezone.sql

* remove file be executable

* fix timezone

* fix ci

---------

Co-authored-by: János Benjamin Antal <antaljanosbenjamin@users.noreply.github.com>
---
 .../FunctionDateOrDateTimeAddInterval.h       |  4 +--
 ...21_datetime64_compatibility_long.reference | 32 +++++++++----------
 .../03013_addDays_with_timezone.reference     |  1 +
 .../03013_addDays_with_timezone.sql           |  1 +
 4 files changed, 20 insertions(+), 18 deletions(-)
 create mode 100644 tests/queries/0_stateless/03013_addDays_with_timezone.reference
 create mode 100644 tests/queries/0_stateless/03013_addDays_with_timezone.sql

diff --git a/src/Functions/FunctionDateOrDateTimeAddInterval.h b/src/Functions/FunctionDateOrDateTimeAddInterval.h
index b8c0d27c42e..f50b1415622 100644
--- a/src/Functions/FunctionDateOrDateTimeAddInterval.h
+++ b/src/Functions/FunctionDateOrDateTimeAddInterval.h
@@ -621,9 +621,9 @@ public:
         }
         else
         {
-            if (!WhichDataType(arguments[0].type).isDateTime())
+            if (!WhichDataType(arguments[0].type).isDateTimeOrDateTime64())
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of first argument of function {}. "
-                    "Must be a DateTime", arguments[0].type->getName(), getName());
+                    "Must be a DateTime/DateTime64", arguments[0].type->getName(), getName());
 
             if (!WhichDataType(arguments[2].type).isString())
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of third argument of function {}. "
diff --git a/tests/queries/0_stateless/00921_datetime64_compatibility_long.reference b/tests/queries/0_stateless/00921_datetime64_compatibility_long.reference
index a946a114bf4..74b7b207661 100644
--- a/tests/queries/0_stateless/00921_datetime64_compatibility_long.reference
+++ b/tests/queries/0_stateless/00921_datetime64_compatibility_long.reference
@@ -241,82 +241,82 @@ SELECT toYYYYMMDDhhmmss(N, \'Asia/Istanbul\')
 SELECT addYears(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2020-09-16 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2020-09-16 19:20:11.234"
 ------------------------------------------
 SELECT addMonths(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-10-16 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-10-16 19:20:11.234"
 ------------------------------------------
 SELECT addWeeks(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-23 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-23 19:20:11.234"
 ------------------------------------------
 SELECT addDays(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-17 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-17 19:20:11.234"
 ------------------------------------------
 SELECT addHours(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-16 20:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-16 20:20:11.234"
 ------------------------------------------
 SELECT addMinutes(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-16 19:21:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-16 19:21:11.234"
 ------------------------------------------
 SELECT addSeconds(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-16 19:20:12"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-16 19:20:12.234"
 ------------------------------------------
 SELECT addQuarters(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-12-16 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-12-16 19:20:11.234"
 ------------------------------------------
 SELECT subtractYears(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2018-09-16 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2018-09-16 19:20:11.234"
 ------------------------------------------
 SELECT subtractMonths(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-08-16 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-08-16 19:20:11.234"
 ------------------------------------------
 SELECT subtractWeeks(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-09 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-09 19:20:11.234"
 ------------------------------------------
 SELECT subtractDays(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-15 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-15 19:20:11.234"
 ------------------------------------------
 SELECT subtractHours(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-16 18:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-16 18:20:11.234"
 ------------------------------------------
 SELECT subtractMinutes(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-16 19:19:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-16 19:19:11.234"
 ------------------------------------------
 SELECT subtractSeconds(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-09-16 19:20:10"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-09-16 19:20:10.234"
 ------------------------------------------
 SELECT subtractQuarters(N, 1, \'Asia/Istanbul\')
 Code: 43
 "DateTime('Asia/Istanbul')","2019-06-16 19:20:11"
-Code: 43
+"DateTime64(3, 'Asia/Istanbul')","2019-06-16 19:20:11.234"
 ------------------------------------------
 SELECT CAST(N as DateTime(\'Europe/Minsk\'))
 "DateTime('Europe/Minsk')","2019-09-16 00:00:00"
diff --git a/tests/queries/0_stateless/03013_addDays_with_timezone.reference b/tests/queries/0_stateless/03013_addDays_with_timezone.reference
new file mode 100644
index 00000000000..6a8fa4f8a2c
--- /dev/null
+++ b/tests/queries/0_stateless/03013_addDays_with_timezone.reference
@@ -0,0 +1 @@
+2024-01-11 00:00:00.000000
diff --git a/tests/queries/0_stateless/03013_addDays_with_timezone.sql b/tests/queries/0_stateless/03013_addDays_with_timezone.sql
new file mode 100644
index 00000000000..eb822d53898
--- /dev/null
+++ b/tests/queries/0_stateless/03013_addDays_with_timezone.sql
@@ -0,0 +1 @@
+select addDays(toDateTime64('2024-01-01', 6, 'Asia/Shanghai'), 10, 'Asia/Shanghai');

From 7c173e4dbc9606f2d0f4de6d61bbfe214997891c Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 21 Mar 2024 16:03:50 +0100
Subject: [PATCH 856/985] Analyzer: fix group_by_use_nulls #ci_set_analyzer

---
 src/Planner/PlannerExpressionAnalysis.cpp                 | 8 ++++++--
 .../03014_analyzer_group_by_use_nulls.reference           | 2 ++
 .../0_stateless/03014_analyzer_group_by_use_nulls.sql     | 1 +
 3 files changed, 9 insertions(+), 2 deletions(-)
 create mode 100644 tests/queries/0_stateless/03014_analyzer_group_by_use_nulls.reference
 create mode 100644 tests/queries/0_stateless/03014_analyzer_group_by_use_nulls.sql

diff --git a/src/Planner/PlannerExpressionAnalysis.cpp b/src/Planner/PlannerExpressionAnalysis.cpp
index c664317b250..441e2ac4b9e 100644
--- a/src/Planner/PlannerExpressionAnalysis.cpp
+++ b/src/Planner/PlannerExpressionAnalysis.cpp
@@ -1,5 +1,7 @@
 #include <Planner/PlannerExpressionAnalysis.h>
 
+#include <Columns/ColumnNullable.h>
+
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeNullable.h>
 
@@ -111,7 +113,8 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                             continue;
 
                         auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
-                        available_columns_after_aggregation.emplace_back(expression_dag_node->column, expression_type_after_aggregation, expression_dag_node->result_name);
+                        auto column_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->column) : expression_dag_node->column;
+                        available_columns_after_aggregation.emplace_back(std::move(column_after_aggregation), expression_type_after_aggregation, expression_dag_node->result_name);
                         aggregation_keys.push_back(expression_dag_node->result_name);
                         before_aggregation_actions->getOutputs().push_back(expression_dag_node);
                         before_aggregation_actions_output_node_names.insert(expression_dag_node->result_name);
@@ -161,7 +164,8 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                         continue;
 
                     auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
-                    available_columns_after_aggregation.emplace_back(expression_dag_node->column, expression_type_after_aggregation, expression_dag_node->result_name);
+                    auto column_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->column) : expression_dag_node->column;
+                    available_columns_after_aggregation.emplace_back(std::move(column_after_aggregation), expression_type_after_aggregation, expression_dag_node->result_name);
                     aggregation_keys.push_back(expression_dag_node->result_name);
                     before_aggregation_actions->getOutputs().push_back(expression_dag_node);
                     before_aggregation_actions_output_node_names.insert(expression_dag_node->result_name);
diff --git a/tests/queries/0_stateless/03014_analyzer_group_by_use_nulls.reference b/tests/queries/0_stateless/03014_analyzer_group_by_use_nulls.reference
new file mode 100644
index 00000000000..b50fdcee209
--- /dev/null
+++ b/tests/queries/0_stateless/03014_analyzer_group_by_use_nulls.reference
@@ -0,0 +1,2 @@
+a	b
+a	b
diff --git a/tests/queries/0_stateless/03014_analyzer_group_by_use_nulls.sql b/tests/queries/0_stateless/03014_analyzer_group_by_use_nulls.sql
new file mode 100644
index 00000000000..a1c302465de
--- /dev/null
+++ b/tests/queries/0_stateless/03014_analyzer_group_by_use_nulls.sql
@@ -0,0 +1 @@
+SELECT 'a' AS key, 'b' as value GROUP BY key WITH CUBE SETTINGS group_by_use_nulls = 1;

From f36e19917fcb5d8acc290bee77ff1ffd9ceca587 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 21 Mar 2024 15:27:39 +0000
Subject: [PATCH 857/985] Disable analyzer for EXPLAIN SYNTAX queries

---
 src/Interpreters/InterpreterFactory.cpp        |  4 ++++
 ...allel_replicas_cte_explain_syntax_crash.sql | 18 +++++++++---------
 2 files changed, 13 insertions(+), 9 deletions(-)

diff --git a/src/Interpreters/InterpreterFactory.cpp b/src/Interpreters/InterpreterFactory.cpp
index 0b87ec3cc0e..387d056ffe7 100644
--- a/src/Interpreters/InterpreterFactory.cpp
+++ b/src/Interpreters/InterpreterFactory.cpp
@@ -219,6 +219,10 @@ InterpreterFactory::InterpreterPtr InterpreterFactory::get(ASTPtr & query, Conte
     }
     else if (query->as<ASTExplainQuery>())
     {
+        const auto kind = query->as<ASTExplainQuery>()->getKind();
+        if (kind == ASTExplainQuery::ParsedAST || kind == ASTExplainQuery::AnalyzedSyntax)
+            context->setSetting("allow_experimental_analyzer", false);
+
         interpreter_name = "InterpreterExplainQuery";
     }
     else if (query->as<ASTShowProcesslistQuery>())
diff --git a/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql b/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql
index f46817d5e82..df4ec9d26a3 100644
--- a/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql
+++ b/tests/queries/0_stateless/03006_parallel_replicas_cte_explain_syntax_crash.sql
@@ -3,29 +3,26 @@ DROP TABLE IF EXISTS numbers_1e6__fuzz_33;
 
 CREATE TABLE numbers_1e6__fuzz_34
 (
-    `n` LowCardinality(Nullable(UInt8))
+    n UInt64
 )
 ENGINE = MergeTree
 ORDER BY n
-SETTINGS allow_nullable_key = 1
 AS SELECT *
-FROM numbers(1000000)
-SETTINGS allow_suspicious_low_cardinality_types = 1;
+FROM numbers(10);
 
 
 CREATE TABLE numbers_1e6__fuzz_33
 (
-    `n` LowCardinality(Nullable(UInt8))
+    n UInt64
 )
 ENGINE = MergeTree
 ORDER BY n
-SETTINGS allow_nullable_key = 1
 AS SELECT *
-FROM numbers(1000000)
-SETTINGS allow_suspicious_low_cardinality_types = 1;
+FROM numbers(10);
 
 SET allow_experimental_analyzer = 1;
-SET allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3;
+SET allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', max_parallel_replicas = 3, parallel_replicas_min_number_of_rows_per_replica=0;
+
 EXPLAIN SYNTAX
 WITH
     cte1 AS
@@ -41,3 +38,6 @@ WITH
     )
 SELECT count()
 FROM cte2;
+
+DROP TABLE numbers_1e6__fuzz_34;
+DROP TABLE numbers_1e6__fuzz_33;

From 37b34d6ed159b76528e5bc8b1d74705eae0ba97d Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 21 Mar 2024 16:28:45 +0100
Subject: [PATCH 858/985] Analyzer: Clear list of broken integration tests

---
 tests/analyzer_integration_broken_tests.txt | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
index 56fde20c363..e69de29bb2d 100644
--- a/tests/analyzer_integration_broken_tests.txt
+++ b/tests/analyzer_integration_broken_tests.txt
@@ -1 +0,0 @@
-test_concurrent_backups_s3/test.py::test_concurrent_backups

From d1d72778021e9e13dc4a9a3bf4a34b53eb55ce7e Mon Sep 17 00:00:00 2001
From: Anton Popov <anton@clickhouse.com>
Date: Thu, 21 Mar 2024 15:29:11 +0000
Subject: [PATCH 859/985] fix clang-tidy and test

---
 src/Common/ColumnsHashingImpl.h                      |  4 ++--
 .../03009_consecutive_keys_nullable.reference        |  6 +++---
 .../0_stateless/03009_consecutive_keys_nullable.sql  | 12 ++++++------
 3 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/src/Common/ColumnsHashingImpl.h b/src/Common/ColumnsHashingImpl.h
index c8d62fa7e6b..6b3cc24d870 100644
--- a/src/Common/ColumnsHashingImpl.h
+++ b/src/Common/ColumnsHashingImpl.h
@@ -67,7 +67,7 @@ template <typename Value, bool nullable> struct LastElementCache;
 template <typename Value>
 struct LastElementCache<Value, true> : public LastElementCacheBase
 {
-    Value value;
+    Value value{};
     bool is_null = false;
 
     template <typename Key>
@@ -79,7 +79,7 @@ struct LastElementCache<Value, true> : public LastElementCacheBase
 template <typename Value>
 struct LastElementCache<Value, false> : public LastElementCacheBase
 {
-    Value value;
+    Value value{};
 
     template <typename Key>
     bool check(const Key & key) const { return value.first == key; }
diff --git a/tests/queries/0_stateless/03009_consecutive_keys_nullable.reference b/tests/queries/0_stateless/03009_consecutive_keys_nullable.reference
index 1c8064290c6..e1b9e0cba62 100644
--- a/tests/queries/0_stateless/03009_consecutive_keys_nullable.reference
+++ b/tests/queries/0_stateless/03009_consecutive_keys_nullable.reference
@@ -1,13 +1,13 @@
-\N	1	1
 1	2	0
 \N	1	1
 1	2	0
+\N	1	1
 \N	3	3
 1	3	0
-\N	1	1
 1	2	0
-\N	2	2
+\N	1	1
 1	1	0
+\N	2	2
 t_nullable_keys_1	0
 t_nullable_keys_2	0
 t_nullable_keys_3	1
diff --git a/tests/queries/0_stateless/03009_consecutive_keys_nullable.sql b/tests/queries/0_stateless/03009_consecutive_keys_nullable.sql
index ee2cb5a171f..7650cf14a49 100644
--- a/tests/queries/0_stateless/03009_consecutive_keys_nullable.sql
+++ b/tests/queries/0_stateless/03009_consecutive_keys_nullable.sql
@@ -2,7 +2,7 @@ DROP TABLE IF EXISTS t_nullable_keys_1;
 
 CREATE TABLE t_nullable_keys_1 (x Nullable(Int64)) ENGINE = Memory;
 INSERT INTO t_nullable_keys_1 VALUES (1), (1), (NULL);
-SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_1 GROUP BY x;
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_1 GROUP BY x ORDER BY x;
 
 DROP TABLE t_nullable_keys_1;
 
@@ -10,7 +10,7 @@ DROP TABLE IF EXISTS t_nullable_keys_2;
 
 CREATE TABLE t_nullable_keys_2 (x Nullable(Int64)) ENGINE = Memory;
 INSERT INTO t_nullable_keys_2 VALUES (NULL), (1), (1);
-SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_2 GROUP BY x;
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_2 GROUP BY x ORDER BY x;
 
 DROP TABLE t_nullable_keys_2;
 
@@ -18,7 +18,7 @@ DROP TABLE IF EXISTS t_nullable_keys_3;
 
 CREATE TABLE t_nullable_keys_3 (x Nullable(Int64)) ENGINE = Memory;
 INSERT INTO t_nullable_keys_3 VALUES (NULL), (NULL), (NULL);
-SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_3 GROUP BY x;
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_3 GROUP BY x ORDER BY x;
 
 DROP TABLE t_nullable_keys_3;
 
@@ -26,7 +26,7 @@ DROP TABLE IF EXISTS t_nullable_keys_4;
 
 CREATE TABLE t_nullable_keys_4 (x Nullable(Int64)) ENGINE = Memory;
 INSERT INTO t_nullable_keys_4 VALUES (1), (1), (1);
-SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_4 GROUP BY x;
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_4 GROUP BY x ORDER BY x;
 
 DROP TABLE t_nullable_keys_4;
 
@@ -34,7 +34,7 @@ DROP TABLE IF EXISTS t_nullable_keys_5;
 
 CREATE TABLE t_nullable_keys_5 (x Nullable(Int64)) ENGINE = Memory;
 INSERT INTO t_nullable_keys_5 VALUES (1), (NULL), (1);
-SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_5 GROUP BY x;
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_5 GROUP BY x ORDER BY x;
 
 DROP TABLE t_nullable_keys_5;
 
@@ -42,7 +42,7 @@ DROP TABLE IF EXISTS t_nullable_keys_6;
 
 CREATE TABLE t_nullable_keys_6 (x Nullable(Int64)) ENGINE = Memory;
 INSERT INTO t_nullable_keys_6 VALUES (NULL), (1), (NULL);
-SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_6 GROUP BY x;
+SELECT x, count(), countIf(x IS NULL) FROM t_nullable_keys_6 GROUP BY x ORDER BY x;
 
 DROP TABLE t_nullable_keys_6;
 

From 29a52419972ca8bac81d56ced30d871495091cdb Mon Sep 17 00:00:00 2001
From: Vitaly Baranov <vitlibar@clickhouse.com>
Date: Wed, 20 Mar 2024 17:18:08 +0100
Subject: [PATCH 860/985] fix build

---
 src/Common/Config/AbstractConfigurationComparison.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/Config/AbstractConfigurationComparison.cpp b/src/Common/Config/AbstractConfigurationComparison.cpp
index e241a540cc1..607b583cf31 100644
--- a/src/Common/Config/AbstractConfigurationComparison.cpp
+++ b/src/Common/Config/AbstractConfigurationComparison.cpp
@@ -41,7 +41,7 @@ namespace
 #if defined(ABORT_ON_LOGICAL_ERROR)
             /// Compound `ignore_keys` are not yet implemented.
             for (const auto & ignore_key : *ignore_keys)
-                chassert(ignore_key.find(".") == std::string_view::npos);
+                chassert(ignore_key.find('.') == std::string_view::npos);
 #endif
         }
 

From 63631ee58721729bd82d45a854074546c38be5f8 Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Thu, 21 Mar 2024 15:35:05 +0000
Subject: [PATCH 861/985] Remove debug code

---
 src/Storages/StorageMergeTree.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index 19f951c8dc4..c87681a1418 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -219,7 +219,6 @@ void StorageMergeTree::read(
         Block header;
         if (local_context->getSettingsRef().allow_experimental_analyzer)
         {
-            chassert(query_info.query_tree);
             QueryTreeNodePtr modified_query_tree = query_info.query_tree->clone();
             rewriteJoinToGlobalJoin(modified_query_tree, local_context);
             modified_query_tree = buildQueryTreeForShard(query_info.planner_context, modified_query_tree);

From 110b08f666c158d0f0cabbeff975e56b57f2286f Mon Sep 17 00:00:00 2001
From: Dmitry Novik <mrnovikd@gmail.com>
Date: Thu, 21 Mar 2024 18:38:57 +0100
Subject: [PATCH 862/985] Fixup #ci_set_analyzer

---
 src/Planner/PlannerExpressionAnalysis.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Planner/PlannerExpressionAnalysis.cpp b/src/Planner/PlannerExpressionAnalysis.cpp
index 441e2ac4b9e..dd3769ee10b 100644
--- a/src/Planner/PlannerExpressionAnalysis.cpp
+++ b/src/Planner/PlannerExpressionAnalysis.cpp
@@ -113,7 +113,7 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                             continue;
 
                         auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
-                        auto column_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->column) : expression_dag_node->column;
+                        auto column_after_aggregation = group_by_use_nulls && expression_dag_node->column != nullptr ? makeNullableSafe(expression_dag_node->column) : expression_dag_node->column;
                         available_columns_after_aggregation.emplace_back(std::move(column_after_aggregation), expression_type_after_aggregation, expression_dag_node->result_name);
                         aggregation_keys.push_back(expression_dag_node->result_name);
                         before_aggregation_actions->getOutputs().push_back(expression_dag_node);
@@ -164,7 +164,7 @@ std::optional<AggregationAnalysisResult> analyzeAggregation(const QueryTreeNodeP
                         continue;
 
                     auto expression_type_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->result_type) : expression_dag_node->result_type;
-                    auto column_after_aggregation = group_by_use_nulls ? makeNullableSafe(expression_dag_node->column) : expression_dag_node->column;
+                    auto column_after_aggregation = group_by_use_nulls && expression_dag_node->column != nullptr ? makeNullableSafe(expression_dag_node->column) : expression_dag_node->column;
                     available_columns_after_aggregation.emplace_back(std::move(column_after_aggregation), expression_type_after_aggregation, expression_dag_node->result_name);
                     aggregation_keys.push_back(expression_dag_node->result_name);
                     before_aggregation_actions->getOutputs().push_back(expression_dag_node);

From b275e06aca70a334babf74412fea6cf728664bca Mon Sep 17 00:00:00 2001
From: Dmitry Novik <n0vik@clickhouse.com>
Date: Thu, 21 Mar 2024 19:02:46 +0100
Subject: [PATCH 863/985] Add test for 57820 #ci_set_analyzer

---
 .../queries/0_stateless/03018_analyzer_greater_null.reference | 1 +
 tests/queries/0_stateless/03018_analyzer_greater_null.sql     | 4 ++++
 2 files changed, 5 insertions(+)
 create mode 100644 tests/queries/0_stateless/03018_analyzer_greater_null.reference
 create mode 100644 tests/queries/0_stateless/03018_analyzer_greater_null.sql

diff --git a/tests/queries/0_stateless/03018_analyzer_greater_null.reference b/tests/queries/0_stateless/03018_analyzer_greater_null.reference
new file mode 100644
index 00000000000..1e254619239
--- /dev/null
+++ b/tests/queries/0_stateless/03018_analyzer_greater_null.reference
@@ -0,0 +1 @@
+\N	0
diff --git a/tests/queries/0_stateless/03018_analyzer_greater_null.sql b/tests/queries/0_stateless/03018_analyzer_greater_null.sql
new file mode 100644
index 00000000000..66ea53e451f
--- /dev/null
+++ b/tests/queries/0_stateless/03018_analyzer_greater_null.sql
@@ -0,0 +1,4 @@
+SELECT
+    max(NULL > 255) > NULL AS a,
+    count(NULL > 1.) > 1048577
+FROM numbers(10);

From 958659584957ff419a9305d9c7edee5703fedbdc Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Thu, 21 Mar 2024 19:09:40 +0100
Subject: [PATCH 864/985] Fix clang-tidy

---
 src/Functions/FunctionsTimeWindow.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Functions/FunctionsTimeWindow.h b/src/Functions/FunctionsTimeWindow.h
index 65cc7e9e87c..d52b76bec91 100644
--- a/src/Functions/FunctionsTimeWindow.h
+++ b/src/Functions/FunctionsTimeWindow.h
@@ -119,7 +119,7 @@ template<> \
     struct AddTime<IntervalKind::Kind::INTERVAL_KIND> \
     { \
         static inline NO_SANITIZE_UNDEFINED UInt32 execute(UInt32 t, Int64 delta, const DateLUTImpl &) \
-        { return static_cast<UInt32>(t + delta * INTERVAL); } \
+        { return static_cast<UInt32>(t + delta * (INTERVAL)); } \
     };
     ADD_TIME(Day, 86400)
     ADD_TIME(Hour, 3600)

From 89d80a4d65be42986f8d710c6f2ac5305491b80b Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Thu, 21 Mar 2024 18:16:31 +0000
Subject: [PATCH 865/985] Redo fix.

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 57 ++++++++++++++++++-----
 src/Functions/randConstant.cpp            | 16 ++-----
 2 files changed, 50 insertions(+), 23 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 2a46417ee98..834bc2e5813 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -799,7 +799,13 @@ struct IdentifierResolveScope
     /// Node hash to mask id map
     std::shared_ptr<std::map<IQueryTreeNode::Hash, size_t>> projection_mask_map;
 
-    std::map<IQueryTreeNode::Hash, FunctionOverloadResolverPtr> rand_constant_cache;
+    struct ResolvedFunctionsCache
+    {
+        FunctionOverloadResolverPtr resolver;
+        std::map<IQueryTreeNode::Hash, FunctionBasePtr> cache;
+    };
+
+    std::map<IQueryTreeNode::Hash, ResolvedFunctionsCache> functions_cache;
 
     [[maybe_unused]] const IdentifierResolveScope * getNearestQueryScope() const
     {
@@ -925,6 +931,24 @@ struct IdentifierResolveScope
     }
 };
 
+IQueryTreeNode::Hash getHashForFunctionArguments(const ColumnsWithTypeAndName & arguments)
+{
+    SipHash hash;
+    for (const auto & arg : arguments)
+    {
+        auto type_name = arg.type->getName();
+        hash.update(type_name.c_str(), type_name.size());
+
+        if (arg.column)
+        {
+            if (const auto * col_const = typeid_cast<const ColumnConst *>(arg.column.get()))
+                col_const->updateHashWithValue(0, hash);
+        }
+    }
+
+    return getSipHash128AsPair(hash);
+}
+
 
 /** Visitor that extracts expression and function aliases from node and initialize scope tables with it.
   * Does not go into child lambdas and queries.
@@ -5534,21 +5558,19 @@ ProjectionNames QueryAnalyzer::resolveFunction(QueryTreeNodePtr & node, Identifi
     FunctionOverloadResolverPtr function = UserDefinedExecutableFunctionFactory::instance().tryGet(function_name, scope.context, parameters);
     bool is_executable_udf = true;
 
+    IdentifierResolveScope::ResolvedFunctionsCache * function_cache = nullptr;
+
     if (!function)
     {
         /// This is a hack to allow a query like `select randConstant(), randConstant(), randConstant()`.
         /// Function randConstant() would return the same value for the same arguments (in scope).
-        if (function_name == "randConstant")
-        {
-            auto hash = function_node_ptr->getTreeHash();
-            auto & func = scope.rand_constant_cache[hash];
-            if (!func)
-                func = FunctionFactory::instance().tryGet(function_name, scope.context);
 
-            function = func;
-        }
-        else
-            function = FunctionFactory::instance().tryGet(function_name, scope.context);
+        auto hash = function_node_ptr->getTreeHash();
+        function_cache = &scope.functions_cache[hash];
+        if (!function_cache->resolver)
+            function_cache->resolver = FunctionFactory::instance().tryGet(function_name, scope.context);
+
+        function = function_cache->resolver;
 
         is_executable_udf = false;
     }
@@ -5773,7 +5795,18 @@ ProjectionNames QueryAnalyzer::resolveFunction(QueryTreeNodePtr & node, Identifi
 
     try
     {
-        auto function_base = function->build(argument_columns);
+        FunctionBasePtr function_base;
+        if (function_cache)
+        {
+            auto args_hash = getHashForFunctionArguments(argument_columns);
+            auto & cached_function = function_cache->cache[args_hash];
+            if (!cached_function)
+                cached_function = function->build(argument_columns);
+
+            function_base = cached_function;
+        }
+        else
+            function_base = function->build(argument_columns);
 
         /// Do not constant fold get scalar functions
         bool disable_constant_folding = function_name == "__getScalar" || function_name == "shardNum" ||
diff --git a/src/Functions/randConstant.cpp b/src/Functions/randConstant.cpp
index 5872ab8bb34..22ce6d88ea6 100644
--- a/src/Functions/randConstant.cpp
+++ b/src/Functions/randConstant.cpp
@@ -88,14 +88,6 @@ public:
         return std::make_unique<RandomConstantOverloadResolver<ToType, Name>>();
     }
 
-    RandomConstantOverloadResolver()
-    {
-        typename ColumnVector<ToType>::Container vec_to(1);
-
-        TargetSpecific::Default::RandImpl::execute(reinterpret_cast<char *>(vec_to.data()), sizeof(ToType));
-        value = vec_to[0];
-    }
-
     DataTypePtr getReturnTypeImpl(const DataTypes & data_types) const override
     {
         size_t number_of_arguments = data_types.size();
@@ -113,11 +105,13 @@ public:
         if (!arguments.empty())
             argument_types.emplace_back(arguments.back().type);
 
+        typename ColumnVector<ToType>::Container vec_to(1);
+
+        TargetSpecific::Default::RandImpl::execute(reinterpret_cast<char *>(vec_to.data()), sizeof(ToType));
+        ToType value = vec_to[0];
+
         return std::make_unique<FunctionBaseRandomConstant<ToType, Name>>(value, argument_types, return_type);
     }
-
-private:
-    ToType value;
 };
 
 struct NameRandConstant { static constexpr auto name = "randConstant"; };

From 929173cce2e934a5510a0b9753d92734f39bf8d1 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 21 Mar 2024 19:18:16 +0100
Subject: [PATCH 866/985] Fix S3 buffer allocation

---
 src/Common/BufferAllocationPolicy.cpp            |  2 +-
 src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp |  4 ++++
 src/IO/WriteBufferFromS3.cpp                     | 12 ++++++++++++
 src/IO/WriteBufferFromS3.h                       |  1 +
 4 files changed, 18 insertions(+), 1 deletion(-)

diff --git a/src/Common/BufferAllocationPolicy.cpp b/src/Common/BufferAllocationPolicy.cpp
index 980cbcca729..9f9665be9b9 100644
--- a/src/Common/BufferAllocationPolicy.cpp
+++ b/src/Common/BufferAllocationPolicy.cpp
@@ -73,7 +73,7 @@ public:
 
         if (1 == buffer_number)
         {
-            current_size =  std::min(size_t(DBMS_DEFAULT_BUFFER_SIZE), first_size);
+            current_size = first_size;
             return;
         }
 
diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index ed3ce76bd94..1e589cf8bf3 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -141,6 +141,10 @@ void WriteBufferFromAzureBlobStorage::allocateBuffer()
 {
     buffer_allocation_policy->nextBuffer();
     auto size = buffer_allocation_policy->getBufferSize();
+
+    if (buffer_allocation_policy->getBufferNumber() == 1)
+        size = std::min(size_t(DBMS_DEFAULT_BUFFER_SIZE), size);
+
     memory = Memory(size);
     WriteBuffer::set(memory.data(), memory.size());
 }
diff --git a/src/IO/WriteBufferFromS3.cpp b/src/IO/WriteBufferFromS3.cpp
index 865bac86ff5..4ddff4ce898 100644
--- a/src/IO/WriteBufferFromS3.cpp
+++ b/src/IO/WriteBufferFromS3.cpp
@@ -339,10 +339,22 @@ void WriteBufferFromS3::allocateBuffer()
 {
     buffer_allocation_policy->nextBuffer();
     chassert(0 == hidden_size);
+
+    if (buffer_allocation_policy->getBufferNumber() == 1)
+        return allocateFirstBuffer();
+
     memory = Memory(buffer_allocation_policy->getBufferSize());
     WriteBuffer::set(memory.data(), memory.size());
 }
 
+void WriteBufferFromS3::allocateFirstBuffer()
+{
+    const auto max_first_buffer = buffer_allocation_policy->getBufferSize();
+    const auto size = std::min(size_t(DBMS_DEFAULT_BUFFER_SIZE), max_first_buffer);
+    memory = Memory(size);
+    WriteBuffer::set(memory.data(), memory.size());
+}
+
 void WriteBufferFromS3::setFakeBufferWhenPreFinalized()
 {
     WriteBuffer::set(fake_buffer_when_prefinalized, sizeof(fake_buffer_when_prefinalized));
diff --git a/src/IO/WriteBufferFromS3.h b/src/IO/WriteBufferFromS3.h
index 0eab20891bf..4139cbdde6e 100644
--- a/src/IO/WriteBufferFromS3.h
+++ b/src/IO/WriteBufferFromS3.h
@@ -62,6 +62,7 @@ private:
     void reallocateFirstBuffer();
     void detachBuffer();
     void allocateBuffer();
+    void allocateFirstBuffer();
     void setFakeBufferWhenPreFinalized();
 
     S3::UploadPartRequest getUploadRequest(size_t part_number, PartData & data);

From 3f653bbc3258793be95c94ce749142b8b6e0f4db Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 21 Mar 2024 20:28:52 +0100
Subject: [PATCH 867/985] Added test with log check

---
 .../IO/ReadBufferFromAzureBlobStorage.cpp     | 18 ++++---
 .../test_storage_azure_blob_storage/test.py   | 23 +++++++++
 ...xx_test_dictionary_create_access.reference |  0
 .../xxx_test_dictionary_create_access.sh      | 47 +++++++++++++++++++
 4 files changed, 78 insertions(+), 10 deletions(-)
 create mode 100644 tests/queries/0_stateless/xxx_test_dictionary_create_access.reference
 create mode 100755 tests/queries/0_stateless/xxx_test_dictionary_create_access.sh

diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
index 3555c71abee..0c4acebf347 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
@@ -264,15 +264,6 @@ size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t ran
     size_t initial_n = n;
 
     size_t sleep_time_with_backoff_milliseconds = 100;
-    auto handle_exception = [&, this](const auto & e, size_t i)
-    {
-        LOG_INFO(log, "Exception caught during Azure Download for file {} at offset {} at attempt {}/{}: {}", path, offset, i + 1, max_single_download_retries, e.Message);
-        if (i + 1 == max_single_download_retries)
-            throw;
-
-        sleepForMilliseconds(sleep_time_with_backoff_milliseconds);
-        sleep_time_with_backoff_milliseconds *= 2;
-    };
 
     for (size_t i = 0; i < max_single_download_retries && n > 0; ++i)
     {
@@ -288,12 +279,19 @@ size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t ran
             std::istringstream string_stream(String(static_cast<char *>(data_ptr),bytes)); // STYLE_CHECK_ALLOW_STD_STRING_STREAM
             copyFromIStreamWithProgressCallback(string_stream, to, n, progress_callback, &bytes_copied);
 
+            LOG_INFO(log, "AzureBlobStorage readBigAt read bytes {}", bytes_copied);
+
             if (read_settings.remote_throttler)
                 read_settings.remote_throttler->add(bytes_copied, ProfileEvents::RemoteReadThrottlerBytes, ProfileEvents::RemoteReadThrottlerSleepMicroseconds);
         }
         catch (const Azure::Core::RequestFailedException & e)
         {
-            handle_exception(e,i);
+            LOG_INFO(log, "Exception caught during Azure Download for file {} at offset {} at attempt {}/{}: {}", path, offset, i + 1, max_single_download_retries, e.Message);
+            if (i + 1 == max_single_download_retries)
+                throw;
+
+            sleepForMilliseconds(sleep_time_with_backoff_milliseconds);
+            sleep_time_with_backoff_milliseconds *= 2;
         }
 
         range_begin += bytes_copied;
diff --git a/tests/integration/test_storage_azure_blob_storage/test.py b/tests/integration/test_storage_azure_blob_storage/test.py
index e1d636f3831..6918be9f78a 100644
--- a/tests/integration/test_storage_azure_blob_storage/test.py
+++ b/tests/integration/test_storage_azure_blob_storage/test.py
@@ -16,6 +16,7 @@ from helpers.cluster import ClickHouseCluster, ClickHouseInstance
 from helpers.network import PartitionManager
 from helpers.mock_servers import start_mock_servers
 from helpers.test_tools import exec_query_with_retry
+from helpers.test_tools import assert_logs_contain_with_retry
 
 
 @pytest.fixture(scope="module")
@@ -1320,3 +1321,25 @@ def test_format_detection(cluster):
     )
 
     assert result == expected_result
+
+
+def test_parallel_read(cluster):
+    node = cluster.instances["node"]
+    connection_string = cluster.env_variables["AZURITE_CONNECTION_STRING"]
+    storage_account_url = cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]
+    account_name = "devstoreaccount1"
+    account_key = "Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw=="
+
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('{storage_account_url}', 'cont', 'test_parallel_read.parquet', '{account_name}', '{account_key}') "
+        f"select * from numbers(10000) settings azure_truncate_on_insert=1",
+    )
+    time.sleep(1)
+
+    res = azure_query(
+        node,
+        f"select count() from azureBlobStorage('{connection_string}', 'cont', 'test_parallel_read.parquet')",
+    )
+    assert int(res) == 10000
+    assert_logs_contain_with_retry(node, "AzureBlobStorage readBigAt read bytes")
\ No newline at end of file
diff --git a/tests/queries/0_stateless/xxx_test_dictionary_create_access.reference b/tests/queries/0_stateless/xxx_test_dictionary_create_access.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/xxx_test_dictionary_create_access.sh b/tests/queries/0_stateless/xxx_test_dictionary_create_access.sh
new file mode 100755
index 00000000000..4478eb59c95
--- /dev/null
+++ b/tests/queries/0_stateless/xxx_test_dictionary_create_access.sh
@@ -0,0 +1,47 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+readonly PID=$$
+readonly TEST_USER=$"02834_USER_${PID}"
+
+#${CLICKHOUSE_CURL} -sS -X POST "${CLICKHOUSE_URL}&user=${TEST_USER}&password=pass" \
+#   -d "SELECT * FROM remote('127.0.0.1:${CLICKHOUSE_PORT_TCP}', 'system', 'one', '${TEST_USER}', 'pass')"
+
+${CLICKHOUSE_CLIENT} -q "CREATE DATABASE db;"
+${CLICKHOUSE_CLIENT} -q "DROP TABLE IF EXISTS db.table;"
+
+${CLICKHOUSE_CLIENT} -q "DROP DICTIONARY IF EXISTS db.dict_name;"
+
+${CLICKHOUSE_CLIENT} -q "CREATE TABLE db.table (label_data_combination_id UInt64) engine = MergeTree Order BY label_data_combination_id;"
+${CLICKHOUSE_CLIENT} -q "CREATE USER ${TEST_USER};"
+${CLICKHOUSE_CLIENT} -q "GRANT SELECT ON db.* TO ${TEST_USER};"
+#${CLICKHOUSE_CLIENT} -q "GRANT INSERT ON db.* TO ${TEST_USER};"
+${CLICKHOUSE_CLIENT} -q "GRANT CREATE ON db.* TO ${TEST_USER};"
+#${CLICKHOUSE_CLIENT} -q "GRANT DROP ON db.* TO ${TEST_USER};"
+
+${CLICKHOUSE_CURL} -sS -X POST "${CLICKHOUSE_URL}&user=${TEST_USER}&password=pass" \
+ -d "CREATE OR REPLACE DICTIONARY db.dict_name
+    (
+      label_data_combination_id UInt64
+    )
+    PRIMARY KEY label_data_combination_id
+    SOURCE(CLICKHOUSE(
+      QUERY
+        'SELECT
+          label_data_combination_id
+        FROM db.table'
+      )
+    )
+    LAYOUT(HASHED(SHARDS 16 SHARD_LOAD_QUEUE_BACKLOG 10000))
+    LIFETIME(0)
+    SETTINGS(dictionary_use_async_executor = 1, max_threads = 16)
+    COMMENT 'Dictionary mapping of label_data_combination_id to the underlying data.';"
+
+
+${CLICKHOUSE_CLIENT} -q  "DROP TABLE IF EXISTS db.table;"
+${CLICKHOUSE_CLIENT} -q "DROP DICTIONARY IF EXISTS db.dict_name;"
+${CLICKHOUSE_CLIENT} -q "DROP DATABASE db;"

From d6b515b6bf6069b980509bfa0bd4f8fdcd088acf Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Thu, 21 Mar 2024 17:20:08 +0000
Subject: [PATCH 868/985] CI: modify CI from PR body  #do_not_test 
 #job_style_check

---
 .github/PULL_REQUEST_TEMPLATE.md | 30 ++++++++++++++++++++++++++++++
 .gitmessage                      |  2 +-
 tests/ci/ci.py                   | 21 +++++++++++++++------
 tests/ci/pr_info.py              |  3 +++
 4 files changed, 49 insertions(+), 7 deletions(-)

diff --git a/.github/PULL_REQUEST_TEMPLATE.md b/.github/PULL_REQUEST_TEMPLATE.md
index 7fb2abebbbb..4db0737c959 100644
--- a/.github/PULL_REQUEST_TEMPLATE.md
+++ b/.github/PULL_REQUEST_TEMPLATE.md
@@ -40,3 +40,33 @@ At a minimum, the following information should be added (but add more as needed)
 
 
 > Information about CI checks: https://clickhouse.com/docs/en/development/continuous-integration/
+
+---
+### Modify your CI run:
+##### NOTE:
+- if your merge the PR with modified CI you **MUST** know what you are doing.
+- modifiers can be applied only if set before CI starts
+- remove `!` to apply
+- return all `!` to restore defaults
+```
+!#ci_set_<SET_NAME> - to run only preconfigured set of tests, e.g.:
+!#ci_set_arm - to run only integration tests on ARM
+!#ci_set_integration - to run only integration tests on AMD
+!#ci_set_analyzer - to run only tests for analyzer
+NOTE: you can configure your own ci set
+```
+```
+!#job_<JOB NAME> - to run only specified job, e.g.:
+!#job_stateless_tests_release
+!#job_package_debug
+!#job_style_check
+!#job_integration_tests_asan
+```
+```
+!#batch_2 - to run only 2nd batch for all multi-batch jobs
+!#btach_1_2_3 - to run only 1, 2, 3rd batch for all multi-batch jobs
+```
+```
+!#no_merge_commit - to disable merge commit (no merge from master)
+!#do_not_test - to disable whole CI (except style check)
+```
diff --git a/.gitmessage b/.gitmessage
index 2ad30596de6..797446edd49 100644
--- a/.gitmessage
+++ b/.gitmessage
@@ -26,4 +26,4 @@
 
 ## To run only specified batches for multi-batch job(s)
 #batch_2
-#btach_1_2_3
+#batch_1_2_3
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index 29906e6571f..cd63514cb6a 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1407,15 +1407,25 @@ def _update_gh_statuses_action(indata: Dict, s3: S3Helper) -> None:
     print("... CI report update - done")
 
 
-def _fetch_commit_tokens(message: str) -> List[str]:
-    pattern = r"#[\w-]+"
-    matches = [match[1:] for match in re.findall(pattern, message)]
+def _fetch_commit_tokens(message: str, pr_info: PRInfo) -> List[str]:
+    pattern = r"([^!]|^)#(\w+)"
+    matches = [match[-1] for match in re.findall(pattern, message)]
     res = [
         match
         for match in matches
         if match in Labels or match.startswith("job_") or match.startswith("batch_")
     ]
-    return res
+    print(f"CI modifyers from commit message: [{res}]")
+    res_2 = []
+    if pr_info.is_pr():
+        matches = [match[-1] for match in re.findall(pattern, pr_info.body)]
+        res_2 = [
+            match
+            for match in matches
+            if match in Labels or match.startswith("job_") or match.startswith("batch_")
+        ]
+        print(f"CI modifyers from PR body: [{res_2}]")
+    return list(set(res + res_2))
 
 
 def _upload_build_artifacts(
@@ -1701,8 +1711,7 @@ def main() -> int:
             message = args.commit_message or git_runner.run(
                 f"{GIT_PREFIX} log {pr_info.sha} --format=%B -n 1"
             )
-            tokens = _fetch_commit_tokens(message)
-            print(f"Commit message tokens: [{tokens}]")
+            tokens = _fetch_commit_tokens(message, pr_info)
             if Labels.NO_MERGE_COMMIT in tokens and CI:
                 git_runner.run(f"{GIT_PREFIX} checkout {pr_info.sha}")
                 git_ref = git_runner.run(f"{GIT_PREFIX} rev-parse HEAD")
diff --git a/tests/ci/pr_info.py b/tests/ci/pr_info.py
index 9bd30f3c58e..84f2db4002d 100644
--- a/tests/ci/pr_info.py
+++ b/tests/ci/pr_info.py
@@ -316,6 +316,9 @@ class PRInfo:
     def is_release_branch(self) -> bool:
         return self.number == 0
 
+    def is_pr(self):
+        return self.event_type == EventType.PULL_REQUEST
+
     def is_scheduled(self):
         return self.event_type == EventType.SCHEDULE
 

From 54c5ea8d6d1e13b8151bbfcc7cffd8f1de5c616b Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Thu, 21 Mar 2024 21:14:24 +0100
Subject: [PATCH 869/985] FunctionsConversion: Remove some templates

---
 src/Functions/FunctionsConversion.cpp | 164 ++++++++++++--------------
 1 file changed, 78 insertions(+), 86 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index ceff4f3fd7e..9262389e593 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1127,23 +1127,24 @@ struct AccurateOrNullConvertStrategyAdditions
     UInt32 scale { 0 };
 };
 
-
-struct ConvertDefaultBehaviorTag {};
-struct ConvertReturnNullOnErrorTag {};
-struct ConvertReturnZeroOnErrorTag {};
+enum class BehaviourOnErrorFromString
+{
+    ConvertDefaultBehaviorTag,
+    ConvertReturnNullOnErrorTag,
+    ConvertReturnZeroOnErrorTag
+};
 
 /** Conversion of number types to each other, enums to numbers, dates and datetimes to numbers and back: done by straight assignment.
   *  (Date is represented internally as number of days from some day; DateTime - as unix timestamp)
   */
 template <typename FromDataType, typename ToDataType, typename Name,
-    typename SpecialTag = ConvertDefaultBehaviorTag,
     FormatSettings::DateTimeOverflowBehavior date_time_overflow_behavior = default_date_time_overflow_behavior>
 struct ConvertImpl
 {
     template <typename Additions = void *>
     static ColumnPtr NO_SANITIZE_UNDEFINED execute(
         const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type [[maybe_unused]], size_t input_rows_count,
-        Additions additions = Additions())
+        BehaviourOnErrorFromString from_string_tag [[maybe_unused]], Additions additions = Additions())
     {
         const ColumnWithTypeAndName & named_from = arguments[0];
 
@@ -1176,8 +1177,7 @@ struct ConvertImpl
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeImpl<date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
-        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64> && std::is_same_v<ToDataType, DataTypeDate32>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64> && std::is_same_v<ToDataType, DataTypeDate32>)
         {
             return DateTimeTransformImpl<DataTypeDateTime64, DataTypeDate32, TransformDateTime64<ToDate32Impl>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
@@ -1194,8 +1194,7 @@ struct ConvertImpl
         else if constexpr ((
                 std::is_same_v<FromDataType, DataTypeUInt32>
                 || std::is_same_v<FromDataType, DataTypeUInt64>)
-            && std::is_same_v<ToDataType, DataTypeDate>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDate>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
@@ -1203,8 +1202,7 @@ struct ConvertImpl
         else if constexpr ((
                 std::is_same_v<FromDataType, DataTypeInt8>
                 || std::is_same_v<FromDataType, DataTypeInt16>)
-            && std::is_same_v<ToDataType, DataTypeDate>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDate>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform8Or16Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
@@ -1214,8 +1212,7 @@ struct ConvertImpl
                 || std::is_same_v<FromDataType, DataTypeInt64>
                 || std::is_same_v<FromDataType, DataTypeFloat32>
                 || std::is_same_v<FromDataType, DataTypeFloat64>)
-            && std::is_same_v<ToDataType, DataTypeDate>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDate>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTransform32Or64Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
@@ -1223,8 +1220,7 @@ struct ConvertImpl
         else if constexpr ((
                 std::is_same_v<FromDataType, DataTypeUInt32>
                 || std::is_same_v<FromDataType, DataTypeUInt64>)
-            && std::is_same_v<ToDataType, DataTypeDate32>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDate32>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
@@ -1232,8 +1228,7 @@ struct ConvertImpl
         else if constexpr ((
                 std::is_same_v<FromDataType, DataTypeInt8>
                 || std::is_same_v<FromDataType, DataTypeInt16>)
-            && std::is_same_v<ToDataType, DataTypeDate32>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDate32>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform8Or16Signed<typename FromDataType::FieldType>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
@@ -1243,8 +1238,7 @@ struct ConvertImpl
                 || std::is_same_v<FromDataType, DataTypeInt64>
                 || std::is_same_v<FromDataType, DataTypeFloat32>
                 || std::is_same_v<FromDataType, DataTypeFloat64>)
-            && std::is_same_v<ToDataType, DataTypeDate32>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDate32>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDate32Transform32Or64Signed<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
@@ -1254,15 +1248,13 @@ struct ConvertImpl
                 std::is_same_v<FromDataType, DataTypeInt8>
                 || std::is_same_v<FromDataType, DataTypeInt16>
                 || std::is_same_v<FromDataType, DataTypeInt32>)
-            && std::is_same_v<ToDataType, DataTypeDateTime>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransformSigned<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
-            && std::is_same_v<ToDataType, DataTypeDateTime>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
@@ -1271,8 +1263,7 @@ struct ConvertImpl
                 std::is_same_v<FromDataType, DataTypeInt64>
                 || std::is_same_v<FromDataType, DataTypeFloat32>
                 || std::is_same_v<FromDataType, DataTypeFloat64>)
-            && std::is_same_v<ToDataType, DataTypeDateTime>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTimeTransform64Signed<typename FromDataType::FieldType, UInt32, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count);
@@ -1282,15 +1273,13 @@ struct ConvertImpl
                 || std::is_same_v<FromDataType, DataTypeInt16>
                 || std::is_same_v<FromDataType, DataTypeInt32>
                 || std::is_same_v<FromDataType, DataTypeInt64>)
-            && std::is_same_v<ToDataType, DataTypeDateTime64>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformSigned<typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeUInt64>
-            && std::is_same_v<ToDataType, DataTypeDateTime64>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformUnsigned<UInt64, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
@@ -1298,23 +1287,20 @@ struct ConvertImpl
         else if constexpr ((
                 std::is_same_v<FromDataType, DataTypeFloat32>
                 || std::is_same_v<FromDataType, DataTypeFloat64>)
-            && std::is_same_v<ToDataType, DataTypeDateTime64>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64TransformFloat<FromDataType, typename FromDataType::FieldType, default_date_time_overflow_behavior>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
         }
         /// Conversion of DateTime64 to Date or DateTime: discards fractional part.
         else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
-            && std::is_same_v<ToDataType, DataTypeDate>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDate>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateImpl<date_time_overflow_behavior>>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
         }
         else if constexpr (std::is_same_v<FromDataType, DataTypeDateTime64>
-            && std::is_same_v<ToDataType, DataTypeDateTime>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDateTime>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, TransformDateTime64<ToDateTimeImpl<date_time_overflow_behavior>>, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
@@ -1324,8 +1310,7 @@ struct ConvertImpl
                 std::is_same_v<FromDataType, DataTypeDate>
                 || std::is_same_v<FromDataType, DataTypeDate32>
                 || std::is_same_v<FromDataType, DataTypeDateTime>)
-            && std::is_same_v<ToDataType, DataTypeDateTime64>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<ToDataType, DataTypeDateTime64>)
         {
             return DateTimeTransformImpl<FromDataType, ToDataType, ToDateTime64Transform, false>::template execute<Additions>(
                 arguments, result_type, input_rows_count, additions);
@@ -1443,8 +1428,7 @@ struct ConvertImpl
         /// Conversion from FixedString to String.
         /// Cutting sequences of zero bytes from end of strings.
         else if constexpr (std::is_same_v<ToDataType, DataTypeString>
-            && std::is_same_v<FromDataType, DataTypeFixedString>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+            && std::is_same_v<FromDataType, DataTypeFixedString>)
         {
             ColumnUInt8::MutablePtr null_map = copyNullMap(arguments[0].column);
             const auto & nested =  columnGetNested(arguments[0]);
@@ -1488,8 +1472,7 @@ struct ConvertImpl
                 throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
                         arguments[0].column->getName(), Name::name);
         }
-        else if constexpr (std::is_same_v<ToDataType, DataTypeString>
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        else if constexpr (std::is_same_v<ToDataType, DataTypeString>)
         {
             /// Anything else to String.
 
@@ -1550,27 +1533,35 @@ struct ConvertImpl
             && std::is_same_v<FromDataType, DataTypeString>
             && std::is_same_v<ToDataType, DataTypeUInt32>)
         {
-            return ConvertImpl<FromDataType, DataTypeDateTime, Name, SpecialTag, date_time_overflow_behavior>::template execute<Additions>(
-                arguments, result_type, input_rows_count);
+            return ConvertImpl<FromDataType, DataTypeDateTime, Name, date_time_overflow_behavior>::template execute<Additions>(
+                arguments, result_type, input_rows_count, from_string_tag);
         }
-        else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>)
-            && std::is_same_v<SpecialTag, ConvertDefaultBehaviorTag>)
+        else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>))
         {
-            return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Throw, ConvertFromStringParsingMode::Normal>::execute(
-                arguments, result_type, input_rows_count, additions);
-        }
-        else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>)
-            && std::is_same_v<SpecialTag, ConvertReturnNullOnErrorTag>)
-        {
-            return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Null, ConvertFromStringParsingMode::Normal>::execute(
-                arguments, result_type, input_rows_count, additions);
-        }
-        else if constexpr ((std::is_same_v<FromDataType, DataTypeString> || std::is_same_v<FromDataType, DataTypeFixedString>)
-            && is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>
-            && std::is_same_v<SpecialTag, ConvertReturnZeroOnErrorTag>)
-        {
-            return ConvertThroughParsing<FromDataType, ToDataType, Name, ConvertFromStringExceptionMode::Zero, ConvertFromStringParsingMode::Normal>::execute(
-                arguments, result_type, input_rows_count, additions);
+            switch (from_string_tag)
+            {
+            case BehaviourOnErrorFromString::ConvertDefaultBehaviorTag:
+                return ConvertThroughParsing<FromDataType,
+                                             ToDataType,
+                                             Name,
+                                             ConvertFromStringExceptionMode::Throw,
+                                             ConvertFromStringParsingMode::Normal>::execute(
+                        arguments, result_type, input_rows_count, additions);
+            case BehaviourOnErrorFromString::ConvertReturnNullOnErrorTag:
+                return ConvertThroughParsing<FromDataType,
+                                             ToDataType,
+                                             Name,
+                                             ConvertFromStringExceptionMode::Null,
+                                             ConvertFromStringParsingMode::Normal>::execute(
+                        arguments, result_type, input_rows_count, additions);
+            case BehaviourOnErrorFromString::ConvertReturnZeroOnErrorTag:
+                return ConvertThroughParsing<FromDataType,
+                                             ToDataType,
+                                             Name,
+                                             ConvertFromStringExceptionMode::Zero,
+                                             ConvertFromStringParsingMode::Normal>::execute(
+                        arguments, result_type, input_rows_count, additions);
+            }
         }
         else
         {
@@ -2165,12 +2156,11 @@ private:
         if (context)
             date_time_overflow_behavior = context->getSettingsRef().date_time_overflow_behavior.value;
 
-        auto call = [&](const auto & types, const auto & tag) -> bool
+        auto call = [&](const auto & types, BehaviourOnErrorFromString from_string_tag) -> bool
         {
             using Types = std::decay_t<decltype(types)>;
             using LeftDataType = typename Types::LeftType;
             using RightDataType = typename Types::RightType;
-            using SpecialTag = std::decay_t<decltype(tag)>;
 
             if constexpr (IsDataTypeDecimal<RightDataType>)
             {
@@ -2191,13 +2181,13 @@ private:
                 switch (date_time_overflow_behavior)
                 {
                     case FormatSettings::DateTimeOverflowBehavior::Throw:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, scale);
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, from_string_tag, scale);
                         break;
                     case FormatSettings::DateTimeOverflowBehavior::Ignore:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, scale);
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, from_string_tag, scale);
                         break;
                     case FormatSettings::DateTimeOverflowBehavior::Saturate:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, scale);
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, from_string_tag, scale);
                         break;
                 }
 
@@ -2208,20 +2198,20 @@ private:
                 switch (date_time_overflow_behavior)
                 {
                     case FormatSettings::DateTimeOverflowBehavior::Throw:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, dt64->getScale());
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::Throw>::execute(arguments, result_type, input_rows_count, from_string_tag, dt64->getScale());
                         break;
                     case FormatSettings::DateTimeOverflowBehavior::Ignore:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, dt64->getScale());
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::Ignore>::execute(arguments, result_type, input_rows_count, from_string_tag, dt64->getScale());
                         break;
                     case FormatSettings::DateTimeOverflowBehavior::Saturate:
-                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, dt64->getScale());
+                        result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, from_string_tag, dt64->getScale());
                         break;
                 }
             }
 #define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE) \
             case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-                result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
-                arguments, result_type, input_rows_count); \
+                result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
+                arguments, result_type, input_rows_count, from_string_tag); \
                 break;
 
             else if constexpr (IsDataTypeDecimalOrNumber<LeftDataType> && IsDataTypeDecimalOrNumber<RightDataType>)
@@ -2262,7 +2252,7 @@ private:
             }
 #undef GENERATE_OVERFLOW_MODE_CASE
             else
-                  result_column = ConvertImpl<LeftDataType, RightDataType, Name, SpecialTag>::execute(arguments, result_type, input_rows_count);
+                  result_column = ConvertImpl<LeftDataType, RightDataType, Name>::execute(arguments, result_type, input_rows_count, from_string_tag);
 
             return true;
         };
@@ -2275,7 +2265,7 @@ private:
 
             if (to_datetime64 || scale != 0) /// When scale = 0, the data type is DateTime otherwise the data type is DateTime64
             {
-                if (!callOnIndexAndDataType<DataTypeDateTime64>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{}))
+                if (!callOnIndexAndDataType<DataTypeDateTime64>(from_type->getTypeId(), call, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag))
                     throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
                                     arguments[0].type->getName(), getName());
 
@@ -2292,23 +2282,25 @@ private:
         bool done = false;
         if constexpr (is_any_of<ToDataType, DataTypeString, DataTypeFixedString>)
         {
-            done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
+            done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag);
         }
         else
         {
             bool cast_ipv4_ipv6_default_on_conversion_error = false;
             if constexpr (is_any_of<ToDataType, DataTypeIPv4, DataTypeIPv6>)
+            {
                 if (context && (cast_ipv4_ipv6_default_on_conversion_error = context->getSettingsRef().cast_ipv4_ipv6_default_on_conversion_error))
-                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertReturnZeroOnErrorTag{});
+                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, BehaviourOnErrorFromString::ConvertReturnZeroOnErrorTag);
+            }
 
             if (!cast_ipv4_ipv6_default_on_conversion_error)
             {
                 /// We should use ConvertFromStringExceptionMode::Null mode when converting from String (or FixedString)
                 /// to Nullable type, to avoid 'value is too short' error on attempt to parse empty string from NULL values.
                 if (to_nullable && WhichDataType(from_type).isStringOrFixedString())
-                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertReturnNullOnErrorTag{});
+                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, BehaviourOnErrorFromString::ConvertReturnNullOnErrorTag);
                 else
-                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, ConvertDefaultBehaviorTag{});
+                    done = callOnIndexAndDataType<ToDataType>(from_type->getTypeId(), call, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag);
             }
         }
 
@@ -3185,8 +3177,8 @@ private:
                     {
 #define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
             case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
-                arguments, result_type, input_rows_count, ADDITIONS()); \
+                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
+                arguments, result_type, input_rows_count, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag, ADDITIONS()); \
                 break;
                         if (wrapper_cast_type == CastType::accurate)
                         {
@@ -3215,8 +3207,8 @@ private:
                     {
 #define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
             case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertDefaultBehaviorTag, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::template execute<ADDITIONS>( \
-arguments, result_type, input_rows_count); \
+            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::template execute<ADDITIONS>( \
+arguments, result_type, input_rows_count, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag); \
                 break;
                         if (wrapper_cast_type == CastType::accurate)
                         {
@@ -3376,7 +3368,7 @@ arguments, result_type, input_rows_count); \
                         AccurateConvertStrategyAdditions additions;
                         additions.scale = scale;
                         result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
-                            arguments, result_type, input_rows_count, additions);
+                            arguments, result_type, input_rows_count, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag, additions);
 
                         return true;
                     }
@@ -3385,7 +3377,7 @@ arguments, result_type, input_rows_count); \
                         AccurateOrNullConvertStrategyAdditions additions;
                         additions.scale = scale;
                         result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
-                            arguments, result_type, input_rows_count, additions);
+                            arguments, result_type, input_rows_count, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag, additions);
 
                         return true;
                     }
@@ -3397,14 +3389,14 @@ arguments, result_type, input_rows_count); \
                         /// Consistent with CAST(Nullable(String) AS Nullable(Numbers))
                         /// In case when converting to Nullable type, we apply different parsing rule,
                         /// that will not throw an exception but return NULL in case of malformed input.
-                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, ConvertReturnNullOnErrorTag>::execute(
-                            arguments, result_type, input_rows_count, scale);
+                        result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
+                            arguments, result_type, input_rows_count, BehaviourOnErrorFromString::ConvertReturnNullOnErrorTag, scale);
 
                         return true;
                     }
                 }
 
-                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(arguments, result_type, input_rows_count, scale);
+                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(arguments, result_type, input_rows_count, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag, scale);
 
                 return true;
             });

From 389566f895979104f4931ddb5a2d36be43e1eecb Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Thu, 21 Mar 2024 20:23:06 +0000
Subject: [PATCH 870/985] quick fix for style check

---
 tests/ci/style_check.py | 41 +++++++++++++++++++++--------------------
 1 file changed, 21 insertions(+), 20 deletions(-)

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index d7f6fa998e9..05788aad5ea 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -8,9 +8,8 @@ import subprocess
 import sys
 from concurrent.futures import ProcessPoolExecutor
 from pathlib import Path
-from typing import List, Tuple, Union
+from typing import List, Tuple
 
-import magic
 from docker_images_helper import get_docker_image, pull_image
 from env_helper import CI, REPO_COPY, TEMP_PATH
 from git_helper import GIT_PREFIX, git_runner
@@ -96,32 +95,34 @@ def commit_push_staged(pr_info: PRInfo) -> None:
     git_runner(push_cmd)
 
 
-def is_python(file: Union[Path, str]) -> bool:
+def is_python(file: str) -> bool:
     """returns if the changed file in the repository is python script"""
     # WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
     # and `Support os.PathLike values in magic.from_file` is only from 0.4.25
-    try:
-        return bool(
-            magic.from_file(os.path.join(REPO_COPY, file), mime=True)
-            == "text/x-script.python"
-        )
-    except IsADirectoryError:
-        # Process submodules w/o errors
-        return False
+    # try:
+    #     return bool(
+    #         magic.from_file(os.path.join(REPO_COPY, file), mime=True)
+    #         == "text/x-script.python"
+    #     )
+    # except IsADirectoryError:
+    #     # Process submodules w/o errors
+    #     return False
+    return file.endswith(".py")
 
 
-def is_shell(file: Union[Path, str]) -> bool:
+def is_shell(file: str) -> bool:
     """returns if the changed file in the repository is shell script"""
     # WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
     # and `Support os.PathLike values in magic.from_file` is only from 0.4.25
-    try:
-        return bool(
-            magic.from_file(os.path.join(REPO_COPY, file), mime=True)
-            == "text/x-shellscript"
-        )
-    except IsADirectoryError:
-        # Process submodules w/o errors
-        return False
+    # try:
+    #     return bool(
+    #         magic.from_file(os.path.join(REPO_COPY, file), mime=True)
+    #         == "text/x-shellscript"
+    #     )
+    # except IsADirectoryError:
+    #     # Process submodules w/o errors
+    #     return False
+    return file.endswith(".sh")
 
 
 def main():

From a2836b0887e03bc8c16098ca084a64b145aa634d Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 21 Mar 2024 22:17:18 +0100
Subject: [PATCH 871/985] Removed unwanted tests

---
 ...xx_test_dictionary_create_access.reference |  0
 .../xxx_test_dictionary_create_access.sh      | 47 -------------------
 2 files changed, 47 deletions(-)
 delete mode 100644 tests/queries/0_stateless/xxx_test_dictionary_create_access.reference
 delete mode 100755 tests/queries/0_stateless/xxx_test_dictionary_create_access.sh

diff --git a/tests/queries/0_stateless/xxx_test_dictionary_create_access.reference b/tests/queries/0_stateless/xxx_test_dictionary_create_access.reference
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/tests/queries/0_stateless/xxx_test_dictionary_create_access.sh b/tests/queries/0_stateless/xxx_test_dictionary_create_access.sh
deleted file mode 100755
index 4478eb59c95..00000000000
--- a/tests/queries/0_stateless/xxx_test_dictionary_create_access.sh
+++ /dev/null
@@ -1,47 +0,0 @@
-#!/usr/bin/env bash
-# Tags: no-fasttest
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-readonly PID=$$
-readonly TEST_USER=$"02834_USER_${PID}"
-
-#${CLICKHOUSE_CURL} -sS -X POST "${CLICKHOUSE_URL}&user=${TEST_USER}&password=pass" \
-#   -d "SELECT * FROM remote('127.0.0.1:${CLICKHOUSE_PORT_TCP}', 'system', 'one', '${TEST_USER}', 'pass')"
-
-${CLICKHOUSE_CLIENT} -q "CREATE DATABASE db;"
-${CLICKHOUSE_CLIENT} -q "DROP TABLE IF EXISTS db.table;"
-
-${CLICKHOUSE_CLIENT} -q "DROP DICTIONARY IF EXISTS db.dict_name;"
-
-${CLICKHOUSE_CLIENT} -q "CREATE TABLE db.table (label_data_combination_id UInt64) engine = MergeTree Order BY label_data_combination_id;"
-${CLICKHOUSE_CLIENT} -q "CREATE USER ${TEST_USER};"
-${CLICKHOUSE_CLIENT} -q "GRANT SELECT ON db.* TO ${TEST_USER};"
-#${CLICKHOUSE_CLIENT} -q "GRANT INSERT ON db.* TO ${TEST_USER};"
-${CLICKHOUSE_CLIENT} -q "GRANT CREATE ON db.* TO ${TEST_USER};"
-#${CLICKHOUSE_CLIENT} -q "GRANT DROP ON db.* TO ${TEST_USER};"
-
-${CLICKHOUSE_CURL} -sS -X POST "${CLICKHOUSE_URL}&user=${TEST_USER}&password=pass" \
- -d "CREATE OR REPLACE DICTIONARY db.dict_name
-    (
-      label_data_combination_id UInt64
-    )
-    PRIMARY KEY label_data_combination_id
-    SOURCE(CLICKHOUSE(
-      QUERY
-        'SELECT
-          label_data_combination_id
-        FROM db.table'
-      )
-    )
-    LAYOUT(HASHED(SHARDS 16 SHARD_LOAD_QUEUE_BACKLOG 10000))
-    LIFETIME(0)
-    SETTINGS(dictionary_use_async_executor = 1, max_threads = 16)
-    COMMENT 'Dictionary mapping of label_data_combination_id to the underlying data.';"
-
-
-${CLICKHOUSE_CLIENT} -q  "DROP TABLE IF EXISTS db.table;"
-${CLICKHOUSE_CLIENT} -q "DROP DICTIONARY IF EXISTS db.dict_name;"
-${CLICKHOUSE_CLIENT} -q "DROP DATABASE db;"

From 50bc8acc3724b8fa81d2aa1e7b40515a16268d08 Mon Sep 17 00:00:00 2001
From: robot-clickhouse <robot-clickhouse@users.noreply.github.com>
Date: Thu, 21 Mar 2024 21:26:53 +0000
Subject: [PATCH 872/985] Automatic style fix

---
 tests/integration/test_storage_azure_blob_storage/test.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/test_storage_azure_blob_storage/test.py b/tests/integration/test_storage_azure_blob_storage/test.py
index 6918be9f78a..7d30265e4f8 100644
--- a/tests/integration/test_storage_azure_blob_storage/test.py
+++ b/tests/integration/test_storage_azure_blob_storage/test.py
@@ -1342,4 +1342,4 @@ def test_parallel_read(cluster):
         f"select count() from azureBlobStorage('{connection_string}', 'cont', 'test_parallel_read.parquet')",
     )
     assert int(res) == 10000
-    assert_logs_contain_with_retry(node, "AzureBlobStorage readBigAt read bytes")
\ No newline at end of file
+    assert_logs_contain_with_retry(node, "AzureBlobStorage readBigAt read bytes")

From 257c263596f5832faafff8abfe344c53bf549ea7 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Thu, 21 Mar 2024 22:33:34 +0100
Subject: [PATCH 873/985] Avoid extra copy of data

---
 src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
index 0c4acebf347..2b8986a265e 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
@@ -259,7 +259,7 @@ size_t ReadBufferFromAzureBlobStorage::getFileSize()
     return *file_size;
 }
 
-size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t range_begin, const std::function<bool(size_t)> & progress_callback) const
+size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t range_begin, const std::function<bool(size_t)> & /*progress_callback*/) const
 {
     size_t initial_n = n;
 
@@ -275,9 +275,7 @@ size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t ran
             auto download_response = blob_client->Download(download_options);
 
             std::unique_ptr<Azure::Core::IO::BodyStream> body_stream = std::move(download_response.Value.BodyStream);
-            auto bytes = body_stream->ReadToCount(reinterpret_cast<uint8_t *>(data_ptr), body_stream->Length());
-            std::istringstream string_stream(String(static_cast<char *>(data_ptr),bytes)); // STYLE_CHECK_ALLOW_STD_STRING_STREAM
-            copyFromIStreamWithProgressCallback(string_stream, to, n, progress_callback, &bytes_copied);
+            bytes_copied = body_stream->ReadToCount(reinterpret_cast<uint8_t *>(to), body_stream->Length());
 
             LOG_INFO(log, "AzureBlobStorage readBigAt read bytes {}", bytes_copied);
 

From 7ac41d7fc195004b4efccbd7891466fe956500e1 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Thu, 21 Mar 2024 23:25:31 +0000
Subject: [PATCH 874/985] Fix segfault in SquashingTransform

---
 src/Interpreters/SquashingTransform.cpp | 25 ++++++++++++++++++++-----
 1 file changed, 20 insertions(+), 5 deletions(-)

diff --git a/src/Interpreters/SquashingTransform.cpp b/src/Interpreters/SquashingTransform.cpp
index 4ed0dddc191..da608f5e7ce 100644
--- a/src/Interpreters/SquashingTransform.cpp
+++ b/src/Interpreters/SquashingTransform.cpp
@@ -89,13 +89,25 @@ void SquashingTransform::append(ReferenceType input_block)
 
     assert(blocksHaveEqualStructure(input_block, accumulated_block));
 
-    for (size_t i = 0, size = accumulated_block.columns(); i < size; ++i)
+    try
     {
-        const auto source_column = input_block.getByPosition(i).column;
+        for (size_t i = 0, size = accumulated_block.columns(); i < size; ++i)
+        {
+            const auto source_column = input_block.getByPosition(i).column;
 
-        auto mutable_column = IColumn::mutate(std::move(accumulated_block.getByPosition(i).column));
-        mutable_column->insertRangeFrom(*source_column, 0, source_column->size());
-        accumulated_block.getByPosition(i).column = std::move(mutable_column);
+            auto mutable_column = IColumn::mutate(std::move(accumulated_block.getByPosition(i).column));
+            mutable_column->insertRangeFrom(*source_column, 0, source_column->size());
+            accumulated_block.getByPosition(i).column = std::move(mutable_column);
+        }
+    }
+    catch (...)
+    {
+        /// add() may be called again even after a previous add() threw an exception.
+        /// Keep accumulated_block in a valid state.
+        /// Seems ok to discard accumulated data because we're throwing an exception, which the caller will
+        /// hopefully interpret to mean "this block and all *previous* blocks are potentially lost".
+        accumulated_block.clear();
+        throw;
     }
 }
 
@@ -107,6 +119,9 @@ bool SquashingTransform::isEnoughSize(const Block & block)
 
     for (const auto & [column, type, name] : block)
     {
+        if (!column)
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Invalid column in block.");
+
         if (!rows)
             rows = column->size();
         else if (rows != column->size())

From 415ed79b1673c06ac6d50114ce33ca6e12c198ec Mon Sep 17 00:00:00 2001
From: Duc Canh Le <duccanh.le@ahrefs.com>
Date: Fri, 15 Dec 2023 01:46:08 +0000
Subject: [PATCH 875/985] allow declaring enum in external table structure

Signed-off-by: Duc Canh Le <duccanh.le@ahrefs.com>
---
 src/Core/ExternalTable.cpp                    | 73 ++++++++++++++++---
 .../02935_external_table_enum_type.reference  |  2 +
 .../02935_external_table_enum_type.sh         | 10 +++
 3 files changed, 75 insertions(+), 10 deletions(-)
 create mode 100644 tests/queries/0_stateless/02935_external_table_enum_type.reference
 create mode 100755 tests/queries/0_stateless/02935_external_table_enum_type.sh

diff --git a/src/Core/ExternalTable.cpp b/src/Core/ExternalTable.cpp
index 58b705ca317..fa1e49d437c 100644
--- a/src/Core/ExternalTable.cpp
+++ b/src/Core/ExternalTable.cpp
@@ -17,6 +17,9 @@
 
 #include <Core/ExternalTable.h>
 #include <Poco/Net/MessageHeader.h>
+#include <Parsers/ASTNameTypePair.h>
+#include <Parsers/ParserCreateQuery.h>
+#include <Parsers/parseQuery.h>
 #include <base/scope_guard.h>
 
 
@@ -28,6 +31,18 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
 }
 
+/// Parsing a list of types with `,` as separator. For example, `Int, Enum('foo'=1,'bar'=2), Double`
+/// Used in `parseStructureFromTypesField`
+class ParserTypeList : public IParserBase
+{
+protected:
+    const char * getName() const override { return "type pair list"; }
+    bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override
+    {
+        return ParserList(std::make_unique<ParserDataType>(), std::make_unique<ParserToken>(TokenType::Comma), false)
+        .parse(pos, node, expected);
+    }
+};
 
 ExternalTableDataPtr BaseExternalTable::getData(ContextPtr context)
 {
@@ -55,23 +70,61 @@ void BaseExternalTable::clear()
 
 void BaseExternalTable::parseStructureFromStructureField(const std::string & argument)
 {
-    std::vector<std::string> vals;
-    splitInto<' ', ','>(vals, argument, true);
+    /// First try to parse table structure with `ParserNameTypePairList`, this allows user to declare Enum types in the structure
+    ParserNameTypePairList parser;
+    const auto * pos = argument.data();
+    String error;
+    ASTPtr columns_list_raw = tryParseQuery(parser, pos, pos+argument.size(), error, false, "", false, 0, 0);
+    bool parse_structure_with_parser = false;
+    if ((parse_structure_with_parser = columns_list_raw != nullptr))
+    {
+        for (auto & child : columns_list_raw->children)
+        {
+            auto * column = child->as<ASTNameTypePair>();
+            if (column)
+                structure.emplace_back(column->name, column->type->getColumnNameWithoutAlias());
+            else
+            {
+                structure.clear();
+                parse_structure_with_parser = false;
+                break;
+            }
+        }
+    }
 
-    if (vals.size() % 2 != 0)
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Odd number of attributes in section structure: {}", vals.size());
+    if (!parse_structure_with_parser)
+    {
+        std::vector<std::string> vals;
+        splitInto<' ', ','>(vals, argument, true);
 
-    for (size_t i = 0; i < vals.size(); i += 2)
-        structure.emplace_back(vals[i], vals[i + 1]);
+        if (vals.size() % 2 != 0)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Odd number of attributes in section structure: {}", vals.size());
+
+        for (size_t i = 0; i < vals.size(); i += 2)
+            structure.emplace_back(vals[i], vals[i + 1]);
+    }
 }
 
 void BaseExternalTable::parseStructureFromTypesField(const std::string & argument)
 {
-    std::vector<std::string> vals;
-    splitInto<' ', ','>(vals, argument, true);
+    /// First try to parse table structure with `ParserTypeList`, this allows user to declare Enum types in the structure
+    ParserTypeList parser;
+    const auto * pos = argument.data();
+    String error;
+    ASTPtr type_list_raw = tryParseQuery(parser, pos, pos+argument.size(), error, false, "", false, 0, 0);
+    if (type_list_raw != nullptr)
+    {
+        for (size_t i = 0; i < type_list_raw->children.size(); ++i)
+            structure.emplace_back("_" + toString(i + 1), type_list_raw->children[i]->getColumnNameWithoutAlias());
+    }
+    else
+    {
+        std::vector<std::string> vals;
+        splitInto<' ', ','>(vals, argument, true);
 
-    for (size_t i = 0; i < vals.size(); ++i)
-        structure.emplace_back("_" + toString(i + 1), vals[i]);
+        for (size_t i = 0; i < vals.size(); ++i)
+            structure.emplace_back("_" + toString(i + 1), vals[i]);
+    }
 }
 
 void BaseExternalTable::initSampleBlock()
diff --git a/tests/queries/0_stateless/02935_external_table_enum_type.reference b/tests/queries/0_stateless/02935_external_table_enum_type.reference
new file mode 100644
index 00000000000..1efccdbfc67
--- /dev/null
+++ b/tests/queries/0_stateless/02935_external_table_enum_type.reference
@@ -0,0 +1,2 @@
+foo	1
+bar	2
diff --git a/tests/queries/0_stateless/02935_external_table_enum_type.sh b/tests/queries/0_stateless/02935_external_table_enum_type.sh
new file mode 100755
index 00000000000..ab4306a056e
--- /dev/null
+++ b/tests/queries/0_stateless/02935_external_table_enum_type.sh
@@ -0,0 +1,10 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+http_url="http://${CLICKHOUSE_HOST}:${CLICKHOUSE_PORT_HTTP}/?"
+
+curl -s "${http_url}temp_structure=x+Enum8('foo'%3D1,'bar'%3D2),y+Int" -F "$(printf 'temp='foo'\t1');filename=data1" -F "query=SELECT * FROM temp"
+curl -s "${http_url}temp_types=Enum8('foo'%3D1,'bar'%3D2),Int" -F "$(printf 'temp='bar'\t2');filename=data1" -F "query=SELECT * FROM temp"

From 3f0bba97a68016803c9c730a47872468a7c3d997 Mon Sep 17 00:00:00 2001
From: Duc Canh Le <duccanh.le@ahrefs.com>
Date: Wed, 20 Dec 2023 03:14:47 +0000
Subject: [PATCH 876/985] fix shellcheck

Signed-off-by: Duc Canh Le <duccanh.le@ahrefs.com>
---
 tests/queries/0_stateless/02935_external_table_enum_type.sh | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/02935_external_table_enum_type.sh b/tests/queries/0_stateless/02935_external_table_enum_type.sh
index ab4306a056e..292fb647b27 100755
--- a/tests/queries/0_stateless/02935_external_table_enum_type.sh
+++ b/tests/queries/0_stateless/02935_external_table_enum_type.sh
@@ -6,5 +6,5 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 
 http_url="http://${CLICKHOUSE_HOST}:${CLICKHOUSE_PORT_HTTP}/?"
 
-curl -s "${http_url}temp_structure=x+Enum8('foo'%3D1,'bar'%3D2),y+Int" -F "$(printf 'temp='foo'\t1');filename=data1" -F "query=SELECT * FROM temp"
-curl -s "${http_url}temp_types=Enum8('foo'%3D1,'bar'%3D2),Int" -F "$(printf 'temp='bar'\t2');filename=data1" -F "query=SELECT * FROM temp"
+curl -s "${http_url}temp_structure=x+Enum8('foo'%3D1,'bar'%3D2),y+Int" -F "$(printf 'temp='"foo"'\t1');filename=data1" -F "query=SELECT * FROM temp"
+curl -s "${http_url}temp_types=Enum8('foo'%3D1,'bar'%3D2),Int" -F "$(printf 'temp='"bar"'\t2');filename=data1" -F "query=SELECT * FROM temp"

From f45e3ba4327c09fd67746a15bdfa82ad79390dad Mon Sep 17 00:00:00 2001
From: Duc Canh Le <duccanh.le@ahrefs.com>
Date: Mon, 4 Mar 2024 15:37:41 +0000
Subject: [PATCH 877/985] address review comments

Signed-off-by: Duc Canh Le <duccanh.le@ahrefs.com>
---
 src/Core/ExternalTable.cpp                    | 57 ++++++-------------
 .../02935_external_table_enum_type.reference  |  2 +
 .../02935_external_table_enum_type.sh         |  2 +
 3 files changed, 20 insertions(+), 41 deletions(-)

diff --git a/src/Core/ExternalTable.cpp b/src/Core/ExternalTable.cpp
index fa1e49d437c..23a181d8ea2 100644
--- a/src/Core/ExternalTable.cpp
+++ b/src/Core/ExternalTable.cpp
@@ -70,61 +70,36 @@ void BaseExternalTable::clear()
 
 void BaseExternalTable::parseStructureFromStructureField(const std::string & argument)
 {
-    /// First try to parse table structure with `ParserNameTypePairList`, this allows user to declare Enum types in the structure
     ParserNameTypePairList parser;
     const auto * pos = argument.data();
     String error;
-    ASTPtr columns_list_raw = tryParseQuery(parser, pos, pos+argument.size(), error, false, "", false, 0, 0);
-    bool parse_structure_with_parser = false;
-    if ((parse_structure_with_parser = columns_list_raw != nullptr))
+    ASTPtr columns_list_raw = tryParseQuery(parser, pos, pos + argument.size(), error, false, "", false, 0, 0);
+
+    if (!columns_list_raw)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Error while parsing table structure: {}", error);
+
+    for (auto & child : columns_list_raw->children)
     {
-        for (auto & child : columns_list_raw->children)
-        {
-            auto * column = child->as<ASTNameTypePair>();
-            if (column)
-                structure.emplace_back(column->name, column->type->getColumnNameWithoutAlias());
-            else
-            {
-                structure.clear();
-                parse_structure_with_parser = false;
-                break;
-            }
-        }
-    }
-
-    if (!parse_structure_with_parser)
-    {
-        std::vector<std::string> vals;
-        splitInto<' ', ','>(vals, argument, true);
-
-        if (vals.size() % 2 != 0)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Odd number of attributes in section structure: {}", vals.size());
-
-        for (size_t i = 0; i < vals.size(); i += 2)
-            structure.emplace_back(vals[i], vals[i + 1]);
+        auto * column = child->as<ASTNameTypePair>();
+        if (column)
+            structure.emplace_back(column->name, column->type->getColumnNameWithoutAlias());
+        else
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Error while parsing table structure: expected column definition, got {}", child->formatForErrorMessage());
     }
 }
 
 void BaseExternalTable::parseStructureFromTypesField(const std::string & argument)
 {
-    /// First try to parse table structure with `ParserTypeList`, this allows user to declare Enum types in the structure
     ParserTypeList parser;
     const auto * pos = argument.data();
     String error;
     ASTPtr type_list_raw = tryParseQuery(parser, pos, pos+argument.size(), error, false, "", false, 0, 0);
-    if (type_list_raw != nullptr)
-    {
-        for (size_t i = 0; i < type_list_raw->children.size(); ++i)
-            structure.emplace_back("_" + toString(i + 1), type_list_raw->children[i]->getColumnNameWithoutAlias());
-    }
-    else
-    {
-        std::vector<std::string> vals;
-        splitInto<' ', ','>(vals, argument, true);
 
-        for (size_t i = 0; i < vals.size(); ++i)
-            structure.emplace_back("_" + toString(i + 1), vals[i]);
-    }
+    if (!type_list_raw)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Error while parsing table structure: {}", error);
+
+    for (size_t i = 0; i < type_list_raw->children.size(); ++i)
+        structure.emplace_back("_" + toString(i + 1), type_list_raw->children[i]->getColumnNameWithoutAlias());
 }
 
 void BaseExternalTable::initSampleBlock()
diff --git a/tests/queries/0_stateless/02935_external_table_enum_type.reference b/tests/queries/0_stateless/02935_external_table_enum_type.reference
index 1efccdbfc67..ed152e608b9 100644
--- a/tests/queries/0_stateless/02935_external_table_enum_type.reference
+++ b/tests/queries/0_stateless/02935_external_table_enum_type.reference
@@ -1,2 +1,4 @@
 foo	1
 bar	2
+foo	1
+bar	2
diff --git a/tests/queries/0_stateless/02935_external_table_enum_type.sh b/tests/queries/0_stateless/02935_external_table_enum_type.sh
index 292fb647b27..61d5508e9f9 100755
--- a/tests/queries/0_stateless/02935_external_table_enum_type.sh
+++ b/tests/queries/0_stateless/02935_external_table_enum_type.sh
@@ -8,3 +8,5 @@ http_url="http://${CLICKHOUSE_HOST}:${CLICKHOUSE_PORT_HTTP}/?"
 
 curl -s "${http_url}temp_structure=x+Enum8('foo'%3D1,'bar'%3D2),y+Int" -F "$(printf 'temp='"foo"'\t1');filename=data1" -F "query=SELECT * FROM temp"
 curl -s "${http_url}temp_types=Enum8('foo'%3D1,'bar'%3D2),Int" -F "$(printf 'temp='"bar"'\t2');filename=data1" -F "query=SELECT * FROM temp"
+echo -ne 'foo\t1' | ${CLICKHOUSE_CLIENT} --query="select * from tmp" --external --file=- --name=tmp --structure="x Enum8('foo'=1,'bar'=2),y Int"
+echo -ne 'bar\t2' | ${CLICKHOUSE_CLIENT} --query="select * from tmp" --external --file=- --name=tmp --types="Enum8('foo'=1,'bar'=2),Int"

From e39576917dfe2ba69c5181035c87182d2404aee5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 00:40:28 +0100
Subject: [PATCH 878/985] Add a test

---
 .../03018_external_with_complex_data_types.reference       | 1 +
 .../0_stateless/03018_external_with_complex_data_types.sh  | 7 +++++++
 2 files changed, 8 insertions(+)
 create mode 100644 tests/queries/0_stateless/03018_external_with_complex_data_types.reference
 create mode 100755 tests/queries/0_stateless/03018_external_with_complex_data_types.sh

diff --git a/tests/queries/0_stateless/03018_external_with_complex_data_types.reference b/tests/queries/0_stateless/03018_external_with_complex_data_types.reference
new file mode 100644
index 00000000000..11277a62b06
--- /dev/null
+++ b/tests/queries/0_stateless/03018_external_with_complex_data_types.reference
@@ -0,0 +1 @@
+Hello	world
diff --git a/tests/queries/0_stateless/03018_external_with_complex_data_types.sh b/tests/queries/0_stateless/03018_external_with_complex_data_types.sh
new file mode 100755
index 00000000000..fb3a22d9044
--- /dev/null
+++ b/tests/queries/0_stateless/03018_external_with_complex_data_types.sh
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+${CLICKHOUSE_CLIENT} --external --file <(echo "Hello, world") --name test --format CSV --structure "x Enum('Hello' = 1, 'world' = 2), y String" --query "SELECT * FROM test"

From 828c555780c70a260029b13d07e61f2cdbf493a6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 00:42:49 +0100
Subject: [PATCH 879/985] Fix build

---
 src/Core/ExternalTable.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Core/ExternalTable.cpp b/src/Core/ExternalTable.cpp
index 23a181d8ea2..e043a2f9492 100644
--- a/src/Core/ExternalTable.cpp
+++ b/src/Core/ExternalTable.cpp
@@ -73,7 +73,7 @@ void BaseExternalTable::parseStructureFromStructureField(const std::string & arg
     ParserNameTypePairList parser;
     const auto * pos = argument.data();
     String error;
-    ASTPtr columns_list_raw = tryParseQuery(parser, pos, pos + argument.size(), error, false, "", false, 0, 0);
+    ASTPtr columns_list_raw = tryParseQuery(parser, pos, pos + argument.size(), error, false, "", false, DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS, true);
 
     if (!columns_list_raw)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Error while parsing table structure: {}", error);
@@ -93,7 +93,7 @@ void BaseExternalTable::parseStructureFromTypesField(const std::string & argumen
     ParserTypeList parser;
     const auto * pos = argument.data();
     String error;
-    ASTPtr type_list_raw = tryParseQuery(parser, pos, pos+argument.size(), error, false, "", false, 0, 0);
+    ASTPtr type_list_raw = tryParseQuery(parser, pos, pos+argument.size(), error, false, "", false, DBMS_DEFAULT_MAX_QUERY_SIZE, DBMS_DEFAULT_MAX_PARSER_DEPTH, DBMS_DEFAULT_MAX_PARSER_BACKTRACKS, true);
 
     if (!type_list_raw)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Error while parsing table structure: {}", error);

From b91d478c937fe73a7f92585c3b8d30b8732d5975 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 00:56:57 +0100
Subject: [PATCH 880/985] There is no such thing as broken tests

---
 tests/analyzer_integration_broken_tests.txt |  0
 tests/integration/ci-runner.py              | 32 ++++-----------------
 2 files changed, 6 insertions(+), 26 deletions(-)
 delete mode 100644 tests/analyzer_integration_broken_tests.txt

diff --git a/tests/analyzer_integration_broken_tests.txt b/tests/analyzer_integration_broken_tests.txt
deleted file mode 100644
index e69de29bb2d..00000000000
diff --git a/tests/integration/ci-runner.py b/tests/integration/ci-runner.py
index e7f691d2237..32a60c8fa47 100755
--- a/tests/integration/ci-runner.py
+++ b/tests/integration/ci-runner.py
@@ -475,7 +475,7 @@ class ClickhouseIntegrationTestsRunner:
         return result
 
     @staticmethod
-    def _update_counters(main_counters, current_counters, broken_tests):
+    def _update_counters(main_counters, current_counters):
         for test in current_counters["PASSED"]:
             if test not in main_counters["PASSED"]:
                 if test in main_counters["FAILED"]:
@@ -483,21 +483,14 @@ class ClickhouseIntegrationTestsRunner:
                 if test in main_counters["BROKEN"]:
                     main_counters["BROKEN"].remove(test)
 
-                if test not in broken_tests:
-                    main_counters["PASSED"].append(test)
-                else:
-                    main_counters["NOT_FAILED"].append(test)
+                main_counters["PASSED"].append(test)
 
         for state in ("ERROR", "FAILED"):
             for test in current_counters[state]:
                 if test in main_counters["PASSED"]:
                     main_counters["PASSED"].remove(test)
-                if test not in broken_tests:
-                    if test not in main_counters[state]:
-                        main_counters[state].append(test)
-                else:
-                    if test not in main_counters["BROKEN"]:
-                        main_counters["BROKEN"].append(test)
+                if test not in main_counters[state]:
+                    main_counters[state].append(test)
 
         for state in ("SKIPPED",):
             for test in current_counters[state]:
@@ -564,7 +557,6 @@ class ClickhouseIntegrationTestsRunner:
         tests_in_group,
         num_tries,
         num_workers,
-        broken_tests,
     ):
         try:
             return self.run_test_group(
@@ -573,7 +565,6 @@ class ClickhouseIntegrationTestsRunner:
                 tests_in_group,
                 num_tries,
                 num_workers,
-                broken_tests,
             )
         except Exception as e:
             logging.info("Failed to run %s:\n%s", test_group, e)
@@ -596,7 +587,6 @@ class ClickhouseIntegrationTestsRunner:
         tests_in_group,
         num_tries,
         num_workers,
-        broken_tests,
     ):
         counters = {
             "ERROR": [],
@@ -706,7 +696,7 @@ class ClickhouseIntegrationTestsRunner:
                     )
                 times_lines = parse_test_times(info_path)
                 new_tests_times = get_test_times(times_lines)
-                self._update_counters(counters, new_counters, broken_tests)
+                self._update_counters(counters, new_counters)
                 for test_name, test_time in new_tests_times.items():
                     tests_times[test_name] = test_time
 
@@ -915,20 +905,10 @@ class ClickhouseIntegrationTestsRunner:
             logging.info("Shuffling test groups")
             random.shuffle(items_to_run)
 
-        broken_tests = []
-        if self.use_analyzer:
-            with open(
-                f"{repo_path}/tests/analyzer_integration_broken_tests.txt",
-                "r",
-                encoding="utf-8",
-            ) as f:
-                broken_tests = f.read().splitlines()
-            logging.info("Broken tests in the list: %s", len(broken_tests))
-
         for group, tests in items_to_run:
             logging.info("Running test group %s containing %s tests", group, len(tests))
             group_counters, group_test_times, log_paths = self.try_run_test_group(
-                repo_path, group, tests, MAX_RETRY, NUM_WORKERS, broken_tests
+                repo_path, group, tests, MAX_RETRY, NUM_WORKERS
             )
             total_tests = 0
             for counter, value in group_counters.items():

From 7d7025a74edf9c779cad98ca87d32252c5213e31 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Thu, 21 Mar 2024 22:20:33 +0000
Subject: [PATCH 881/985] CI: modify it

---
 .github/PULL_REQUEST_TEMPLATE.md | 53 ++++++++++++++++----------------
 tests/ci/ci.py                   |  9 +++---
 tests/ci/ci_config.py            | 46 ++++++++++++++++++++++++++-
 3 files changed, 75 insertions(+), 33 deletions(-)

diff --git a/.github/PULL_REQUEST_TEMPLATE.md b/.github/PULL_REQUEST_TEMPLATE.md
index 4db0737c959..fede3fe519d 100644
--- a/.github/PULL_REQUEST_TEMPLATE.md
+++ b/.github/PULL_REQUEST_TEMPLATE.md
@@ -43,30 +43,29 @@ At a minimum, the following information should be added (but add more as needed)
 
 ---
 ### Modify your CI run:
-##### NOTE:
-- if your merge the PR with modified CI you **MUST** know what you are doing.
-- modifiers can be applied only if set before CI starts
-- remove `!` to apply
-- return all `!` to restore defaults
-```
-!#ci_set_<SET_NAME> - to run only preconfigured set of tests, e.g.:
-!#ci_set_arm - to run only integration tests on ARM
-!#ci_set_integration - to run only integration tests on AMD
-!#ci_set_analyzer - to run only tests for analyzer
-NOTE: you can configure your own ci set
-```
-```
-!#job_<JOB NAME> - to run only specified job, e.g.:
-!#job_stateless_tests_release
-!#job_package_debug
-!#job_style_check
-!#job_integration_tests_asan
-```
-```
-!#batch_2 - to run only 2nd batch for all multi-batch jobs
-!#btach_1_2_3 - to run only 1, 2, 3rd batch for all multi-batch jobs
-```
-```
-!#no_merge_commit - to disable merge commit (no merge from master)
-!#do_not_test - to disable whole CI (except style check)
-```
+**NOTE:** If your merge the PR with modified CI you **MUST KNOW** what you are doing
+**NOTE:** Set desired options before CI starts or re-push after updates
+
+#### Run only:
+- [ ] <!---ci_set_integration--> Integration tests
+- [ ] <!---ci_set_arm--> Integration tests (arm64)
+- [ ] <!---ci_set_stateless--> Stateless tests (release)
+- [ ] <!---ci_set_stateless_asan--> Stateless tests (asan)
+- [ ] <!---ci_set_stateful--> Stateful tests (release)
+- [ ] <!---ci_set_stateful_asan--> Stateful tests (asan)
+- [ ] <!---ci_set_reduced--> No sanitizers
+- [ ] <!---ci_set_analyzer--> Tests with analyzer
+- [ ] <!---ci_set_fast--> Fast tests
+- [ ] <!---job_package_debug--> Only package_debug build
+- [ ] <!---PLACE_YOUR_TAG_CONFIGURED_IN_ci_config.py_FILE_HERE--> Add your CI variant description here
+
+#### CI options:
+- [ ] <!---do_not_test--> do not test (only style check)
+- [ ] <!---no_merge_commit--> disable merge-commit (no merge from master before tests)
+- [ ] <!---no_ci_cache--> disable CI cache (job reuse)
+
+#### Only specified batches in multi-batch jobs:
+- [ ] <!---batch_0--> 1
+- [ ] <!---batch_1--> 2
+- [ ] <!---batch_2--> 3
+- [ ] <!---batch_3--> 4
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
index cd63514cb6a..514189a8b8a 100644
--- a/tests/ci/ci.py
+++ b/tests/ci/ci.py
@@ -1248,9 +1248,7 @@ def _configure_jobs(
         for token_ in ci_controlling_tokens:
             label_config = CI_CONFIG.get_label_config(token_)
             assert label_config, f"Unknonwn token [{token_}]"
-            print(
-                f"NOTE: CI controlling token: [{ci_controlling_tokens}], add jobs: [{label_config.run_jobs}]"
-            )
+            print(f"NOTE: CI modifier: [{token_}], add jobs: [{label_config.run_jobs}]")
             jobs_to_do_requested += label_config.run_jobs
 
         # handle specific job requests
@@ -1264,7 +1262,7 @@ def _configure_jobs(
             for job in requested_jobs:
                 job_with_parents = CI_CONFIG.get_job_with_parents(job)
                 print(
-                    f"NOTE: CI controlling token: [#job_{job}], add jobs: [{job_with_parents}]"
+                    f"NOTE: CI modifier: [#job_{job}], add jobs: [{job_with_parents}]"
                 )
                 # always add requested job itself, even if it could be skipped
                 jobs_to_do_requested.append(job_with_parents[0])
@@ -1273,6 +1271,7 @@ def _configure_jobs(
                         jobs_to_do_requested.append(parent)
 
         if jobs_to_do_requested:
+            jobs_to_do_requested = list(set(jobs_to_do_requested))
             print(
                 f"NOTE: Only specific job(s) were requested by commit message tokens: [{jobs_to_do_requested}]"
             )
@@ -1408,7 +1407,7 @@ def _update_gh_statuses_action(indata: Dict, s3: S3Helper) -> None:
 
 
 def _fetch_commit_tokens(message: str, pr_info: PRInfo) -> List[str]:
-    pattern = r"([^!]|^)#(\w+)"
+    pattern = r"(#|- \[x\] +<!---)(\w+)"
     matches = [match[-1] for match in re.findall(pattern, message)]
     res = [
         match
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 7c213da27ec..8ac37cb602e 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -46,9 +46,14 @@ class Labels(metaclass=WithIter):
     NO_MERGE_COMMIT = "no_merge_commit"
     NO_CI_CACHE = "no_ci_cache"
     CI_SET_REDUCED = "ci_set_reduced"
+    CI_SET_FAST = "ci_set_fast"
     CI_SET_ARM = "ci_set_arm"
     CI_SET_INTEGRATION = "ci_set_integration"
     CI_SET_ANALYZER = "ci_set_analyzer"
+    CI_SET_STATLESS = "ci_set_stateless"
+    CI_SET_STATEFUL = "ci_set_stateful"
+    CI_SET_STATLESS_ASAN = "ci_set_stateless_asan"
+    CI_SET_STATEFUL_ASAN = "ci_set_stateful_asan"
 
     libFuzzer = "libFuzzer"
 
@@ -809,9 +814,15 @@ class CIConfig:
 CI_CONFIG = CIConfig(
     label_configs={
         Labels.DO_NOT_TEST_LABEL: LabelConfig(run_jobs=[JobNames.STYLE_CHECK]),
+        Labels.CI_SET_FAST: LabelConfig(
+            run_jobs=[
+                JobNames.STYLE_CHECK,
+                JobNames.FAST_TEST,
+            ]
+        ),
         Labels.CI_SET_ARM: LabelConfig(
             run_jobs=[
-                # JobNames.STYLE_CHECK,
+                JobNames.STYLE_CHECK,
                 Build.PACKAGE_AARCH64,
                 JobNames.INTEGRATION_TEST_ARM,
             ]
@@ -833,6 +844,38 @@ CI_CONFIG = CIConfig(
                 JobNames.INTEGRATION_TEST_ASAN_ANALYZER,
             ]
         ),
+        Labels.CI_SET_STATLESS: LabelConfig(
+            run_jobs=[
+                JobNames.STYLE_CHECK,
+                JobNames.FAST_TEST,
+                Build.PACKAGE_RELEASE,
+                JobNames.STATELESS_TEST_RELEASE,
+            ]
+        ),
+        Labels.CI_SET_STATLESS_ASAN: LabelConfig(
+            run_jobs=[
+                JobNames.STYLE_CHECK,
+                JobNames.FAST_TEST,
+                Build.PACKAGE_ASAN,
+                JobNames.STATELESS_TEST_ASAN,
+            ]
+        ),
+        Labels.CI_SET_STATEFUL: LabelConfig(
+            run_jobs=[
+                JobNames.STYLE_CHECK,
+                JobNames.FAST_TEST,
+                Build.PACKAGE_RELEASE,
+                JobNames.STATEFUL_TEST_RELEASE,
+            ]
+        ),
+        Labels.CI_SET_STATEFUL_ASAN: LabelConfig(
+            run_jobs=[
+                JobNames.STYLE_CHECK,
+                JobNames.FAST_TEST,
+                Build.PACKAGE_ASAN,
+                JobNames.STATEFUL_TEST_ASAN,
+            ]
+        ),
         Labels.CI_SET_REDUCED: LabelConfig(
             run_jobs=[
                 job
@@ -844,6 +887,7 @@ CI_CONFIG = CIConfig(
                         "tsan",
                         "msan",
                         "ubsan",
+                        "coverage",
                         # skip build report jobs as not all builds will be done
                         "build check",
                     )

From 4675e709fc5a0e58bb1f75c2f94b4595bfe227e5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 03:18:38 +0300
Subject: [PATCH 882/985] Unclog the CI

---
 docs/ru/index.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/ru/index.md b/docs/ru/index.md
index a9a666b18db..88a90fa4b21 100644
--- a/docs/ru/index.md
+++ b/docs/ru/index.md
@@ -96,4 +96,4 @@ ClickHouse — столбцовая система управления база
 
 В «обычных» СУБД этого не делается, так как не имеет смысла при выполнении простых запросов. Хотя есть исключения. Например, в MemSQL кодогенерация используется для уменьшения времени отклика при выполнении SQL-запросов. Для сравнения: в аналитических СУБД требуется оптимизация по пропускной способности (throughput, ГБ/с), а не времени отклика (latency, с).
 
-Стоит заметить, что для эффективности по CPU требуется, чтобы язык запросов был декларативным (SQL, MDX) или хотя бы векторным (J, K). То есть необходимо, чтобы запрос содержал циклы только в неявном виде, открывая возможности для оптимизации.
+Стоит заметить, что для эффективности по CPU требуется, чтобы язык запросов был декларативным (SQL, MDX) или хотя бы векторным (J, K, APL). То есть необходимо, чтобы запрос содержал циклы только в неявном виде, открывая возможности для оптимизации.

From fe5e6b0a0ff4d69a9ffde95598e567c546e6f877 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 03:32:02 +0300
Subject: [PATCH 883/985] Update docs/en/sql-reference/statements/kill.md

Co-authored-by: Johnny <9611008+johnnymatthews@users.noreply.github.com>
---
 docs/en/sql-reference/statements/kill.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/statements/kill.md b/docs/en/sql-reference/statements/kill.md
index c85870fc0c8..0ea117921b7 100644
--- a/docs/en/sql-reference/statements/kill.md
+++ b/docs/en/sql-reference/statements/kill.md
@@ -76,7 +76,7 @@ A test query (`TEST`) only checks the user’s rights and displays a list of que
 The presence of long-running or incomplete mutations often indicates that a ClickHouse service is running poorly. The asynchronous nature of mutations can cause them to consume all available resources on a system. You may need to either: 
 
 - Pause all new mutations, `INSERT`s , and `SELECT`s and allow the queue of mutations to complete.
-- Or manually kill some of these mutations by sending a `KILLSIG` command.
+- Or manually kill some of these mutations by sending a `KILL` command.
 
 ``` sql
 KILL MUTATION [ON CLUSTER cluster]

From 08abe5823e2ed351218b281606b1b5cc4e17d407 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 03:32:46 +0300
Subject: [PATCH 884/985] Update kill.md

---
 docs/en/sql-reference/statements/kill.md | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/en/sql-reference/statements/kill.md b/docs/en/sql-reference/statements/kill.md
index 0ea117921b7..b665ad85a09 100644
--- a/docs/en/sql-reference/statements/kill.md
+++ b/docs/en/sql-reference/statements/kill.md
@@ -103,7 +103,7 @@ WHERE is_done = 0;
 Count of mutations from a ClickHouse cluster of replicas:
 ``` sql
 SELECT count(*)
-FROM clusterAllReplicas('default',system.mutations)
+FROM clusterAllReplicas('default', system.mutations)
 WHERE is_done = 0;
 ```
 
@@ -111,15 +111,15 @@ Query the list of incomplete mutations:
 
 List of mutations from a single ClickHouse node:
 ``` sql
-SELECT mutation_id,*
+SELECT mutation_id, *
 FROM system.mutations
 WHERE is_done = 0;
 ```
 
 List of mutations from a ClickHouse cluster:
 ``` sql
-SELECT mutation_id,*
-FROM clusterAllReplicas('default',system.mutations)
+SELECT mutation_id, *
+FROM clusterAllReplicas('default', system.mutations)
 WHERE is_done = 0;
 ```
 

From 09c252f438a9c6bc314d85573e325a1302ebbe72 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 04:17:24 +0300
Subject: [PATCH 885/985] Update ci-runner.py

---
 tests/integration/ci-runner.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/ci-runner.py b/tests/integration/ci-runner.py
index 32a60c8fa47..e051f6be85d 100755
--- a/tests/integration/ci-runner.py
+++ b/tests/integration/ci-runner.py
@@ -773,7 +773,7 @@ class ClickhouseIntegrationTestsRunner:
             final_retry += 1
             logging.info("Running tests for the %s time", i)
             counters, tests_times, log_paths = self.try_run_test_group(
-                repo_path, "bugfix" if should_fail else "flaky", tests_to_run, 1, 1, []
+                repo_path, "bugfix" if should_fail else "flaky", tests_to_run, 1, 1
             )
             logs += log_paths
             if counters["FAILED"]:

From 6a550bc7547c1fd78419550532f5a2fc65178d68 Mon Sep 17 00:00:00 2001
From: liuneng <1398775315@qq.com>
Date: Fri, 22 Mar 2024 11:23:59 +0800
Subject: [PATCH 886/985] add test case and support constant expression

---
 src/Analyzer/Passes/ConvertInToEqualPass.cpp  |   2 +-
 .../03013_optimize_in_to_equal.reference      | 138 +++++++++++++++++-
 .../03013_optimize_in_to_equal.sql            |  14 +-
 3 files changed, 149 insertions(+), 5 deletions(-)

diff --git a/src/Analyzer/Passes/ConvertInToEqualPass.cpp b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
index ddd8a8f266f..66a37fea5bd 100644
--- a/src/Analyzer/Passes/ConvertInToEqualPass.cpp
+++ b/src/Analyzer/Passes/ConvertInToEqualPass.cpp
@@ -36,7 +36,7 @@ public:
             || constant_node->getValue().getType() == Field::Types::Which::Array)
             return ;
         // x IN null not equivalent to x = null
-        if (constant_node->hasSourceExpression() || constant_node->getValue().isNull())
+        if (constant_node->getValue().isNull())
             return ;
         auto result_func_name = MAPPING.at(func_node->getFunctionName());
         auto equal = std::make_shared<FunctionNode>(result_func_name);
diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.reference b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
index dcaa14abfb1..c24f40d545d 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
@@ -22,6 +22,29 @@ QUERY id: 0
           CONSTANT id: 8, constant_value: \'a\', constant_value_type: String
   SETTINGS allow_experimental_analyzer=1
 -------------------
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: equals, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: \'A\', constant_value_type: String
+            EXPRESSION
+              FUNCTION id: 9, function_name: upper, function_type: ordinary, result_type: String
+                ARGUMENTS
+                  LIST id: 10, nodes: 1
+                    CONSTANT id: 11, constant_value: \'a\', constant_value_type: String
+  SETTINGS allow_experimental_analyzer=1
+-------------------
 QUERY id: 0
   PROJECTION COLUMNS
     x String
@@ -40,6 +63,24 @@ QUERY id: 0
           CONSTANT id: 8, constant_value: Tuple_(\'a\', \'b\'), constant_value_type: Tuple(String, String)
   SETTINGS allow_experimental_analyzer=1
 -------------------
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: in, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: Array_[\'a\', \'b\'], constant_value_type: Array(String)
+  SETTINGS allow_experimental_analyzer=1
+-------------------
 b	2
 c	3
 -------------------
@@ -61,6 +102,97 @@ QUERY id: 0
           CONSTANT id: 8, constant_value: \'a\', constant_value_type: String
   SETTINGS allow_experimental_analyzer=1
 -------------------
-a	1
-b	2
-c	3
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: notEquals, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: \'A\', constant_value_type: String
+            EXPRESSION
+              FUNCTION id: 9, function_name: upper, function_type: ordinary, result_type: String
+                ARGUMENTS
+                  LIST id: 10, nodes: 1
+                    CONSTANT id: 11, constant_value: \'a\', constant_value_type: String
+  SETTINGS allow_experimental_analyzer=1
+-------------------
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: notIn, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: Tuple_(\'a\', \'b\'), constant_value_type: Tuple(String, String)
+  SETTINGS allow_experimental_analyzer=1
+-------------------
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: notIn, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: Array_[\'a\', \'b\'], constant_value_type: Array(String)
+  SETTINGS allow_experimental_analyzer=1
+-------------------
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: notIn, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: NULL, constant_value_type: Nullable(Nothing)
+  SETTINGS allow_experimental_analyzer=1
+-------------------
+QUERY id: 0
+  PROJECTION COLUMNS
+    x String
+    y Int32
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: x, result_type: String, source_id: 3
+      COLUMN id: 4, column_name: y, result_type: Int32, source_id: 3
+  JOIN TREE
+    TABLE id: 3, alias: __table1, table_name: default.test
+  WHERE
+    FUNCTION id: 5, function_name: in, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: x, result_type: String, source_id: 3
+          CONSTANT id: 8, constant_value: NULL, constant_value_type: Nullable(Nothing)
+  SETTINGS allow_experimental_analyzer=1
diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
index be4dc2275a9..c38a741114f 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
@@ -7,10 +7,22 @@ select x in Null from test;
 select '-------------------';
 explain query tree select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
+explain query tree select * from test where x in (upper('a')) SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
 explain query tree select * from test where x in ('a','b') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
+explain query tree select * from test where x in ['a','b'] SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
 select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
 explain query tree select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-select * from test where x not in (NULL) SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in (upper('a')) SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
+explain query tree select * from test where x not in ('a','b') SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
+explain query tree select * from test where x not in ['a','b'] SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
+explain query tree select * from test where x not in (NULL) SETTINGS allow_experimental_analyzer = 1;
+select '-------------------';
+explain query tree select * from test where x in (NULL) SETTINGS allow_experimental_analyzer = 1;

From 1389144d05bb7b1a995f7bf8c8ea63a096448f38 Mon Sep 17 00:00:00 2001
From: pufit <pufit@clickhouse.com>
Date: Fri, 22 Mar 2024 02:08:03 -0400
Subject: [PATCH 887/985] Fix crash in
 `multiSearchAllPositionsCaseInsensitiveUTF8` for incorrect UTF-8 input

---
 src/Common/Volnitsky.h                                         | 3 ++-
 .../0_stateless/02364_multiSearch_function_family.reference    | 1 +
 .../queries/0_stateless/02364_multiSearch_function_family.sql  | 2 ++
 3 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/Common/Volnitsky.h b/src/Common/Volnitsky.h
index 3360c197984..a87a4c2cf8b 100644
--- a/src/Common/Volnitsky.h
+++ b/src/Common/Volnitsky.h
@@ -191,7 +191,8 @@ namespace VolnitskyTraits
                         if (length_l != length_r)
                             return false;
 
-                        assert(length_l >= 2 && length_r >= 2);
+                        if (length_l >= 2 && length_r >= 2)
+                            return false;  /// Some part of the given ngram contains an invalid UTF-8 sequence.
 
                         chars.c0 = seq_l[seq_ngram_offset];
                         chars.c1 = seq_l[seq_ngram_offset + 1];
diff --git a/tests/queries/0_stateless/02364_multiSearch_function_family.reference b/tests/queries/0_stateless/02364_multiSearch_function_family.reference
index eb93a2509b6..3f57c163410 100644
--- a/tests/queries/0_stateless/02364_multiSearch_function_family.reference
+++ b/tests/queries/0_stateless/02364_multiSearch_function_family.reference
@@ -12872,3 +12872,4 @@
 1
 1
 1
+1
diff --git a/tests/queries/0_stateless/02364_multiSearch_function_family.sql b/tests/queries/0_stateless/02364_multiSearch_function_family.sql
index 4ad1a68eeb7..99690e1545e 100644
--- a/tests/queries/0_stateless/02364_multiSearch_function_family.sql
+++ b/tests/queries/0_stateless/02364_multiSearch_function_family.sql
@@ -223,6 +223,8 @@ select [2] = multiSearchAllPositions(materialize('abab'), materialize(['ba']));
 select [1] = multiSearchAllPositionsCaseInsensitive(materialize('aBaB'), materialize(['abab']));
 select [3] = multiSearchAllPositionsUTF8(materialize('ab€ab'), materialize(['€']));
 select [3] = multiSearchAllPositionsCaseInsensitiveUTF8(materialize('ab€AB'), materialize(['€ab']));
+-- checks the correct handling of broken utf-8 sequence
+select [0] = multiSearchAllPositionsCaseInsensitiveUTF8(materialize(''), materialize(['a\x90\x90\x90\x90\x90\x90']));
 
 select 1 = multiSearchAny(materialize('abcdefgh'), ['b']);
 select 1 = multiSearchAny(materialize('abcdefgh'), ['bc']);

From 216dcbef2c86a58a0c8b3679395e89d3fec640b2 Mon Sep 17 00:00:00 2001
From: pufit <pufit@clickhouse.com>
Date: Fri, 22 Mar 2024 02:13:51 -0400
Subject: [PATCH 888/985] Correct revoke for the partially granted rights.
 (#61115)

* Correct revoke for the partially granted rights.
---
 src/Access/AccessRights.cpp                   | 79 +++++++++++++++++++
 src/Access/AccessRights.h                     |  7 ++
 .../Access/InterpreterGrantQuery.cpp          | 16 ++++
 ...orrect_revoke_for_partial_rights.reference |  1 +
 ...03006_correct_revoke_for_partial_rights.sh | 33 ++++++++
 5 files changed, 136 insertions(+)
 create mode 100644 tests/queries/0_stateless/03006_correct_revoke_for_partial_rights.reference
 create mode 100755 tests/queries/0_stateless/03006_correct_revoke_for_partial_rights.sh

diff --git a/src/Access/AccessRights.cpp b/src/Access/AccessRights.cpp
index 72cbeca4f11..36a68bc0a34 100644
--- a/src/Access/AccessRights.cpp
+++ b/src/Access/AccessRights.cpp
@@ -408,6 +408,65 @@ public:
 
     friend bool operator!=(const Node & left, const Node & right) { return !(left == right); }
 
+    bool contains(const Node & other)
+    {
+        if (min_flags_with_children.contains(other.max_flags_with_children))
+            return true;
+
+        if (!flags.contains(other.flags))
+            return false;
+
+        /// Let's assume that the current node has the following rights:
+        ///
+        /// SELECT ON *.* TO user1;
+        /// REVOKE SELECT ON system.* FROM user1;
+        /// REVOKE SELECT ON mydb.* FROM user1;
+        ///
+        /// And the other node has the rights:
+        ///
+        /// SELECT ON *.* TO user2;
+        /// REVOKE SELECT ON system.* FROM user2;
+        ///
+        /// First, we check that each child from the other node is present in the current node:
+        ///
+        /// SELECT ON *.* TO user1;  -- checked
+        /// REVOKE SELECT ON system.* FROM user1; -- checked
+        if (other.children)
+        {
+            for (const auto & [name, node] : *other.children)
+            {
+                const auto & child = tryGetChild(name);
+                if (child == nullptr)
+                {
+                    if (!flags.contains(node.flags))
+                        return false;
+                }
+                else
+                {
+                    if (!child->contains(node))
+                        return false;
+                }
+            }
+        }
+
+        if (!children)
+            return true;
+
+        /// Then we check that each of our children has no other rights revoked.
+        ///
+        /// REVOKE SELECT ON mydb.* FROM user1; -- check failed, returning false
+        for (const auto & [name, node] : *children)
+        {
+            if (other.children && other.children->contains(name))
+                continue;
+
+            if (!node.flags.contains(other.flags))
+                return false;
+        }
+
+        return true;
+    }
+
     void makeUnion(const Node & other)
     {
         makeUnionRec(other);
@@ -1004,6 +1063,24 @@ bool AccessRights::isGrantedImpl(const AccessFlags & flags, const Args &... args
         return helper(root);
 }
 
+template <bool grant_option>
+bool AccessRights::containsImpl(const AccessRights & other) const
+{
+    auto helper = [&](const std::unique_ptr<Node> & root_node) -> bool
+    {
+        if (!root_node)
+            return !other.root;
+        if (!other.root)
+            return true;
+        return root_node->contains(*other.root);
+    };
+    if constexpr (grant_option)
+        return helper(root_with_grant_option);
+    else
+        return helper(root);
+}
+
+
 template <bool grant_option>
 bool AccessRights::isGrantedImplHelper(const AccessRightsElement & element) const
 {
@@ -1068,6 +1145,8 @@ bool AccessRights::hasGrantOption(const AccessFlags & flags, std::string_view da
 bool AccessRights::hasGrantOption(const AccessRightsElement & element) const { return isGrantedImpl<true>(element); }
 bool AccessRights::hasGrantOption(const AccessRightsElements & elements) const { return isGrantedImpl<true>(elements); }
 
+bool AccessRights::contains(const AccessRights & access_rights) const { return containsImpl<false>(access_rights); }
+bool AccessRights::containsWithGrantOption(const AccessRights & access_rights) const { return containsImpl<true>(access_rights); }
 
 bool operator ==(const AccessRights & left, const AccessRights & right)
 {
diff --git a/src/Access/AccessRights.h b/src/Access/AccessRights.h
index 5efffc0037a..bfb4b7c68c3 100644
--- a/src/Access/AccessRights.h
+++ b/src/Access/AccessRights.h
@@ -95,6 +95,10 @@ public:
     bool hasGrantOption(const AccessRightsElement & element) const;
     bool hasGrantOption(const AccessRightsElements & elements) const;
 
+    /// Checks if a given `access_rights` is a subset for the current access rights.
+    bool contains(const AccessRights & access_rights) const;
+    bool containsWithGrantOption(const AccessRights & access_rights) const;
+
     /// Merges two sets of access rights together.
     /// It's used to combine access rights from multiple roles.
     void makeUnion(const AccessRights & other);
@@ -153,6 +157,9 @@ private:
     template <bool grant_option>
     bool isGrantedImpl(const AccessRightsElements & elements) const;
 
+    template <bool grant_option>
+    bool containsImpl(const AccessRights & other) const;
+
     template <bool grant_option>
     bool isGrantedImplHelper(const AccessRightsElement & element) const;
 
diff --git a/src/Interpreters/Access/InterpreterGrantQuery.cpp b/src/Interpreters/Access/InterpreterGrantQuery.cpp
index 0f2d65abb5e..ed06b1d0fc6 100644
--- a/src/Interpreters/Access/InterpreterGrantQuery.cpp
+++ b/src/Interpreters/Access/InterpreterGrantQuery.cpp
@@ -178,6 +178,22 @@ namespace
                 elements_to_revoke.emplace_back(std::move(element_to_revoke));
         }
 
+        /// Additional check for REVOKE
+        ///
+        /// If user1 has the rights
+        /// GRANT SELECT ON *.* TO user1;
+        /// REVOKE SELECT ON system.* FROM user1;
+        /// REVOKE SELECT ON mydb.* FROM user1;
+        ///
+        /// And user2 has the rights
+        /// GRANT SELECT ON *.* TO user2;
+        /// REVOKE SELECT ON system.* FROM user2;
+        ///
+        /// the query `REVOKE SELECT ON *.* FROM user1` executed by user2 should succeed.
+        if (current_user_access.getAccessRights()->containsWithGrantOption(access_to_revoke))
+            return;
+
+        /// Technically, this check always fails if `containsWithGrantOption` returns `false`. But we still call it to get a nice exception message.
         current_user_access.checkGrantOption(elements_to_revoke);
     }
 
diff --git a/tests/queries/0_stateless/03006_correct_revoke_for_partial_rights.reference b/tests/queries/0_stateless/03006_correct_revoke_for_partial_rights.reference
new file mode 100644
index 00000000000..0cfbf08886f
--- /dev/null
+++ b/tests/queries/0_stateless/03006_correct_revoke_for_partial_rights.reference
@@ -0,0 +1 @@
+2
diff --git a/tests/queries/0_stateless/03006_correct_revoke_for_partial_rights.sh b/tests/queries/0_stateless/03006_correct_revoke_for_partial_rights.sh
new file mode 100755
index 00000000000..b58dda8648a
--- /dev/null
+++ b/tests/queries/0_stateless/03006_correct_revoke_for_partial_rights.sh
@@ -0,0 +1,33 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+db=${CLICKHOUSE_DATABASE}
+user1="user1_03006_$db_$RANDOM"
+user2="user2_03006_$db_$RANDOM"
+
+${CLICKHOUSE_CLIENT} --multiquery <<EOF
+DROP DATABASE IF EXISTS $db;
+CREATE DATABASE $db;
+CREATE USER $user1, $user2;
+
+GRANT SELECT ON *.* TO $user2 WITH GRANT OPTION;
+REVOKE SELECT ON system.* FROM $user2;
+EOF
+
+${CLICKHOUSE_CLIENT} --user $user2 --query "GRANT CURRENT GRANTS ON *.* TO $user1"
+${CLICKHOUSE_CLIENT} --user $user2 --query "REVOKE ALL ON *.* FROM $user1"
+${CLICKHOUSE_CLIENT} --query "SHOW GRANTS FOR $user1"
+
+${CLICKHOUSE_CLIENT} --user $user2 --query "GRANT CURRENT GRANTS ON *.* TO $user1"
+${CLICKHOUSE_CLIENT} --query "REVOKE ALL ON $db.* FROM $user1"
+${CLICKHOUSE_CLIENT} --user $user2 --query "REVOKE ALL ON *.* FROM $user1"
+${CLICKHOUSE_CLIENT} --query "SHOW GRANTS FOR $user1"
+
+${CLICKHOUSE_CLIENT} --user $user2 --query "GRANT CURRENT GRANTS ON *.* TO $user1"
+${CLICKHOUSE_CLIENT} --query "REVOKE ALL ON $db.* FROM $user2"
+${CLICKHOUSE_CLIENT} --user $user2 --query "REVOKE ALL ON *.* FROM $user1" 2>&1 | grep -c "ACCESS_DENIED"
+
+${CLICKHOUSE_CLIENT} --query "DROP DATABASE IF EXISTS $db"

From 771c5496069c8aa17934ec421e3a7397c2325072 Mon Sep 17 00:00:00 2001
From: "Mikhail f. Shiryaev" <felixoid@clickhouse.com>
Date: Fri, 22 Mar 2024 09:14:30 +0100
Subject: [PATCH 889/985] Process removed files, decouple _check_mime

---
 tests/ci/style_check.py | 42 +++++++++++++++++------------------------
 1 file changed, 17 insertions(+), 25 deletions(-)

diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index 05788aad5ea..373fa7b316f 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -8,8 +8,9 @@ import subprocess
 import sys
 from concurrent.futures import ProcessPoolExecutor
 from pathlib import Path
-from typing import List, Tuple
+from typing import List, Tuple, Union
 
+import magic
 from docker_images_helper import get_docker_image, pull_image
 from env_helper import CI, REPO_COPY, TEMP_PATH
 from git_helper import GIT_PREFIX, git_runner
@@ -95,34 +96,25 @@ def commit_push_staged(pr_info: PRInfo) -> None:
     git_runner(push_cmd)
 
 
-def is_python(file: str) -> bool:
+def _check_mime(file: Union[Path, str], mime: str) -> bool:
+    # WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
+    # and `Support os.PathLike values in magic.from_file` is only from 0.4.25
+    try:
+        return bool(magic.from_file(os.path.join(REPO_COPY, file), mime=True) == mime)
+    except (IsADirectoryError, FileNotFoundError) as e:
+        # Process submodules and removed files w/o errors
+        logging.warning("Captured error on file '%s': %s", file, e)
+        return False
+
+
+def is_python(file: Union[Path, str]) -> bool:
     """returns if the changed file in the repository is python script"""
-    # WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
-    # and `Support os.PathLike values in magic.from_file` is only from 0.4.25
-    # try:
-    #     return bool(
-    #         magic.from_file(os.path.join(REPO_COPY, file), mime=True)
-    #         == "text/x-script.python"
-    #     )
-    # except IsADirectoryError:
-    #     # Process submodules w/o errors
-    #     return False
-    return file.endswith(".py")
+    return _check_mime(file, "text/x-script.python")
 
 
-def is_shell(file: str) -> bool:
+def is_shell(file: Union[Path, str]) -> bool:
     """returns if the changed file in the repository is shell script"""
-    # WARNING: python-magic v2:0.4.24-2 is used in ubuntu 22.04,
-    # and `Support os.PathLike values in magic.from_file` is only from 0.4.25
-    # try:
-    #     return bool(
-    #         magic.from_file(os.path.join(REPO_COPY, file), mime=True)
-    #         == "text/x-shellscript"
-    #     )
-    # except IsADirectoryError:
-    #     # Process submodules w/o errors
-    #     return False
-    return file.endswith(".sh")
+    return _check_mime(file, "text/x-shellscript")
 
 
 def main():

From 5beabe071ce9cfbcfac28e4f0f21048588704faa Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 22 Mar 2024 09:35:23 +0100
Subject: [PATCH 890/985] Destroy KeeperDispatcher first

---
 src/Coordination/Standalone/Context.cpp | 76 ++++++++++++++++++++++++-
 src/Interpreters/Context.cpp            | 22 +++++--
 2 files changed, 90 insertions(+), 8 deletions(-)

diff --git a/src/Coordination/Standalone/Context.cpp b/src/Coordination/Standalone/Context.cpp
index 75b81187973..6652449340d 100644
--- a/src/Coordination/Standalone/Context.cpp
+++ b/src/Coordination/Standalone/Context.cpp
@@ -44,12 +44,78 @@ struct ContextSharedPart : boost::noncopyable
         : macros(std::make_unique<Macros>())
     {}
 
+    ~ContextSharedPart()
+    {
+        if (keeper_dispatcher)
+        {
+            try
+            {
+                keeper_dispatcher->shutdown();
+            }
+            catch (...)
+            {
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+            }
+        }
+
+        /// Wait for thread pool for background reads and writes,
+        /// since it may use per-user MemoryTracker which will be destroyed here.
+        if (asynchronous_remote_fs_reader)
+        {
+            try
+            {
+                asynchronous_remote_fs_reader->wait();
+                asynchronous_remote_fs_reader.reset();
+            }
+            catch (...)
+            {
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+            }
+        }
+
+        if (asynchronous_local_fs_reader)
+        {
+            try
+            {
+                asynchronous_local_fs_reader->wait();
+                asynchronous_local_fs_reader.reset();
+            }
+            catch (...)
+            {
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+            }
+        }
+
+        if (synchronous_local_fs_reader)
+        {
+            try
+            {
+                synchronous_local_fs_reader->wait();
+                synchronous_local_fs_reader.reset();
+            }
+            catch (...)
+            {
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+            }
+        }
+
+        if (threadpool_writer)
+        {
+            try
+            {
+                threadpool_writer->wait();
+                threadpool_writer.reset();
+            }
+            catch (...)
+            {
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+            }
+        }
+    }
+
     /// For access of most of shared objects.
     mutable SharedMutex mutex;
 
-    mutable std::mutex keeper_dispatcher_mutex;
-    mutable std::shared_ptr<KeeperDispatcher> keeper_dispatcher TSA_GUARDED_BY(keeper_dispatcher_mutex);
-
     ServerSettings server_settings;
 
     String path;                                            /// Path to the data directory, with a slash at the end.
@@ -77,6 +143,10 @@ struct ContextSharedPart : boost::noncopyable
 
     mutable ThrottlerPtr local_read_throttler;              /// A server-wide throttler for local IO reads
     mutable ThrottlerPtr local_write_throttler;             /// A server-wide throttler for local IO writes
+                                                            ///
+    mutable std::mutex keeper_dispatcher_mutex;
+    mutable std::shared_ptr<KeeperDispatcher> keeper_dispatcher TSA_GUARDED_BY(keeper_dispatcher_mutex);
+
 };
 
 ContextData::ContextData() = default;
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 038b9712b0c..9e7afcaaac1 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -221,10 +221,6 @@ struct ContextSharedPart : boost::noncopyable
 
     ConfigurationPtr sensitive_data_masker_config;
 
-#if USE_NURAFT
-    mutable std::mutex keeper_dispatcher_mutex;
-    mutable std::shared_ptr<KeeperDispatcher> keeper_dispatcher TSA_GUARDED_BY(keeper_dispatcher_mutex);
-#endif
     mutable std::mutex auxiliary_zookeepers_mutex;
     mutable std::map<String, zkutil::ZooKeeperPtr> auxiliary_zookeepers TSA_GUARDED_BY(auxiliary_zookeepers_mutex);    /// Map for auxiliary ZooKeeper clients.
     ConfigurationPtr auxiliary_zookeepers_config TSA_GUARDED_BY(auxiliary_zookeepers_mutex);           /// Stores auxiliary zookeepers configs
@@ -417,6 +413,11 @@ struct ContextSharedPart : boost::noncopyable
 
     bool is_server_completely_started TSA_GUARDED_BY(mutex) = false;
 
+#if USE_NURAFT
+    mutable std::mutex keeper_dispatcher_mutex;
+    mutable std::shared_ptr<KeeperDispatcher> keeper_dispatcher TSA_GUARDED_BY(keeper_dispatcher_mutex);
+#endif
+
     ContextSharedPart()
         : access_control(std::make_unique<AccessControl>())
         , global_overcommit_tracker(&process_list)
@@ -432,9 +433,20 @@ struct ContextSharedPart : boost::noncopyable
         }
     }
 
-
     ~ContextSharedPart()
     {
+        if (keeper_dispatcher)
+        {
+            try
+            {
+                keeper_dispatcher->shutdown();
+            }
+            catch (...)
+            {
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+            }
+        }
+
         /// Wait for thread pool for background reads and writes,
         /// since it may use per-user MemoryTracker which will be destroyed here.
         if (asynchronous_remote_fs_reader)

From d969c0cd08f3c158a57b6b4337f9280e5773728d Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 22 Mar 2024 10:30:55 +0100
Subject: [PATCH 891/985] Removed unused includes

---
 src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp | 2 --
 1 file changed, 2 deletions(-)

diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
index 2b8986a265e..4dc80dd5418 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
@@ -10,8 +10,6 @@
 #include <Common/ProfileEvents.h>
 #include <IO/SeekableReadBuffer.h>
 
-#include <sstream>
-
 namespace ProfileEvents
 {
     extern const Event RemoteReadThrottlerBytes;

From a08c16e8eb9325bf80655a7d70406e68db68d6f3 Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 22 Mar 2024 10:45:48 +0100
Subject: [PATCH 892/985] Fixed clang tidy build

---
 src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
index 1e589cf8bf3..05b93dd1fa3 100644
--- a/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/WriteBufferFromAzureBlobStorage.cpp
@@ -47,7 +47,7 @@ WriteBufferFromAzureBlobStorage::WriteBufferFromAzureBlobStorage(
     ThreadPoolCallbackRunner<void> schedule_)
     : WriteBufferFromFileBase(buf_size_, nullptr, 0)
     , log(getLogger("WriteBufferFromAzureBlobStorage"))
-    , buffer_allocation_policy(createBufferAllocationPolicy(*settings_.get()))
+    , buffer_allocation_policy(createBufferAllocationPolicy(*settings_))
     , max_single_part_upload_size(settings_->max_single_part_upload_size)
     , max_unexpected_write_error_retries(settings_->max_unexpected_write_error_retries)
     , blob_path(blob_path_)

From 409d2edba4d8781ac1c9e061a6646bfb8e160d41 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 22 Mar 2024 11:15:09 +0100
Subject: [PATCH 893/985] Fix flaky 03014_async_with_dedup_part_log_rmt

---
 .../0_stateless/03014_async_with_dedup_part_log_rmt.sql       | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.sql b/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.sql
index e14c1635853..6b441e951e1 100644
--- a/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.sql
+++ b/tests/queries/0_stateless/03014_async_with_dedup_part_log_rmt.sql
@@ -10,7 +10,7 @@ INSERT INTO 03014_async_with_dedup_part_log VALUES (2);
 
 SYSTEM FLUSH LOGS;
 SELECT error, count() FROM system.part_log
-WHERE table = '03014_async_with_dedup_part_log' and database = currentDatabase()
+WHERE table = '03014_async_with_dedup_part_log' AND database = currentDatabase() AND event_type = 'NewPart'
 GROUP BY error
 ORDER BY error;
 
@@ -19,6 +19,6 @@ INSERT INTO 03014_async_with_dedup_part_log VALUES (2);
 
 SYSTEM FLUSH LOGS;
 SELECT error, count() FROM system.part_log
-WHERE table = '03014_async_with_dedup_part_log' and database = currentDatabase()
+WHERE table = '03014_async_with_dedup_part_log' AND database = currentDatabase() AND event_type = 'NewPart'
 GROUP BY error
 ORDER BY error;

From ec134d2642bca10a9f147006858af4656b008d45 Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 22 Mar 2024 10:51:01 +0000
Subject: [PATCH 894/985] Another attempt.

---
 src/Analyzer/Passes/QueryAnalysisPass.cpp | 23 ++---------------------
 1 file changed, 2 insertions(+), 21 deletions(-)

diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 834bc2e5813..6082012445c 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -802,7 +802,7 @@ struct IdentifierResolveScope
     struct ResolvedFunctionsCache
     {
         FunctionOverloadResolverPtr resolver;
-        std::map<IQueryTreeNode::Hash, FunctionBasePtr> cache;
+        FunctionBasePtr function_base;
     };
 
     std::map<IQueryTreeNode::Hash, ResolvedFunctionsCache> functions_cache;
@@ -931,24 +931,6 @@ struct IdentifierResolveScope
     }
 };
 
-IQueryTreeNode::Hash getHashForFunctionArguments(const ColumnsWithTypeAndName & arguments)
-{
-    SipHash hash;
-    for (const auto & arg : arguments)
-    {
-        auto type_name = arg.type->getName();
-        hash.update(type_name.c_str(), type_name.size());
-
-        if (arg.column)
-        {
-            if (const auto * col_const = typeid_cast<const ColumnConst *>(arg.column.get()))
-                col_const->updateHashWithValue(0, hash);
-        }
-    }
-
-    return getSipHash128AsPair(hash);
-}
-
 
 /** Visitor that extracts expression and function aliases from node and initialize scope tables with it.
   * Does not go into child lambdas and queries.
@@ -5798,8 +5780,7 @@ ProjectionNames QueryAnalyzer::resolveFunction(QueryTreeNodePtr & node, Identifi
         FunctionBasePtr function_base;
         if (function_cache)
         {
-            auto args_hash = getHashForFunctionArguments(argument_columns);
-            auto & cached_function = function_cache->cache[args_hash];
+            auto & cached_function = function_cache->function_base;
             if (!cached_function)
                 cached_function = function->build(argument_columns);
 

From 7a154ad373e1b11e73d0311421ff45fed3ed045e Mon Sep 17 00:00:00 2001
From: Smita Kulkarni <Smita.Kulkarni@clickhouse.com>
Date: Fri, 22 Mar 2024 11:51:35 +0100
Subject: [PATCH 895/985] Updated log levels

---
 src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
index 4dc80dd5418..5947b742339 100644
--- a/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
+++ b/src/Disks/IO/ReadBufferFromAzureBlobStorage.cpp
@@ -103,7 +103,7 @@ bool ReadBufferFromAzureBlobStorage::nextImpl()
 
     auto handle_exception = [&, this](const auto & e, size_t i)
     {
-        LOG_INFO(log, "Exception caught during Azure Read for file {} at attempt {}/{}: {}", path, i + 1, max_single_read_retries, e.Message);
+        LOG_DEBUG(log, "Exception caught during Azure Read for file {} at attempt {}/{}: {}", path, i + 1, max_single_read_retries, e.Message);
         if (i + 1 == max_single_read_retries)
             throw;
 
@@ -215,7 +215,7 @@ void ReadBufferFromAzureBlobStorage::initialize()
 
     auto handle_exception = [&, this](const auto & e, size_t i)
     {
-        LOG_INFO(log, "Exception caught during Azure Download for file {} at offset {} at attempt {}/{}: {}", path, offset, i + 1, max_single_download_retries, e.Message);
+        LOG_DEBUG(log, "Exception caught during Azure Download for file {} at offset {} at attempt {}/{}: {}", path, offset, i + 1, max_single_download_retries, e.Message);
         if (i + 1 == max_single_download_retries)
             throw;
 
@@ -275,14 +275,14 @@ size_t ReadBufferFromAzureBlobStorage::readBigAt(char * to, size_t n, size_t ran
             std::unique_ptr<Azure::Core::IO::BodyStream> body_stream = std::move(download_response.Value.BodyStream);
             bytes_copied = body_stream->ReadToCount(reinterpret_cast<uint8_t *>(to), body_stream->Length());
 
-            LOG_INFO(log, "AzureBlobStorage readBigAt read bytes {}", bytes_copied);
+            LOG_TEST(log, "AzureBlobStorage readBigAt read bytes {}", bytes_copied);
 
             if (read_settings.remote_throttler)
                 read_settings.remote_throttler->add(bytes_copied, ProfileEvents::RemoteReadThrottlerBytes, ProfileEvents::RemoteReadThrottlerSleepMicroseconds);
         }
         catch (const Azure::Core::RequestFailedException & e)
         {
-            LOG_INFO(log, "Exception caught during Azure Download for file {} at offset {} at attempt {}/{}: {}", path, offset, i + 1, max_single_download_retries, e.Message);
+            LOG_DEBUG(log, "Exception caught during Azure Download for file {} at offset {} at attempt {}/{}: {}", path, offset, i + 1, max_single_download_retries, e.Message);
             if (i + 1 == max_single_download_retries)
                 throw;
 

From ad218411b373e8df599e739c81d2e28982f25678 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 22 Mar 2024 12:27:37 +0100
Subject: [PATCH 896/985] remove duplicated SETTINGS statement

---
 .../03013_optimize_in_to_equal.sql            | 25 ++++++++++---------
 1 file changed, 13 insertions(+), 12 deletions(-)

diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
index c38a741114f..ba6eb5d4f5f 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
@@ -1,28 +1,29 @@
 DROP TABLE IF EXISTS test;
 CREATE TABLE test (x String, y Int32) ENGINE = MergeTree() ORDER BY x;
+SET allow_experimental_analyzer = 1;
 INSERT INTO test VALUES ('a', 1), ('b', 2), ('c', 3);
-select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
+select * from test where x in ('a');
 select '-------------------';
 select x in Null from test;
 select '-------------------';
-explain query tree select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in ('a');
 select '-------------------';
-explain query tree select * from test where x in (upper('a')) SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in (upper('a'));
 select '-------------------';
-explain query tree select * from test where x in ('a','b') SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in ('a','b');
 select '-------------------';
-explain query tree select * from test where x in ['a','b'] SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in ['a','b'];
 select '-------------------';
-select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
+select * from test where x not in ('a');
 select '-------------------';
-explain query tree select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in ('a');
 select '-------------------';
-explain query tree select * from test where x not in (upper('a')) SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in (upper('a'));
 select '-------------------';
-explain query tree select * from test where x not in ('a','b') SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in ('a','b');
 select '-------------------';
-explain query tree select * from test where x not in ['a','b'] SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in ['a','b'];
 select '-------------------';
-explain query tree select * from test where x not in (NULL) SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in (NULL);
 select '-------------------';
-explain query tree select * from test where x in (NULL) SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in (NULL);

From 5d5f073bab07801e0955d085d88f2b41e18c301e Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 22 Mar 2024 12:48:14 +0100
Subject: [PATCH 897/985] revert previous commit

---
 .../03013_optimize_in_to_equal.sql            | 25 +++++++++----------
 1 file changed, 12 insertions(+), 13 deletions(-)

diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
index ba6eb5d4f5f..c38a741114f 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
@@ -1,29 +1,28 @@
 DROP TABLE IF EXISTS test;
 CREATE TABLE test (x String, y Int32) ENGINE = MergeTree() ORDER BY x;
-SET allow_experimental_analyzer = 1;
 INSERT INTO test VALUES ('a', 1), ('b', 2), ('c', 3);
-select * from test where x in ('a');
+select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
 select x in Null from test;
 select '-------------------';
-explain query tree select * from test where x in ('a');
+explain query tree select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x in (upper('a'));
+explain query tree select * from test where x in (upper('a')) SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x in ('a','b');
+explain query tree select * from test where x in ('a','b') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x in ['a','b'];
+explain query tree select * from test where x in ['a','b'] SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-select * from test where x not in ('a');
+select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x not in ('a');
+explain query tree select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x not in (upper('a'));
+explain query tree select * from test where x not in (upper('a')) SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x not in ('a','b');
+explain query tree select * from test where x not in ('a','b') SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x not in ['a','b'];
+explain query tree select * from test where x not in ['a','b'] SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x not in (NULL);
+explain query tree select * from test where x not in (NULL) SETTINGS allow_experimental_analyzer = 1;
 select '-------------------';
-explain query tree select * from test where x in (NULL);
+explain query tree select * from test where x in (NULL) SETTINGS allow_experimental_analyzer = 1;

From 5c082a8cc52dfeeadeec89bcc38ef17d10c4855b Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Fri, 22 Mar 2024 13:19:18 +0000
Subject: [PATCH 898/985] init

---
 src/Functions/currentUser.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Functions/currentUser.cpp b/src/Functions/currentUser.cpp
index 67b5d7626bf..1679c56a929 100644
--- a/src/Functions/currentUser.cpp
+++ b/src/Functions/currentUser.cpp
@@ -55,6 +55,7 @@ REGISTER_FUNCTION(CurrentUser)
 {
     factory.registerFunction<FunctionCurrentUser>();
     factory.registerAlias("user", FunctionCurrentUser::name, FunctionFactory::CaseInsensitive);
+    factory.registerAlias("current_user", FunctionCurrentUser::name, FunctionFactory::CaseInsensitive);
 }
 
 }

From 7be46e117cf7535209d16e536f9accc7e80d0f9a Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 22 Mar 2024 14:57:34 +0100
Subject: [PATCH 899/985] Remove another batch of bad templates

---
 src/Functions/FunctionsConversion.cpp | 150 +++++++++++++++-----------
 1 file changed, 85 insertions(+), 65 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 9262389e593..16a6e15cd10 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -1921,6 +1921,19 @@ struct NameParseDateTimeBestEffort;
 struct NameParseDateTimeBestEffortOrZero;
 struct NameParseDateTimeBestEffortOrNull;
 
+template <typename Name, typename ToDataType>
+constexpr bool mightBeDateTime()
+{
+    if constexpr (std::is_same_v<ToDataType, DataTypeDateTime64>)
+        return true;
+    else if constexpr (
+        std::is_same_v<Name, NameToDateTime> || std::is_same_v<Name, NameParseDateTimeBestEffort>
+        || std::is_same_v<Name, NameParseDateTimeBestEffortOrZero> || std::is_same_v<Name, NameParseDateTimeBestEffortOrNull>)
+        return true;
+
+    return false;
+}
+
 template<typename Name, typename ToDataType>
 inline bool isDateTime64(const ColumnsWithTypeAndName & arguments)
 {
@@ -2190,7 +2203,6 @@ private:
                         result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::Saturate>::execute(arguments, result_type, input_rows_count, from_string_tag, scale);
                         break;
                 }
-
             }
             else if constexpr (IsDataTypeDateOrDateTime<RightDataType> && std::is_same_v<LeftDataType, DataTypeDateTime64>)
             {
@@ -2208,12 +2220,25 @@ private:
                         break;
                 }
             }
+            else if constexpr ((IsDataTypeNumber<LeftDataType>
+                                || IsDataTypeDateOrDateTime<LeftDataType>)&&IsDataTypeDateOrDateTime<RightDataType>)
+            {
 #define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE) \
-            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-                result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
-                arguments, result_type, input_rows_count, from_string_tag); \
-                break;
+    case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
+        result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
+            arguments, result_type, input_rows_count, from_string_tag); \
+        break;
+                static_assert(
+                    !(std::is_same_v<LeftDataType, DataTypeNumber<Int64>> && std::is_same_v<RightDataType, DataTypeNumber<UInt32>>));
+                switch (date_time_overflow_behavior)
+                {
+                    GENERATE_OVERFLOW_MODE_CASE(Throw)
+                    GENERATE_OVERFLOW_MODE_CASE(Ignore)
+                    GENERATE_OVERFLOW_MODE_CASE(Saturate)
+                }
 
+#undef GENERATE_OVERFLOW_MODE_CASE
+            }
             else if constexpr (IsDataTypeDecimalOrNumber<LeftDataType> && IsDataTypeDecimalOrNumber<RightDataType>)
             {
                 using LeftT = typename LeftDataType::FieldType;
@@ -2232,44 +2257,36 @@ private:
                 }
                 else
                 {
-                    switch (date_time_overflow_behavior)
-                    {
-                        GENERATE_OVERFLOW_MODE_CASE(Throw)
-                        GENERATE_OVERFLOW_MODE_CASE(Ignore)
-                        GENERATE_OVERFLOW_MODE_CASE(Saturate)
-                    }
+                    result_column = ConvertImpl<LeftDataType, RightDataType, Name>::execute(
+                        arguments, result_type, input_rows_count, from_string_tag);
                 }
             }
-            else if constexpr ((IsDataTypeNumber<LeftDataType> || IsDataTypeDateOrDateTime<LeftDataType>)
-                               && IsDataTypeDateOrDateTime<RightDataType>)
-            {
-                switch (date_time_overflow_behavior)
-                {
-                    GENERATE_OVERFLOW_MODE_CASE(Throw)
-                    GENERATE_OVERFLOW_MODE_CASE(Ignore)
-                    GENERATE_OVERFLOW_MODE_CASE(Saturate)
-                }
-            }
-#undef GENERATE_OVERFLOW_MODE_CASE
             else
                   result_column = ConvertImpl<LeftDataType, RightDataType, Name>::execute(arguments, result_type, input_rows_count, from_string_tag);
 
             return true;
         };
 
-        if (isDateTime64<Name, ToDataType>(arguments))
+        if constexpr (mightBeDateTime<Name, ToDataType>())
         {
-            /// For toDateTime('xxxx-xx-xx xx:xx:xx.00', 2[, 'timezone']) we need to it convert to DateTime64
-            const ColumnWithTypeAndName & scale_column = arguments[1];
-            UInt32 scale = extractToDecimalScale(scale_column);
-
-            if (to_datetime64 || scale != 0) /// When scale = 0, the data type is DateTime otherwise the data type is DateTime64
+            if (isDateTime64<Name, ToDataType>(arguments))
             {
-                if (!callOnIndexAndDataType<DataTypeDateTime64>(from_type->getTypeId(), call, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag))
-                    throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
-                                    arguments[0].type->getName(), getName());
+                /// For toDateTime('xxxx-xx-xx xx:xx:xx.00', 2[, 'timezone']) we need to it convert to DateTime64
+                const ColumnWithTypeAndName & scale_column = arguments[1];
+                UInt32 scale = extractToDecimalScale(scale_column);
 
-                return result_column;
+                if (to_datetime64 || scale != 0) /// When scale = 0, the data type is DateTime otherwise the data type is DateTime64
+                {
+                    if (!callOnIndexAndDataType<DataTypeDateTime64>(
+                            from_type->getTypeId(), call, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag))
+                        throw Exception(
+                            ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                            "Illegal type {} of argument of function {}",
+                            arguments[0].type->getName(),
+                            getName());
+
+                    return result_column;
+                }
             }
         }
 
@@ -2468,19 +2485,27 @@ public:
             result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count,
                 assert_cast<const ToDataType &>(*removeNullable(result_type)).getScale());
         }
-        else if (isDateTime64<Name, ToDataType>(arguments))
+        else if constexpr (mightBeDateTime<Name, ToDataType>())
         {
-            UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
-            if (arguments.size() > 1)
-                scale = extractToDecimalScale(arguments[1]);
-
-            if (scale == 0)
+            if (isDateTime64<Name, ToDataType>(arguments))
             {
-                result_column = executeInternal<DataTypeDateTime>(arguments, result_type, input_rows_count, 0);
+                UInt64 scale = to_datetime64 ? DataTypeDateTime64::default_scale : 0;
+                if (arguments.size() > 1)
+                    scale = extractToDecimalScale(arguments[1]);
+
+                if (scale == 0)
+                {
+                    result_column = executeInternal<DataTypeDateTime>(arguments, result_type, input_rows_count, 0);
+                }
+                else
+                {
+                    result_column
+                        = executeInternal<DataTypeDateTime64>(arguments, result_type, input_rows_count, static_cast<UInt32>(scale));
+                }
             }
             else
             {
-                result_column = executeInternal<DataTypeDateTime64>(arguments, result_type, input_rows_count, static_cast<UInt32>(scale));
+                result_column = executeInternal<ToDataType>(arguments, result_type, input_rows_count, 0);
             }
         }
         else
@@ -3173,13 +3198,14 @@ private:
 
                 if constexpr (IsDataTypeNumber<LeftDataType>)
                 {
-                    if constexpr (IsDataTypeNumber<RightDataType>)
+                    if constexpr (IsDataTypeDateOrDateTime<RightDataType>)
                     {
 #define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
-            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-                result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
-                arguments, result_type, input_rows_count, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag, ADDITIONS()); \
-                break;
+    case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
+        result_column \
+            = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>:: \
+                execute(arguments, result_type, input_rows_count, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag, ADDITIONS()); \
+        break;
                         if (wrapper_cast_type == CastType::accurate)
                         {
                             switch (date_time_overflow_behavior)
@@ -3202,33 +3228,27 @@ private:
 
                         return true;
                     }
-
-                    if constexpr (std::is_same_v<RightDataType, DataTypeDate> || std::is_same_v<RightDataType, DataTypeDateTime>)
+                    else if constexpr (IsDataTypeNumber<RightDataType>)
                     {
-#define GENERATE_OVERFLOW_MODE_CASE(OVERFLOW_MODE, ADDITIONS) \
-            case FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE: \
-            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::template execute<ADDITIONS>( \
-arguments, result_type, input_rows_count, BehaviourOnErrorFromString::ConvertDefaultBehaviorTag); \
-                break;
                         if (wrapper_cast_type == CastType::accurate)
                         {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateConvertStrategyAdditions)
-                            }
+                            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
+                                arguments,
+                                result_type,
+                                input_rows_count,
+                                BehaviourOnErrorFromString::ConvertDefaultBehaviorTag,
+                                AccurateConvertStrategyAdditions());
                         }
                         else
                         {
-                            switch (date_time_overflow_behavior)
-                            {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateOrNullConvertStrategyAdditions)
-                            }
+                            result_column = ConvertImpl<LeftDataType, RightDataType, FunctionCastName>::execute(
+                                arguments,
+                                result_type,
+                                input_rows_count,
+                                BehaviourOnErrorFromString::ConvertDefaultBehaviorTag,
+                                AccurateOrNullConvertStrategyAdditions());
                         }
-#undef GENERATE_OVERFLOW_MODE_CASE
+
                         return true;
                     }
                 }

From 6a681e074fbf981aa4e7002a3b17c7d4bba8bf31 Mon Sep 17 00:00:00 2001
From: Antonio Andelic <antonio@clickhouse.com>
Date: Fri, 22 Mar 2024 15:17:28 +0100
Subject: [PATCH 900/985] Fix build

---
 src/Coordination/Standalone/Context.cpp | 2 +-
 src/Interpreters/Context.cpp            | 2 ++
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/src/Coordination/Standalone/Context.cpp b/src/Coordination/Standalone/Context.cpp
index 6652449340d..1095a11566f 100644
--- a/src/Coordination/Standalone/Context.cpp
+++ b/src/Coordination/Standalone/Context.cpp
@@ -143,7 +143,7 @@ struct ContextSharedPart : boost::noncopyable
 
     mutable ThrottlerPtr local_read_throttler;              /// A server-wide throttler for local IO reads
     mutable ThrottlerPtr local_write_throttler;             /// A server-wide throttler for local IO writes
-                                                            ///
+
     mutable std::mutex keeper_dispatcher_mutex;
     mutable std::shared_ptr<KeeperDispatcher> keeper_dispatcher TSA_GUARDED_BY(keeper_dispatcher_mutex);
 
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 9e7afcaaac1..1167b5d3472 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -435,6 +435,7 @@ struct ContextSharedPart : boost::noncopyable
 
     ~ContextSharedPart()
     {
+#if USE_NURAFT
         if (keeper_dispatcher)
         {
             try
@@ -446,6 +447,7 @@ struct ContextSharedPart : boost::noncopyable
                 tryLogCurrentException(__PRETTY_FUNCTION__);
             }
         }
+#endif
 
         /// Wait for thread pool for background reads and writes,
         /// since it may use per-user MemoryTracker which will be destroyed here.

From 8c49c9bf9e119ecbfdf3ec9147190a226424a9d2 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?J=C3=A1nos=20Benjamin=20Antal?=
 <antaljanosbenjamin@users.noreply.github.com>
Date: Fri, 22 Mar 2024 15:20:01 +0100
Subject: [PATCH 901/985] Revert "Fix bug when reading system.parts using UUID
 (issue 61220)." (#61774)

---
 src/Storages/System/StorageSystemPartsBase.cpp        |  4 ++--
 .../03010_read_system_parts_table_test.reference      | 10 ----------
 .../03010_read_system_parts_table_test.sql            | 11 -----------
 3 files changed, 2 insertions(+), 23 deletions(-)
 delete mode 100644 tests/queries/0_stateless/03010_read_system_parts_table_test.reference
 delete mode 100644 tests/queries/0_stateless/03010_read_system_parts_table_test.sql

diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index 4855dcfd6ed..2acb5ebe221 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -190,7 +190,7 @@ StoragesInfoStream::StoragesInfoStream(const ActionsDAGPtr & filter_by_database,
     block_to_filter.insert(ColumnWithTypeAndName(std::move(table_column_mut), std::make_shared<DataTypeString>(), "table"));
     block_to_filter.insert(ColumnWithTypeAndName(std::move(engine_column_mut), std::make_shared<DataTypeString>(), "engine"));
     block_to_filter.insert(ColumnWithTypeAndName(std::move(active_column_mut), std::make_shared<DataTypeUInt8>(), "active"));
-    block_to_filter.insert(ColumnWithTypeAndName(std::move(storage_uuid_column_mut), std::make_shared<DataTypeUUID>(), "storage_uuid"));
+    block_to_filter.insert(ColumnWithTypeAndName(std::move(storage_uuid_column_mut), std::make_shared<DataTypeUUID>(), "uuid"));
 
     if (rows)
     {
@@ -203,7 +203,7 @@ StoragesInfoStream::StoragesInfoStream(const ActionsDAGPtr & filter_by_database,
     database_column = block_to_filter.getByName("database").column;
     table_column = block_to_filter.getByName("table").column;
     active_column = block_to_filter.getByName("active").column;
-    storage_uuid_column = block_to_filter.getByName("storage_uuid").column;
+    storage_uuid_column = block_to_filter.getByName("uuid").column;
 }
 
 class ReadFromSystemPartsBase : public SourceStepWithFilter
diff --git a/tests/queries/0_stateless/03010_read_system_parts_table_test.reference b/tests/queries/0_stateless/03010_read_system_parts_table_test.reference
deleted file mode 100644
index c2dd177f245..00000000000
--- a/tests/queries/0_stateless/03010_read_system_parts_table_test.reference
+++ /dev/null
@@ -1,10 +0,0 @@
-00000000-0000-0000-0000-000000000000	1231_1_1_0
-00000000-0000-0000-0000-000000000000	6666_2_2_0
-00000000-0000-0000-0000-000000000000	1231_1_1_0	users
-00000000-0000-0000-0000-000000000000	6666_2_2_0	users
-00000000-0000-0000-0000-000000000000	1231_1_1_0	users	uid
-00000000-0000-0000-0000-000000000000	1231_1_1_0	users	name
-00000000-0000-0000-0000-000000000000	1231_1_1_0	users	age
-00000000-0000-0000-0000-000000000000	6666_2_2_0	users	uid
-00000000-0000-0000-0000-000000000000	6666_2_2_0	users	name
-00000000-0000-0000-0000-000000000000	6666_2_2_0	users	age
diff --git a/tests/queries/0_stateless/03010_read_system_parts_table_test.sql b/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
deleted file mode 100644
index a50005b2312..00000000000
--- a/tests/queries/0_stateless/03010_read_system_parts_table_test.sql
+++ /dev/null
@@ -1,11 +0,0 @@
-DROP TABLE IF EXISTS users;
-CREATE TABLE users (uid Int16, name String, age Int16) ENGINE=MergeTree ORDER BY uid PARTITION BY uid;
-
-INSERT INTO users VALUES (1231, 'John', 33);
-INSERT INTO users VALUES (6666, 'Ksenia', 48);
-
-SELECT uuid, name from system.parts WHERE database = currentDatabase() AND table = 'users';
-
-SELECT uuid, name, table from system.parts WHERE database = currentDatabase() AND table = 'users' AND uuid = '00000000-0000-0000-0000-000000000000';
-SELECT uuid, name, table, column from system.parts_columns WHERE database = currentDatabase() AND table = 'users' AND uuid = '00000000-0000-0000-0000-000000000000';
-DROP TABLE IF EXISTS users;

From ef0fa1963df9a3190771ee3906978f618099e9df Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Wed, 20 Mar 2024 15:34:09 +0000
Subject: [PATCH 902/985] CI: use ci-runner as module  #no_merge_commit 
 #ci_set_integration  #batch_0

---
 tests/ci/ci_config.py                         |  6 ++-
 .../ci-runner.py => ci/ci_runner.py}          | 53 +++++++++++--------
 tests/ci/integration_test_check.py            | 38 ++++---------
 3 files changed, 46 insertions(+), 51 deletions(-)
 rename tests/{integration/ci-runner.py => ci/ci_runner.py} (97%)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index 8ac37cb602e..d7cbb948311 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -385,7 +385,11 @@ upgrade_check_digest = DigestConfig(
     docker=["clickhouse/upgrade-check"],
 )
 integration_check_digest = DigestConfig(
-    include_paths=["./tests/ci/integration_test_check.py", "./tests/integration"],
+    include_paths=[
+        "./tests/ci/integration_test_check.py",
+        "./tests/ci/ci_runner.py",
+        "./tests/integration",
+    ],
     exclude_files=[".md"],
     docker=IMAGES.copy(),
 )
diff --git a/tests/integration/ci-runner.py b/tests/ci/ci_runner.py
similarity index 97%
rename from tests/integration/ci-runner.py
rename to tests/ci/ci_runner.py
index e051f6be85d..fa84dd4b206 100755
--- a/tests/integration/ci-runner.py
+++ b/tests/ci/ci_runner.py
@@ -13,11 +13,13 @@ import string
 import subprocess
 import sys
 import time
+from typing import Any, Dict
 import zlib  # for crc32
 from collections import defaultdict
 from itertools import chain
 
 from integration_test_images import IMAGES
+from env_helper import CI
 
 MAX_RETRY = 1
 NUM_WORKERS = 5
@@ -102,7 +104,7 @@ def get_counters(fname):
         "PASSED": set([]),
         "FAILED": set([]),
         "SKIPPED": set([]),
-    }
+    }  # type: Dict[str, Any]
 
     with open(fname, "r", encoding="utf-8") as out:
         for line in out:
@@ -292,7 +294,7 @@ class ClickhouseIntegrationTestsRunner:
             return name + ":latest"
         return name
 
-    def get_image_version(self, name: str):
+    def get_image_version(self, name: str) -> Any:
         if name in self.image_versions:
             return self.image_versions[name]
         logging.warning(
@@ -380,15 +382,15 @@ class ClickhouseIntegrationTestsRunner:
         os.chmod(CLICKHOUSE_ODBC_BRIDGE_BINARY_PATH, 0o777)
         os.chmod(CLICKHOUSE_LIBRARY_BRIDGE_BINARY_PATH, 0o777)
         shutil.copy(
-            CLICKHOUSE_BINARY_PATH, os.getenv("CLICKHOUSE_TESTS_SERVER_BIN_PATH")
+            CLICKHOUSE_BINARY_PATH, os.getenv("CLICKHOUSE_TESTS_SERVER_BIN_PATH")  # type: ignore
         )
         shutil.copy(
             CLICKHOUSE_ODBC_BRIDGE_BINARY_PATH,
-            os.getenv("CLICKHOUSE_TESTS_ODBC_BRIDGE_BIN_PATH"),
+            os.getenv("CLICKHOUSE_TESTS_ODBC_BRIDGE_BIN_PATH"),  # type: ignore
         )
         shutil.copy(
             CLICKHOUSE_LIBRARY_BRIDGE_BINARY_PATH,
-            os.getenv("CLICKHOUSE_TESTS_LIBRARY_BRIDGE_BIN_PATH"),
+            os.getenv("CLICKHOUSE_TESTS_LIBRARY_BRIDGE_BIN_PATH"),  # type: ignore
         )
 
     @staticmethod
@@ -466,7 +468,7 @@ class ClickhouseIntegrationTestsRunner:
 
     @staticmethod
     def group_test_by_file(tests):
-        result = {}
+        result = {}  # type: Dict
         for test in tests:
             test_file = test.split("::")[0]
             if test_file not in result:
@@ -573,8 +575,8 @@ class ClickhouseIntegrationTestsRunner:
                 "PASSED": [],
                 "FAILED": [],
                 "SKIPPED": [],
-            }
-            tests_times = defaultdict(float)
+            }  # type: Dict
+            tests_times = defaultdict(float)  # type: Dict
             for test in tests_in_group:
                 counters["ERROR"].append(test)
                 tests_times[test] = 0
@@ -595,8 +597,8 @@ class ClickhouseIntegrationTestsRunner:
             "SKIPPED": [],
             "BROKEN": [],
             "NOT_FAILED": [],
-        }
-        tests_times = defaultdict(float)
+        }  # type: Dict
+        tests_times = defaultdict(float)  # type: Dict
 
         if self.soft_deadline_time < time.time():
             for test in tests_in_group:
@@ -894,7 +896,7 @@ class ClickhouseIntegrationTestsRunner:
             "SKIPPED": [],
             "BROKEN": [],
             "NOT_FAILED": [],
-        }
+        }  # type: Dict
         tests_times = defaultdict(float)
         tests_log_paths = defaultdict(list)
 
@@ -985,7 +987,7 @@ def write_results(results_file, status_file, results, status):
         out.writerow(status)
 
 
-if __name__ == "__main__":
+def run():
     logging.basicConfig(level=logging.INFO, format="%(asctime)s %(message)s")
 
     repo_path = os.environ.get("CLICKHOUSE_TESTS_REPO_PATH")
@@ -993,29 +995,36 @@ if __name__ == "__main__":
     result_path = os.environ.get("CLICKHOUSE_TESTS_RESULT_PATH")
     params_path = os.environ.get("CLICKHOUSE_TESTS_JSON_PARAMS_PATH")
 
+    assert params_path
     with open(params_path, "r", encoding="utf-8") as jfd:
         params = json.loads(jfd.read())
     runner = ClickhouseIntegrationTestsRunner(result_path, params)
 
     logging.info("Running tests")
 
-    # Avoid overlaps with previous runs
-    logging.info("Clearing dmesg before run")
-    subprocess.check_call(  # STYLE_CHECK_ALLOW_SUBPROCESS_CHECK_CALL
-        "dmesg --clear", shell=True
-    )
+    if CI:
+        # Avoid overlaps with previous runs
+        logging.info("Clearing dmesg before run")
+        subprocess.check_call(  # STYLE_CHECK_ALLOW_SUBPROCESS_CHECK_CALL
+            "sudo -E dmesg --clear", shell=True
+        )
 
     state, description, test_results, _ = runner.run_impl(repo_path, build_path)
     logging.info("Tests finished")
 
-    # Dump dmesg (to capture possible OOMs)
-    logging.info("Dumping dmesg")
-    subprocess.check_call(  # STYLE_CHECK_ALLOW_SUBPROCESS_CHECK_CALL
-        "dmesg -T", shell=True
-    )
+    if CI:
+        # Dump dmesg (to capture possible OOMs)
+        logging.info("Dumping dmesg")
+        subprocess.check_call(  # STYLE_CHECK_ALLOW_SUBPROCESS_CHECK_CALL
+            "sudo -E dmesg -T", shell=True
+        )
 
     status = (state, description)
     out_results_file = os.path.join(str(runner.path()), "test_results.tsv")
     out_status_file = os.path.join(str(runner.path()), "check_status.tsv")
     write_results(out_results_file, out_status_file, test_results, status)
     logging.info("Result written")
+
+
+if __name__ == "__main__":
+    run()
diff --git a/tests/ci/integration_test_check.py b/tests/ci/integration_test_check.py
index 751abf617fa..a0fe823b8d7 100644
--- a/tests/ci/integration_test_check.py
+++ b/tests/ci/integration_test_check.py
@@ -25,7 +25,8 @@ from report import (
     read_test_results,
 )
 from stopwatch import Stopwatch
-from tee_popen import TeePopen
+
+import ci_runner
 
 
 def get_json_params_dict(
@@ -208,9 +209,8 @@ def main():
 
     output_path_log = result_path / "main_script_log.txt"
 
-    runner_path = repo_path / "tests" / "integration" / "ci-runner.py"
-    run_command = f"sudo -E {runner_path}"
-    logging.info("Going to run command: `%s`", run_command)
+    for k, v in my_env.items():
+        os.environ[k] = v
     logging.info(
         "ENV parameters for runner:\n%s",
         "\n".join(
@@ -218,31 +218,13 @@ def main():
         ),
     )
 
-    integration_infrastructure_fail = False
-    with TeePopen(run_command, output_path_log, my_env) as process:
-        retcode = process.wait()
-        if retcode == 0:
-            logging.info("Run tests successfully")
-        elif retcode == 13:
-            logging.warning(
-                "There were issues with infrastructure. Not writing status report to restart job."
-            )
-            integration_infrastructure_fail = True
-            sys.exit(1)
-        else:
-            logging.info("Some tests failed")
-
-    # subprocess.check_call(f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True)
-
-    if not integration_infrastructure_fail:
-        state, description, test_results, additional_logs = process_results(result_path)
+    try:
+        ci_runner.run()
+    except Exception as e:
+        logging.error("Exception: %s", e)
+        state, description, test_results, additional_logs = ERROR, "no description", [TestResult("infrastructure error", ERROR, stopwatch.duration_seconds)], []  # type: ignore
     else:
-        state, description, test_results, additional_logs = (
-            ERROR,
-            "no description",
-            [TestResult("infrastructure error", ERROR, stopwatch.duration_seconds)],
-            [],
-        )
+        state, description, test_results, additional_logs = process_results(result_path)
 
     JobReport(
         description=description,

From e4556ae6c139fc3abc12a162e67873afa51b2bc2 Mon Sep 17 00:00:00 2001
From: Max Kainov <max.kainov@clickhouse.com>
Date: Thu, 21 Mar 2024 13:44:08 +0000
Subject: [PATCH 903/985] comments

---
 tests/ci/ci_config.py                                  |  4 ++--
 tests/ci/integration_test_check.py                     | 10 ++++------
 tests/ci/{ci_runner.py => integration_tests_runner.py} |  0
 3 files changed, 6 insertions(+), 8 deletions(-)
 rename tests/ci/{ci_runner.py => integration_tests_runner.py} (100%)

diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index d7cbb948311..573976f1f84 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -387,8 +387,8 @@ upgrade_check_digest = DigestConfig(
 integration_check_digest = DigestConfig(
     include_paths=[
         "./tests/ci/integration_test_check.py",
-        "./tests/ci/ci_runner.py",
-        "./tests/integration",
+        "./tests/ci/integration_tests_runner.py",
+        "./tests/integration/",
     ],
     exclude_files=[".md"],
     docker=IMAGES.copy(),
diff --git a/tests/ci/integration_test_check.py b/tests/ci/integration_test_check.py
index a0fe823b8d7..61270c06a97 100644
--- a/tests/ci/integration_test_check.py
+++ b/tests/ci/integration_test_check.py
@@ -26,7 +26,7 @@ from report import (
 )
 from stopwatch import Stopwatch
 
-import ci_runner
+import integration_tests_runner as runner
 
 
 def get_json_params_dict(
@@ -207,8 +207,6 @@ def main():
         json_params.write(params_text)
         logging.info("Parameters file %s is written: %s", json_path, params_text)
 
-    output_path_log = result_path / "main_script_log.txt"
-
     for k, v in my_env.items():
         os.environ[k] = v
     logging.info(
@@ -219,10 +217,10 @@ def main():
     )
 
     try:
-        ci_runner.run()
+        runner.run()
     except Exception as e:
         logging.error("Exception: %s", e)
-        state, description, test_results, additional_logs = ERROR, "no description", [TestResult("infrastructure error", ERROR, stopwatch.duration_seconds)], []  # type: ignore
+        state, description, test_results, additional_logs = ERROR, "infrastructure error", [TestResult("infrastructure error", ERROR, stopwatch.duration_seconds)], []  # type: ignore
     else:
         state, description, test_results, additional_logs = process_results(result_path)
 
@@ -232,7 +230,7 @@ def main():
         status=state,
         start_time=stopwatch.start_time_str,
         duration=stopwatch.duration_seconds,
-        additional_files=[output_path_log] + additional_logs,
+        additional_files=additional_logs,
     ).dump(to_file=args.report_to_file if args.report_to_file else None)
 
     if state != SUCCESS:
diff --git a/tests/ci/ci_runner.py b/tests/ci/integration_tests_runner.py
similarity index 100%
rename from tests/ci/ci_runner.py
rename to tests/ci/integration_tests_runner.py

From de55ec24cc48503e8fe94dd795266e225b7041ce Mon Sep 17 00:00:00 2001
From: yariks5s <yaroslav.briukhovetskyi@clickhouse.com>
Date: Fri, 22 Mar 2024 14:29:44 +0000
Subject: [PATCH 904/985] tests+docs

---
 docs/en/sql-reference/functions/other-functions.md           | 2 +-
 .../0_stateless/00990_function_current_user.reference        | 4 ++++
 tests/queries/0_stateless/00990_function_current_user.sql    | 5 +++++
 3 files changed, 10 insertions(+), 1 deletion(-)

diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index e7fca31483a..0ca404274ec 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -405,7 +405,7 @@ Returns the name of the current user. In case of a distributed query, the name o
 SELECT currentUser();
 ```
 
-Alias: `user()`, `USER()`.
+Aliases: `user()`, `USER()`, `current_user()`. Aliases are case insensitive.
 
 **Returned values**
 
diff --git a/tests/queries/0_stateless/00990_function_current_user.reference b/tests/queries/0_stateless/00990_function_current_user.reference
index f1f321b1ecd..227c7c3b562 100644
--- a/tests/queries/0_stateless/00990_function_current_user.reference
+++ b/tests/queries/0_stateless/00990_function_current_user.reference
@@ -2,3 +2,7 @@
 1
 1	1
 1
+1
+1
+1	1	1
+1
diff --git a/tests/queries/0_stateless/00990_function_current_user.sql b/tests/queries/0_stateless/00990_function_current_user.sql
index 38bd815ecef..c2d946e4185 100644
--- a/tests/queries/0_stateless/00990_function_current_user.sql
+++ b/tests/queries/0_stateless/00990_function_current_user.sql
@@ -3,3 +3,8 @@ select currentUser() IS NOT NULL;
 select length(currentUser()) > 0;
 select currentUser() = user(), currentUser() = USER();
 select currentUser() = initial_user from system.processes where query like '%$!@#%';
+
+select current_user() IS NOT NULL;
+select length(current_user()) > 0;
+select current_user() = user(), current_user() = USER(), current_user() = currentUser();
+select current_user() = initial_user from system.processes where query like '%$!@#%';

From 97bd6ecfc19c0ab9103d7c9153c66f8b9c000f32 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 22 Mar 2024 16:00:53 +0100
Subject: [PATCH 905/985] remove duplicated SETTINGS statement

---
 .../03013_optimize_in_to_equal.reference      | 10 --------
 .../03013_optimize_in_to_equal.sql            | 25 ++++++++++---------
 2 files changed, 13 insertions(+), 22 deletions(-)

diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.reference b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
index c24f40d545d..93ac91bd957 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.reference
@@ -20,7 +20,6 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: x, result_type: String, source_id: 3
           CONSTANT id: 8, constant_value: \'a\', constant_value_type: String
-  SETTINGS allow_experimental_analyzer=1
 -------------------
 QUERY id: 0
   PROJECTION COLUMNS
@@ -43,7 +42,6 @@ QUERY id: 0
                 ARGUMENTS
                   LIST id: 10, nodes: 1
                     CONSTANT id: 11, constant_value: \'a\', constant_value_type: String
-  SETTINGS allow_experimental_analyzer=1
 -------------------
 QUERY id: 0
   PROJECTION COLUMNS
@@ -61,7 +59,6 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: x, result_type: String, source_id: 3
           CONSTANT id: 8, constant_value: Tuple_(\'a\', \'b\'), constant_value_type: Tuple(String, String)
-  SETTINGS allow_experimental_analyzer=1
 -------------------
 QUERY id: 0
   PROJECTION COLUMNS
@@ -79,7 +76,6 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: x, result_type: String, source_id: 3
           CONSTANT id: 8, constant_value: Array_[\'a\', \'b\'], constant_value_type: Array(String)
-  SETTINGS allow_experimental_analyzer=1
 -------------------
 b	2
 c	3
@@ -100,7 +96,6 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: x, result_type: String, source_id: 3
           CONSTANT id: 8, constant_value: \'a\', constant_value_type: String
-  SETTINGS allow_experimental_analyzer=1
 -------------------
 QUERY id: 0
   PROJECTION COLUMNS
@@ -123,7 +118,6 @@ QUERY id: 0
                 ARGUMENTS
                   LIST id: 10, nodes: 1
                     CONSTANT id: 11, constant_value: \'a\', constant_value_type: String
-  SETTINGS allow_experimental_analyzer=1
 -------------------
 QUERY id: 0
   PROJECTION COLUMNS
@@ -141,7 +135,6 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: x, result_type: String, source_id: 3
           CONSTANT id: 8, constant_value: Tuple_(\'a\', \'b\'), constant_value_type: Tuple(String, String)
-  SETTINGS allow_experimental_analyzer=1
 -------------------
 QUERY id: 0
   PROJECTION COLUMNS
@@ -159,7 +152,6 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: x, result_type: String, source_id: 3
           CONSTANT id: 8, constant_value: Array_[\'a\', \'b\'], constant_value_type: Array(String)
-  SETTINGS allow_experimental_analyzer=1
 -------------------
 QUERY id: 0
   PROJECTION COLUMNS
@@ -177,7 +169,6 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: x, result_type: String, source_id: 3
           CONSTANT id: 8, constant_value: NULL, constant_value_type: Nullable(Nothing)
-  SETTINGS allow_experimental_analyzer=1
 -------------------
 QUERY id: 0
   PROJECTION COLUMNS
@@ -195,4 +186,3 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: x, result_type: String, source_id: 3
           CONSTANT id: 8, constant_value: NULL, constant_value_type: Nullable(Nothing)
-  SETTINGS allow_experimental_analyzer=1
diff --git a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
index c38a741114f..ba6eb5d4f5f 100644
--- a/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
+++ b/tests/queries/0_stateless/03013_optimize_in_to_equal.sql
@@ -1,28 +1,29 @@
 DROP TABLE IF EXISTS test;
 CREATE TABLE test (x String, y Int32) ENGINE = MergeTree() ORDER BY x;
+SET allow_experimental_analyzer = 1;
 INSERT INTO test VALUES ('a', 1), ('b', 2), ('c', 3);
-select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
+select * from test where x in ('a');
 select '-------------------';
 select x in Null from test;
 select '-------------------';
-explain query tree select * from test where x in ('a') SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in ('a');
 select '-------------------';
-explain query tree select * from test where x in (upper('a')) SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in (upper('a'));
 select '-------------------';
-explain query tree select * from test where x in ('a','b') SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in ('a','b');
 select '-------------------';
-explain query tree select * from test where x in ['a','b'] SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in ['a','b'];
 select '-------------------';
-select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
+select * from test where x not in ('a');
 select '-------------------';
-explain query tree select * from test where x not in ('a') SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in ('a');
 select '-------------------';
-explain query tree select * from test where x not in (upper('a')) SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in (upper('a'));
 select '-------------------';
-explain query tree select * from test where x not in ('a','b') SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in ('a','b');
 select '-------------------';
-explain query tree select * from test where x not in ['a','b'] SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in ['a','b'];
 select '-------------------';
-explain query tree select * from test where x not in (NULL) SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x not in (NULL);
 select '-------------------';
-explain query tree select * from test where x in (NULL) SETTINGS allow_experimental_analyzer = 1;
+explain query tree select * from test where x in (NULL);

From 165022e88b65ac64afa257651df51b539d759be1 Mon Sep 17 00:00:00 2001
From: pufit <pufit@clickhouse.com>
Date: Fri, 22 Mar 2024 12:01:18 -0400
Subject: [PATCH 906/985] fix

---
 src/Common/Volnitsky.h | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Common/Volnitsky.h b/src/Common/Volnitsky.h
index a87a4c2cf8b..daf143f7303 100644
--- a/src/Common/Volnitsky.h
+++ b/src/Common/Volnitsky.h
@@ -191,7 +191,7 @@ namespace VolnitskyTraits
                         if (length_l != length_r)
                             return false;
 
-                        if (length_l >= 2 && length_r >= 2)
+                        if (length_l < 2 || length_r < 2)
                             return false;  /// Some part of the given ngram contains an invalid UTF-8 sequence.
 
                         chars.c0 = seq_l[seq_ngram_offset];

From 2377b1eb293c643de561d73c37524c249a8167cf Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Ra=C3=BAl=20Mar=C3=ADn?= <git@rmr.ninja>
Date: Fri, 22 Mar 2024 17:55:50 +0100
Subject: [PATCH 907/985] FML

---
 src/Functions/FunctionsConversion.cpp | 14 ++++++--------
 1 file changed, 6 insertions(+), 8 deletions(-)

diff --git a/src/Functions/FunctionsConversion.cpp b/src/Functions/FunctionsConversion.cpp
index 16a6e15cd10..7049ca44110 100644
--- a/src/Functions/FunctionsConversion.cpp
+++ b/src/Functions/FunctionsConversion.cpp
@@ -2228,8 +2228,6 @@ private:
         result_column = ConvertImpl<LeftDataType, RightDataType, Name, FormatSettings::DateTimeOverflowBehavior::OVERFLOW_MODE>::execute( \
             arguments, result_type, input_rows_count, from_string_tag); \
         break;
-                static_assert(
-                    !(std::is_same_v<LeftDataType, DataTypeNumber<Int64>> && std::is_same_v<RightDataType, DataTypeNumber<UInt32>>));
                 switch (date_time_overflow_behavior)
                 {
                     GENERATE_OVERFLOW_MODE_CASE(Throw)
@@ -3210,18 +3208,18 @@ private:
                         {
                             switch (date_time_overflow_behavior)
                             {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, AccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, AccurateConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, AccurateConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateConvertStrategyAdditions)
                             }
                         }
                         else
                         {
                             switch (date_time_overflow_behavior)
                             {
-                                GENERATE_OVERFLOW_MODE_CASE(Throw, AccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Ignore, AccurateOrNullConvertStrategyAdditions)
-                                GENERATE_OVERFLOW_MODE_CASE(Saturate, AccurateOrNullConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Throw, DateTimeAccurateOrNullConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Ignore, DateTimeAccurateOrNullConvertStrategyAdditions)
+                                GENERATE_OVERFLOW_MODE_CASE(Saturate, DateTimeAccurateOrNullConvertStrategyAdditions)
                             }
                         }
 #undef GENERATE_OVERFLOW_MODE_CASE

From 2736b4ef6436b86d82fb8439c82b1b0fcbab1213 Mon Sep 17 00:00:00 2001
From: Dani Pozo <dani.pozo@tinybird.co>
Date: Fri, 22 Mar 2024 17:58:07 +0100
Subject: [PATCH 908/985] Use managed identity for backups IO in Azure Blob
 Storage

Also adds option to prevent ClickHouse from trying to create a non-existing container, which requires
a role assignment at the storage account level.
---
 docs/en/operations/backup.md                  |  1 +
 src/Backups/BackupFactory.h                   |  1 +
 src/Backups/BackupIO_AzureBlobStorage.cpp     |  5 +-
 src/Backups/BackupIO_AzureBlobStorage.h       |  2 +-
 src/Backups/BackupSettings.cpp                |  1 +
 src/Backups/BackupSettings.h                  |  3 +
 src/Backups/BackupsWorker.cpp                 |  1 +
 .../registerBackupEngineAzureBlobStorage.cpp  |  5 +-
 src/Storages/StorageAzureBlob.cpp             | 56 ++++++++++++-------
 src/Storages/StorageAzureBlob.h               |  2 +-
 10 files changed, 50 insertions(+), 27 deletions(-)

diff --git a/docs/en/operations/backup.md b/docs/en/operations/backup.md
index 8639af468c2..2ba50b39934 100644
--- a/docs/en/operations/backup.md
+++ b/docs/en/operations/backup.md
@@ -87,6 +87,7 @@ The BACKUP and RESTORE statements take a list of DATABASE and TABLE names, a des
     - `structure_only`: if enabled, allows to only backup or restore the CREATE statements without the data of tables
     - `storage_policy`: storage policy for the tables being restored. See [Using Multiple Block Devices for Data Storage](../engines/table-engines/mergetree-family/mergetree.md#table_engine-mergetree-multiple-volumes). This setting is only applicable to the `RESTORE` command. The specified storage policy applies only to tables with an engine from the `MergeTree` family.
     - `s3_storage_class`: the storage class used for S3 backup. For example, `STANDARD`
+    - `azure_attempt_to_create_container`: when using Azure Blob Storage, whether the specified container will try to be created if it doesn't exist. Default: true.
 
 ### Usage examples
 
diff --git a/src/Backups/BackupFactory.h b/src/Backups/BackupFactory.h
index f0c64486da4..4e752508577 100644
--- a/src/Backups/BackupFactory.h
+++ b/src/Backups/BackupFactory.h
@@ -40,6 +40,7 @@ public:
         bool deduplicate_files = true;
         bool allow_s3_native_copy = true;
         bool use_same_s3_credentials_for_base_backup = false;
+        bool azure_attempt_to_create_container = true;
         ReadSettings read_settings;
         WriteSettings write_settings;
     };
diff --git a/src/Backups/BackupIO_AzureBlobStorage.cpp b/src/Backups/BackupIO_AzureBlobStorage.cpp
index b3b92323109..7f3ee6b42a7 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.cpp
+++ b/src/Backups/BackupIO_AzureBlobStorage.cpp
@@ -140,12 +140,13 @@ BackupWriterAzureBlobStorage::BackupWriterAzureBlobStorage(
     StorageAzureBlob::Configuration configuration_,
     const ReadSettings & read_settings_,
     const WriteSettings & write_settings_,
-    const ContextPtr & context_)
+    const ContextPtr & context_,
+    bool attempt_to_create_container)
     : BackupWriterDefault(read_settings_, write_settings_, getLogger("BackupWriterAzureBlobStorage"))
     , data_source_description{DataSourceType::ObjectStorage, ObjectStorageType::Azure, MetadataStorageType::None, configuration_.container, false, false}
     , configuration(configuration_)
 {
-    auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false);
+    auto client_ptr = StorageAzureBlob::createClient(configuration, /* is_read_only */ false, attempt_to_create_container);
     object_storage = std::make_unique<AzureObjectStorage>("BackupWriterAzureBlobStorage",
                                                           std::move(client_ptr),
                                                           StorageAzureBlob::createSettings(context_),
diff --git a/src/Backups/BackupIO_AzureBlobStorage.h b/src/Backups/BackupIO_AzureBlobStorage.h
index 95325044a62..f0b9aace4d4 100644
--- a/src/Backups/BackupIO_AzureBlobStorage.h
+++ b/src/Backups/BackupIO_AzureBlobStorage.h
@@ -37,7 +37,7 @@ private:
 class BackupWriterAzureBlobStorage : public BackupWriterDefault
 {
 public:
-    BackupWriterAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_);
+    BackupWriterAzureBlobStorage(StorageAzureBlob::Configuration configuration_, const ReadSettings & read_settings_, const WriteSettings & write_settings_, const ContextPtr & context_, bool attempt_to_create_container);
     ~BackupWriterAzureBlobStorage() override;
 
     bool fileExists(const String & file_name) override;
diff --git a/src/Backups/BackupSettings.cpp b/src/Backups/BackupSettings.cpp
index 68d825e9468..468e5651274 100644
--- a/src/Backups/BackupSettings.cpp
+++ b/src/Backups/BackupSettings.cpp
@@ -28,6 +28,7 @@ namespace ErrorCodes
     M(Bool, deduplicate_files) \
     M(Bool, allow_s3_native_copy) \
     M(Bool, use_same_s3_credentials_for_base_backup) \
+    M(Bool, azure_attempt_to_create_container) \
     M(Bool, read_from_filesystem_cache) \
     M(UInt64, shard_num) \
     M(UInt64, replica_num) \
diff --git a/src/Backups/BackupSettings.h b/src/Backups/BackupSettings.h
index 10181ea464a..13709ca11c6 100644
--- a/src/Backups/BackupSettings.h
+++ b/src/Backups/BackupSettings.h
@@ -47,6 +47,9 @@ struct BackupSettings
     /// Whether base backup to S3 should inherit credentials from the BACKUP query.
     bool use_same_s3_credentials_for_base_backup = false;
 
+    /// Whether a new Azure container should be created if it does not exist (requires permissions at storage account level)
+    bool azure_attempt_to_create_container = true;
+
     /// Allow to use the filesystem cache in passive mode - benefit from the existing cache entries,
     /// but don't put more entries into the cache.
     bool read_from_filesystem_cache = true;
diff --git a/src/Backups/BackupsWorker.cpp b/src/Backups/BackupsWorker.cpp
index d0853300edb..96fe770227c 100644
--- a/src/Backups/BackupsWorker.cpp
+++ b/src/Backups/BackupsWorker.cpp
@@ -597,6 +597,7 @@ void BackupsWorker::doBackup(
     backup_create_params.deduplicate_files = backup_settings.deduplicate_files;
     backup_create_params.allow_s3_native_copy = backup_settings.allow_s3_native_copy;
     backup_create_params.use_same_s3_credentials_for_base_backup = backup_settings.use_same_s3_credentials_for_base_backup;
+    backup_create_params.azure_attempt_to_create_container = backup_settings.azure_attempt_to_create_container;
     backup_create_params.read_settings = getReadSettingsForBackup(context, backup_settings);
     backup_create_params.write_settings = getWriteSettingsForBackup(context);
     backup = BackupFactory::instance().createBackup(backup_create_params);
diff --git a/src/Backups/registerBackupEngineAzureBlobStorage.cpp b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
index 48f66569304..dbe5b555c31 100644
--- a/src/Backups/registerBackupEngineAzureBlobStorage.cpp
+++ b/src/Backups/registerBackupEngineAzureBlobStorage.cpp
@@ -86,7 +86,7 @@ void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
             if (args.size() == 3)
             {
                 configuration.connection_url = args[0].safeGet<String>();
-                configuration.is_connection_string = true;
+                configuration.is_connection_string = !configuration.connection_url.starts_with("http");
 
                 configuration.container =  args[1].safeGet<String>();
                 configuration.blob_path = args[2].safeGet<String>();
@@ -147,7 +147,8 @@ void registerBackupEngineAzureBlobStorage(BackupFactory & factory)
             auto writer = std::make_shared<BackupWriterAzureBlobStorage>(configuration,
                                                            params.read_settings,
                                                            params.write_settings,
-                                                           params.context);
+                                                           params.context,
+                                                           params.azure_attempt_to_create_container);
 
             return std::make_unique<BackupImpl>(
                 params.backup_info,
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 6367cb0b077..289bd4643c4 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -17,6 +17,7 @@
 #include <DataTypes/DataTypesNumber.h>
 
 #include <azure/storage/common/storage_credential.hpp>
+#include <azure/identity/managed_identity_credential.hpp>
 #include <Processors/Transforms/AddingDefaultsTransform.h>
 #include <Processors/Transforms/ExtractColumnsTransform.h>
 #include <Processors/Formats/IOutputFormat.h>
@@ -336,33 +337,37 @@ static bool containerExists(std::unique_ptr<BlobServiceClient> &blob_service_cli
     return false;
 }
 
-AzureClientPtr StorageAzureBlob::createClient(StorageAzureBlob::Configuration configuration, bool is_read_only)
+AzureClientPtr StorageAzureBlob::createClient(StorageAzureBlob::Configuration configuration, bool is_read_only, bool attempt_to_create_container)
 {
     AzureClientPtr result;
 
     if (configuration.is_connection_string)
     {
+        std::shared_ptr<Azure::Identity::ManagedIdentityCredential> managed_identity_credential = std::make_shared<Azure::Identity::ManagedIdentityCredential>();
         std::unique_ptr<BlobServiceClient> blob_service_client = std::make_unique<BlobServiceClient>(BlobServiceClient::CreateFromConnectionString(configuration.connection_url));
         result = std::make_unique<BlobContainerClient>(BlobContainerClient::CreateFromConnectionString(configuration.connection_url, configuration.container));
-        bool container_exists = containerExists(blob_service_client,configuration.container);
 
-        if (!container_exists)
+        if (attempt_to_create_container)
         {
-            if (is_read_only)
-                throw Exception(
-                    ErrorCodes::DATABASE_ACCESS_DENIED,
-                    "AzureBlobStorage container does not exist '{}'",
-                    configuration.container);
+            bool container_exists = containerExists(blob_service_client,configuration.container);
+            if (!container_exists)
+            {
+                if (is_read_only)
+                    throw Exception(
+                        ErrorCodes::DATABASE_ACCESS_DENIED,
+                        "AzureBlobStorage container does not exist '{}'",
+                        configuration.container);
 
-            try
-            {
-                result->CreateIfNotExists();
-            } catch (const Azure::Storage::StorageException & e)
-            {
-                if (!(e.StatusCode == Azure::Core::Http::HttpStatusCode::Conflict
-                    && e.ReasonPhrase == "The specified container already exists."))
+                try
                 {
-                    throw;
+                    result->CreateIfNotExists();
+                } catch (const Azure::Storage::StorageException & e)
+                {
+                    if (!(e.StatusCode == Azure::Core::Http::HttpStatusCode::Conflict
+                        && e.ReasonPhrase == "The specified container already exists."))
+                    {
+                        throw;
+                    }
                 }
             }
         }
@@ -377,17 +382,17 @@ AzureClientPtr StorageAzureBlob::createClient(StorageAzureBlob::Configuration co
         }
 
         std::unique_ptr<BlobServiceClient> blob_service_client;
+        std::shared_ptr<Azure::Identity::ManagedIdentityCredential> managed_identity_credential;
         if (storage_shared_key_credential)
         {
             blob_service_client = std::make_unique<BlobServiceClient>(configuration.connection_url, storage_shared_key_credential);
         }
         else
         {
-            blob_service_client = std::make_unique<BlobServiceClient>(configuration.connection_url);
+            managed_identity_credential = std::make_shared<Azure::Identity::ManagedIdentityCredential>();
+            blob_service_client = std::make_unique<BlobServiceClient>(configuration.connection_url, managed_identity_credential);
         }
 
-        bool container_exists = containerExists(blob_service_client,configuration.container);
-
         std::string final_url;
         size_t pos = configuration.connection_url.find('?');
         if (pos != std::string::npos)
@@ -400,12 +405,21 @@ AzureClientPtr StorageAzureBlob::createClient(StorageAzureBlob::Configuration co
             final_url
                 = configuration.connection_url + (configuration.connection_url.back() == '/' ? "" : "/") + configuration.container;
 
+        if (!attempt_to_create_container)
+        {
+            if (storage_shared_key_credential)
+                return std::make_unique<BlobContainerClient>(final_url, storage_shared_key_credential);
+            else
+                return std::make_unique<BlobContainerClient>(final_url, managed_identity_credential);
+        }
+
+        bool container_exists = containerExists(blob_service_client,configuration.container);
         if (container_exists)
         {
             if (storage_shared_key_credential)
                 result = std::make_unique<BlobContainerClient>(final_url, storage_shared_key_credential);
             else
-                result = std::make_unique<BlobContainerClient>(final_url);
+                result = std::make_unique<BlobContainerClient>(final_url, managed_identity_credential);
         }
         else
         {
@@ -425,7 +439,7 @@ AzureClientPtr StorageAzureBlob::createClient(StorageAzureBlob::Configuration co
                     if (storage_shared_key_credential)
                         result = std::make_unique<BlobContainerClient>(final_url, storage_shared_key_credential);
                     else
-                        result = std::make_unique<BlobContainerClient>(final_url);
+                        result = std::make_unique<BlobContainerClient>(final_url, managed_identity_credential);
                 }
                 else
                 {
diff --git a/src/Storages/StorageAzureBlob.h b/src/Storages/StorageAzureBlob.h
index 63fd489dcaf..27ac7a5c368 100644
--- a/src/Storages/StorageAzureBlob.h
+++ b/src/Storages/StorageAzureBlob.h
@@ -69,7 +69,7 @@ public:
         ASTPtr partition_by_);
 
     static StorageAzureBlob::Configuration getConfiguration(ASTs & engine_args, const ContextPtr & local_context);
-    static AzureClientPtr createClient(StorageAzureBlob::Configuration configuration, bool is_read_only);
+    static AzureClientPtr createClient(StorageAzureBlob::Configuration configuration, bool is_read_only, bool attempt_to_create_container = true);
 
     static AzureObjectStorage::SettingsPtr createSettings(const ContextPtr & local_context);
 

From df9aa3611f9ccce452fcbdfeeec28ea3250cf41a Mon Sep 17 00:00:00 2001
From: Nikolai Kochetov <nk@clickhouse.com>
Date: Fri, 22 Mar 2024 18:12:38 +0100
Subject: [PATCH 909/985] Remove already not flaky tests with analyzer.

---
 tests/analyzer_tech_debt.txt | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index e2d8084df5e..cd9d262e5e4 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -6,6 +6,4 @@
 # Check after constants refactoring
 02901_parallel_replicas_rollup
 # Flaky. Please don't delete them without fixing them:
-01287_max_execution_speed
 02003_WithMergeableStateAfterAggregationAndLimit_LIMIT_BY_LIMIT_OFFSET
-02404_memory_bound_merging

From 510a3044c3b3ce3cccc45681bdc7dfafc3b49ac4 Mon Sep 17 00:00:00 2001
From: Yarik Briukhovetskyi <114298166+yariks5s@users.noreply.github.com>
Date: Fri, 22 Mar 2024 18:23:20 +0100
Subject: [PATCH 910/985] simplify tests

---
 .../0_stateless/00990_function_current_user.reference      | 4 ----
 tests/queries/0_stateless/00990_function_current_user.sql  | 7 +------
 2 files changed, 1 insertion(+), 10 deletions(-)

diff --git a/tests/queries/0_stateless/00990_function_current_user.reference b/tests/queries/0_stateless/00990_function_current_user.reference
index 227c7c3b562..95d2ef117ea 100644
--- a/tests/queries/0_stateless/00990_function_current_user.reference
+++ b/tests/queries/0_stateless/00990_function_current_user.reference
@@ -1,8 +1,4 @@
 1
 1
-1	1
-1
-1
-1
 1	1	1
 1
diff --git a/tests/queries/0_stateless/00990_function_current_user.sql b/tests/queries/0_stateless/00990_function_current_user.sql
index c2d946e4185..4cf59e72e11 100644
--- a/tests/queries/0_stateless/00990_function_current_user.sql
+++ b/tests/queries/0_stateless/00990_function_current_user.sql
@@ -1,10 +1,5 @@
 -- since actual user name is unknown, have to perform just smoke tests
 select currentUser() IS NOT NULL;
 select length(currentUser()) > 0;
-select currentUser() = user(), currentUser() = USER();
+select currentUser() = user(), currentUser() = USER(), current_user() = currentUser();
 select currentUser() = initial_user from system.processes where query like '%$!@#%';
-
-select current_user() IS NOT NULL;
-select length(current_user()) > 0;
-select current_user() = user(), current_user() = USER(), current_user() = currentUser();
-select current_user() = initial_user from system.processes where query like '%$!@#%';

From edc9e8fbc8eb91e00399ab844681c95e31df0f70 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Fri, 22 Mar 2024 17:30:50 +0000
Subject: [PATCH 911/985] Analyzer: Fix assert in JOIN with Distributed table

---
 src/Planner/PlannerContext.cpp  | 3 +++
 src/Planner/PlannerJoinTree.cpp | 3 ++-
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/src/Planner/PlannerContext.cpp b/src/Planner/PlannerContext.cpp
index f939b959ce7..c9187e6aa2a 100644
--- a/src/Planner/PlannerContext.cpp
+++ b/src/Planner/PlannerContext.cpp
@@ -32,6 +32,9 @@ const ColumnIdentifier & GlobalPlannerContext::createColumnIdentifier(const Name
         column_identifier = column.name;
 
     auto [it, inserted] = column_identifiers.emplace(column_identifier);
+    if (!inserted)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Column identifier {} is already registered", column_identifier);
+
     assert(inserted);
 
     return *it;
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 61a7a19f5be..4ca8b6d7d48 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -960,7 +960,8 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
         else
         {
             auto subquery_options = select_query_options.subquery();
-            Planner subquery_planner(table_expression, subquery_options, planner_context->getGlobalPlannerContext());
+            Planner subquery_planner(table_expression, subquery_options,
+                std::make_shared<GlobalPlannerContext>(nullptr, nullptr, FiltersForTableExpressionMap{}));
             /// Propagate storage limits to subquery
             subquery_planner.addStorageLimits(*select_query_info.storage_limits);
             subquery_planner.buildQueryPlanIfNeeded();

From f54e11176d6057f37c1f38e332d6ff5113accb50 Mon Sep 17 00:00:00 2001
From: vdimir <vdimir@clickhouse.com>
Date: Fri, 22 Mar 2024 18:12:31 +0000
Subject: [PATCH 912/985] u

---
 src/Planner/PlannerJoinTree.cpp | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 4ca8b6d7d48..c2b888af578 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -959,9 +959,14 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
         }
         else
         {
+            std::shared_ptr<GlobalPlannerContext> subquery_planner_context;
+            if (wrap_read_columns_in_subquery)
+                subquery_planner_context = std::make_shared<GlobalPlannerContext>(nullptr, nullptr, FiltersForTableExpressionMap{});
+            else
+                subquery_planner_context = planner_context->getGlobalPlannerContext();
+
             auto subquery_options = select_query_options.subquery();
-            Planner subquery_planner(table_expression, subquery_options,
-                std::make_shared<GlobalPlannerContext>(nullptr, nullptr, FiltersForTableExpressionMap{}));
+            Planner subquery_planner(table_expression, subquery_options, subquery_planner_context);
             /// Propagate storage limits to subquery
             subquery_planner.addStorageLimits(*select_query_info.storage_limits);
             subquery_planner.buildQueryPlanIfNeeded();

From ada32a433a8609debd8eb795f1c99103aebce879 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 19:51:06 +0100
Subject: [PATCH 913/985] Enable `output_format_pretty_row_numbers` by default

---
 src/Core/Settings.h               | 2 +-
 src/Core/SettingsChangesHistory.h | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 958fe64902d..9414915484e 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1138,7 +1138,7 @@ class IColumn;
     \
     M(Bool, output_format_enable_streaming, false, "Enable streaming in output formats that support it.", 0) \
     M(Bool, output_format_write_statistics, true, "Write statistics about read rows, bytes, time elapsed in suitable output formats.", 0) \
-    M(Bool, output_format_pretty_row_numbers, false, "Add row numbers before each row for pretty output format", 0) \
+    M(Bool, output_format_pretty_row_numbers, true, "Add row numbers before each row for pretty output format", 0) \
     M(UInt64, output_format_pretty_single_large_number_tip_threshold, 1'000'000, "Print a readable number tip on the right side of the table if the block consists of a single number which exceeds this value (except 0)", 0) \
     M(Bool, insert_distributed_one_random_shard, false, "If setting is enabled, inserting into distributed table will choose a random shard to write when there is no sharding key", 0) \
     \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 8798712ceaa..262d44886c6 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -104,6 +104,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"keeper_retry_max_backoff_ms", 5000, 5000, "Max backoff timeout for general keeper operations"},
               {"s3queue_allow_experimental_sharded_mode", false, false, "Enable experimental sharded mode of S3Queue table engine. It is experimental because it will be rewritten"},
               {"merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability", 0.0, 0.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability."},
+              {"output_format_pretty_row_numbers", false, true, "It is better for usability."},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},

From 4621fe6115fe7d62efa3309ef8efc59c02c6ce6e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 20:21:54 +0100
Subject: [PATCH 914/985] Fix wrong cases of numbers pretty printing

---
 .../Formats/Impl/PrettyBlockOutputFormat.cpp  | 19 +++++++++++--------
 1 file changed, 11 insertions(+), 8 deletions(-)

diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index c5db8f2e30a..92411864e93 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -419,16 +419,19 @@ void PrettyBlockOutputFormat::writeReadableNumberTip(const Chunk & chunk)
     auto is_single_number = readable_number_tip && chunk.getNumRows() == 1 && chunk.getNumColumns() == 1;
     if (!is_single_number)
         return;
+
     auto value = columns[0]->getFloat64(0);
     auto threshold = format_settings.pretty.output_format_pretty_single_large_number_tip_threshold;
-    if (threshold == 0 || value <= threshold)
-        return;
-    if (color)
-        writeCString("\033[90m", out);
-    writeCString(" -- ", out);
-    formatReadableQuantity(value, out, 2);
-    if (color)
-        writeCString("\033[0m", out);
+
+    if (threshold && isFinite(value) && abs(value) >= threshold)
+    {
+        if (color)
+            writeCString("\033[90m", out);
+        writeCString(" -- ", out);
+        formatReadableQuantity(value, out, 2);
+        if (color)
+            writeCString("\033[0m", out);
+    }
 }
 
 void registerOutputFormatPretty(FormatFactory & factory)

From 1a7494f04f4525494eb40c0edd2669c8a515e49b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 20:25:58 +0100
Subject: [PATCH 915/985] Add a test

Revert changes from another branch

Revert changes from another branch

Revert changes from another branch
---
 .../03019_numbers_pretty.reference            | 25 +++++++++++++++++++
 .../0_stateless/03019_numbers_pretty.sql      |  6 +++++
 2 files changed, 31 insertions(+)
 create mode 100644 tests/queries/0_stateless/03019_numbers_pretty.reference
 create mode 100644 tests/queries/0_stateless/03019_numbers_pretty.sql

diff --git a/tests/queries/0_stateless/03019_numbers_pretty.reference b/tests/queries/0_stateless/03019_numbers_pretty.reference
new file mode 100644
index 00000000000..501df424ce7
--- /dev/null
+++ b/tests/queries/0_stateless/03019_numbers_pretty.reference
@@ -0,0 +1,25 @@
+┏━━━━━━━━━━━━━┓
+┃ 1230000000. ┃
+┡━━━━━━━━━━━━━┩
+│  1230000000 │ -- 1.23 billion
+└─────────────┘
+┏━━━━━━━━━━━━━━┓
+┃ -1230000000. ┃
+┡━━━━━━━━━━━━━━┩
+│  -1230000000 │-- -1.23 billion
+└──────────────┘
+┏━━━━━┓
+┃ inf ┃
+┡━━━━━┩
+│ inf │
+└─────┘
+┏━━━━━━┓
+┃ -inf ┃
+┡━━━━━━┩
+│ -inf │
+└──────┘
+┏━━━━━┓
+┃ nan ┃
+┡━━━━━┩
+│ nan │
+└─────┘
diff --git a/tests/queries/0_stateless/03019_numbers_pretty.sql b/tests/queries/0_stateless/03019_numbers_pretty.sql
new file mode 100644
index 00000000000..e6d47abcd17
--- /dev/null
+++ b/tests/queries/0_stateless/03019_numbers_pretty.sql
@@ -0,0 +1,6 @@
+SET output_format_pretty_row_numbers = 0;
+SELECT 1.23e9 FORMAT Pretty;
+SELECT -1.23e9 FORMAT Pretty;
+SELECT inf FORMAT Pretty;
+SELECT -inf FORMAT Pretty;
+SELECT nan FORMAT Pretty;

From 8751737c68451e858bbd8bd58adb45a1617b8fd0 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Fri, 22 Mar 2024 12:59:21 -0700
Subject: [PATCH 916/985] Fix DWARF format failing to skip DW_FORM_strx3
 attributes (#61737)

---
 .../Formats/Impl/DWARFBlockInputFormat.cpp    | 20 ++++++++++++++-----
 1 file changed, 15 insertions(+), 5 deletions(-)

diff --git a/src/Processors/Formats/Impl/DWARFBlockInputFormat.cpp b/src/Processors/Formats/Impl/DWARFBlockInputFormat.cpp
index b655e892d3b..00a0d426dcf 100644
--- a/src/Processors/Formats/Impl/DWARFBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/DWARFBlockInputFormat.cpp
@@ -325,11 +325,21 @@ void DWARFBlockInputFormat::skipAttribute(
     const llvm::DWARFAbbreviationDeclaration::AttributeSpec & attr, uint64_t * offset,
     const UnitState & unit) const
 {
-    if (!llvm::DWARFFormValue::skipValue(
-        attr.Form, *extractor, offset, unit.dwarf_unit->getFormParams()))
-            throw Exception(ErrorCodes::CANNOT_PARSE_DWARF,
-                "Failed to skip attribute {} of form {} at offset {}",
-                llvm::dwarf::AttributeString(attr.Attr), attr.Form, *offset);
+    if (attr.Form == llvm::dwarf::DW_FORM_strx3)
+    {
+        /// DWARFFormValue::skipValue() fails on DW_FORM_strx3 because the `switch` statement is
+        /// missing this form for some reason. Maybe it's a bug in llvm.
+        /// Use extractValue() to work around.
+        parseAttribute(attr, offset, unit);
+    }
+    else
+    {
+        if (!llvm::DWARFFormValue::skipValue(
+            attr.Form, *extractor, offset, unit.dwarf_unit->getFormParams()))
+                throw Exception(ErrorCodes::CANNOT_PARSE_DWARF,
+                    "Failed to skip attribute {} of form {} at offset {}",
+                    llvm::dwarf::AttributeString(attr.Attr), attr.Form, *offset);
+    }
 }
 
 uint64_t DWARFBlockInputFormat::parseAddress(llvm::dwarf::Attribute attr, const llvm::DWARFFormValue & val, const UnitState & unit)

From 84daaa1c7ee8196fa16eb71dc2e7b354c39348d4 Mon Sep 17 00:00:00 2001
From: Michael Kolupaev <michael.kolupaev@clickhouse.com>
Date: Fri, 22 Mar 2024 20:00:42 +0000
Subject: [PATCH 917/985] Style

---
 src/Interpreters/SquashingTransform.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Interpreters/SquashingTransform.cpp b/src/Interpreters/SquashingTransform.cpp
index da608f5e7ce..41f024df7a7 100644
--- a/src/Interpreters/SquashingTransform.cpp
+++ b/src/Interpreters/SquashingTransform.cpp
@@ -6,6 +6,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int SIZES_OF_COLUMNS_DOESNT_MATCH;
+    extern const int LOGICAL_ERROR;
 }
 
 SquashingTransform::SquashingTransform(size_t min_block_size_rows_, size_t min_block_size_bytes_)

From 18c016caaac6cab5635ed3149805015092e101ff Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 21:06:36 +0100
Subject: [PATCH 918/985] Support for --output-format in client

---
 programs/local/LocalServer.cpp | 1 -
 src/Client/ClientBase.cpp      | 3 ++-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index 6f7d3681c46..e0124f03a64 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -819,7 +819,6 @@ void LocalServer::addOptions(OptionsDescription & options_description)
         ("file,F", po::value<std::string>(), "path to file with data of the initial table (stdin if not specified)")
 
         ("input-format", po::value<std::string>(), "input format of the initial table data")
-        ("output-format", po::value<std::string>(), "default output format")
 
         ("logger.console", po::value<bool>()->implicit_value(true), "Log to console")
         ("logger.log", po::value<std::string>(), "Log file name")
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index 8b13f2a4ffd..4dab7f2403b 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -2892,7 +2892,8 @@ void ClientBase::init(int argc, char ** argv)
 
         ("suggestion_limit", po::value<int>()->default_value(10000), "Suggestion limit for how many databases, tables and columns to fetch.")
 
-        ("format,f", po::value<std::string>(), "default output format")
+        ("format,output-format,f", po::value<std::string>(), "default output format (and input format for clickhouse-local)")
+
         ("vertical,E", "vertical output format, same as --format=Vertical or FORMAT Vertical or \\G at end of command")
         ("highlight", po::value<bool>()->default_value(true), "enable or disable basic syntax highlight in interactive command line")
 

From fd5d55588553ed7a4a8121eb244e484cbf194632 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 21:07:09 +0100
Subject: [PATCH 919/985] A test can be slow in debug build

---
 tests/queries/0_stateless/00938_fix_rwlock_segfault_long.sh | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/00938_fix_rwlock_segfault_long.sh b/tests/queries/0_stateless/00938_fix_rwlock_segfault_long.sh
index 795f41528b2..088c266b017 100755
--- a/tests/queries/0_stateless/00938_fix_rwlock_segfault_long.sh
+++ b/tests/queries/0_stateless/00938_fix_rwlock_segfault_long.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: long
+# Tags: long, no-debug
 
 # Test fix for issue #5066
 

From 14c616e6964d7e98fcae36603206ca074903b776 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 21:29:33 +0100
Subject: [PATCH 920/985] Fix for clang-19

---
 src/Interpreters/PreparedSets.h | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/src/Interpreters/PreparedSets.h b/src/Interpreters/PreparedSets.h
index 3419d3b6839..45d53a691a6 100644
--- a/src/Interpreters/PreparedSets.h
+++ b/src/Interpreters/PreparedSets.h
@@ -9,12 +9,11 @@
 #include <Storages/IStorage_fwd.h>
 #include <Interpreters/Context_fwd.h>
 #include <Interpreters/SetKeys.h>
+#include <Processors/QueryPlan/QueryPlan.h>
 
 namespace DB
 {
 
-class QueryPlan;
-
 class Set;
 using SetPtr = std::shared_ptr<Set>;
 struct SetKeyColumns;

From a56c113c839f644b45f69dcb8030840f4872c0dc Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 22:12:59 +0100
Subject: [PATCH 921/985] Fix for clang-19

---
 .../AggregateFunctionQuantile.cpp             |  3 --
 .../AggregateFunctionQuantile.h               | 31 +++++++++----------
 .../AggregateFunctionQuantileBFloat16.cpp     |  3 --
 ...regateFunctionQuantileBFloat16Weighted.cpp |  3 --
 .../AggregateFunctionQuantileDD.cpp           |  3 --
 ...AggregateFunctionQuantileDeterministic.cpp |  3 --
 .../AggregateFunctionQuantileExact.cpp        |  3 --
 ...ggregateFunctionQuantileExactExclusive.cpp |  3 --
 .../AggregateFunctionQuantileExactHigh.cpp    |  5 +--
 ...ggregateFunctionQuantileExactInclusive.cpp |  3 --
 .../AggregateFunctionQuantileExactLow.cpp     |  3 --
 ...AggregateFunctionQuantileExactWeighted.cpp |  3 --
 .../AggregateFunctionQuantileGK.cpp           |  3 --
 ...teFunctionQuantileInterpolatedWeighted.cpp |  3 --
 .../AggregateFunctionQuantileTDigest.cpp      |  3 --
 ...gregateFunctionQuantileTDigestWeighted.cpp |  3 --
 .../AggregateFunctionQuantileTiming.cpp       |  3 --
 ...ggregateFunctionQuantileTimingWeighted.cpp |  3 --
 src/Interpreters/PreparedSets.cpp             |  2 ++
 src/Interpreters/PreparedSets.h               |  5 ++-
 src/Server/MySQLHandler.cpp                   |  2 ++
 src/Server/MySQLHandler.h                     |  2 ++
 src/Storages/HDFS/StorageHDFS.cpp             |  2 ++
 src/Storages/HDFS/StorageHDFS.h               |  2 ++
 src/Storages/Kafka/StorageKafka.cpp           |  2 ++
 src/Storages/Kafka/StorageKafka.h             |  2 ++
 .../RocksDB/StorageEmbeddedRocksDB.cpp        |  2 ++
 src/Storages/RocksDB/StorageEmbeddedRocksDB.h |  2 ++
 src/Storages/StorageURL.cpp                   |  2 ++
 src/Storages/StorageURL.h                     |  2 ++
 30 files changed, 42 insertions(+), 69 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionQuantile.cpp b/src/AggregateFunctions/AggregateFunctionQuantile.cpp
index 110f6c6b4d6..1ba3cc0f516 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantile.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantile.cpp
@@ -116,9 +116,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantile.h b/src/AggregateFunctions/AggregateFunctionQuantile.h
index 315be2123a7..127dc06b642 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantile.h
+++ b/src/AggregateFunctions/AggregateFunctionQuantile.h
@@ -91,6 +91,21 @@ public:
         if (!returns_many && levels.size() > 1)
             throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires one level parameter or less", getName());
 
+        if constexpr (has_second_arg)
+        {
+            assertBinary(Name::name, argument_types_);
+            if (!isUInt(argument_types_[1]))
+                throw Exception(
+                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Second argument (weight) for function {} must be unsigned integer, but it has type {}",
+                    Name::name,
+                    argument_types_[1]->getName());
+        }
+        else
+        {
+            assertUnary(Name::name, argument_types_);
+        }
+
         if constexpr (is_quantile_ddsketch)
         {
             if (params.empty())
@@ -272,22 +287,6 @@ public:
                 static_cast<ColVecType &>(to).getData().push_back(data.get(level));
         }
     }
-
-    static void assertSecondArg(const DataTypes & types)
-    {
-        if constexpr (has_second_arg)
-        {
-            assertBinary(Name::name, types);
-            if (!isUInt(types[1]))
-                throw Exception(
-                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "Second argument (weight) for function {} must be unsigned integer, but it has type {}",
-                    Name::name,
-                    types[1]->getName());
-        }
-        else
-            assertUnary(Name::name, types);
-    }
 };
 
 struct NameQuantile { static constexpr auto name = "quantile"; };
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
index c211ba03136..5e17a147924 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
@@ -26,9 +26,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
index 702848ee4fa..25460646369 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
@@ -26,9 +26,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
index 4d1b2069dcc..d41581346b3 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
@@ -27,9 +27,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
index f9f114d69e4..714d81a73d1 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
@@ -116,9 +116,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
index 3098c498ce9..ba7e04fe2d1 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
@@ -27,9 +27,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
index 64ae5f01f58..0962d894c95 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
@@ -26,9 +26,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
index a224b8fc10f..f278250bd36 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
@@ -27,9 +27,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
@@ -39,12 +36,12 @@ AggregateFunctionPtr createAggregateFunctionQuantile(
 #undef DISPATCH
     if (which.idx == TypeIndex::Date) return std::make_shared<Function<DataTypeDate::FieldType, false>>(argument_types, params);
     if (which.idx == TypeIndex::DateTime) return std::make_shared<Function<DataTypeDateTime::FieldType, false>>(argument_types, params);
+    if (which.idx == TypeIndex::DateTime64) return std::make_shared<Function<DateTime64, false>>(argument_types, params);
 
     if (which.idx == TypeIndex::Decimal32) return std::make_shared<Function<Decimal32, false>>(argument_types, params);
     if (which.idx == TypeIndex::Decimal64) return std::make_shared<Function<Decimal64, false>>(argument_types, params);
     if (which.idx == TypeIndex::Decimal128) return std::make_shared<Function<Decimal128, false>>(argument_types, params);
     if (which.idx == TypeIndex::Decimal256) return std::make_shared<Function<Decimal256, false>>(argument_types, params);
-    if (which.idx == TypeIndex::DateTime64) return std::make_shared<Function<DateTime64, false>>(argument_types, params);
 
     throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument for aggregate function {}",
                     argument_type->getName(), name);
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
index 96703c271d8..56a5c91b254 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
@@ -26,9 +26,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
index 221281a7bb3..2fc96bb0d22 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
@@ -26,9 +26,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
index e5066fe9c3d..b4a72a920d1 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
@@ -216,9 +216,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
index 26737e43eef..e020d029df6 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
@@ -503,9 +503,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
index 2b8b72a549a..a6edf499acb 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
@@ -320,9 +320,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
index e3896ffb0d7..da2b10055ba 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
@@ -26,9 +26,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
index 56d5fd36412..15587f4eb4b 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
@@ -26,9 +26,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
index b3fbd50b6e2..bf38d3a37f7 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
@@ -26,9 +26,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
index 7bbba728313..282ebf70522 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
@@ -26,9 +26,6 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
-    /// Second argument type check doesn't depend on the type of the first one.
-    Function<void, true>::assertSecondArg(argument_types);
-
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/Interpreters/PreparedSets.cpp b/src/Interpreters/PreparedSets.cpp
index 76f75cde1dc..b04c8b1b725 100644
--- a/src/Interpreters/PreparedSets.cpp
+++ b/src/Interpreters/PreparedSets.cpp
@@ -122,6 +122,8 @@ FutureSetFromSubquery::FutureSetFromSubquery(
     set_and_key->set = std::make_shared<Set>(size_limits, settings.use_index_for_in_with_subqueries_max_values, settings.transform_null_in);
 }
 
+FutureSetFromSubquery::~FutureSetFromSubquery() = default;
+
 SetPtr FutureSetFromSubquery::get() const
 {
     if (set_and_key->set != nullptr && set_and_key->set->isCreated())
diff --git a/src/Interpreters/PreparedSets.h b/src/Interpreters/PreparedSets.h
index 45d53a691a6..bf99a8ece3c 100644
--- a/src/Interpreters/PreparedSets.h
+++ b/src/Interpreters/PreparedSets.h
@@ -9,11 +9,12 @@
 #include <Storages/IStorage_fwd.h>
 #include <Interpreters/Context_fwd.h>
 #include <Interpreters/SetKeys.h>
-#include <Processors/QueryPlan/QueryPlan.h>
 
 namespace DB
 {
 
+class QueryPlan;
+
 class Set;
 using SetPtr = std::shared_ptr<Set>;
 struct SetKeyColumns;
@@ -107,6 +108,8 @@ public:
         QueryTreeNodePtr query_tree_,
         const Settings & settings);
 
+    ~FutureSetFromSubquery() override;
+
     SetPtr get() const override;
     DataTypes getTypes() const override;
     SetPtr buildOrderedSetInplace(const ContextPtr & context) override;
diff --git a/src/Server/MySQLHandler.cpp b/src/Server/MySQLHandler.cpp
index ad5cae01540..32490627214 100644
--- a/src/Server/MySQLHandler.cpp
+++ b/src/Server/MySQLHandler.cpp
@@ -192,6 +192,8 @@ MySQLHandler::MySQLHandler(
     settings_replacements.emplace("NET_READ_TIMEOUT", "receive_timeout");
 }
 
+MySQLHandler::~MySQLHandler() = default;
+
 void MySQLHandler::run()
 {
     setThreadName("MySQLHandler");
diff --git a/src/Server/MySQLHandler.h b/src/Server/MySQLHandler.h
index 2deb2b8f435..2f891ebf810 100644
--- a/src/Server/MySQLHandler.h
+++ b/src/Server/MySQLHandler.h
@@ -46,6 +46,8 @@ public:
         const ProfileEvents::Event & read_event_ = ProfileEvents::end(),
         const ProfileEvents::Event & write_event_ = ProfileEvents::end());
 
+    ~MySQLHandler() override;
+
     void run() final;
 
 protected:
diff --git a/src/Storages/HDFS/StorageHDFS.cpp b/src/Storages/HDFS/StorageHDFS.cpp
index c574f57fc6a..93cf64f30a0 100644
--- a/src/Storages/HDFS/StorageHDFS.cpp
+++ b/src/Storages/HDFS/StorageHDFS.cpp
@@ -624,6 +624,8 @@ HDFSSource::HDFSSource(
     initialize();
 }
 
+HDFSSource::~HDFSSource() = default;
+
 bool HDFSSource::initialize()
 {
     bool skip_empty_files = getContext()->getSettingsRef().hdfs_skip_empty_files;
diff --git a/src/Storages/HDFS/StorageHDFS.h b/src/Storages/HDFS/StorageHDFS.h
index 47e5addccb4..b14bb7f997b 100644
--- a/src/Storages/HDFS/StorageHDFS.h
+++ b/src/Storages/HDFS/StorageHDFS.h
@@ -153,6 +153,8 @@ public:
         std::shared_ptr<IteratorWrapper> file_iterator_,
         bool need_only_count_);
 
+    ~HDFSSource() override;
+
     String getName() const override;
 
     Chunk generate() override;
diff --git a/src/Storages/Kafka/StorageKafka.cpp b/src/Storages/Kafka/StorageKafka.cpp
index e41488189e9..a6c15149e15 100644
--- a/src/Storages/Kafka/StorageKafka.cpp
+++ b/src/Storages/Kafka/StorageKafka.cpp
@@ -386,6 +386,8 @@ StorageKafka::StorageKafka(
     });
 }
 
+StorageKafka::~StorageKafka() = default;
+
 VirtualColumnsDescription StorageKafka::createVirtuals(StreamingHandleErrorMode handle_error_mode)
 {
     VirtualColumnsDescription desc;
diff --git a/src/Storages/Kafka/StorageKafka.h b/src/Storages/Kafka/StorageKafka.h
index 3b20e6b23f6..829e23faf77 100644
--- a/src/Storages/Kafka/StorageKafka.h
+++ b/src/Storages/Kafka/StorageKafka.h
@@ -42,6 +42,8 @@ public:
         std::unique_ptr<KafkaSettings> kafka_settings_,
         const String & collection_name_);
 
+    ~StorageKafka() override;
+
     std::string getName() const override { return "Kafka"; }
 
     bool noPushingToViews() const override { return true; }
diff --git a/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp b/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp
index 8725ab172ac..7c4581025e5 100644
--- a/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp
+++ b/src/Storages/RocksDB/StorageEmbeddedRocksDB.cpp
@@ -197,6 +197,8 @@ StorageEmbeddedRocksDB::StorageEmbeddedRocksDB(const StorageID & table_id_,
     initDB();
 }
 
+StorageEmbeddedRocksDB::~StorageEmbeddedRocksDB() = default;
+
 void StorageEmbeddedRocksDB::truncate(const ASTPtr &, const StorageMetadataPtr & , ContextPtr, TableExclusiveLockHolder &)
 {
     std::lock_guard lock(rocksdb_ptr_mx);
diff --git a/src/Storages/RocksDB/StorageEmbeddedRocksDB.h b/src/Storages/RocksDB/StorageEmbeddedRocksDB.h
index 113e1f12b65..8525108735b 100644
--- a/src/Storages/RocksDB/StorageEmbeddedRocksDB.h
+++ b/src/Storages/RocksDB/StorageEmbeddedRocksDB.h
@@ -39,6 +39,8 @@ public:
         String rocksdb_dir_ = "",
         bool read_only_ = false);
 
+    ~StorageEmbeddedRocksDB() override;
+
     std::string getName() const override { return "EmbeddedRocksDB"; }
 
     void read(
diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index adcb83218fd..cc46cc8f8dc 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -387,6 +387,8 @@ StorageURLSource::StorageURLSource(
     };
 }
 
+StorageURLSource::~StorageURLSource() = default;
+
 Chunk StorageURLSource::generate()
 {
     while (true)
diff --git a/src/Storages/StorageURL.h b/src/Storages/StorageURL.h
index 294b1f828bb..842cfd5b627 100644
--- a/src/Storages/StorageURL.h
+++ b/src/Storages/StorageURL.h
@@ -181,6 +181,8 @@ public:
         bool glob_url = false,
         bool need_only_count_ = false);
 
+    ~StorageURLSource() override;
+
     String getName() const override { return name; }
 
     void setKeyCondition(const ActionsDAGPtr & filter_actions_dag, ContextPtr context_) override

From 46e5a7060bd97848556540c7c7969164bd24669f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 01:30:12 +0100
Subject: [PATCH 922/985] Fix error and remove garbage

---
 .../AggregateFunctionCount.cpp                  |  4 +++-
 .../AggregateFunctionQuantile.cpp               |  3 +++
 src/AggregateFunctions/FactoryHelpers.h         | 17 -----------------
 3 files changed, 6 insertions(+), 18 deletions(-)

diff --git a/src/AggregateFunctions/AggregateFunctionCount.cpp b/src/AggregateFunctions/AggregateFunctionCount.cpp
index ec91685dbe6..01099853364 100644
--- a/src/AggregateFunctions/AggregateFunctionCount.cpp
+++ b/src/AggregateFunctions/AggregateFunctionCount.cpp
@@ -19,7 +19,9 @@ namespace
 AggregateFunctionPtr createAggregateFunctionCount(const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings *)
 {
     assertNoParameters(name, parameters);
-    assertArityAtMost<1>(name, argument_types);
+
+    if (argument_types.size() > 1)
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires zero or one argument", name);
 
     return std::make_shared<AggregateFunctionCount>(argument_types);
 }
diff --git a/src/AggregateFunctions/AggregateFunctionQuantile.cpp b/src/AggregateFunctions/AggregateFunctionQuantile.cpp
index 1ba3cc0f516..ba59759e745 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantile.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantile.cpp
@@ -116,6 +116,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/FactoryHelpers.h b/src/AggregateFunctions/FactoryHelpers.h
index 3cfc202013d..8169c521e77 100644
--- a/src/AggregateFunctions/FactoryHelpers.h
+++ b/src/AggregateFunctions/FactoryHelpers.h
@@ -33,21 +33,4 @@ inline void assertBinary(const std::string & name, const DataTypes & argument_ty
         throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires two arguments", name);
 }
 
-template<std::size_t maximal_arity>
-inline void assertArityAtMost(const std::string & name, const DataTypes & argument_types)
-{
-    if (argument_types.size() <= maximal_arity)
-        return;
-
-    if constexpr (maximal_arity == 0)
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} cannot have arguments", name);
-
-    if constexpr (maximal_arity == 1)
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires zero or one argument",
-                        name);
-
-    throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at most {} arguments",
-                    name, maximal_arity);
-}
-
 }

From 27505c622b75a5d72a862e21b86ebf642ac62282 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 01:40:48 +0100
Subject: [PATCH 923/985] Add a test

---
 .../03020_output_format_client.reference         | 12 ++++++++++++
 .../0_stateless/03020_output_format_client.sh    | 16 ++++++++++++++++
 2 files changed, 28 insertions(+)
 create mode 100644 tests/queries/0_stateless/03020_output_format_client.reference
 create mode 100755 tests/queries/0_stateless/03020_output_format_client.sh

diff --git a/tests/queries/0_stateless/03020_output_format_client.reference b/tests/queries/0_stateless/03020_output_format_client.reference
new file mode 100644
index 00000000000..7738e2cffb2
--- /dev/null
+++ b/tests/queries/0_stateless/03020_output_format_client.reference
@@ -0,0 +1,12 @@
+| x |
+|:-|
+| Hello, world |
+| x |
+|:-|
+| Hello, world |
+| x |
+|:-|
+| Hello, world |
+| x |
+|:-|
+| Hello, world |
diff --git a/tests/queries/0_stateless/03020_output_format_client.sh b/tests/queries/0_stateless/03020_output_format_client.sh
new file mode 100755
index 00000000000..b641af3e2e4
--- /dev/null
+++ b/tests/queries/0_stateless/03020_output_format_client.sh
@@ -0,0 +1,16 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+# clickhouse-local has --input-format and --output-format parameters,
+# and also the --format parameter which is the default for both input and output formats, but has less preference.
+
+# clickhouse-client does not have the --input-format parameter.
+# However, it accepts both --format and --output-format for convenience.
+
+${CLICKHOUSE_LOCAL} --output-format Markdown --query "SELECT 'Hello, world' AS x"
+${CLICKHOUSE_CLIENT} --output-format Markdown --query "SELECT 'Hello, world' AS x"
+${CLICKHOUSE_LOCAL} --format Markdown --query "SELECT 'Hello, world' AS x"
+${CLICKHOUSE_CLIENT} --format Markdown --query "SELECT 'Hello, world' AS x"

From 7365f4e32b72309e77f37e6257717d2b1e2ba0e6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 01:43:28 +0100
Subject: [PATCH 924/985] Add modifications

---
 programs/client/Client.cpp | 14 +++++++-------
 src/Client/ClientBase.cpp  |  5 ++++-
 2 files changed, 11 insertions(+), 8 deletions(-)

diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index 9e90596b4f8..217684830d4 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -1,4 +1,3 @@
-#include <boost/algorithm/string/join.hpp>
 #include <cstdlib>
 #include <fcntl.h>
 #include <map>
@@ -7,7 +6,6 @@
 #include <memory>
 #include <optional>
 #include <Common/ThreadStatus.h>
-#include <Common/scope_guard_safe.h>
 #include <boost/program_options.hpp>
 #include <boost/algorithm/string/replace.hpp>
 #include <filesystem>
@@ -45,8 +43,6 @@
 
 #include <Processors/Transforms/getSourceFromASTInsertQuery.h>
 
-#include <Interpreters/InterpreterSetQuery.h>
-
 #include <Functions/registerFunctions.h>
 #include <AggregateFunctions/registerAggregateFunctions.h>
 #include <Formats/registerFormats.h>
@@ -1180,7 +1176,7 @@ void Client::processConfig()
 
     pager = config().getString("pager", "");
 
-    is_default_format = !config().has("vertical") && !config().has("format");
+    is_default_format = !config().has("vertical") && !config().has("output-format") && !config().has("format");
     if (is_default_format && checkIfStdoutIsRegularFile())
     {
         is_default_format = false;
@@ -1189,9 +1185,13 @@ void Client::processConfig()
         format = format_from_file_name ? *format_from_file_name : "TabSeparated";
     }
     else if (config().has("vertical"))
-        format = config().getString("format", "Vertical");
+    {
+        format = config().getString("output-format", config().getString("format", "Vertical"));
+    }
     else
-        format = config().getString("format", is_interactive ? "PrettyCompact" : "TabSeparated");
+    {
+        format = config().getString("output-format", config().getString("format", is_interactive ? "PrettyCompact" : "TabSeparated"));
+    }
 
     format_max_block_size = config().getUInt64("format_max_block_size",
         global_context->getSettingsRef().max_block_size);
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index 4dab7f2403b..c97669760f9 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -2892,7 +2892,8 @@ void ClientBase::init(int argc, char ** argv)
 
         ("suggestion_limit", po::value<int>()->default_value(10000), "Suggestion limit for how many databases, tables and columns to fetch.")
 
-        ("format,output-format,f", po::value<std::string>(), "default output format (and input format for clickhouse-local)")
+        ("format,f", po::value<std::string>(), "default output format (and input format for clickhouse-local)")
+        ("output-format", po::value<std::string>(), "default output format (this option has preference over --format)")
 
         ("vertical,E", "vertical output format, same as --format=Vertical or FORMAT Vertical or \\G at end of command")
         ("highlight", po::value<bool>()->default_value(true), "enable or disable basic syntax highlight in interactive command line")
@@ -2976,6 +2977,8 @@ void ClientBase::init(int argc, char ** argv)
         config().setBool("ignore-error", true);
     if (options.count("format"))
         config().setString("format", options["format"].as<std::string>());
+    if (options.count("output-format"))
+        config().setString("output-format", options["output-format"].as<std::string>());
     if (options.count("vertical"))
         config().setBool("vertical", true);
     if (options.count("stacktrace"))

From 33c2cd9cfb65d57e7a6ff67b74d3eb1f65caf4d6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 02:31:51 +0100
Subject: [PATCH 925/985] Update test

---
 .../0_stateless/03020_output_format_client.reference        | 6 ++++++
 tests/queries/0_stateless/03020_output_format_client.sh     | 2 ++
 2 files changed, 8 insertions(+)

diff --git a/tests/queries/0_stateless/03020_output_format_client.reference b/tests/queries/0_stateless/03020_output_format_client.reference
index 7738e2cffb2..95e6d3d69ce 100644
--- a/tests/queries/0_stateless/03020_output_format_client.reference
+++ b/tests/queries/0_stateless/03020_output_format_client.reference
@@ -10,3 +10,9 @@
 | x |
 |:-|
 | Hello, world |
+Row 1:
+──────
+x: Hello, world
+Row 1:
+──────
+x: Hello, world
diff --git a/tests/queries/0_stateless/03020_output_format_client.sh b/tests/queries/0_stateless/03020_output_format_client.sh
index b641af3e2e4..8fd5956daff 100755
--- a/tests/queries/0_stateless/03020_output_format_client.sh
+++ b/tests/queries/0_stateless/03020_output_format_client.sh
@@ -14,3 +14,5 @@ ${CLICKHOUSE_LOCAL} --output-format Markdown --query "SELECT 'Hello, world' AS x
 ${CLICKHOUSE_CLIENT} --output-format Markdown --query "SELECT 'Hello, world' AS x"
 ${CLICKHOUSE_LOCAL} --format Markdown --query "SELECT 'Hello, world' AS x"
 ${CLICKHOUSE_CLIENT} --format Markdown --query "SELECT 'Hello, world' AS x"
+${CLICKHOUSE_LOCAL} --vertical --query "SELECT 'Hello, world' AS x"
+${CLICKHOUSE_CLIENT} --vertical --query "SELECT 'Hello, world' AS x"

From 38cd754eed68e1b30a0cae948bda0b7428541b4a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 02:34:59 +0100
Subject: [PATCH 926/985] More tests

---
 tests/queries/0_stateless/03020_output_format_client.reference | 2 ++
 tests/queries/0_stateless/03020_output_format_client.sh        | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/tests/queries/0_stateless/03020_output_format_client.reference b/tests/queries/0_stateless/03020_output_format_client.reference
index 95e6d3d69ce..bcb6161e9a0 100644
--- a/tests/queries/0_stateless/03020_output_format_client.reference
+++ b/tests/queries/0_stateless/03020_output_format_client.reference
@@ -16,3 +16,5 @@ x: Hello, world
 Row 1:
 ──────
 x: Hello, world
+Hello, world
+Hello, world
diff --git a/tests/queries/0_stateless/03020_output_format_client.sh b/tests/queries/0_stateless/03020_output_format_client.sh
index 8fd5956daff..d9de09ee02a 100755
--- a/tests/queries/0_stateless/03020_output_format_client.sh
+++ b/tests/queries/0_stateless/03020_output_format_client.sh
@@ -16,3 +16,5 @@ ${CLICKHOUSE_LOCAL} --format Markdown --query "SELECT 'Hello, world' AS x"
 ${CLICKHOUSE_CLIENT} --format Markdown --query "SELECT 'Hello, world' AS x"
 ${CLICKHOUSE_LOCAL} --vertical --query "SELECT 'Hello, world' AS x"
 ${CLICKHOUSE_CLIENT} --vertical --query "SELECT 'Hello, world' AS x"
+${CLICKHOUSE_LOCAL} --query "SELECT 'Hello, world' AS x"
+${CLICKHOUSE_CLIENT} --query "SELECT 'Hello, world' AS x"

From f64695910eb4606901d2f39cfbf4f064689dc885 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 02:42:11 +0100
Subject: [PATCH 927/985] Add a test

---
 .../03021_output_format_tty.reference         |  8 ++++++
 .../0_stateless/03021_output_format_tty.sh    | 27 +++++++++++++++++++
 2 files changed, 35 insertions(+)
 create mode 100644 tests/queries/0_stateless/03021_output_format_tty.reference
 create mode 100755 tests/queries/0_stateless/03021_output_format_tty.sh

diff --git a/tests/queries/0_stateless/03021_output_format_tty.reference b/tests/queries/0_stateless/03021_output_format_tty.reference
new file mode 100644
index 00000000000..3d3927f704f
--- /dev/null
+++ b/tests/queries/0_stateless/03021_output_format_tty.reference
@@ -0,0 +1,8 @@
+spawn bash -c source ./../shell_config.sh ; $CLICKHOUSE_CLIENT --query 'SELECT 1'
+┌─[1m1[0m─┐
+│ 1 │
+└───┘
+spawn bash -c source ./../shell_config.sh ; $CLICKHOUSE_LOCAL --query 'SELECT 2'
+┌─[1m2[0m─┐
+│ 2 │
+└───┘
diff --git a/tests/queries/0_stateless/03021_output_format_tty.sh b/tests/queries/0_stateless/03021_output_format_tty.sh
new file mode 100755
index 00000000000..93ff8739ef2
--- /dev/null
+++ b/tests/queries/0_stateless/03021_output_format_tty.sh
@@ -0,0 +1,27 @@
+#!/usr/bin/expect -f
+
+set basedir [file dirname $argv0]
+set basename [file tail $argv0]
+exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+set history_file $env(CLICKHOUSE_TMP)/$basename.history
+
+log_user 1
+set timeout 60
+match_max 100000
+
+expect_after {
+    # Do not ignore eof from expect
+    -i $any_spawn_id eof { exp_continue }
+    # A default timeout action is to do nothing, change it to fail
+    -i $any_spawn_id timeout { exit 1 }
+}
+
+spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT --query 'SELECT 1'"
+expect "│ 1 │"
+expect "└───┘"
+expect eof
+
+spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_LOCAL --query 'SELECT 2'"
+expect "│ 2 │"
+expect "└───┘"
+expect eof

From c0c8cdc18561b88abfc06fa19732c2ffbf9fadf9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 02:42:22 +0100
Subject: [PATCH 928/985] Add modifications

---
 programs/client/Client.cpp     | 40 +---------------
 programs/local/LocalServer.cpp | 44 ++----------------
 src/Client/ClientBase.cpp      | 85 +++++++++++++++++++++++++++++++++-
 src/Client/ClientBase.h        |  9 +++-
 4 files changed, 94 insertions(+), 84 deletions(-)

diff --git a/programs/client/Client.cpp b/programs/client/Client.cpp
index 217684830d4..d4bf2f686c8 100644
--- a/programs/client/Client.cpp
+++ b/programs/client/Client.cpp
@@ -1134,13 +1134,6 @@ void Client::processOptions(const OptionsDescription & options_description,
 }
 
 
-static bool checkIfStdoutIsRegularFile()
-{
-    struct stat file_stat;
-    return fstat(STDOUT_FILENO, &file_stat) == 0 && S_ISREG(file_stat.st_mode);
-}
-
-
 void Client::processConfig()
 {
     if (!queries.empty() && config().has("queries-file"))
@@ -1176,38 +1169,7 @@ void Client::processConfig()
 
     pager = config().getString("pager", "");
 
-    is_default_format = !config().has("vertical") && !config().has("output-format") && !config().has("format");
-    if (is_default_format && checkIfStdoutIsRegularFile())
-    {
-        is_default_format = false;
-        std::optional<String> format_from_file_name;
-        format_from_file_name = FormatFactory::instance().tryGetFormatFromFileDescriptor(STDOUT_FILENO);
-        format = format_from_file_name ? *format_from_file_name : "TabSeparated";
-    }
-    else if (config().has("vertical"))
-    {
-        format = config().getString("output-format", config().getString("format", "Vertical"));
-    }
-    else
-    {
-        format = config().getString("output-format", config().getString("format", is_interactive ? "PrettyCompact" : "TabSeparated"));
-    }
-
-    format_max_block_size = config().getUInt64("format_max_block_size",
-        global_context->getSettingsRef().max_block_size);
-
-    insert_format = "Values";
-
-    /// Setting value from cmd arg overrides one from config
-    if (global_context->getSettingsRef().max_insert_block_size.changed)
-    {
-        insert_format_max_block_size = global_context->getSettingsRef().max_insert_block_size;
-    }
-    else
-    {
-        insert_format_max_block_size = config().getUInt64("insert_format_max_block_size",
-            global_context->getSettingsRef().max_insert_block_size);
-    }
+    setDefaultFormatsFromConfiguration();
 
     global_context->setClientName(std::string(DEFAULT_CLIENT_NAME));
     global_context->setQueryKindInitial();
diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index e0124f03a64..05c9830ee2c 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -312,47 +312,28 @@ void LocalServer::cleanup()
 }
 
 
-static bool checkIfStdinIsRegularFile()
-{
-    struct stat file_stat;
-    return fstat(STDIN_FILENO, &file_stat) == 0 && S_ISREG(file_stat.st_mode);
-}
-
-
-static bool checkIfStdoutIsRegularFile()
-{
-    struct stat file_stat;
-    return fstat(STDOUT_FILENO, &file_stat) == 0 && S_ISREG(file_stat.st_mode);
-}
-
-
 std::string LocalServer::getInitialCreateTableQuery()
 {
-    if (!config().has("table-structure") && !config().has("table-file") && !config().has("table-data-format") && (!checkIfStdinIsRegularFile() || queries.empty()))
+    if (!config().has("table-structure") && !config().has("table-file") && !config().has("table-data-format") && (!isRegularFile(STDIN_FILENO) || queries.empty()))
         return {};
 
     auto table_name = backQuoteIfNeed(config().getString("table-name", "table"));
     auto table_structure = config().getString("table-structure", "auto");
 
     String table_file;
-    std::optional<String> format_from_file_name;
     if (!config().has("table-file") || config().getString("table-file") == "-")
     {
         /// Use Unix tools stdin naming convention
         table_file = "stdin";
-        format_from_file_name = FormatFactory::instance().tryGetFormatFromFileDescriptor(STDIN_FILENO);
     }
     else
     {
         /// Use regular file
         auto file_name = config().getString("table-file");
         table_file = quoteString(file_name);
-        format_from_file_name = FormatFactory::instance().tryGetFormatFromFileName(file_name);
     }
 
-    auto data_format = backQuoteIfNeed(
-        config().getString("table-data-format", config().getString("format", format_from_file_name ? *format_from_file_name : "TSV")));
-
+    String data_format = backQuoteIfNeed(default_input_format);
 
     if (table_structure == "auto")
         table_structure = "";
@@ -618,26 +599,7 @@ void LocalServer::processConfig()
     if (config().has("macros"))
         global_context->setMacros(std::make_unique<Macros>(config(), "macros", log));
 
-    if (!config().has("output-format") && !config().has("format") && checkIfStdoutIsRegularFile())
-    {
-        std::optional<String> format_from_file_name;
-        format_from_file_name = FormatFactory::instance().tryGetFormatFromFileDescriptor(STDOUT_FILENO);
-        format = format_from_file_name ? *format_from_file_name : "TSV";
-    }
-    else
-        format = config().getString("output-format", config().getString("format", is_interactive ? "PrettyCompact" : "TSV"));
-    insert_format = "Values";
-
-    /// Setting value from cmd arg overrides one from config
-    if (global_context->getSettingsRef().max_insert_block_size.changed)
-    {
-        insert_format_max_block_size = global_context->getSettingsRef().max_insert_block_size;
-    }
-    else
-    {
-        insert_format_max_block_size = config().getUInt64("insert_format_max_block_size",
-            global_context->getSettingsRef().max_insert_block_size);
-    }
+    setDefaultFormatsFromConfiguration();
 
     /// Sets external authenticators config (LDAP, Kerberos).
     global_context->setExternalAuthenticatorsConfig(config());
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index c97669760f9..767a9b2b9f9 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -564,7 +564,7 @@ try
             out_buf = &std_out;
         }
 
-        String current_format = format;
+        String current_format = default_output_format;
 
         select_into_file = false;
         select_into_file_and_stdout = false;
@@ -722,6 +722,87 @@ void ClientBase::adjustSettings()
     global_context->setSettings(settings);
 }
 
+bool ClientBase::isRegularFile(int fd)
+{
+    struct stat file_stat;
+    return fstat(fd, &file_stat) == 0 && S_ISREG(file_stat.st_mode);
+}
+
+void ClientBase::setDefaultFormatsFromConfiguration()
+{
+    if (config().has("output-format"))
+    {
+        default_output_format = config().getString("output-format");
+        is_default_format = false;
+    }
+    else if (config().has("format"))
+    {
+        default_output_format = config().getString("format");
+        is_default_format = false;
+    }
+    else if (config().has("vertical"))
+    {
+        default_output_format = "Vertical";
+        is_default_format = false;
+    }
+    else if (isRegularFile(STDOUT_FILENO))
+    {
+        std::optional<String> format_from_file_name = FormatFactory::instance().tryGetFormatFromFileDescriptor(STDOUT_FILENO);
+        if (format_from_file_name)
+            default_output_format = *format_from_file_name;
+        else
+            default_output_format = "TSV";
+    }
+    else if (is_interactive || stdout_is_a_tty)
+    {
+        default_output_format = "PrettyCompact";
+    }
+    else
+    {
+        default_output_format = "TSV";
+    }
+
+    if (config().has("input-format"))
+    {
+        default_input_format = config().getString("input-format");
+    }
+    else if (config().has("format"))
+    {
+        default_input_format = config().getString("format");
+    }
+    else if (config().getString("table-file", "-") != "-")
+    {
+        auto file_name = config().getString("table-file");
+        std::optional<String> format_from_file_name = FormatFactory::instance().tryGetFormatFromFileName(file_name);
+        if (format_from_file_name)
+            default_input_format = *format_from_file_name;
+        else
+            default_input_format = "TSV";
+    }
+    else
+    {
+        std::optional<String> format_from_file_name = FormatFactory::instance().tryGetFormatFromFileDescriptor(STDIN_FILENO);
+        if (format_from_file_name)
+            default_input_format = *format_from_file_name;
+        else
+            default_input_format = "TSV";
+    }
+
+    format_max_block_size = config().getUInt64("format_max_block_size",
+        global_context->getSettingsRef().max_block_size);
+
+    /// Setting value from cmd arg overrides one from config
+    if (global_context->getSettingsRef().max_insert_block_size.changed)
+    {
+        insert_format_max_block_size = global_context->getSettingsRef().max_insert_block_size;
+    }
+    else
+    {
+        insert_format_max_block_size = config().getUInt64("insert_format_max_block_size",
+            global_context->getSettingsRef().max_insert_block_size);
+    }
+}
+
 void ClientBase::initTTYBuffer(ProgressOption progress)
 {
     if (tty_buf)
@@ -1605,7 +1686,7 @@ void ClientBase::sendData(Block & sample, const ColumnsDescription & columns_des
 
 void ClientBase::sendDataFrom(ReadBuffer & buf, Block & sample, const ColumnsDescription & columns_description, ASTPtr parsed_query, bool have_more_data)
 {
-    String current_format = insert_format;
+    String current_format = "Values";
 
     /// Data format can be specified in the INSERT query.
     if (const auto * insert = parsed_query->as<ASTInsertQuery>())
diff --git a/src/Client/ClientBase.h b/src/Client/ClientBase.h
index 51dfaebd995..9ec87ababfc 100644
--- a/src/Client/ClientBase.h
+++ b/src/Client/ClientBase.h
@@ -185,9 +185,13 @@ protected:
     static bool isSyncInsertWithData(const ASTInsertQuery & insert_query, const ContextPtr & context);
     bool processMultiQueryFromFile(const String & file_name);
 
+    static bool isRegularFile(int fd);
+
     /// Adjust some settings after command line options and config had been processed.
     void adjustSettings();
 
+    void setDefaultFormatsFromConfiguration();
+
     void initTTYBuffer(ProgressOption progress);
 
     /// Should be one of the first, to be destroyed the last,
@@ -218,12 +222,13 @@ protected:
 
     String pager;
 
-    String format; /// Query results output format.
+    String default_output_format; /// Query results output format.
+    String default_input_format; /// Tables' format for clickhouse-local.
+
     bool select_into_file = false; /// If writing result INTO OUTFILE. It affects progress rendering.
     bool select_into_file_and_stdout = false; /// If writing result INTO OUTFILE AND STDOUT. It affects progress rendering.
     bool is_default_format = true; /// false, if format is set in the config or command line.
     size_t format_max_block_size = 0; /// Max block size for console output.
-    String insert_format; /// Format of INSERT data that is read from stdin in batch mode.
     size_t insert_format_max_block_size = 0; /// Max block size when reading INSERT data.
     size_t max_client_network_bandwidth = 0; /// The maximum speed of data exchange over the network for the client in bytes per second.
 

From 487ac4c82893fee282e1ba01dbdada5ee358f7f4 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 02:50:00 +0100
Subject: [PATCH 929/985] Fix tests

---
 src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp  | 2 +-
 tests/queries/0_stateless/03019_numbers_pretty.reference | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index 92411864e93..ab1e4e214e0 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -423,7 +423,7 @@ void PrettyBlockOutputFormat::writeReadableNumberTip(const Chunk & chunk)
     auto value = columns[0]->getFloat64(0);
     auto threshold = format_settings.pretty.output_format_pretty_single_large_number_tip_threshold;
 
-    if (threshold && isFinite(value) && abs(value) >= threshold)
+    if (threshold && isFinite(value) && abs(value) > threshold)
     {
         if (color)
             writeCString("\033[90m", out);
diff --git a/tests/queries/0_stateless/03019_numbers_pretty.reference b/tests/queries/0_stateless/03019_numbers_pretty.reference
index 501df424ce7..dd441dcd48f 100644
--- a/tests/queries/0_stateless/03019_numbers_pretty.reference
+++ b/tests/queries/0_stateless/03019_numbers_pretty.reference
@@ -6,7 +6,7 @@
 ┏━━━━━━━━━━━━━━┓
 ┃ -1230000000. ┃
 ┡━━━━━━━━━━━━━━┩
-│  -1230000000 │-- -1.23 billion
+│  -1230000000 │ -- -1.23 billion
 └──────────────┘
 ┏━━━━━┓
 ┃ inf ┃

From 8b6e2d722699d38b481dae62896a165c7062700f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 02:50:40 +0100
Subject: [PATCH 930/985] Do not print garbage in clickhouse-test

---
 tests/clickhouse-test | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 0dd408a2c8c..10851d23481 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -1387,7 +1387,6 @@ class TestCase:
                     self.reference_file,
                     self.stdout_file,
                 ],
-                encoding="latin-1",
                 stdout=PIPE,
                 universal_newlines=True,
             ) as diff_proc:

From 465b0c16cdb6f17c6e26f612c10432b69930aca0 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 03:10:14 +0100
Subject: [PATCH 931/985] Better row numbers

---
 src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp  | 9 ++++++---
 .../Formats/Impl/PrettyCompactBlockOutputFormat.cpp      | 8 +++++---
 .../Formats/Impl/PrettySpaceBlockOutputFormat.cpp        | 7 ++++++-
 tests/queries/0_stateless/01670_neighbor_lc_bug.sql      | 2 ++
 .../0_stateless/02947_merge_tree_index_table_2.sql       | 1 +
 5 files changed, 20 insertions(+), 7 deletions(-)

diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index c5db8f2e30a..d2bd71188b8 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -287,11 +287,14 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
         {
             // Write row number;
             auto row_num_string = std::to_string(i + 1 + total_rows) + ". ";
+
             for (size_t j = 0; j < row_number_width - row_num_string.size(); ++j)
-            {
-                writeCString(" ", out);
-            }
+                writeChar(' ', out);
+            if (color)
+                writeCString("\033[90m", out);
             writeString(row_num_string, out);
+            if (color)
+                writeCString("\033[0m", out);
         }
 
         writeCString(grid_symbols.bar, out);
diff --git a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
index bda51770838..3f0349d7710 100644
--- a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
@@ -147,10 +147,12 @@ void PrettyCompactBlockOutputFormat::writeRow(
         // Write row number;
         auto row_num_string = std::to_string(row_num + 1 + total_rows) + ". ";
         for (size_t i = 0; i < row_number_width - row_num_string.size(); ++i)
-        {
-            writeCString(" ", out);
-        }
+            writeChar(' ', out);
+        if (color)
+            writeCString("\033[90m", out);
         writeString(row_num_string, out);
+        if (color)
+            writeCString("\033[0m", out);
     }
 
     const GridSymbols & grid_symbols = format_settings.pretty.charset == FormatSettings::Pretty::Charset::UTF8 ?
diff --git a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
index e92863c93fb..cc90f654c01 100644
--- a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
@@ -73,8 +73,13 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
             // Write row number;
             auto row_num_string = std::to_string(row + 1 + total_rows) + ". ";
             for (size_t i = 0; i < row_number_width - row_num_string.size(); ++i)
-                writeCString(" ", out);
+                writeChar(' ', out);
+            if (color)
+                writeCString("\033[90m", out);
             writeString(row_num_string, out);
+            if (color)
+                writeCString("\033[0m", out);
+
         }
         for (size_t column = 0; column < num_columns; ++column)
         {
diff --git a/tests/queries/0_stateless/01670_neighbor_lc_bug.sql b/tests/queries/0_stateless/01670_neighbor_lc_bug.sql
index 3cb194ccc64..2c95e16e916 100644
--- a/tests/queries/0_stateless/01670_neighbor_lc_bug.sql
+++ b/tests/queries/0_stateless/01670_neighbor_lc_bug.sql
@@ -1,3 +1,5 @@
+SET output_format_pretty_row_numbers = 0;
+
 SELECT
     neighbor(n, -2) AS int,
     neighbor(s, -2) AS str,
diff --git a/tests/queries/0_stateless/02947_merge_tree_index_table_2.sql b/tests/queries/0_stateless/02947_merge_tree_index_table_2.sql
index 5520962fb7a..f4fb2cec2dc 100644
--- a/tests/queries/0_stateless/02947_merge_tree_index_table_2.sql
+++ b/tests/queries/0_stateless/02947_merge_tree_index_table_2.sql
@@ -1,5 +1,6 @@
 DROP TABLE IF EXISTS t_merge_tree_index;
 
+SET output_format_pretty_row_numbers = 0;
 SET print_pretty_type_names = 0;
 
 CREATE TABLE t_merge_tree_index

From be784bb649a012b90c6fa233d370bc293d55fd75 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 03:24:50 +0100
Subject: [PATCH 932/985] Update tests

---
 ..._visible_width_of_tuple_of_dates.reference |   6 +-
 .../0_stateless/00098_k_union_all.reference   |  24 +-
 .../00298_enum_width_and_cast.reference       |  34 +-
 .../00305_http_and_readonly.reference         |  24 +-
 ...isible_width_of_array_tuple_enum.reference |   6 +-
 .../00405_PrettyCompactMonoBlock.reference    |  48 +-
 ...00405_output_format_pretty_color.reference | 696 +++++++++---------
 .../00405_pretty_formats.reference            | 552 +++++++-------
 .../00406_tuples_with_nulls.reference         |  30 +-
 .../00476_pretty_formats_and_widths.reference | 126 ++--
 ...0569_parse_date_time_best_effort.reference | 210 +++---
 ...0695_pretty_max_column_pad_width.reference | 204 ++---
 .../0_stateless/00722_inner_join.reference    |  72 +-
 .../00730_unicode_terminal_format.reference   | 170 ++---
 ...parse_date_time_best_effort_more.reference |  42 +-
 .../00818_inner_join_bug_3567.reference       |  38 +-
 .../00820_multiple_joins.reference            |  30 +-
 ...le_joins_subquery_requires_alias.reference |  30 +-
 .../00847_multiple_join_same_column.reference |  56 +-
 .../01018_ambiguous_column.reference          |  12 +-
 .../01074_partial_revokes.reference           |  36 +-
 .../01293_pretty_max_value_width.reference    | 212 +++---
 ...1_parse_date_time_best_effort_us.reference |  72 +-
 .../01472_many_rows_in_totals.reference       |  32 +-
 ...output_format_pretty_row_numbers.reference | 176 ++---
 ...01509_output_format_pretty_row_numbers.sql |   1 +
 .../01553_settings_early_apply.reference      |   4 +-
 .../01645_system_table_engines.reference      |   8 +-
 .../01656_ipv4_bad_formatting.reference       |   8 +-
 .../01671_merge_join_and_constants.reference  |  10 +-
 ...2026_describe_include_subcolumns.reference |  46 +-
 .../0_stateless/02152_bool_type.reference     |  10 +-
 .../02375_pretty_formats.reference            | 200 ++---
 ...2381_parseDateTime64BestEffortUS.reference |  10 +-
 ...rtingAggregatedToChunksTransform.reference |  12 +-
 .../02790_sql_standard_fetch.reference        |  72 +-
 ...793_implicit_pretty_format_settings.expect |   2 +-
 ...explain_settings_not_applied_bug.reference |  20 +-
 .../02890_describe_table_options.reference    | 344 ++++-----
 ...02896_union_distinct_http_format.reference |  14 +-
 .../02947_merge_tree_index_table_1.reference  |  88 +--
 .../02947_merge_tree_index_table_2.reference  |  30 +-
 ..._readable_number_on_single_value.reference | 688 ++++++++---------
 43 files changed, 2253 insertions(+), 2252 deletions(-)

diff --git a/tests/queries/0_stateless/00085_visible_width_of_tuple_of_dates.reference b/tests/queries/0_stateless/00085_visible_width_of_tuple_of_dates.reference
index 39074512621..e0714f93e6b 100644
--- a/tests/queries/0_stateless/00085_visible_width_of_tuple_of_dates.reference
+++ b/tests/queries/0_stateless/00085_visible_width_of_tuple_of_dates.reference
@@ -1,3 +1,3 @@
-┌─[1mx[0m───────────────────────────┐
-│ ('2000-01-01','2000-01-01') │
-└─────────────────────────────┘
+   ┌─[1mx[0m───────────────────────────┐
+[90m1. [0m│ ('2000-01-01','2000-01-01') │
+   └─────────────────────────────┘
diff --git a/tests/queries/0_stateless/00098_k_union_all.reference b/tests/queries/0_stateless/00098_k_union_all.reference
index a6921e228af..6a12c30ac8e 100644
--- a/tests/queries/0_stateless/00098_k_union_all.reference
+++ b/tests/queries/0_stateless/00098_k_union_all.reference
@@ -1,18 +1,18 @@
- [1m1[0m
+    [1m1[0m
 
- 1 
- [1m1[0m
+[90m1. [0m 1 
+    [1m1[0m
 
- 1 
- [1m1[0m
+[90m1. [0m 1 
+    [1m1[0m
 
- 1 
- [1m1[0m
+[90m2. [0m 1 
+    [1m1[0m
 
- 1 
- [1m1[0m
+[90m1. [0m 1 
+    [1m1[0m
 
- 1 
- [1m1[0m
+[90m2. [0m 1 
+    [1m1[0m
 
- 1 
+[90m3. [0m 1 
diff --git a/tests/queries/0_stateless/00298_enum_width_and_cast.reference b/tests/queries/0_stateless/00298_enum_width_and_cast.reference
index 617494b3101..706e3f2ae98 100644
--- a/tests/queries/0_stateless/00298_enum_width_and_cast.reference
+++ b/tests/queries/0_stateless/00298_enum_width_and_cast.reference
@@ -1,17 +1,17 @@
-┌─[1mx[0m─────┬─[1my[0m─┐
-│ Hello │ 0 │
-└───────┴───┘
-┌─[1mx[0m─────┬─[1my[0m─┐
-│ Hello │ 0 │
-│ \     │ 0 │
-└───────┴───┘
-┌─[1mx[0m────────┬─[1my[0m─┐
-│ Hello    │ 0 │
-│ \        │ 0 │
-│ 	\t │ 0 │
-└──────────┴───┘
-┌─[1mx[0m────────┬─[1my[0m─┬─[1mtoInt8(x)[0m─┬─[1ms[0m─────┬─[1mcasted[0m─┐
-│ Hello    │ 0 │      -100 │ Hello │ Hello  │
-│ \        │ 0 │         0 │ \     │ \      │
-│ 	\t │ 0 │       111 │ 	\t │ 	\t  │
-└──────────┴───┴───────────┴───────┴────────┘
+   ┌─[1mx[0m─────┬─[1my[0m─┐
+[90m1. [0m│ Hello │ 0 │
+   └───────┴───┘
+   ┌─[1mx[0m─────┬─[1my[0m─┐
+[90m1. [0m│ Hello │ 0 │
+[90m2. [0m│ \     │ 0 │
+   └───────┴───┘
+   ┌─[1mx[0m────────┬─[1my[0m─┐
+[90m1. [0m│ Hello    │ 0 │
+[90m2. [0m│ \        │ 0 │
+[90m3. [0m│ 	\t │ 0 │
+   └──────────┴───┘
+   ┌─[1mx[0m────────┬─[1my[0m─┬─[1mtoInt8(x)[0m─┬─[1ms[0m─────┬─[1mcasted[0m─┐
+[90m1. [0m│ Hello    │ 0 │      -100 │ Hello │ Hello  │
+[90m2. [0m│ \        │ 0 │         0 │ \     │ \      │
+[90m3. [0m│ 	\t │ 0 │       111 │ 	\t │ 	\t  │
+   └──────────┴───┴───────────┴───────┴────────┘
diff --git a/tests/queries/0_stateless/00305_http_and_readonly.reference b/tests/queries/0_stateless/00305_http_and_readonly.reference
index 4d0cb6bd6bc..baddaa07bca 100644
--- a/tests/queries/0_stateless/00305_http_and_readonly.reference
+++ b/tests/queries/0_stateless/00305_http_and_readonly.reference
@@ -1,19 +1,19 @@
- name               value   changed
+    name               value   changed
 
- max_rows_to_read   10000         1 
- readonly           0             0 
- name               value   changed
+1.  max_rows_to_read   10000         1 
+2.  readonly           0             0 
+    name               value   changed
 
- max_rows_to_read   10000         1 
- readonly           2             1 
- name               value   changed
+1.  max_rows_to_read   10000         1 
+2.  readonly           2             1 
+    name               value   changed
 
- max_rows_to_read   10000         1 
- readonly           1             1 
- name               value   changed
+1.  max_rows_to_read   10000         1 
+2.  readonly           1             1 
+    name               value   changed
 
- max_rows_to_read   10000         1 
- readonly           2             1 
+1.  max_rows_to_read   10000         1 
+2.  readonly           2             1 
 Ok
 Ok
 0
diff --git a/tests/queries/0_stateless/00367_visible_width_of_array_tuple_enum.reference b/tests/queries/0_stateless/00367_visible_width_of_array_tuple_enum.reference
index f31beaf2dc4..069db227ff4 100644
--- a/tests/queries/0_stateless/00367_visible_width_of_array_tuple_enum.reference
+++ b/tests/queries/0_stateless/00367_visible_width_of_array_tuple_enum.reference
@@ -1,3 +1,3 @@
-┌─x─────────┬─y───────────┐
-│ ['hello'] │ (1,'hello') │
-└───────────┴─────────────┘
+   ┌─x─────────┬─y───────────┐
+1. │ ['hello'] │ (1,'hello') │
+   └───────────┴─────────────┘
diff --git a/tests/queries/0_stateless/00405_PrettyCompactMonoBlock.reference b/tests/queries/0_stateless/00405_PrettyCompactMonoBlock.reference
index 94d3efa6e0a..54c87785fab 100644
--- a/tests/queries/0_stateless/00405_PrettyCompactMonoBlock.reference
+++ b/tests/queries/0_stateless/00405_PrettyCompactMonoBlock.reference
@@ -1,32 +1,32 @@
 one block
-┌─[1mnumber[0m─┐
-│      0 │
-│      1 │
-└────────┘
+   ┌─[1mnumber[0m─┐
+[90m1. [0m│      0 │
+[90m2. [0m│      1 │
+   └────────┘
 two blocks
-┌─[1mnumber[0m─┐
-│      0 │
-│      0 │
-└────────┘
+   ┌─[1mnumber[0m─┐
+[90m1. [0m│      0 │
+[90m2. [0m│      0 │
+   └────────┘
 extremes
-┌─[1mnumber[0m─┐
-│      0 │
-│      1 │
-│      2 │
-└────────┘
+   ┌─[1mnumber[0m─┐
+[90m1. [0m│      0 │
+[90m2. [0m│      1 │
+[90m3. [0m│      2 │
+   └────────┘
 
 Extremes:
-┌─[1mnumber[0m─┐
-│      0 │
-│      2 │
-└────────┘
+   ┌─[1mnumber[0m─┐
+[90m1. [0m│      0 │
+[90m2. [0m│      2 │
+   └────────┘
 totals
-┌─[1msum(number)[0m─┐
-│           2 │
-│           1 │
-└─────────────┘
+   ┌─[1msum(number)[0m─┐
+[90m1. [0m│           2 │
+[90m2. [0m│           1 │
+   └─────────────┘
 
 Totals:
-┌─[1msum(number)[0m─┐
-│           3 │
-└─────────────┘
+   ┌─[1msum(number)[0m─┐
+[90m1. [0m│           3 │
+   └─────────────┘
diff --git a/tests/queries/0_stateless/00405_output_format_pretty_color.reference b/tests/queries/0_stateless/00405_output_format_pretty_color.reference
index aebdb5f1343..c48b81411be 100644
--- a/tests/queries/0_stateless/00405_output_format_pretty_color.reference
+++ b/tests/queries/0_stateless/00405_output_format_pretty_color.reference
@@ -1,363 +1,363 @@
 0
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     7 │ 7     │ (7,'7') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     8 │ 8     │ (8,'8') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
- hello   world   tuple     sometimes_nulls
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+2. │     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+3. │     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+2. │     1 │ 1     │ (1,'1') │               1 │
+3. │     2 │ 2     │ (2,'2') │               2 │
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+    hello   world   tuple     sometimes_nulls
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- hello   world   tuple     sometimes_nulls
+1.      0   0       (0,'0')              ᴺᵁᴸᴸ 
+2.      1   1       (1,'1')                 1 
+3.      2   2       (2,'2')                 2 
+4.      3   3       (3,'3')              ᴺᵁᴸᴸ 
+5.      4   4       (4,'4')                 1 
+     hello   world   tuple     sometimes_nulls
 
-     5   5       (5,'5')                 2 
-     6   6       (6,'6')              ᴺᵁᴸᴸ 
-     7   7       (7,'7')                 1 
-     8   8       (8,'8')                 2 
-     9   9       (9,'9')              ᴺᵁᴸᴸ 
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     7 │ 7     │ (7,'7') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     8 │ 8     │ (8,'8') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
- hello   world   tuple     sometimes_nulls
+ 6.      5   5       (5,'5')                 2 
+ 7.      6   6       (6,'6')              ᴺᵁᴸᴸ 
+ 8.      7   7       (7,'7')                 1 
+ 9.      8   8       (8,'8')                 2 
+10.      9   9       (9,'9')              ᴺᵁᴸᴸ 
+    ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+ 1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+ 2. │     1 │ 1     │ (1,'1') │               1 │
+ 3. │     2 │ 2     │ (2,'2') │               2 │
+ 4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+ 5. │     4 │ 4     │ (4,'4') │               1 │
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+2. │     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+3. │     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+2. │     1 │ 1     │ (1,'1') │               1 │
+3. │     2 │ 2     │ (2,'2') │               2 │
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+    hello   world   tuple     sometimes_nulls
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- hello   world   tuple     sometimes_nulls
+1.      0   0       (0,'0')              ᴺᵁᴸᴸ 
+2.      1   1       (1,'1')                 1 
+3.      2   2       (2,'2')                 2 
+4.      3   3       (3,'3')              ᴺᵁᴸᴸ 
+5.      4   4       (4,'4')                 1 
+     hello   world   tuple     sometimes_nulls
 
-     5   5       (5,'5')                 2 
-     6   6       (6,'6')              ᴺᵁᴸᴸ 
-     7   7       (7,'7')                 1 
-     8   8       (8,'8')                 2 
-     9   9       (9,'9')              ᴺᵁᴸᴸ 
+ 6.      5   5       (5,'5')                 2 
+ 7.      6   6       (6,'6')              ᴺᵁᴸᴸ 
+ 8.      7   7       (7,'7')                 1 
+ 9.      8   8       (8,'8')                 2 
+10.      9   9       (9,'9')              ᴺᵁᴸᴸ 
 1
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     7 │ 7     │ (7,'7') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     8 │ 8     │ (8,'8') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
- [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+[90m1. [0m│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m2. [0m│     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m3. [0m│     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m4. [0m│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m5. [0m│     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ [90m6. [0m│     5 │ 5     │ (5,'5') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ [90m7. [0m│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+    ├───────┼───────┼─────────┼─────────────────┤
+ [90m8. [0m│     7 │ 7     │ (7,'7') │               1 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ [90m9. [0m│     8 │ 8     │ (8,'8') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+[90m10. [0m│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
+[90m1. [0m│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+[90m2. [0m│     1 │ 1     │ (1,'1') │               1 │
+[90m3. [0m│     2 │ 2     │ (2,'2') │               2 │
+[90m4. [0m│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+[90m5. [0m│     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
+ [90m6. [0m│     5 │ 5     │ (5,'5') │               2 │
+ [90m7. [0m│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ [90m8. [0m│     7 │ 7     │ (7,'7') │               1 │
+ [90m9. [0m│     8 │ 8     │ (8,'8') │               2 │
+[90m10. [0m│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+    [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
+[90m1. [0m     0   0       (0,'0')              ᴺᵁᴸᴸ 
+[90m2. [0m     1   1       (1,'1')                 1 
+[90m3. [0m     2   2       (2,'2')                 2 
+[90m4. [0m     3   3       (3,'3')              ᴺᵁᴸᴸ 
+[90m5. [0m     4   4       (4,'4')                 1 
+     [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
 
-     5   5       (5,'5')                 2 
-     6   6       (6,'6')              ᴺᵁᴸᴸ 
-     7   7       (7,'7')                 1 
-     8   8       (8,'8')                 2 
-     9   9       (9,'9')              ᴺᵁᴸᴸ 
-┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     7 │ 7     │ (7,'7') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     8 │ 8     │ (8,'8') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
- hello   world   tuple     sometimes_nulls
+ [90m6. [0m     5   5       (5,'5')                 2 
+ [90m7. [0m     6   6       (6,'6')              ᴺᵁᴸᴸ 
+ [90m8. [0m     7   7       (7,'7')                 1 
+ [90m9. [0m     8   8       (8,'8')                 2 
+[90m10. [0m     9   9       (9,'9')              ᴺᵁᴸᴸ 
+    ┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
+ [90m1. [0m│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+ [90m2. [0m│     1 │ 1     │ (1,'1') │               1 │
+ [90m3. [0m│     2 │ 2     │ (2,'2') │               2 │
+ [90m4. [0m│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+ [90m5. [0m│     4 │ 4     │ (4,'4') │               1 │
+ [90m6. [0m│     5 │ 5     │ (5,'5') │               2 │
+ [90m7. [0m│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ [90m8. [0m│     7 │ 7     │ (7,'7') │               1 │
+ [90m9. [0m│     8 │ 8     │ (8,'8') │               2 │
+[90m10. [0m│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+2. │     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+3. │     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+2. │     1 │ 1     │ (1,'1') │               1 │
+3. │     2 │ 2     │ (2,'2') │               2 │
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+    hello   world   tuple     sometimes_nulls
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- hello   world   tuple     sometimes_nulls
+1.      0   0       (0,'0')              ᴺᵁᴸᴸ 
+2.      1   1       (1,'1')                 1 
+3.      2   2       (2,'2')                 2 
+4.      3   3       (3,'3')              ᴺᵁᴸᴸ 
+5.      4   4       (4,'4')                 1 
+     hello   world   tuple     sometimes_nulls
 
-     5   5       (5,'5')                 2 
-     6   6       (6,'6')              ᴺᵁᴸᴸ 
-     7   7       (7,'7')                 1 
-     8   8       (8,'8')                 2 
-     9   9       (9,'9')              ᴺᵁᴸᴸ 
+ 6.      5   5       (5,'5')                 2 
+ 7.      6   6       (6,'6')              ᴺᵁᴸᴸ 
+ 8.      7   7       (7,'7')                 1 
+ 9.      8   8       (8,'8')                 2 
+10.      9   9       (9,'9')              ᴺᵁᴸᴸ 
 auto
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     7 │ 7     │ (7,'7') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     8 │ 8     │ (8,'8') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
- hello   world   tuple     sometimes_nulls
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+2. │     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+3. │     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+2. │     1 │ 1     │ (1,'1') │               1 │
+3. │     2 │ 2     │ (2,'2') │               2 │
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+    hello   world   tuple     sometimes_nulls
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- hello   world   tuple     sometimes_nulls
+1.      0   0       (0,'0')              ᴺᵁᴸᴸ 
+2.      1   1       (1,'1')                 1 
+3.      2   2       (2,'2')                 2 
+4.      3   3       (3,'3')              ᴺᵁᴸᴸ 
+5.      4   4       (4,'4')                 1 
+     hello   world   tuple     sometimes_nulls
 
-     5   5       (5,'5')                 2 
-     6   6       (6,'6')              ᴺᵁᴸᴸ 
-     7   7       (7,'7')                 1 
-     8   8       (8,'8')                 2 
-     9   9       (9,'9')              ᴺᵁᴸᴸ 
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     7 │ 7     │ (7,'7') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     8 │ 8     │ (8,'8') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
- hello   world   tuple     sometimes_nulls
+ 6.      5   5       (5,'5')                 2 
+ 7.      6   6       (6,'6')              ᴺᵁᴸᴸ 
+ 8.      7   7       (7,'7')                 1 
+ 9.      8   8       (8,'8')                 2 
+10.      9   9       (9,'9')              ᴺᵁᴸᴸ 
+    ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+ 1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+ 2. │     1 │ 1     │ (1,'1') │               1 │
+ 3. │     2 │ 2     │ (2,'2') │               2 │
+ 4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+ 5. │     4 │ 4     │ (4,'4') │               1 │
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+2. │     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+3. │     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+2. │     1 │ 1     │ (1,'1') │               1 │
+3. │     2 │ 2     │ (2,'2') │               2 │
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+    hello   world   tuple     sometimes_nulls
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- hello   world   tuple     sometimes_nulls
+1.      0   0       (0,'0')              ᴺᵁᴸᴸ 
+2.      1   1       (1,'1')                 1 
+3.      2   2       (2,'2')                 2 
+4.      3   3       (3,'3')              ᴺᵁᴸᴸ 
+5.      4   4       (4,'4')                 1 
+     hello   world   tuple     sometimes_nulls
 
-     5   5       (5,'5')                 2 
-     6   6       (6,'6')              ᴺᵁᴸᴸ 
-     7   7       (7,'7')                 1 
-     8   8       (8,'8')                 2 
-     9   9       (9,'9')              ᴺᵁᴸᴸ 
+ 6.      5   5       (5,'5')                 2 
+ 7.      6   6       (6,'6')              ᴺᵁᴸᴸ 
+ 8.      7   7       (7,'7')                 1 
+ 9.      8   8       (8,'8')                 2 
+10.      9   9       (9,'9')              ᴺᵁᴸᴸ 
diff --git a/tests/queries/0_stateless/00405_pretty_formats.reference b/tests/queries/0_stateless/00405_pretty_formats.reference
index bdfff4a8738..bad93c19bb6 100644
--- a/tests/queries/0_stateless/00405_pretty_formats.reference
+++ b/tests/queries/0_stateless/00405_pretty_formats.reference
@@ -1,306 +1,306 @@
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     7 │ 7     │ (7,'7') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     8 │ 8     │ (8,'8') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
- [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+[90m1. [0m│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m2. [0m│     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m3. [0m│     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m4. [0m│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m5. [0m│     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ [90m6. [0m│     5 │ 5     │ (5,'5') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ [90m7. [0m│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+    ├───────┼───────┼─────────┼─────────────────┤
+ [90m8. [0m│     7 │ 7     │ (7,'7') │               1 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ [90m9. [0m│     8 │ 8     │ (8,'8') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+[90m10. [0m│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
+[90m1. [0m│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+[90m2. [0m│     1 │ 1     │ (1,'1') │               1 │
+[90m3. [0m│     2 │ 2     │ (2,'2') │               2 │
+[90m4. [0m│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+[90m5. [0m│     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
+ [90m6. [0m│     5 │ 5     │ (5,'5') │               2 │
+ [90m7. [0m│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ [90m8. [0m│     7 │ 7     │ (7,'7') │               1 │
+ [90m9. [0m│     8 │ 8     │ (8,'8') │               2 │
+[90m10. [0m│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+    [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
+[90m1. [0m     0   0       (0,'0')              ᴺᵁᴸᴸ 
+[90m2. [0m     1   1       (1,'1')                 1 
+[90m3. [0m     2   2       (2,'2')                 2 
+[90m4. [0m     3   3       (3,'3')              ᴺᵁᴸᴸ 
+[90m5. [0m     4   4       (4,'4')                 1 
+     [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
 
-     5   5       (5,'5')                 2 
-     6   6       (6,'6')              ᴺᵁᴸᴸ 
-     7   7       (7,'7')                 1 
-     8   8       (8,'8')                 2 
-     9   9       (9,'9')              ᴺᵁᴸᴸ 
-┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     7 │ 7     │ (7,'7') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     8 │ 8     │ (8,'8') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     5 │ 5     │ (5,'5') │               2 │
-│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
-│     7 │ 7     │ (7,'7') │               1 │
-│     8 │ 8     │ (8,'8') │               2 │
-│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
-└───────┴───────┴─────────┴─────────────────┘
- hello   world   tuple     sometimes_nulls
+ [90m6. [0m     5   5       (5,'5')                 2 
+ [90m7. [0m     6   6       (6,'6')              ᴺᵁᴸᴸ 
+ [90m8. [0m     7   7       (7,'7')                 1 
+ [90m9. [0m     8   8       (8,'8')                 2 
+[90m10. [0m     9   9       (9,'9')              ᴺᵁᴸᴸ 
+    ┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
+ [90m1. [0m│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+ [90m2. [0m│     1 │ 1     │ (1,'1') │               1 │
+ [90m3. [0m│     2 │ 2     │ (2,'2') │               2 │
+ [90m4. [0m│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+ [90m5. [0m│     4 │ 4     │ (4,'4') │               1 │
+ [90m6. [0m│     5 │ 5     │ (5,'5') │               2 │
+ [90m7. [0m│     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ [90m8. [0m│     7 │ 7     │ (7,'7') │               1 │
+ [90m9. [0m│     8 │ 8     │ (8,'8') │               2 │
+[90m10. [0m│     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+2. │     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+3. │     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+    ├───────┼───────┼─────────┼─────────────────┤
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+    ├───────┼───────┼─────────┼─────────────────┤
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+   ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+2. │     1 │ 1     │ (1,'1') │               1 │
+3. │     2 │ 2     │ (2,'2') │               2 │
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+ 7. │     6 │ 6     │ (6,'6') │            ᴺᵁᴸᴸ │
+ 8. │     7 │ 7     │ (7,'7') │               1 │
+ 9. │     8 │ 8     │ (8,'8') │               2 │
+10. │     9 │ 9     │ (9,'9') │            ᴺᵁᴸᴸ │
+    └───────┴───────┴─────────┴─────────────────┘
+    hello   world   tuple     sometimes_nulls
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- hello   world   tuple     sometimes_nulls
+1.      0   0       (0,'0')              ᴺᵁᴸᴸ 
+2.      1   1       (1,'1')                 1 
+3.      2   2       (2,'2')                 2 
+4.      3   3       (3,'3')              ᴺᵁᴸᴸ 
+5.      4   4       (4,'4')                 1 
+     hello   world   tuple     sometimes_nulls
 
-     5   5       (5,'5')                 2 
-     6   6       (6,'6')              ᴺᵁᴸᴸ 
-     7   7       (7,'7')                 1 
-     8   8       (8,'8')                 2 
-     9   9       (9,'9')              ᴺᵁᴸᴸ 
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-└───────┴───────┴─────────┴─────────────────┘
+ 6.      5   5       (5,'5')                 2 
+ 7.      6   6       (6,'6')              ᴺᵁᴸᴸ 
+ 8.      7   7       (7,'7')                 1 
+ 9.      8   8       (8,'8')                 2 
+10.      9   9       (9,'9')              ᴺᵁᴸᴸ 
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+[90m1. [0m│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m2. [0m│     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m3. [0m│     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m4. [0m│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+[90m5. [0m│     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ [1mhello[0m ┃ [1mworld[0m ┃ [1mtuple  [0m ┃ [1msometimes_nulls[0m ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ [90m6. [0m│     5 │ 5     │ (5,'5') │               2 │
+    └───────┴───────┴─────────┴─────────────────┘
   Showed first 6.
-┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
-│     5 │ 5     │ (5,'5') │               2 │
-└───────┴───────┴─────────┴─────────────────┘
+   ┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
+[90m1. [0m│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+[90m2. [0m│     1 │ 1     │ (1,'1') │               1 │
+[90m3. [0m│     2 │ 2     │ (2,'2') │               2 │
+[90m4. [0m│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+[90m5. [0m│     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
+ [90m6. [0m│     5 │ 5     │ (5,'5') │               2 │
+    └───────┴───────┴─────────┴─────────────────┘
   Showed first 6.
- [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
+    [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
+[90m1. [0m     0   0       (0,'0')              ᴺᵁᴸᴸ 
+[90m2. [0m     1   1       (1,'1')                 1 
+[90m3. [0m     2   2       (2,'2')                 2 
+[90m4. [0m     3   3       (3,'3')              ᴺᵁᴸᴸ 
+[90m5. [0m     4   4       (4,'4')                 1 
+     [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
 
-     5   5       (5,'5')                 2 
+ [90m6. [0m     5   5       (5,'5')                 2 
 
 Showed first 6.
-┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-│     5 │ 5     │ (5,'5') │               2 │
-└───────┴───────┴─────────┴─────────────────┘
+   ┌─[1mhello[0m─┬─[1mworld[0m─┬─[1mtuple[0m───┬─[1msometimes_nulls[0m─┐
+[90m1. [0m│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+[90m2. [0m│     1 │ 1     │ (1,'1') │               1 │
+[90m3. [0m│     2 │ 2     │ (2,'2') │               2 │
+[90m4. [0m│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+[90m5. [0m│     4 │ 4     │ (4,'4') │               1 │
+[90m6. [0m│     5 │ 5     │ (5,'5') │               2 │
+   └───────┴───────┴─────────┴─────────────────┘
   Showed first 6.
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     1 │ 1     │ (1,'1') │               1 │
-├───────┼───────┼─────────┼─────────────────┤
-│     2 │ 2     │ (2,'2') │               2 │
-├───────┼───────┼─────────┼─────────────────┤
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-├───────┼───────┼─────────┼─────────────────┤
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
-┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
-┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
-│     5 │ 5     │ (5,'5') │               2 │
-└───────┴───────┴─────────┴─────────────────┘
+   ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+   ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+   ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+2. │     1 │ 1     │ (1,'1') │               1 │
+   ├───────┼───────┼─────────┼─────────────────┤
+3. │     2 │ 2     │ (2,'2') │               2 │
+   ├───────┼───────┼─────────┼─────────────────┤
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+   ├───────┼───────┼─────────┼─────────────────┤
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┏━━━━━━━┳━━━━━━━┳━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
+    ┃ hello ┃ world ┃ tuple   ┃ sometimes_nulls ┃
+    ┡━━━━━━━╇━━━━━━━╇━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+    └───────┴───────┴─────────┴─────────────────┘
   Showed first 6.
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
-│     1 │ 1     │ (1,'1') │               1 │
-│     2 │ 2     │ (2,'2') │               2 │
-│     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
-│     4 │ 4     │ (4,'4') │               1 │
-└───────┴───────┴─────────┴─────────────────┘
-┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
-│     5 │ 5     │ (5,'5') │               2 │
-└───────┴───────┴─────────┴─────────────────┘
+   ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+1. │     0 │ 0     │ (0,'0') │            ᴺᵁᴸᴸ │
+2. │     1 │ 1     │ (1,'1') │               1 │
+3. │     2 │ 2     │ (2,'2') │               2 │
+4. │     3 │ 3     │ (3,'3') │            ᴺᵁᴸᴸ │
+5. │     4 │ 4     │ (4,'4') │               1 │
+   └───────┴───────┴─────────┴─────────────────┘
+    ┌─hello─┬─world─┬─tuple───┬─sometimes_nulls─┐
+ 6. │     5 │ 5     │ (5,'5') │               2 │
+    └───────┴───────┴─────────┴─────────────────┘
   Showed first 6.
- hello   world   tuple     sometimes_nulls
+    hello   world   tuple     sometimes_nulls
 
-     0   0       (0,'0')              ᴺᵁᴸᴸ 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              ᴺᵁᴸᴸ 
-     4   4       (4,'4')                 1 
- hello   world   tuple     sometimes_nulls
+1.      0   0       (0,'0')              ᴺᵁᴸᴸ 
+2.      1   1       (1,'1')                 1 
+3.      2   2       (2,'2')                 2 
+4.      3   3       (3,'3')              ᴺᵁᴸᴸ 
+5.      4   4       (4,'4')                 1 
+     hello   world   tuple     sometimes_nulls
 
-     5   5       (5,'5')                 2 
+ 6.      5   5       (5,'5')                 2 
 
 Showed first 6.
-+-------+-------+---------+-----------------+
-| [1mhello[0m | [1mworld[0m | [1mtuple  [0m | [1msometimes_nulls[0m |
-+-------+-------+---------+-----------------+
-|     0 | 0     | (0,'0') |            NULL |
-+-------+-------+---------+-----------------+
-|     1 | 1     | (1,'1') |               1 |
-+-------+-------+---------+-----------------+
-|     2 | 2     | (2,'2') |               2 |
-+-------+-------+---------+-----------------+
-|     3 | 3     | (3,'3') |            NULL |
-+-------+-------+---------+-----------------+
-|     4 | 4     | (4,'4') |               1 |
-+-------+-------+---------+-----------------+
-+-------+-------+---------+-----------------+
-| [1mhello[0m | [1mworld[0m | [1mtuple  [0m | [1msometimes_nulls[0m |
-+-------+-------+---------+-----------------+
-|     5 | 5     | (5,'5') |               2 |
-+-------+-------+---------+-----------------+
+   +-------+-------+---------+-----------------+
+   | [1mhello[0m | [1mworld[0m | [1mtuple  [0m | [1msometimes_nulls[0m |
+   +-------+-------+---------+-----------------+
+[90m1. [0m|     0 | 0     | (0,'0') |            NULL |
+   +-------+-------+---------+-----------------+
+[90m2. [0m|     1 | 1     | (1,'1') |               1 |
+   +-------+-------+---------+-----------------+
+[90m3. [0m|     2 | 2     | (2,'2') |               2 |
+   +-------+-------+---------+-----------------+
+[90m4. [0m|     3 | 3     | (3,'3') |            NULL |
+   +-------+-------+---------+-----------------+
+[90m5. [0m|     4 | 4     | (4,'4') |               1 |
+   +-------+-------+---------+-----------------+
+    +-------+-------+---------+-----------------+
+    | [1mhello[0m | [1mworld[0m | [1mtuple  [0m | [1msometimes_nulls[0m |
+    +-------+-------+---------+-----------------+
+ [90m6. [0m|     5 | 5     | (5,'5') |               2 |
+    +-------+-------+---------+-----------------+
   Showed first 6.
-+-[1mhello[0m-+-[1mworld[0m-+-[1mtuple[0m---+-[1msometimes_nulls[0m-+
-|     0 | 0     | (0,'0') |            NULL |
-|     1 | 1     | (1,'1') |               1 |
-|     2 | 2     | (2,'2') |               2 |
-|     3 | 3     | (3,'3') |            NULL |
-|     4 | 4     | (4,'4') |               1 |
-+-------+-------+---------+-----------------+
-+-[1mhello[0m-+-[1mworld[0m-+-[1mtuple[0m---+-[1msometimes_nulls[0m-+
-|     5 | 5     | (5,'5') |               2 |
-+-------+-------+---------+-----------------+
+   +-[1mhello[0m-+-[1mworld[0m-+-[1mtuple[0m---+-[1msometimes_nulls[0m-+
+[90m1. [0m|     0 | 0     | (0,'0') |            NULL |
+[90m2. [0m|     1 | 1     | (1,'1') |               1 |
+[90m3. [0m|     2 | 2     | (2,'2') |               2 |
+[90m4. [0m|     3 | 3     | (3,'3') |            NULL |
+[90m5. [0m|     4 | 4     | (4,'4') |               1 |
+   +-------+-------+---------+-----------------+
+    +-[1mhello[0m-+-[1mworld[0m-+-[1mtuple[0m---+-[1msometimes_nulls[0m-+
+ [90m6. [0m|     5 | 5     | (5,'5') |               2 |
+    +-------+-------+---------+-----------------+
   Showed first 6.
- [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
+    [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
 
-     0   0       (0,'0')              NULL 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              NULL 
-     4   4       (4,'4')                 1 
- [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
+[90m1. [0m     0   0       (0,'0')              NULL 
+[90m2. [0m     1   1       (1,'1')                 1 
+[90m3. [0m     2   2       (2,'2')                 2 
+[90m4. [0m     3   3       (3,'3')              NULL 
+[90m5. [0m     4   4       (4,'4')                 1 
+     [1mhello[0m   [1mworld[0m   [1mtuple[0m     [1msometimes_nulls[0m
 
-     5   5       (5,'5')                 2 
+ [90m6. [0m     5   5       (5,'5')                 2 
 
 Showed first 6.
-+-[1mhello[0m-+-[1mworld[0m-+-[1mtuple[0m---+-[1msometimes_nulls[0m-+
-|     0 | 0     | (0,'0') |            NULL |
-|     1 | 1     | (1,'1') |               1 |
-|     2 | 2     | (2,'2') |               2 |
-|     3 | 3     | (3,'3') |            NULL |
-|     4 | 4     | (4,'4') |               1 |
-|     5 | 5     | (5,'5') |               2 |
-+-------+-------+---------+-----------------+
+   +-[1mhello[0m-+-[1mworld[0m-+-[1mtuple[0m---+-[1msometimes_nulls[0m-+
+[90m1. [0m|     0 | 0     | (0,'0') |            NULL |
+[90m2. [0m|     1 | 1     | (1,'1') |               1 |
+[90m3. [0m|     2 | 2     | (2,'2') |               2 |
+[90m4. [0m|     3 | 3     | (3,'3') |            NULL |
+[90m5. [0m|     4 | 4     | (4,'4') |               1 |
+[90m6. [0m|     5 | 5     | (5,'5') |               2 |
+   +-------+-------+---------+-----------------+
   Showed first 6.
-+-------+-------+---------+-----------------+
-| hello | world | tuple   | sometimes_nulls |
-+-------+-------+---------+-----------------+
-|     0 | 0     | (0,'0') |            NULL |
-+-------+-------+---------+-----------------+
-|     1 | 1     | (1,'1') |               1 |
-+-------+-------+---------+-----------------+
-|     2 | 2     | (2,'2') |               2 |
-+-------+-------+---------+-----------------+
-|     3 | 3     | (3,'3') |            NULL |
-+-------+-------+---------+-----------------+
-|     4 | 4     | (4,'4') |               1 |
-+-------+-------+---------+-----------------+
-+-------+-------+---------+-----------------+
-| hello | world | tuple   | sometimes_nulls |
-+-------+-------+---------+-----------------+
-|     5 | 5     | (5,'5') |               2 |
-+-------+-------+---------+-----------------+
+   +-------+-------+---------+-----------------+
+   | hello | world | tuple   | sometimes_nulls |
+   +-------+-------+---------+-----------------+
+1. |     0 | 0     | (0,'0') |            NULL |
+   +-------+-------+---------+-----------------+
+2. |     1 | 1     | (1,'1') |               1 |
+   +-------+-------+---------+-----------------+
+3. |     2 | 2     | (2,'2') |               2 |
+   +-------+-------+---------+-----------------+
+4. |     3 | 3     | (3,'3') |            NULL |
+   +-------+-------+---------+-----------------+
+5. |     4 | 4     | (4,'4') |               1 |
+   +-------+-------+---------+-----------------+
+    +-------+-------+---------+-----------------+
+    | hello | world | tuple   | sometimes_nulls |
+    +-------+-------+---------+-----------------+
+ 6. |     5 | 5     | (5,'5') |               2 |
+    +-------+-------+---------+-----------------+
   Showed first 6.
-+-hello-+-world-+-tuple---+-sometimes_nulls-+
-|     0 | 0     | (0,'0') |            NULL |
-|     1 | 1     | (1,'1') |               1 |
-|     2 | 2     | (2,'2') |               2 |
-|     3 | 3     | (3,'3') |            NULL |
-|     4 | 4     | (4,'4') |               1 |
-+-------+-------+---------+-----------------+
-+-hello-+-world-+-tuple---+-sometimes_nulls-+
-|     5 | 5     | (5,'5') |               2 |
-+-------+-------+---------+-----------------+
+   +-hello-+-world-+-tuple---+-sometimes_nulls-+
+1. |     0 | 0     | (0,'0') |            NULL |
+2. |     1 | 1     | (1,'1') |               1 |
+3. |     2 | 2     | (2,'2') |               2 |
+4. |     3 | 3     | (3,'3') |            NULL |
+5. |     4 | 4     | (4,'4') |               1 |
+   +-------+-------+---------+-----------------+
+    +-hello-+-world-+-tuple---+-sometimes_nulls-+
+ 6. |     5 | 5     | (5,'5') |               2 |
+    +-------+-------+---------+-----------------+
   Showed first 6.
- hello   world   tuple     sometimes_nulls
+    hello   world   tuple     sometimes_nulls
 
-     0   0       (0,'0')              NULL 
-     1   1       (1,'1')                 1 
-     2   2       (2,'2')                 2 
-     3   3       (3,'3')              NULL 
-     4   4       (4,'4')                 1 
- hello   world   tuple     sometimes_nulls
+1.      0   0       (0,'0')              NULL 
+2.      1   1       (1,'1')                 1 
+3.      2   2       (2,'2')                 2 
+4.      3   3       (3,'3')              NULL 
+5.      4   4       (4,'4')                 1 
+     hello   world   tuple     sometimes_nulls
 
-     5   5       (5,'5')                 2 
+ 6.      5   5       (5,'5')                 2 
 
 Showed first 6.
diff --git a/tests/queries/0_stateless/00406_tuples_with_nulls.reference b/tests/queries/0_stateless/00406_tuples_with_nulls.reference
index c383c208b64..614cb1ace7f 100644
--- a/tests/queries/0_stateless/00406_tuples_with_nulls.reference
+++ b/tests/queries/0_stateless/00406_tuples_with_nulls.reference
@@ -1,15 +1,15 @@
-┌─tuple─────────┐
-│ (0,NULL,NULL) │
-│ (1,1,'1')     │
-│ (2,2,NULL)    │
-│ (3,NULL,'1')  │
-│ (4,1,NULL)    │
-│ (5,2,'1')     │
-│ (6,NULL,NULL) │
-│ (7,1,'1')     │
-│ (8,2,NULL)    │
-│ (9,NULL,'1')  │
-└───────────────┘
-┌─x────┬─y──────┐
-│ ᴺᵁᴸᴸ │ (NULL) │
-└──────┴────────┘
+    ┌─tuple─────────┐
+ 1. │ (0,NULL,NULL) │
+ 2. │ (1,1,'1')     │
+ 3. │ (2,2,NULL)    │
+ 4. │ (3,NULL,'1')  │
+ 5. │ (4,1,NULL)    │
+ 6. │ (5,2,'1')     │
+ 7. │ (6,NULL,NULL) │
+ 8. │ (7,1,'1')     │
+ 9. │ (8,2,NULL)    │
+10. │ (9,NULL,'1')  │
+    └───────────────┘
+   ┌─x────┬─y──────┐
+1. │ ᴺᵁᴸᴸ │ (NULL) │
+   └──────┴────────┘
diff --git a/tests/queries/0_stateless/00476_pretty_formats_and_widths.reference b/tests/queries/0_stateless/00476_pretty_formats_and_widths.reference
index eedaa4b5d8b..599d8b6d5e3 100644
--- a/tests/queries/0_stateless/00476_pretty_formats_and_widths.reference
+++ b/tests/queries/0_stateless/00476_pretty_formats_and_widths.reference
@@ -1,67 +1,67 @@
-┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
-┃ [1m         x[0m ┃ [1ms         [0m ┃
-┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
-│          1 │ 1          │
-├────────────┼────────────┤
-│         10 │ 10         │
-├────────────┼────────────┤
-│        100 │ 100        │
-├────────────┼────────────┤
-│       1000 │ 1000       │
-├────────────┼────────────┤
-│      10000 │ 10000      │
-├────────────┼────────────┤
-│     100000 │ 100000     │
-├────────────┼────────────┤
-│    1000000 │ 1000000    │
-├────────────┼────────────┤
-│   10000000 │ 10000000   │
-├────────────┼────────────┤
-│  100000000 │ 100000000  │
-├────────────┼────────────┤
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-┌──────────[1mx[0m─┬─[1ms[0m──────────┐
-│          1 │ 1          │
-│         10 │ 10         │
-│        100 │ 100        │
-│       1000 │ 1000       │
-│      10000 │ 10000      │
-│     100000 │ 100000     │
-│    1000000 │ 1000000    │
-│   10000000 │ 10000000   │
-│  100000000 │ 100000000  │
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-          [1mx[0m   [1ms[0m         
+    ┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
+    ┃ [1m         x[0m ┃ [1ms         [0m ┃
+    ┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
+ [90m1. [0m│          1 │ 1          │
+    ├────────────┼────────────┤
+ [90m2. [0m│         10 │ 10         │
+    ├────────────┼────────────┤
+ [90m3. [0m│        100 │ 100        │
+    ├────────────┼────────────┤
+ [90m4. [0m│       1000 │ 1000       │
+    ├────────────┼────────────┤
+ [90m5. [0m│      10000 │ 10000      │
+    ├────────────┼────────────┤
+ [90m6. [0m│     100000 │ 100000     │
+    ├────────────┼────────────┤
+ [90m7. [0m│    1000000 │ 1000000    │
+    ├────────────┼────────────┤
+ [90m8. [0m│   10000000 │ 10000000   │
+    ├────────────┼────────────┤
+ [90m9. [0m│  100000000 │ 100000000  │
+    ├────────────┼────────────┤
+[90m10. [0m│ 1000000000 │ 1000000000 │
+    └────────────┴────────────┘
+    ┌──────────[1mx[0m─┬─[1ms[0m──────────┐
+ [90m1. [0m│          1 │ 1          │
+ [90m2. [0m│         10 │ 10         │
+ [90m3. [0m│        100 │ 100        │
+ [90m4. [0m│       1000 │ 1000       │
+ [90m5. [0m│      10000 │ 10000      │
+ [90m6. [0m│     100000 │ 100000     │
+ [90m7. [0m│    1000000 │ 1000000    │
+ [90m8. [0m│   10000000 │ 10000000   │
+ [90m9. [0m│  100000000 │ 100000000  │
+[90m10. [0m│ 1000000000 │ 1000000000 │
+    └────────────┴────────────┘
+              [1mx[0m   [1ms[0m         
 
-          1   1          
-         10   10         
-        100   100        
-       1000   1000       
-      10000   10000      
-     100000   100000     
-    1000000   1000000    
-   10000000   10000000   
-  100000000   100000000  
- 1000000000   1000000000 
-┌──────────[1mx[0m─┬─[1ms[0m──────────┐
-│          1 │ 1          │
-│         10 │ 10         │
-│        100 │ 100        │
-│       1000 │ 1000       │
-│      10000 │ 10000      │
-│     100000 │ 100000     │
-│    1000000 │ 1000000    │
-│   10000000 │ 10000000   │
-│  100000000 │ 100000000  │
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-┏━━━━━━━━━━┓
-┃ [1m'\\\'\''[0m ┃
-┡━━━━━━━━━━┩
-│ \''      │
-└──────────┘
+ [90m1. [0m          1   1          
+ [90m2. [0m         10   10         
+ [90m3. [0m        100   100        
+ [90m4. [0m       1000   1000       
+ [90m5. [0m      10000   10000      
+ [90m6. [0m     100000   100000     
+ [90m7. [0m    1000000   1000000    
+ [90m8. [0m   10000000   10000000   
+ [90m9. [0m  100000000   100000000  
+[90m10. [0m 1000000000   1000000000 
+    ┌──────────[1mx[0m─┬─[1ms[0m──────────┐
+ [90m1. [0m│          1 │ 1          │
+ [90m2. [0m│         10 │ 10         │
+ [90m3. [0m│        100 │ 100        │
+ [90m4. [0m│       1000 │ 1000       │
+ [90m5. [0m│      10000 │ 10000      │
+ [90m6. [0m│     100000 │ 100000     │
+ [90m7. [0m│    1000000 │ 1000000    │
+ [90m8. [0m│   10000000 │ 10000000   │
+ [90m9. [0m│  100000000 │ 100000000  │
+[90m10. [0m│ 1000000000 │ 1000000000 │
+    └────────────┴────────────┘
+   ┏━━━━━━━━━━┓
+   ┃ [1m'\\\'\''[0m ┃
+   ┡━━━━━━━━━━┩
+[90m1. [0m│ \''      │
+   └──────────┘
 Row 1:
 ──────
 '\\\'\'': \''
diff --git a/tests/queries/0_stateless/00569_parse_date_time_best_effort.reference b/tests/queries/0_stateless/00569_parse_date_time_best_effort.reference
index 0729a7628f2..89f7d1cbf7c 100644
--- a/tests/queries/0_stateless/00569_parse_date_time_best_effort.reference
+++ b/tests/queries/0_stateless/00569_parse_date_time_best_effort.reference
@@ -1,106 +1,106 @@
- s                                                   a                     b
+      s                                                   a                     b
 
- 0                                                ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 0000                                             ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 2000-01-01 00:00:00               2000-01-01 00:00:00   2000-01-01 00:00:00 
- 2000-01-01 01:00:00               2000-01-01 01:00:00   2000-01-01 01:00:00 
- 02/01/17 010203 MSK               2017-01-01 22:02:03   2017-01-01 22:02:03 
- 02/01/17 010203 MSK+0100          2017-01-01 21:02:03   2017-01-01 21:02:03 
- 02/01/17 010203 UTC+0300          2017-01-01 22:02:03   2017-01-01 22:02:03 
- 02/01/17 010203Z                  2017-01-02 01:02:03   2017-01-02 01:02:03 
- 02/01/1970 010203Z                1970-01-02 01:02:03   1970-01-02 01:02:03 
- 02/01/70 010203Z                  1970-01-02 01:02:03   1970-01-02 01:02:03 
- 11 Feb 2018 06:40:50 +0300        2018-02-11 03:40:50   2018-02-11 03:40:50 
- 17 Apr 2000 2 1:2:3               2000-04-17 01:02:03   2000-04-17 01:02:03 
- 19700102 01:00:00                 1970-01-02 01:00:00   1970-01-02 01:00:00 
- 1970010201:00:00                                 ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 19700102010203                    1970-01-02 01:02:03   1970-01-02 01:02:03 
- 19700102010203Z                   1970-01-02 01:02:03   1970-01-02 01:02:03 
- 1970/01/02 010203Z                1970-01-02 01:02:03   1970-01-02 01:02:03 
- 20 2000                           2000-01-20 00:00:00   2000-01-20 00:00:00 
- 201                                              ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 20160101                          2016-01-01 00:00:00   2016-01-01 00:00:00 
- 2016-01-01                        2016-01-01 00:00:00   2016-01-01 00:00:00 
- 201601-01                         2016-01-01 01:00:00   2016-01-01 01:00:00 
- 2016-01-01MSD                     2015-12-31 20:00:00   2015-12-31 20:00:00 
- 2016-01-01 MSD                    2015-12-31 20:00:00   2015-12-31 20:00:00 
- 201601-01 MSD                     2016-01-01 04:00:00   2016-01-01 04:00:00 
- 2016-01-01UTC                     2016-01-01 00:00:00   2016-01-01 00:00:00 
- 2016-01-01Z                       2016-01-01 00:00:00   2016-01-01 00:00:00 
- 2017                              2017-01-01 00:00:00   2017-01-01 00:00:00 
- 2017/01/00                        2017-01-01 00:00:00   2017-01-01 00:00:00 
- 2017/01/00 MSD                    2016-12-31 20:00:00   2016-12-31 20:00:00 
- 2017/01/00 MSD Jun                2017-05-31 20:00:00   2017-05-31 20:00:00 
- 2017/01/01                        2017-01-01 00:00:00   2017-01-01 00:00:00 
- 201701 02 010203 UTC+0300         2017-01-01 22:02:03   2017-01-01 22:02:03 
- 2017-01-02 03:04:05               2017-01-02 03:04:05   2017-01-02 03:04:05 
- 2017-01-0203:04:05                               ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 2017-01-02 03:04:05+0             2017-01-02 03:04:05   2017-01-02 03:04:05 
- 2017-01-02 03:04:05+00            2017-01-02 03:04:05   2017-01-02 03:04:05 
- 2017-01-02 03:04:05+0000          2017-01-02 03:04:05   2017-01-02 03:04:05 
- 2017-01-02 03:04:05 -0100         2017-01-02 04:04:05   2017-01-02 04:04:05 
- 2017-01-02 03:04:05+030           2017-01-02 02:34:05   2017-01-02 02:34:05 
- 2017-01-02 03:04:05+0300          2017-01-02 00:04:05   2017-01-02 00:04:05 
- 2017-01-02 03:04:05+1             2017-01-02 02:04:05   2017-01-02 02:04:05 
- 2017-01-02 03:04:05+300           2017-01-02 00:04:05   2017-01-02 00:04:05 
- 2017-01-02 03:04:05+900           2017-01-01 18:04:05   2017-01-01 18:04:05 
- 2017-01-02 03:04:05GMT            2017-01-02 03:04:05   2017-01-02 03:04:05 
- 2017-01-02 03:04:05 MSD           2017-01-01 23:04:05   2017-01-01 23:04:05 
- 2017-01-02 03:04:05 MSD Feb       2017-02-01 23:04:05   2017-02-01 23:04:05 
- 2017-01-02 03:04:05 MSD Jun       2017-06-01 23:04:05   2017-06-01 23:04:05 
- 2017-01-02 03:04:05 MSK           2017-01-02 00:04:05   2017-01-02 00:04:05 
- 2017-01-02T03:04:05               2017-01-02 03:04:05   2017-01-02 03:04:05 
- 2017-01-02T03:04:05+00            2017-01-02 03:04:05   2017-01-02 03:04:05 
- 2017-01-02T03:04:05 -0100         2017-01-02 04:04:05   2017-01-02 04:04:05 
- 2017-01-02T03:04:05-0100          2017-01-02 04:04:05   2017-01-02 04:04:05 
- 2017-01-02T03:04:05+0100          2017-01-02 02:04:05   2017-01-02 02:04:05 
- 2017-01-02T03:04:05Z              2017-01-02 03:04:05   2017-01-02 03:04:05 
- 2017-01 03:04:05 MSD Jun          2017-05-31 23:04:05   2017-05-31 23:04:05 
- 2017-01 03:04 MSD Jun             2017-05-31 23:04:00   2017-05-31 23:04:00 
- 2017/01/31                        2017-01-31 00:00:00   2017-01-31 00:00:00 
- 2017/01/32                                       ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 2017-01 MSD Jun                   2017-05-31 20:00:00   2017-05-31 20:00:00 
- 201701 MSD Jun                    2017-05-31 20:00:00   2017-05-31 20:00:00 
- 2017 25 1:2:3                                    ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 2017 25 Apr 1:2:3                 2017-04-01 01:02:03   2017-04-01 01:02:03 
- 2017 Apr 01 11:22:33              2017-04-01 11:22:33   2017-04-01 11:22:33 
- 2017 Apr 02 01/02/03 UTC+0300                    ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 2017 Apr 02 010203 UTC+0300       2017-04-01 22:02:03   2017-04-01 22:02:03 
- 2017 Apr 02 01:2:3 UTC+0300       2017-04-01 22:02:03   2017-04-01 22:02:03 
- 2017 Apr 02 1:02:3                2017-04-02 01:02:03   2017-04-02 01:02:03 
- 2017 Apr 02 11:22:33              2017-04-02 11:22:33   2017-04-02 11:22:33 
- 2017 Apr 02 1:2:03                2017-04-02 01:02:03   2017-04-02 01:02:03 
- 2017 Apr 02 1:22:33               2017-04-02 01:22:33   2017-04-02 01:22:33 
- 2017 Apr 02 1:2:3                 2017-04-02 01:02:03   2017-04-02 01:02:03 
- 2017 Apr 02 1:2:33                2017-04-02 01:02:33   2017-04-02 01:02:33 
- 2017 Apr 02 1:2:3 MSK             2017-04-01 22:02:03   2017-04-01 22:02:03 
- 2017 Apr 02 1:2:3 MSK 2017                       ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 2017 Apr 02 1:2:3 MSK 2018                       ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 2017 Apr 02 1:2:3 UTC+0000        2017-04-02 01:02:03   2017-04-02 01:02:03 
- 2017 Apr 02 1:2:3 UTC+0300        2017-04-01 22:02:03   2017-04-01 22:02:03 
- 2017 Apr 02 1:2:3 UTC+0400        2017-04-01 21:02:03   2017-04-01 21:02:03 
- 2017 Apr 2 1:2:3                  2017-04-02 01:02:03   2017-04-02 01:02:03 
- 2017 Jan 02 010203 UTC+0300       2017-01-01 22:02:03   2017-01-01 22:02:03 
- 25 Apr 2017 01:02:03              2017-04-25 01:02:03   2017-04-25 01:02:03 
- 25 Apr 2017 1:2:3                 2017-04-25 01:02:03   2017-04-25 01:02:03 
- 25 Jan 2017 1:2:3                 2017-01-25 01:02:03   2017-01-25 01:02:03 
- 25 Jan 2017 1:2:3 MSK             2017-01-24 22:02:03   2017-01-24 22:02:03 
- 25 Jan 2017 1:2:3 PM              2017-01-25 13:02:03   2017-01-25 13:02:03 
- 25 Jan 2017 1:2:3Z                2017-01-25 01:02:03   2017-01-25 01:02:03 
- 25 Jan 2017 1:2:3 Z               2017-01-25 01:02:03   2017-01-25 01:02:03 
- 25 Jan 2017 1:2:3 Z +0300         2017-01-24 22:02:03   2017-01-24 22:02:03 
- 25 Jan 2017 1:2:3 Z+03:00         2017-01-24 22:02:03   2017-01-24 22:02:03 
- 25 Jan 2017 1:2:3 Z +0300 OM                     ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 25 Jan 2017 1:2:3 Z +03:00 PM     2017-01-25 10:02:03   2017-01-25 10:02:03 
- 25 Jan 2017 1:2:3 Z +0300 PM      2017-01-25 10:02:03   2017-01-25 10:02:03 
- 25 Jan 2017 1:2:3 Z+03:00 PM      2017-01-25 10:02:03   2017-01-25 10:02:03 
- 25 Jan 2017 1:2:3 Z +03:30 PM     2017-01-25 09:32:03   2017-01-25 09:32:03 
- 25 Jan 2017 1:2:3Z Mo                            ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 25 Jan 2017 1:2:3Z Mon            2017-01-25 01:02:03   2017-01-25 01:02:03 
- 25 Jan 2017 1:2:3Z Moo                           ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- 25 Jan 2017 1:2:3 Z PM            2017-01-25 13:02:03   2017-01-25 13:02:03 
- 25 Jan 2017 1:2:3Z PM             2017-01-25 13:02:03   2017-01-25 13:02:03 
- 25 Jan 2017 1:2:3 Z PM +03:00     2017-01-25 10:02:03   2017-01-25 10:02:03 
- Jun, 11 Feb 2018 06:40:50 +0300                  ᴺᵁᴸᴸ   1970-01-01 00:00:00 
- Sun 11 Feb 2018 06:40:50 +0300    2018-02-11 03:40:50   2018-02-11 03:40:50 
- Sun, 11 Feb 2018 06:40:50 +0300   2018-02-11 03:40:50   2018-02-11 03:40:50 
+  1.  0                                                ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+  2.  0000                                             ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+  3.  2000-01-01 00:00:00               2000-01-01 00:00:00   2000-01-01 00:00:00 
+  4.  2000-01-01 01:00:00               2000-01-01 01:00:00   2000-01-01 01:00:00 
+  5.  02/01/17 010203 MSK               2017-01-01 22:02:03   2017-01-01 22:02:03 
+  6.  02/01/17 010203 MSK+0100          2017-01-01 21:02:03   2017-01-01 21:02:03 
+  7.  02/01/17 010203 UTC+0300          2017-01-01 22:02:03   2017-01-01 22:02:03 
+  8.  02/01/17 010203Z                  2017-01-02 01:02:03   2017-01-02 01:02:03 
+  9.  02/01/1970 010203Z                1970-01-02 01:02:03   1970-01-02 01:02:03 
+ 10.  02/01/70 010203Z                  1970-01-02 01:02:03   1970-01-02 01:02:03 
+ 11.  11 Feb 2018 06:40:50 +0300        2018-02-11 03:40:50   2018-02-11 03:40:50 
+ 12.  17 Apr 2000 2 1:2:3               2000-04-17 01:02:03   2000-04-17 01:02:03 
+ 13.  19700102 01:00:00                 1970-01-02 01:00:00   1970-01-02 01:00:00 
+ 14.  1970010201:00:00                                 ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 15.  19700102010203                    1970-01-02 01:02:03   1970-01-02 01:02:03 
+ 16.  19700102010203Z                   1970-01-02 01:02:03   1970-01-02 01:02:03 
+ 17.  1970/01/02 010203Z                1970-01-02 01:02:03   1970-01-02 01:02:03 
+ 18.  20 2000                           2000-01-20 00:00:00   2000-01-20 00:00:00 
+ 19.  201                                              ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 20.  20160101                          2016-01-01 00:00:00   2016-01-01 00:00:00 
+ 21.  2016-01-01                        2016-01-01 00:00:00   2016-01-01 00:00:00 
+ 22.  201601-01                         2016-01-01 01:00:00   2016-01-01 01:00:00 
+ 23.  2016-01-01MSD                     2015-12-31 20:00:00   2015-12-31 20:00:00 
+ 24.  2016-01-01 MSD                    2015-12-31 20:00:00   2015-12-31 20:00:00 
+ 25.  201601-01 MSD                     2016-01-01 04:00:00   2016-01-01 04:00:00 
+ 26.  2016-01-01UTC                     2016-01-01 00:00:00   2016-01-01 00:00:00 
+ 27.  2016-01-01Z                       2016-01-01 00:00:00   2016-01-01 00:00:00 
+ 28.  2017                              2017-01-01 00:00:00   2017-01-01 00:00:00 
+ 29.  2017/01/00                        2017-01-01 00:00:00   2017-01-01 00:00:00 
+ 30.  2017/01/00 MSD                    2016-12-31 20:00:00   2016-12-31 20:00:00 
+ 31.  2017/01/00 MSD Jun                2017-05-31 20:00:00   2017-05-31 20:00:00 
+ 32.  2017/01/01                        2017-01-01 00:00:00   2017-01-01 00:00:00 
+ 33.  201701 02 010203 UTC+0300         2017-01-01 22:02:03   2017-01-01 22:02:03 
+ 34.  2017-01-02 03:04:05               2017-01-02 03:04:05   2017-01-02 03:04:05 
+ 35.  2017-01-0203:04:05                               ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 36.  2017-01-02 03:04:05+0             2017-01-02 03:04:05   2017-01-02 03:04:05 
+ 37.  2017-01-02 03:04:05+00            2017-01-02 03:04:05   2017-01-02 03:04:05 
+ 38.  2017-01-02 03:04:05+0000          2017-01-02 03:04:05   2017-01-02 03:04:05 
+ 39.  2017-01-02 03:04:05 -0100         2017-01-02 04:04:05   2017-01-02 04:04:05 
+ 40.  2017-01-02 03:04:05+030           2017-01-02 02:34:05   2017-01-02 02:34:05 
+ 41.  2017-01-02 03:04:05+0300          2017-01-02 00:04:05   2017-01-02 00:04:05 
+ 42.  2017-01-02 03:04:05+1             2017-01-02 02:04:05   2017-01-02 02:04:05 
+ 43.  2017-01-02 03:04:05+300           2017-01-02 00:04:05   2017-01-02 00:04:05 
+ 44.  2017-01-02 03:04:05+900           2017-01-01 18:04:05   2017-01-01 18:04:05 
+ 45.  2017-01-02 03:04:05GMT            2017-01-02 03:04:05   2017-01-02 03:04:05 
+ 46.  2017-01-02 03:04:05 MSD           2017-01-01 23:04:05   2017-01-01 23:04:05 
+ 47.  2017-01-02 03:04:05 MSD Feb       2017-02-01 23:04:05   2017-02-01 23:04:05 
+ 48.  2017-01-02 03:04:05 MSD Jun       2017-06-01 23:04:05   2017-06-01 23:04:05 
+ 49.  2017-01-02 03:04:05 MSK           2017-01-02 00:04:05   2017-01-02 00:04:05 
+ 50.  2017-01-02T03:04:05               2017-01-02 03:04:05   2017-01-02 03:04:05 
+ 51.  2017-01-02T03:04:05+00            2017-01-02 03:04:05   2017-01-02 03:04:05 
+ 52.  2017-01-02T03:04:05 -0100         2017-01-02 04:04:05   2017-01-02 04:04:05 
+ 53.  2017-01-02T03:04:05-0100          2017-01-02 04:04:05   2017-01-02 04:04:05 
+ 54.  2017-01-02T03:04:05+0100          2017-01-02 02:04:05   2017-01-02 02:04:05 
+ 55.  2017-01-02T03:04:05Z              2017-01-02 03:04:05   2017-01-02 03:04:05 
+ 56.  2017-01 03:04:05 MSD Jun          2017-05-31 23:04:05   2017-05-31 23:04:05 
+ 57.  2017-01 03:04 MSD Jun             2017-05-31 23:04:00   2017-05-31 23:04:00 
+ 58.  2017/01/31                        2017-01-31 00:00:00   2017-01-31 00:00:00 
+ 59.  2017/01/32                                       ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 60.  2017-01 MSD Jun                   2017-05-31 20:00:00   2017-05-31 20:00:00 
+ 61.  201701 MSD Jun                    2017-05-31 20:00:00   2017-05-31 20:00:00 
+ 62.  2017 25 1:2:3                                    ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 63.  2017 25 Apr 1:2:3                 2017-04-01 01:02:03   2017-04-01 01:02:03 
+ 64.  2017 Apr 01 11:22:33              2017-04-01 11:22:33   2017-04-01 11:22:33 
+ 65.  2017 Apr 02 01/02/03 UTC+0300                    ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 66.  2017 Apr 02 010203 UTC+0300       2017-04-01 22:02:03   2017-04-01 22:02:03 
+ 67.  2017 Apr 02 01:2:3 UTC+0300       2017-04-01 22:02:03   2017-04-01 22:02:03 
+ 68.  2017 Apr 02 1:02:3                2017-04-02 01:02:03   2017-04-02 01:02:03 
+ 69.  2017 Apr 02 11:22:33              2017-04-02 11:22:33   2017-04-02 11:22:33 
+ 70.  2017 Apr 02 1:2:03                2017-04-02 01:02:03   2017-04-02 01:02:03 
+ 71.  2017 Apr 02 1:22:33               2017-04-02 01:22:33   2017-04-02 01:22:33 
+ 72.  2017 Apr 02 1:2:3                 2017-04-02 01:02:03   2017-04-02 01:02:03 
+ 73.  2017 Apr 02 1:2:33                2017-04-02 01:02:33   2017-04-02 01:02:33 
+ 74.  2017 Apr 02 1:2:3 MSK             2017-04-01 22:02:03   2017-04-01 22:02:03 
+ 75.  2017 Apr 02 1:2:3 MSK 2017                       ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 76.  2017 Apr 02 1:2:3 MSK 2018                       ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 77.  2017 Apr 02 1:2:3 UTC+0000        2017-04-02 01:02:03   2017-04-02 01:02:03 
+ 78.  2017 Apr 02 1:2:3 UTC+0300        2017-04-01 22:02:03   2017-04-01 22:02:03 
+ 79.  2017 Apr 02 1:2:3 UTC+0400        2017-04-01 21:02:03   2017-04-01 21:02:03 
+ 80.  2017 Apr 2 1:2:3                  2017-04-02 01:02:03   2017-04-02 01:02:03 
+ 81.  2017 Jan 02 010203 UTC+0300       2017-01-01 22:02:03   2017-01-01 22:02:03 
+ 82.  25 Apr 2017 01:02:03              2017-04-25 01:02:03   2017-04-25 01:02:03 
+ 83.  25 Apr 2017 1:2:3                 2017-04-25 01:02:03   2017-04-25 01:02:03 
+ 84.  25 Jan 2017 1:2:3                 2017-01-25 01:02:03   2017-01-25 01:02:03 
+ 85.  25 Jan 2017 1:2:3 MSK             2017-01-24 22:02:03   2017-01-24 22:02:03 
+ 86.  25 Jan 2017 1:2:3 PM              2017-01-25 13:02:03   2017-01-25 13:02:03 
+ 87.  25 Jan 2017 1:2:3Z                2017-01-25 01:02:03   2017-01-25 01:02:03 
+ 88.  25 Jan 2017 1:2:3 Z               2017-01-25 01:02:03   2017-01-25 01:02:03 
+ 89.  25 Jan 2017 1:2:3 Z +0300         2017-01-24 22:02:03   2017-01-24 22:02:03 
+ 90.  25 Jan 2017 1:2:3 Z+03:00         2017-01-24 22:02:03   2017-01-24 22:02:03 
+ 91.  25 Jan 2017 1:2:3 Z +0300 OM                     ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 92.  25 Jan 2017 1:2:3 Z +03:00 PM     2017-01-25 10:02:03   2017-01-25 10:02:03 
+ 93.  25 Jan 2017 1:2:3 Z +0300 PM      2017-01-25 10:02:03   2017-01-25 10:02:03 
+ 94.  25 Jan 2017 1:2:3 Z+03:00 PM      2017-01-25 10:02:03   2017-01-25 10:02:03 
+ 95.  25 Jan 2017 1:2:3 Z +03:30 PM     2017-01-25 09:32:03   2017-01-25 09:32:03 
+ 96.  25 Jan 2017 1:2:3Z Mo                            ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 97.  25 Jan 2017 1:2:3Z Mon            2017-01-25 01:02:03   2017-01-25 01:02:03 
+ 98.  25 Jan 2017 1:2:3Z Moo                           ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+ 99.  25 Jan 2017 1:2:3 Z PM            2017-01-25 13:02:03   2017-01-25 13:02:03 
+100.  25 Jan 2017 1:2:3Z PM             2017-01-25 13:02:03   2017-01-25 13:02:03 
+101.  25 Jan 2017 1:2:3 Z PM +03:00     2017-01-25 10:02:03   2017-01-25 10:02:03 
+102.  Jun, 11 Feb 2018 06:40:50 +0300                  ᴺᵁᴸᴸ   1970-01-01 00:00:00 
+103.  Sun 11 Feb 2018 06:40:50 +0300    2018-02-11 03:40:50   2018-02-11 03:40:50 
+104.  Sun, 11 Feb 2018 06:40:50 +0300   2018-02-11 03:40:50   2018-02-11 03:40:50 
diff --git a/tests/queries/0_stateless/00695_pretty_max_column_pad_width.reference b/tests/queries/0_stateless/00695_pretty_max_column_pad_width.reference
index f464bff67b8..cd11af5d8f7 100644
--- a/tests/queries/0_stateless/00695_pretty_max_column_pad_width.reference
+++ b/tests/queries/0_stateless/00695_pretty_max_column_pad_width.reference
@@ -1,102 +1,102 @@
-┌─range(number)──────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┐
-│ []                                                                                                                                                                                                                                                         │
-│ [0]                                                                                                                                                                                                                                                        │
-│ [0,1]                                                                                                                                                                                                                                                      │
-│ [0,1,2]                                                                                                                                                                                                                                                    │
-│ [0,1,2,3]                                                                                                                                                                                                                                                  │
-│ [0,1,2,3,4]                                                                                                                                                                                                                                                │
-│ [0,1,2,3,4,5]                                                                                                                                                                                                                                              │
-│ [0,1,2,3,4,5,6]                                                                                                                                                                                                                                            │
-│ [0,1,2,3,4,5,6,7]                                                                                                                                                                                                                                          │
-│ [0,1,2,3,4,5,6,7,8]                                                                                                                                                                                                                                        │
-│ [0,1,2,3,4,5,6,7,8,9]                                                                                                                                                                                                                                      │
-│ [0,1,2,3,4,5,6,7,8,9,10]                                                                                                                                                                                                                                   │
-│ [0,1,2,3,4,5,6,7,8,9,10,11]                                                                                                                                                                                                                                │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12]                                                                                                                                                                                                                             │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13]                                                                                                                                                                                                                          │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14]                                                                                                                                                                                                                       │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15]                                                                                                                                                                                                                    │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16]                                                                                                                                                                                                                 │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]                                                                                                                                                                                                              │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18]                                                                                                                                                                                                           │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19]                                                                                                                                                                                                        │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20]                                                                                                                                                                                                     │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21]                                                                                                                                                                                                  │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22]                                                                                                                                                                                               │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23]                                                                                                                                                                                            │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24]                                                                                                                                                                                         │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25]                                                                                                                                                                                      │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26]                                                                                                                                                                                   │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27]                                                                                                                                                                                │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28]                                                                                                                                                                             │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29]                                                                                                                                                                          │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30]                                                                                                                                                                       │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31]                                                                                                                                                                    │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32]                                                                                                                                                                 │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33]                                                                                                                                                              │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34]                                                                                                                                                           │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35]                                                                                                                                                        │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36]                                                                                                                                                     │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37]                                                                                                                                                  │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38]                                                                                                                                               │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39]                                                                                                                                            │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40]                                                                                                                                         │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41]                                                                                                                                      │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42]                                                                                                                                   │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43]                                                                                                                                │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44]                                                                                                                             │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45]                                                                                                                          │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46]                                                                                                                       │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47]                                                                                                                    │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48]                                                                                                                 │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49]                                                                                                              │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50]                                                                                                           │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51]                                                                                                        │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52]                                                                                                     │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53]                                                                                                  │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54]                                                                                               │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55]                                                                                            │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56]                                                                                         │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57]                                                                                      │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58]                                                                                   │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59]                                                                                │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60]                                                                             │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61]                                                                          │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62]                                                                       │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63]                                                                    │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64]                                                                 │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65]                                                              │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66]                                                           │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67]                                                        │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68]                                                     │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69]                                                  │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70]                                               │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71]                                            │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72]                                         │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73]                                      │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74]                                   │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75]                                │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76]                             │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77]                          │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78]                       │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79]                    │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80]                 │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81]              │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82]           │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83]        │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84]     │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85]  │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97] │
-│ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98] │
-└────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
+     ┌─range(number)──────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┐
+  1. │ []                                                                                                                                                                                                                                                         │
+  2. │ [0]                                                                                                                                                                                                                                                        │
+  3. │ [0,1]                                                                                                                                                                                                                                                      │
+  4. │ [0,1,2]                                                                                                                                                                                                                                                    │
+  5. │ [0,1,2,3]                                                                                                                                                                                                                                                  │
+  6. │ [0,1,2,3,4]                                                                                                                                                                                                                                                │
+  7. │ [0,1,2,3,4,5]                                                                                                                                                                                                                                              │
+  8. │ [0,1,2,3,4,5,6]                                                                                                                                                                                                                                            │
+  9. │ [0,1,2,3,4,5,6,7]                                                                                                                                                                                                                                          │
+ 10. │ [0,1,2,3,4,5,6,7,8]                                                                                                                                                                                                                                        │
+ 11. │ [0,1,2,3,4,5,6,7,8,9]                                                                                                                                                                                                                                      │
+ 12. │ [0,1,2,3,4,5,6,7,8,9,10]                                                                                                                                                                                                                                   │
+ 13. │ [0,1,2,3,4,5,6,7,8,9,10,11]                                                                                                                                                                                                                                │
+ 14. │ [0,1,2,3,4,5,6,7,8,9,10,11,12]                                                                                                                                                                                                                             │
+ 15. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13]                                                                                                                                                                                                                          │
+ 16. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14]                                                                                                                                                                                                                       │
+ 17. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15]                                                                                                                                                                                                                    │
+ 18. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16]                                                                                                                                                                                                                 │
+ 19. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17]                                                                                                                                                                                                              │
+ 20. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18]                                                                                                                                                                                                           │
+ 21. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19]                                                                                                                                                                                                        │
+ 22. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20]                                                                                                                                                                                                     │
+ 23. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21]                                                                                                                                                                                                  │
+ 24. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22]                                                                                                                                                                                               │
+ 25. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23]                                                                                                                                                                                            │
+ 26. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24]                                                                                                                                                                                         │
+ 27. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25]                                                                                                                                                                                      │
+ 28. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26]                                                                                                                                                                                   │
+ 29. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27]                                                                                                                                                                                │
+ 30. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28]                                                                                                                                                                             │
+ 31. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29]                                                                                                                                                                          │
+ 32. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30]                                                                                                                                                                       │
+ 33. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31]                                                                                                                                                                    │
+ 34. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32]                                                                                                                                                                 │
+ 35. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33]                                                                                                                                                              │
+ 36. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34]                                                                                                                                                           │
+ 37. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35]                                                                                                                                                        │
+ 38. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36]                                                                                                                                                     │
+ 39. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37]                                                                                                                                                  │
+ 40. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38]                                                                                                                                               │
+ 41. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39]                                                                                                                                            │
+ 42. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40]                                                                                                                                         │
+ 43. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41]                                                                                                                                      │
+ 44. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42]                                                                                                                                   │
+ 45. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43]                                                                                                                                │
+ 46. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44]                                                                                                                             │
+ 47. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45]                                                                                                                          │
+ 48. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46]                                                                                                                       │
+ 49. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47]                                                                                                                    │
+ 50. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48]                                                                                                                 │
+ 51. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49]                                                                                                              │
+ 52. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50]                                                                                                           │
+ 53. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51]                                                                                                        │
+ 54. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52]                                                                                                     │
+ 55. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53]                                                                                                  │
+ 56. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54]                                                                                               │
+ 57. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55]                                                                                            │
+ 58. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56]                                                                                         │
+ 59. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57]                                                                                      │
+ 60. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58]                                                                                   │
+ 61. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59]                                                                                │
+ 62. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60]                                                                             │
+ 63. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61]                                                                          │
+ 64. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62]                                                                       │
+ 65. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63]                                                                    │
+ 66. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64]                                                                 │
+ 67. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65]                                                              │
+ 68. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66]                                                           │
+ 69. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67]                                                        │
+ 70. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68]                                                     │
+ 71. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69]                                                  │
+ 72. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70]                                               │
+ 73. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71]                                            │
+ 74. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72]                                         │
+ 75. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73]                                      │
+ 76. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74]                                   │
+ 77. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75]                                │
+ 78. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76]                             │
+ 79. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77]                          │
+ 80. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78]                       │
+ 81. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79]                    │
+ 82. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80]                 │
+ 83. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81]              │
+ 84. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82]           │
+ 85. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83]        │
+ 86. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84]     │
+ 87. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85]  │
+ 88. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86] │
+ 89. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87] │
+ 90. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88] │
+ 91. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89] │
+ 92. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90] │
+ 93. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91] │
+ 94. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92] │
+ 95. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93] │
+ 96. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94] │
+ 97. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95] │
+ 98. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96] │
+ 99. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97] │
+100. │ [0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98] │
+     └────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
diff --git a/tests/queries/0_stateless/00722_inner_join.reference b/tests/queries/0_stateless/00722_inner_join.reference
index b5e8a77a20d..22e099829ae 100644
--- a/tests/queries/0_stateless/00722_inner_join.reference
+++ b/tests/queries/0_stateless/00722_inner_join.reference
@@ -1,39 +1,39 @@
-┌─database─┬─name─┐
-│ system   │ one  │
-└──────────┴──────┘
-┌─database─┬─name─┐
-│ system   │ one  │
-└──────────┴──────┘
-┌─database─┬─name─┐
-│ system   │ one  │
-└──────────┴──────┘
-┌─x──────┬─name─┐
-│ system │ one  │
-└────────┴──────┘
-┌─database─┬─name─┐
-│ system   │ one  │
-└──────────┴──────┘
-┌─x──────┬─name─┐
-│ system │ one  │
-└────────┴──────┘
-┌─database─┬─name─┐
-│ system   │ one  │
-└──────────┴──────┘
-┌─db.x───┬─name─┐
-│ system │ one  │
-└────────┴──────┘
-┌─db.name─┬─name─┐
-│ system  │ one  │
-└─────────┴──────┘
-┌─db.name─┬─name─┐
-│ system  │ one  │
-└─────────┴──────┘
-┌─database─┬─name─┐
-│ system   │ one  │
-└──────────┴──────┘
-┌─database─┬─name─┐
-│ system   │ one  │
-└──────────┴──────┘
+   ┌─database─┬─name─┐
+1. │ system   │ one  │
+   └──────────┴──────┘
+   ┌─database─┬─name─┐
+1. │ system   │ one  │
+   └──────────┴──────┘
+   ┌─database─┬─name─┐
+1. │ system   │ one  │
+   └──────────┴──────┘
+   ┌─x──────┬─name─┐
+1. │ system │ one  │
+   └────────┴──────┘
+   ┌─database─┬─name─┐
+1. │ system   │ one  │
+   └──────────┴──────┘
+   ┌─x──────┬─name─┐
+1. │ system │ one  │
+   └────────┴──────┘
+   ┌─database─┬─name─┐
+1. │ system   │ one  │
+   └──────────┴──────┘
+   ┌─db.x───┬─name─┐
+1. │ system │ one  │
+   └────────┴──────┘
+   ┌─db.name─┬─name─┐
+1. │ system  │ one  │
+   └─────────┴──────┘
+   ┌─db.name─┬─name─┐
+1. │ system  │ one  │
+   └─────────┴──────┘
+   ┌─database─┬─name─┐
+1. │ system   │ one  │
+   └──────────┴──────┘
+   ┌─database─┬─name─┐
+1. │ system   │ one  │
+   └──────────┴──────┘
 2
 2
 2
diff --git a/tests/queries/0_stateless/00730_unicode_terminal_format.reference b/tests/queries/0_stateless/00730_unicode_terminal_format.reference
index fdfcfd5ed1d..0bf728b0743 100644
--- a/tests/queries/0_stateless/00730_unicode_terminal_format.reference
+++ b/tests/queries/0_stateless/00730_unicode_terminal_format.reference
@@ -1,88 +1,88 @@
-┏━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1           ┃ c2                                          ┃
-┡━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Здравствуйте │ Этот код можно отредактировать и запустить! │
-└──────────────┴─────────────────────────────────────────────┘
-┏━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1   ┃ c2                                 ┃
-┡━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ 你好 │ 这段代码是可以编辑并且能够运行的！ │
-└──────┴────────────────────────────────────┘
-┏━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1   ┃ c2                                     ┃
-┡━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Hola │ ¡Este código es editable y ejecutable! │
-└──────┴────────────────────────────────────────┘
-┏━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1      ┃ c2                                     ┃
-┡━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Bonjour │ Ce code est modifiable et exécutable ! │
-└─────────┴────────────────────────────────────────┘
-┏━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1   ┃ c2                                          ┃
-┡━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Ciao │ Questo codice è modificabile ed eseguibile! │
-└──────┴─────────────────────────────────────────────┘
-┏━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1         ┃ c2                                 ┃
-┡━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ こんにちは │ このコードは編集して実行出来ます！ │
-└────────────┴────────────────────────────────────┘
-┏━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1         ┃ c2                                           ┃
-┡━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ 안녕하세요 │ 여기에서 코드를 수정하고 실행할 수 있습니다! │
-└────────────┴──────────────────────────────────────────────┘
-┏━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1    ┃ c2                                     ┃
-┡━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Cześć │ Ten kod można edytować oraz uruchomić! │
-└───────┴────────────────────────────────────────┘
-┏━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1  ┃ c2                                   ┃
-┡━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Olá │ Este código é editável e executável! │
-└─────┴──────────────────────────────────────┘
-┏━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1       ┃ c2                                     ┃
-┡━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Chào bạn │ Bạn có thể edit và run code trực tiếp! │
-└──────────┴────────────────────────────────────────┘
-┏━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1    ┃ c2                                                 ┃
-┡━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Hallo │ Dieser Code kann bearbeitet und ausgeführt werden! │
-└───────┴────────────────────────────────────────────────────┘
-┏━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1  ┃ c2                                     ┃
-┡━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Hej │ Den här koden kan redigeras och köras! │
-└─────┴────────────────────────────────────────┘
-┏━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1   ┃ c2                                 ┃
-┡━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Ahoj │ Tento kód můžete upravit a spustit │
-└──────┴────────────────────────────────────┘
-┏━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1          ┃ c2                    ┃
-┡━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Tabs 	 Tabs │ Non-first 	 Tabs │
-└─────────────┴───────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1                                  ┃ c2                                                                                  ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Control characters  with zero width │ Invalid UTF-8 which eats pending characters �, or invalid by itself � with zero width │
-└─────────────────────────────────────┴─────────────────────────────────────────────────────────────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ c1               ┃ c2                     ┃
-┡━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━┩
-│ Russian ё and ё  │ Zero bytes     in middle │
-└──────────────────┴────────────────────────┘
-┏━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
-┃ 'Tabs \t Tabs' ┃ 'Long\tTitle' ┃
-┡━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
-│ Tabs 	 Tabs    │ Long	Title    │
-└────────────────┴───────────────┘
+   ┏━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ c1           ┃ c2                                          ┃
+   ┡━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │ Здравствуйте │ Этот код можно отредактировать и запустить! │
+   └──────────────┴─────────────────────────────────────────────┘
+   ┏━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ c1   ┃ c2                                 ┃
+   ┡━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+2. │ 你好 │ 这段代码是可以编辑并且能够运行的！ │
+   └──────┴────────────────────────────────────┘
+   ┏━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ c1   ┃ c2                                     ┃
+   ┡━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+3. │ Hola │ ¡Este código es editable y ejecutable! │
+   └──────┴────────────────────────────────────────┘
+   ┏━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ c1      ┃ c2                                     ┃
+   ┡━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+4. │ Bonjour │ Ce code est modifiable et exécutable ! │
+   └─────────┴────────────────────────────────────────┘
+   ┏━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ c1   ┃ c2                                          ┃
+   ┡━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+5. │ Ciao │ Questo codice è modificabile ed eseguibile! │
+   └──────┴─────────────────────────────────────────────┘
+   ┏━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ c1         ┃ c2                                 ┃
+   ┡━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+6. │ こんにちは │ このコードは編集して実行出来ます！ │
+   └────────────┴────────────────────────────────────┘
+   ┏━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ c1         ┃ c2                                           ┃
+   ┡━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+7. │ 안녕하세요 │ 여기에서 코드를 수정하고 실행할 수 있습니다! │
+   └────────────┴──────────────────────────────────────────────┘
+   ┏━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ c1    ┃ c2                                     ┃
+   ┡━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+8. │ Cześć │ Ten kod można edytować oraz uruchomić! │
+   └───────┴────────────────────────────────────────┘
+   ┏━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ c1  ┃ c2                                   ┃
+   ┡━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+9. │ Olá │ Este código é editável e executável! │
+   └─────┴──────────────────────────────────────┘
+    ┏━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+    ┃ c1       ┃ c2                                     ┃
+    ┡━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+10. │ Chào bạn │ Bạn có thể edit và run code trực tiếp! │
+    └──────────┴────────────────────────────────────────┘
+    ┏━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+    ┃ c1    ┃ c2                                                 ┃
+    ┡━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+11. │ Hallo │ Dieser Code kann bearbeitet und ausgeführt werden! │
+    └───────┴────────────────────────────────────────────────────┘
+    ┏━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+    ┃ c1  ┃ c2                                     ┃
+    ┡━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+12. │ Hej │ Den här koden kan redigeras och köras! │
+    └─────┴────────────────────────────────────────┘
+    ┏━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+    ┃ c1   ┃ c2                                 ┃
+    ┡━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+13. │ Ahoj │ Tento kód můžete upravit a spustit │
+    └──────┴────────────────────────────────────┘
+    ┏━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━┓
+    ┃ c1          ┃ c2                    ┃
+    ┡━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━┩
+14. │ Tabs 	 Tabs │ Non-first 	 Tabs │
+    └─────────────┴───────────────────────┘
+    ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+    ┃ c1                                  ┃ c2                                                                                  ┃
+    ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+15. │ Control characters  with zero width │ Invalid UTF-8 which eats pending characters �, or invalid by itself � with zero width │
+    └─────────────────────────────────────┴─────────────────────────────────────────────────────────────────────────────────────┘
+    ┏━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┓
+    ┃ c1               ┃ c2                     ┃
+    ┡━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━┩
+16. │ Russian ё and ё  │ Zero bytes     in middle │
+    └──────────────────┴────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
+   ┃ 'Tabs \t Tabs' ┃ 'Long\tTitle' ┃
+   ┡━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
+1. │ Tabs 	 Tabs    │ Long	Title    │
+   └────────────────┴───────────────┘
 Row 1:
 ──────
 '你好': 你好
diff --git a/tests/queries/0_stateless/00813_parse_date_time_best_effort_more.reference b/tests/queries/0_stateless/00813_parse_date_time_best_effort_more.reference
index 3acae55e846..e9bdbc4f0bf 100644
--- a/tests/queries/0_stateless/00813_parse_date_time_best_effort_more.reference
+++ b/tests/queries/0_stateless/00813_parse_date_time_best_effort_more.reference
@@ -1,22 +1,22 @@
- s                                               a                     b
+     s                                               a                     b
 
- 24.12.2018                    2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24-12-2018                    2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24.12.18                      2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24-12-18                      2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24-Dec-18                     2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24/DEC/18                     2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24/DEC/2018                   2018-12-24 00:00:00   2018-12-24 00:00:00 
- 01-OCT-2015                   2015-10-01 00:00:00   2015-10-01 00:00:00 
- 24.12.2018                    2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24-12-2018                    2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24.12.18                      2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24-12-18                      2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24-Dec-18                     2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24/DEC/18                     2018-12-24 00:00:00   2018-12-24 00:00:00 
- 24/DEC/2018                   2018-12-24 00:00:00   2018-12-24 00:00:00 
- 01-OCT-2015                   2015-10-01 00:00:00   2015-10-01 00:00:00 
- 24.12.18 010203               2018-12-24 01:02:03   2018-12-24 01:02:03 
- 24.12.18 01:02:03             2018-12-24 01:02:03   2018-12-24 01:02:03 
- 24.DEC.18T01:02:03.000+0300   2018-12-23 22:02:03   2018-12-23 22:02:03 
- 01-September-2018 11:22       2018-09-01 11:22:00   2018-09-01 11:22:00 
+ 1.  24.12.2018                    2018-12-24 00:00:00   2018-12-24 00:00:00 
+ 2.  24-12-2018                    2018-12-24 00:00:00   2018-12-24 00:00:00 
+ 3.  24.12.18                      2018-12-24 00:00:00   2018-12-24 00:00:00 
+ 4.  24-12-18                      2018-12-24 00:00:00   2018-12-24 00:00:00 
+ 5.  24-Dec-18                     2018-12-24 00:00:00   2018-12-24 00:00:00 
+ 6.  24/DEC/18                     2018-12-24 00:00:00   2018-12-24 00:00:00 
+ 7.  24/DEC/2018                   2018-12-24 00:00:00   2018-12-24 00:00:00 
+ 8.  01-OCT-2015                   2015-10-01 00:00:00   2015-10-01 00:00:00 
+ 9.  24.12.2018                    2018-12-24 00:00:00   2018-12-24 00:00:00 
+10.  24-12-2018                    2018-12-24 00:00:00   2018-12-24 00:00:00 
+11.  24.12.18                      2018-12-24 00:00:00   2018-12-24 00:00:00 
+12.  24-12-18                      2018-12-24 00:00:00   2018-12-24 00:00:00 
+13.  24-Dec-18                     2018-12-24 00:00:00   2018-12-24 00:00:00 
+14.  24/DEC/18                     2018-12-24 00:00:00   2018-12-24 00:00:00 
+15.  24/DEC/2018                   2018-12-24 00:00:00   2018-12-24 00:00:00 
+16.  01-OCT-2015                   2015-10-01 00:00:00   2015-10-01 00:00:00 
+17.  24.12.18 010203               2018-12-24 01:02:03   2018-12-24 01:02:03 
+18.  24.12.18 01:02:03             2018-12-24 01:02:03   2018-12-24 01:02:03 
+19.  24.DEC.18T01:02:03.000+0300   2018-12-23 22:02:03   2018-12-23 22:02:03 
+20.  01-September-2018 11:22       2018-09-01 11:22:00   2018-09-01 11:22:00 
diff --git a/tests/queries/0_stateless/00818_inner_join_bug_3567.reference b/tests/queries/0_stateless/00818_inner_join_bug_3567.reference
index 41e0d8ea43a..0194a3c7f09 100644
--- a/tests/queries/0_stateless/00818_inner_join_bug_3567.reference
+++ b/tests/queries/0_stateless/00818_inner_join_bug_3567.reference
@@ -1,19 +1,19 @@
-┌─[1ma[0m─┬──────────[1mb[0m─┐
-│ a │ 2018-01-01 │
-│ b │ 2018-01-01 │
-│ c │ 2018-01-01 │
-└───┴────────────┘
-┌─[1mc[0m─┬─[1mtable2.a[0m─┬──────────[1md[0m─┬─[1ma[0m─┬──────────[1mb[0m─┐
-│ B │ b        │ 2018-01-01 │ B │ 2018-01-01 │
-│ C │ c        │ 2018-01-01 │ C │ 2018-01-01 │
-│ D │ d        │ 2018-01-01 │ D │ 2018-01-01 │
-└───┴──────────┴────────────┴───┴────────────┘
-┌─[1ma[0m─┬──────────[1mb[0m─┬─[1mc[0m─┬──────────[1md[0m─┬─[1mc[0m─┐
-│ a │ 2018-01-01 │   │ 1970-01-01 │   │
-│ b │ 2018-01-01 │ B │ 2018-01-01 │ B │
-│ c │ 2018-01-01 │ C │ 2018-01-01 │ C │
-└───┴────────────┴───┴────────────┴───┘
-┌─[1ma[0m─┬──────────[1mb[0m─┬─[1mc[0m─┬──────────[1md[0m─┬─[1mc[0m─┐
-│ b │ 2018-01-01 │ B │ 2018-01-01 │ B │
-│ c │ 2018-01-01 │ C │ 2018-01-01 │ C │
-└───┴────────────┴───┴────────────┴───┘
+   ┌─[1ma[0m─┬──────────[1mb[0m─┐
+[90m1. [0m│ a │ 2018-01-01 │
+[90m2. [0m│ b │ 2018-01-01 │
+[90m3. [0m│ c │ 2018-01-01 │
+   └───┴────────────┘
+   ┌─[1mc[0m─┬─[1mtable2.a[0m─┬──────────[1md[0m─┬─[1ma[0m─┬──────────[1mb[0m─┐
+[90m1. [0m│ B │ b        │ 2018-01-01 │ B │ 2018-01-01 │
+[90m2. [0m│ C │ c        │ 2018-01-01 │ C │ 2018-01-01 │
+[90m3. [0m│ D │ d        │ 2018-01-01 │ D │ 2018-01-01 │
+   └───┴──────────┴────────────┴───┴────────────┘
+   ┌─[1ma[0m─┬──────────[1mb[0m─┬─[1mc[0m─┬──────────[1md[0m─┬─[1mc[0m─┐
+[90m1. [0m│ a │ 2018-01-01 │   │ 1970-01-01 │   │
+[90m2. [0m│ b │ 2018-01-01 │ B │ 2018-01-01 │ B │
+[90m3. [0m│ c │ 2018-01-01 │ C │ 2018-01-01 │ C │
+   └───┴────────────┴───┴────────────┴───┘
+   ┌─[1ma[0m─┬──────────[1mb[0m─┬─[1mc[0m─┬──────────[1md[0m─┬─[1mc[0m─┐
+[90m1. [0m│ b │ 2018-01-01 │ B │ 2018-01-01 │ B │
+[90m2. [0m│ c │ 2018-01-01 │ C │ 2018-01-01 │ C │
+   └───┴────────────┴───┴────────────┴───┘
diff --git a/tests/queries/0_stateless/00820_multiple_joins.reference b/tests/queries/0_stateless/00820_multiple_joins.reference
index 3d7054bacfc..64f5e75a667 100644
--- a/tests/queries/0_stateless/00820_multiple_joins.reference
+++ b/tests/queries/0_stateless/00820_multiple_joins.reference
@@ -5,9 +5,9 @@
 0	0	0
 10	100	1000
 20	200	2000
-┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬─t3.c─┬─t5.a─┬─t5.b─┬─t5.c─┐
-│    0 │    0 │    0 │    0 │    0 │    0 │    0 │    0 │
-└──────┴──────┴──────┴──────┴──────┴──────┴──────┴──────┘
+   ┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬─t3.c─┬─t5.a─┬─t5.b─┬─t5.c─┐
+1. │    0 │    0 │    0 │    0 │    0 │    0 │    0 │    0 │
+   └──────┴──────┴──────┴──────┴──────┴──────┴──────┴──────┘
 0	0	0	0
 6	6	60	60
 12	12	120	120
@@ -32,18 +32,18 @@
 6	6	60	60
 12	12	120	120
 18	18	180	180
-┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬────c─┐
-│    0 │    0 │    0 │    0 │    0 │
-│    6 │    6 │   60 │   60 │  600 │
-│   12 │   12 │  120 │  120 │ 1200 │
-│   18 │   18 │  180 │  180 │ 1800 │
-└──────┴──────┴──────┴──────┴──────┘
-┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬────c─┐
-│    0 │    0 │    0 │    0 │    0 │
-│    6 │    6 │   60 │   60 │  600 │
-│   12 │   12 │  120 │  120 │ 1200 │
-│   18 │   18 │  180 │  180 │ 1800 │
-└──────┴──────┴──────┴──────┴──────┘
+   ┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬────c─┐
+1. │    0 │    0 │    0 │    0 │    0 │
+2. │    6 │    6 │   60 │   60 │  600 │
+3. │   12 │   12 │  120 │  120 │ 1200 │
+4. │   18 │   18 │  180 │  180 │ 1800 │
+   └──────┴──────┴──────┴──────┴──────┘
+   ┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬────c─┐
+1. │    0 │    0 │    0 │    0 │    0 │
+2. │    6 │    6 │   60 │   60 │  600 │
+3. │   12 │   12 │  120 │  120 │ 1200 │
+4. │   18 │   18 │  180 │  180 │ 1800 │
+   └──────┴──────┴──────┴──────┴──────┘
 0	0	0	0	0	0	0
 6	6	60	60	66	66	120
 12	12	120	120	132	132	240
diff --git a/tests/queries/0_stateless/00820_multiple_joins_subquery_requires_alias.reference b/tests/queries/0_stateless/00820_multiple_joins_subquery_requires_alias.reference
index 11755d6bc8b..8104f6e4490 100644
--- a/tests/queries/0_stateless/00820_multiple_joins_subquery_requires_alias.reference
+++ b/tests/queries/0_stateless/00820_multiple_joins_subquery_requires_alias.reference
@@ -5,9 +5,9 @@
 0	0	0
 10	100	1000
 20	200	2000
-┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬─t3.c─┬─t5.a─┬─t5.b─┬─t5.c─┐
-│    0 │    0 │    0 │    0 │    0 │    0 │    0 │    0 │
-└──────┴──────┴──────┴──────┴──────┴──────┴──────┴──────┘
+   ┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬─t3.c─┬─t5.a─┬─t5.b─┬─t5.c─┐
+1. │    0 │    0 │    0 │    0 │    0 │    0 │    0 │    0 │
+   └──────┴──────┴──────┴──────┴──────┴──────┴──────┴──────┘
 0	0	0	0
 6	6	60	60
 12	12	120	120
@@ -32,18 +32,18 @@
 6	6	60	60
 12	12	120	120
 18	18	180	180
-┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬────c─┐
-│    0 │    0 │    0 │    0 │    0 │
-│    6 │    6 │   60 │   60 │  600 │
-│   12 │   12 │  120 │  120 │ 1200 │
-│   18 │   18 │  180 │  180 │ 1800 │
-└──────┴──────┴──────┴──────┴──────┘
-┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬────c─┐
-│    0 │    0 │    0 │    0 │    0 │
-│    6 │    6 │   60 │   60 │  600 │
-│   12 │   12 │  120 │  120 │ 1200 │
-│   18 │   18 │  180 │  180 │ 1800 │
-└──────┴──────┴──────┴──────┴──────┘
+   ┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬────c─┐
+1. │    0 │    0 │    0 │    0 │    0 │
+2. │    6 │    6 │   60 │   60 │  600 │
+3. │   12 │   12 │  120 │  120 │ 1200 │
+4. │   18 │   18 │  180 │  180 │ 1800 │
+   └──────┴──────┴──────┴──────┴──────┘
+   ┌─t1.a─┬─t2.a─┬─t2.b─┬─t3.b─┬────c─┐
+1. │    0 │    0 │    0 │    0 │    0 │
+2. │    6 │    6 │   60 │   60 │  600 │
+3. │   12 │   12 │  120 │  120 │ 1200 │
+4. │   18 │   18 │  180 │  180 │ 1800 │
+   └──────┴──────┴──────┴──────┴──────┘
 0	0	0	0	0	0	0
 6	6	60	60	66	66	120
 12	12	120	120	132	132	240
diff --git a/tests/queries/0_stateless/00847_multiple_join_same_column.reference b/tests/queries/0_stateless/00847_multiple_join_same_column.reference
index 91bd62ca5a3..112289e1613 100644
--- a/tests/queries/0_stateless/00847_multiple_join_same_column.reference
+++ b/tests/queries/0_stateless/00847_multiple_join_same_column.reference
@@ -15,31 +15,31 @@ s.a: 0
 s.b: 0
 y.a: 0
 y.b: 0
-┌─t.a─┬─s.b─┬─s.a─┬─s.b─┬─y.a─┬─y.b─┐
-│   1 │   1 │   1 │   1 │   1 │   1 │
-│   2 │   0 │   0 │   0 │   0 │   0 │
-└─────┴─────┴─────┴─────┴─────┴─────┘
-┌─t_a─┐
-│   1 │
-│   2 │
-└─────┘
-┌─t.a─┬─s_a─┐
-│   1 │   1 │
-│   2 │   0 │
-└─────┴─────┘
-┌─t.a─┬─t.a─┬─t_b─┐
-│   1 │   1 │   1 │
-│   2 │   2 │   2 │
-└─────┴─────┴─────┘
-┌─s.a─┬─s.a─┬─s_b─┬─s.b─┐
-│   1 │   1 │   1 │   1 │
-│   0 │   0 │   0 │   0 │
-└─────┴─────┴─────┴─────┘
-┌─y.a─┬─y.a─┬─y_b─┬─y.b─┐
-│   1 │   1 │   1 │   1 │
-│   0 │   0 │   0 │   0 │
-└─────┴─────┴─────┴─────┘
-┌─t.a─┬─t_a─┬─s.a─┬─s_a─┬─y.a─┬─y_a─┐
-│   1 │   1 │   1 │   1 │   1 │   1 │
-│   2 │   2 │   0 │   0 │   0 │   0 │
-└─────┴─────┴─────┴─────┴─────┴─────┘
+   ┌─t.a─┬─s.b─┬─s.a─┬─s.b─┬─y.a─┬─y.b─┐
+1. │   1 │   1 │   1 │   1 │   1 │   1 │
+2. │   2 │   0 │   0 │   0 │   0 │   0 │
+   └─────┴─────┴─────┴─────┴─────┴─────┘
+   ┌─t_a─┐
+1. │   1 │
+2. │   2 │
+   └─────┘
+   ┌─t.a─┬─s_a─┐
+1. │   1 │   1 │
+2. │   2 │   0 │
+   └─────┴─────┘
+   ┌─t.a─┬─t.a─┬─t_b─┐
+1. │   1 │   1 │   1 │
+2. │   2 │   2 │   2 │
+   └─────┴─────┴─────┘
+   ┌─s.a─┬─s.a─┬─s_b─┬─s.b─┐
+1. │   1 │   1 │   1 │   1 │
+2. │   0 │   0 │   0 │   0 │
+   └─────┴─────┴─────┴─────┘
+   ┌─y.a─┬─y.a─┬─y_b─┬─y.b─┐
+1. │   1 │   1 │   1 │   1 │
+2. │   0 │   0 │   0 │   0 │
+   └─────┴─────┴─────┴─────┘
+   ┌─t.a─┬─t_a─┬─s.a─┬─s_a─┬─y.a─┬─y_a─┐
+1. │   1 │   1 │   1 │   1 │   1 │   1 │
+2. │   2 │   2 │   0 │   0 │   0 │   0 │
+   └─────┴─────┴─────┴─────┴─────┴─────┘
diff --git a/tests/queries/0_stateless/01018_ambiguous_column.reference b/tests/queries/0_stateless/01018_ambiguous_column.reference
index 308726fa184..ddc2ae1c572 100644
--- a/tests/queries/0_stateless/01018_ambiguous_column.reference
+++ b/tests/queries/0_stateless/01018_ambiguous_column.reference
@@ -7,10 +7,10 @@
 0
 0
 0
-┌─[1msystem.one.dummy[0m─┬─[1mA.dummy[0m─┬─[1mB.dummy[0m─┐
-│                0 │       0 │       0 │
-└──────────────────┴─────────┴─────────┘
-┌─[1mA.dummy[0m─┬─[1mone.dummy[0m─┬─[1mtwo.dummy[0m─┐
-│       0 │         0 │         0 │
-└─────────┴───────────┴───────────┘
+   ┌─[1msystem.one.dummy[0m─┬─[1mA.dummy[0m─┬─[1mB.dummy[0m─┐
+[90m1. [0m│                0 │       0 │       0 │
+   └──────────────────┴─────────┴─────────┘
+   ┌─[1mA.dummy[0m─┬─[1mone.dummy[0m─┬─[1mtwo.dummy[0m─┐
+[90m1. [0m│       0 │         0 │         0 │
+   └─────────┴───────────┴───────────┘
 0
diff --git a/tests/queries/0_stateless/01074_partial_revokes.reference b/tests/queries/0_stateless/01074_partial_revokes.reference
index 9ffa2878ad4..b5baa93efb7 100644
--- a/tests/queries/0_stateless/01074_partial_revokes.reference
+++ b/tests/queries/0_stateless/01074_partial_revokes.reference
@@ -19,17 +19,17 @@ GRANT SELECT ON *.* TO test_user_01074
 REVOKE SELECT ON db.* FROM test_user_01074
 GRANT SELECT ON db.`table` TO test_user_01074
 REVOKE SELECT(col1) ON db.`table` FROM test_user_01074
-┏━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━━━━┳━━━━━━━┳━━━━━━━━┳━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━┓
-┃ [1muser_name      [0m ┃ [1mrole_name[0m ┃ [1maccess_type[0m ┃ [1mdatabase[0m ┃ [1mtable[0m ┃ [1mcolumn[0m ┃ [1mis_partial_revoke[0m ┃ [1mgrant_option[0m ┃
-┡━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━━━━╇━━━━━━━╇━━━━━━━━╇━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━┩
-│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ ᴺᵁᴸᴸ     │ ᴺᵁᴸᴸ  │ ᴺᵁᴸᴸ   │                 0 │            0 │
-├─────────────────┼───────────┼─────────────┼──────────┼───────┼────────┼───────────────────┼──────────────┤
-│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ db       │ ᴺᵁᴸᴸ  │ ᴺᵁᴸᴸ   │                 1 │            0 │
-├─────────────────┼───────────┼─────────────┼──────────┼───────┼────────┼───────────────────┼──────────────┤
-│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ db       │ table │ ᴺᵁᴸᴸ   │                 0 │            0 │
-├─────────────────┼───────────┼─────────────┼──────────┼───────┼────────┼───────────────────┼──────────────┤
-│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ db       │ table │ col1   │                 1 │            0 │
-└─────────────────┴───────────┴─────────────┴──────────┴───────┴────────┴───────────────────┴──────────────┘
+   ┏━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━━━━┳━━━━━━━┳━━━━━━━━┳━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━┓
+   ┃ [1muser_name      [0m ┃ [1mrole_name[0m ┃ [1maccess_type[0m ┃ [1mdatabase[0m ┃ [1mtable[0m ┃ [1mcolumn[0m ┃ [1mis_partial_revoke[0m ┃ [1mgrant_option[0m ┃
+   ┡━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━━━━╇━━━━━━━╇━━━━━━━━╇━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━┩
+[90m1. [0m│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ ᴺᵁᴸᴸ     │ ᴺᵁᴸᴸ  │ ᴺᵁᴸᴸ   │                 0 │            0 │
+   ├─────────────────┼───────────┼─────────────┼──────────┼───────┼────────┼───────────────────┼──────────────┤
+[90m2. [0m│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ db       │ ᴺᵁᴸᴸ  │ ᴺᵁᴸᴸ   │                 1 │            0 │
+   ├─────────────────┼───────────┼─────────────┼──────────┼───────┼────────┼───────────────────┼──────────────┤
+[90m3. [0m│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ db       │ table │ ᴺᵁᴸᴸ   │                 0 │            0 │
+   ├─────────────────┼───────────┼─────────────┼──────────┼───────┼────────┼───────────────────┼──────────────┤
+[90m4. [0m│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ db       │ table │ col1   │                 1 │            0 │
+   └─────────────────┴───────────┴─────────────┴──────────┴───────┴────────┴───────────────────┴──────────────┘
 --cleanup
 --revoke 1
 GRANT SELECT ON *.* TO test_user_01074
@@ -41,13 +41,13 @@ GRANT SELECT ON *.* TO test_user_01074
 --grant option 1
 GRANT SELECT ON *.* TO test_user_01074 WITH GRANT OPTION
 REVOKE GRANT OPTION FOR SELECT(col1) ON db.`table` FROM test_user_01074
-┏━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━━━━┳━━━━━━━┳━━━━━━━━┳━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━┓
-┃ [1muser_name      [0m ┃ [1mrole_name[0m ┃ [1maccess_type[0m ┃ [1mdatabase[0m ┃ [1mtable[0m ┃ [1mcolumn[0m ┃ [1mis_partial_revoke[0m ┃ [1mgrant_option[0m ┃
-┡━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━━━━╇━━━━━━━╇━━━━━━━━╇━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━┩
-│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ ᴺᵁᴸᴸ     │ ᴺᵁᴸᴸ  │ ᴺᵁᴸᴸ   │                 0 │            1 │
-├─────────────────┼───────────┼─────────────┼──────────┼───────┼────────┼───────────────────┼──────────────┤
-│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ db       │ table │ col1   │                 1 │            1 │
-└─────────────────┴───────────┴─────────────┴──────────┴───────┴────────┴───────────────────┴──────────────┘
+   ┏━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━┳━━━━━━━━━━━━━┳━━━━━━━━━━┳━━━━━━━┳━━━━━━━━┳━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━┓
+   ┃ [1muser_name      [0m ┃ [1mrole_name[0m ┃ [1maccess_type[0m ┃ [1mdatabase[0m ┃ [1mtable[0m ┃ [1mcolumn[0m ┃ [1mis_partial_revoke[0m ┃ [1mgrant_option[0m ┃
+   ┡━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━╇━━━━━━━━━━━━━╇━━━━━━━━━━╇━━━━━━━╇━━━━━━━━╇━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━┩
+[90m1. [0m│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ ᴺᵁᴸᴸ     │ ᴺᵁᴸᴸ  │ ᴺᵁᴸᴸ   │                 0 │            1 │
+   ├─────────────────┼───────────┼─────────────┼──────────┼───────┼────────┼───────────────────┼──────────────┤
+[90m2. [0m│ test_user_01074 │ ᴺᵁᴸᴸ      │ SELECT      │ db       │ table │ col1   │                 1 │            1 │
+   └─────────────────┴───────────┴─────────────┴──────────┴───────┴────────┴───────────────────┴──────────────┘
 --cleanup
 --grant option 2
 GRANT SELECT ON *.* TO test_user_01074 WITH GRANT OPTION
diff --git a/tests/queries/0_stateless/01293_pretty_max_value_width.reference b/tests/queries/0_stateless/01293_pretty_max_value_width.reference
index 9887169f7af..f9143a926c4 100644
--- a/tests/queries/0_stateless/01293_pretty_max_value_width.reference
+++ b/tests/queries/0_stateless/01293_pretty_max_value_width.reference
@@ -1,114 +1,114 @@
-┏━━━━━━━━┳━━━━━┓
-┃ [1mx     [0m ┃ [1my  [0m ┃
-┡━━━━━━━━╇━━━━━┩
-│ привет │ мир │
-└────────┴─────┘
-┏━━━━━━━┳━━━━━┓
-┃ [1mx    [0m ┃ [1my  [0m ┃
-┡━━━━━━━╇━━━━━┩
-│ приве[31;1m⋯[0m│ мир │
-└───────┴─────┘
-┌─[1mx[0m─────┬─[1my[0m───┐
-│ приве[31;1m⋯[0m│ мир │
-└───────┴─────┘
- [1mx[0m       [1my[0m  
+   ┏━━━━━━━━┳━━━━━┓
+   ┃ [1mx     [0m ┃ [1my  [0m ┃
+   ┡━━━━━━━━╇━━━━━┩
+[90m1. [0m│ привет │ мир │
+   └────────┴─────┘
+   ┏━━━━━━━┳━━━━━┓
+   ┃ [1mx    [0m ┃ [1my  [0m ┃
+   ┡━━━━━━━╇━━━━━┩
+[90m1. [0m│ приве[31;1m⋯[0m│ мир │
+   └───────┴─────┘
+   ┌─[1mx[0m─────┬─[1my[0m───┐
+[90m1. [0m│ приве[31;1m⋯[0m│ мир │
+   └───────┴─────┘
+    [1mx[0m       [1my[0m  
 
- приве[31;1m⋯[0m  мир 
-┏━━━━━━━┳━━━━━━━┓
-┃ [1mx    [0m ┃ [1my    [0m ┃
-┡━━━━━━━╇━━━━━━━┩
-│ приве[31;1m⋯[0m│ мир   │
-├───────┼───────┤
-│ мир   │ приве[31;1m⋯[0m│
-└───────┴───────┘
-┌─[1mx[0m─────┬─[1my[0m─────┐
-│ приве[31;1m⋯[0m│ мир   │
-│ мир   │ приве[31;1m⋯[0m│
-└───────┴───────┘
- [1mx[0m       [1my[0m    
+[90m1. [0m приве[31;1m⋯[0m  мир 
+   ┏━━━━━━━┳━━━━━━━┓
+   ┃ [1mx    [0m ┃ [1my    [0m ┃
+   ┡━━━━━━━╇━━━━━━━┩
+[90m1. [0m│ приве[31;1m⋯[0m│ мир   │
+   ├───────┼───────┤
+[90m2. [0m│ мир   │ приве[31;1m⋯[0m│
+   └───────┴───────┘
+   ┌─[1mx[0m─────┬─[1my[0m─────┐
+[90m1. [0m│ приве[31;1m⋯[0m│ мир   │
+[90m2. [0m│ мир   │ приве[31;1m⋯[0m│
+   └───────┴───────┘
+    [1mx[0m       [1my[0m    
 
- приве[31;1m⋯[0m  мир   
- мир     приве[31;1m⋯[0m
-┏━━━━━━━━┳━━━━━┓
-┃ [1mx     [0m ┃ [1my  [0m ┃
-┡━━━━━━━━╇━━━━━┩
-│ привет │ мир │
-└────────┴─────┘
-┌─[1mx[0m──────┬─[1my[0m───┐
-│ привет │ мир │
-└────────┴─────┘
- [1mx[0m        [1my[0m  
+[90m1. [0m приве[31;1m⋯[0m  мир   
+[90m2. [0m мир     приве[31;1m⋯[0m
+   ┏━━━━━━━━┳━━━━━┓
+   ┃ [1mx     [0m ┃ [1my  [0m ┃
+   ┡━━━━━━━━╇━━━━━┩
+[90m1. [0m│ привет │ мир │
+   └────────┴─────┘
+   ┌─[1mx[0m──────┬─[1my[0m───┐
+[90m1. [0m│ привет │ мир │
+   └────────┴─────┘
+    [1mx[0m        [1my[0m  
 
- привет   мир 
-┏━━━━━━━━┳━━━━━━━━┓
-┃ [1mx     [0m ┃ [1my     [0m ┃
-┡━━━━━━━━╇━━━━━━━━┩
-│ привет │ мир    │
-├────────┼────────┤
-│ мир    │ привет │
-└────────┴────────┘
-┌─[1mx[0m──────┬─[1my[0m──────┐
-│ привет │ мир    │
-│ мир    │ привет │
-└────────┴────────┘
- [1mx[0m        [1my[0m     
+[90m1. [0m привет   мир 
+   ┏━━━━━━━━┳━━━━━━━━┓
+   ┃ [1mx     [0m ┃ [1my     [0m ┃
+   ┡━━━━━━━━╇━━━━━━━━┩
+[90m1. [0m│ привет │ мир    │
+   ├────────┼────────┤
+[90m2. [0m│ мир    │ привет │
+   └────────┴────────┘
+   ┌─[1mx[0m──────┬─[1my[0m──────┐
+[90m1. [0m│ привет │ мир    │
+[90m2. [0m│ мир    │ привет │
+   └────────┴────────┘
+    [1mx[0m        [1my[0m     
 
- привет   мир    
- мир      привет 
-┏━━━┳━━━┓
-┃ [1mx[0m ┃ [1my[0m ┃
-┡━━━╇━━━┩
-│ п[31;1m⋯[0m│ м[31;1m⋯[0m│
-└───┴───┘
-┌─[1mx[0m─┬─[1my[0m─┐
-│ п[31;1m⋯[0m│ м[31;1m⋯[0m│
-└───┴───┘
- [1mx[0m   [1my[0m
+[90m1. [0m привет   мир    
+[90m2. [0m мир      привет 
+   ┏━━━┳━━━┓
+   ┃ [1mx[0m ┃ [1my[0m ┃
+   ┡━━━╇━━━┩
+[90m1. [0m│ п[31;1m⋯[0m│ м[31;1m⋯[0m│
+   └───┴───┘
+   ┌─[1mx[0m─┬─[1my[0m─┐
+[90m1. [0m│ п[31;1m⋯[0m│ м[31;1m⋯[0m│
+   └───┴───┘
+    [1mx[0m   [1my[0m
 
- п[31;1m⋯[0m  м[31;1m⋯[0m
-┏━━━┳━━━┓
-┃ [1mx[0m ┃ [1my[0m ┃
-┡━━━╇━━━┩
-│ п[31;1m⋯[0m│ м[31;1m⋯[0m│
-├───┼───┤
-│ м[31;1m⋯[0m│ п[31;1m⋯[0m│
-└───┴───┘
-┌─[1mx[0m─┬─[1my[0m─┐
-│ п[31;1m⋯[0m│ м[31;1m⋯[0m│
-│ м[31;1m⋯[0m│ п[31;1m⋯[0m│
-└───┴───┘
- [1mx[0m   [1my[0m
+[90m1. [0m п[31;1m⋯[0m  м[31;1m⋯[0m
+   ┏━━━┳━━━┓
+   ┃ [1mx[0m ┃ [1my[0m ┃
+   ┡━━━╇━━━┩
+[90m1. [0m│ п[31;1m⋯[0m│ м[31;1m⋯[0m│
+   ├───┼───┤
+[90m2. [0m│ м[31;1m⋯[0m│ п[31;1m⋯[0m│
+   └───┴───┘
+   ┌─[1mx[0m─┬─[1my[0m─┐
+[90m1. [0m│ п[31;1m⋯[0m│ м[31;1m⋯[0m│
+[90m2. [0m│ м[31;1m⋯[0m│ п[31;1m⋯[0m│
+   └───┴───┘
+    [1mx[0m   [1my[0m
 
- п[31;1m⋯[0m  м[31;1m⋯[0m
- м[31;1m⋯[0m  п[31;1m⋯[0m
-┏━━━┳━━━┓
-┃ [1mx[0m ┃ [1my[0m ┃
-┡━━━╇━━━┩
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
-└───┴───┘
-┌─[1mx[0m─┬─[1my[0m─┐
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
-└───┴───┘
- [1mx[0m   [1my[0m
+[90m1. [0m п[31;1m⋯[0m  м[31;1m⋯[0m
+[90m2. [0m м[31;1m⋯[0m  п[31;1m⋯[0m
+   ┏━━━┳━━━┓
+   ┃ [1mx[0m ┃ [1my[0m ┃
+   ┡━━━╇━━━┩
+[90m1. [0m│ [31;1m⋯[0m │ [31;1m⋯[0m │
+   └───┴───┘
+   ┌─[1mx[0m─┬─[1my[0m─┐
+[90m1. [0m│ [31;1m⋯[0m │ [31;1m⋯[0m │
+   └───┴───┘
+    [1mx[0m   [1my[0m
 
- [31;1m⋯[0m   [31;1m⋯[0m 
-┏━━━┳━━━┓
-┃ [1mx[0m ┃ [1my[0m ┃
-┡━━━╇━━━┩
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
-├───┼───┤
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
-└───┴───┘
-┌─[1mx[0m─┬─[1my[0m─┐
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
-└───┴───┘
- [1mx[0m   [1my[0m
+[90m1. [0m [31;1m⋯[0m   [31;1m⋯[0m 
+   ┏━━━┳━━━┓
+   ┃ [1mx[0m ┃ [1my[0m ┃
+   ┡━━━╇━━━┩
+[90m1. [0m│ [31;1m⋯[0m │ [31;1m⋯[0m │
+   ├───┼───┤
+[90m2. [0m│ [31;1m⋯[0m │ [31;1m⋯[0m │
+   └───┴───┘
+   ┌─[1mx[0m─┬─[1my[0m─┐
+[90m1. [0m│ [31;1m⋯[0m │ [31;1m⋯[0m │
+[90m2. [0m│ [31;1m⋯[0m │ [31;1m⋯[0m │
+   └───┴───┘
+    [1mx[0m   [1my[0m
 
- [31;1m⋯[0m   [31;1m⋯[0m 
- [31;1m⋯[0m   [31;1m⋯[0m 
-┏━━━┳━━━┓
-┃ x ┃ y ┃
-┡━━━╇━━━┩
-│ ⋯ │ ⋯ │
-└───┴───┘
+[90m1. [0m [31;1m⋯[0m   [31;1m⋯[0m 
+[90m2. [0m [31;1m⋯[0m   [31;1m⋯[0m 
+   ┏━━━┳━━━┓
+   ┃ x ┃ y ┃
+   ┡━━━╇━━━┩
+1. │ ⋯ │ ⋯ │
+   └───┴───┘
diff --git a/tests/queries/0_stateless/01351_parse_date_time_best_effort_us.reference b/tests/queries/0_stateless/01351_parse_date_time_best_effort_us.reference
index 23bcb901557..62b3a40944a 100644
--- a/tests/queries/0_stateless/01351_parse_date_time_best_effort_us.reference
+++ b/tests/queries/0_stateless/01351_parse_date_time_best_effort_us.reference
@@ -1,40 +1,40 @@
 parseDateTimeBestEffortUS
- s                                             a
+     s                                             a
 
- 1970/01/02 010203Z          1970-01-02 01:02:03 
- 01-02-2001 UTC              2001-01-02 00:00:00 
- 10.23.1990                  1990-10-23 00:00:00 
- 01-02-2017 03:04:05+1       2017-01-02 02:04:05 
- 01/02/2017 03:04:05+300     2017-01-02 00:04:05 
- 01.02.2017 03:04:05GMT      2017-01-02 03:04:05 
- 01-02-2017 03:04:05 MSD     2017-01-01 23:04:05 
- 01-02-2017 11:04:05 AM      2017-01-02 11:04:05 
- 01-02-2017 11:04:05 PM      2017-01-02 23:04:05 
- 01-02-2017 12:04:05 AM      2017-01-02 00:04:05 
- 01-02-2017 12:04:05 PM      2017-01-02 12:04:05 
- 01.02.17 03:04:05 MSD Feb   2017-02-01 23:04:05 
- 01/02/2017 03:04:05 MSK     2017-01-02 00:04:05 
- 12/13/2019                  2019-12-13 00:00:00 
- 13/12/2019                  2019-12-13 00:00:00 
- 03/04/2019                  2019-03-04 00:00:00 
+ 1.  1970/01/02 010203Z          1970-01-02 01:02:03 
+ 2.  01-02-2001 UTC              2001-01-02 00:00:00 
+ 3.  10.23.1990                  1990-10-23 00:00:00 
+ 4.  01-02-2017 03:04:05+1       2017-01-02 02:04:05 
+ 5.  01/02/2017 03:04:05+300     2017-01-02 00:04:05 
+ 6.  01.02.2017 03:04:05GMT      2017-01-02 03:04:05 
+ 7.  01-02-2017 03:04:05 MSD     2017-01-01 23:04:05 
+ 8.  01-02-2017 11:04:05 AM      2017-01-02 11:04:05 
+ 9.  01-02-2017 11:04:05 PM      2017-01-02 23:04:05 
+10.  01-02-2017 12:04:05 AM      2017-01-02 00:04:05 
+11.  01-02-2017 12:04:05 PM      2017-01-02 12:04:05 
+12.  01.02.17 03:04:05 MSD Feb   2017-02-01 23:04:05 
+13.  01/02/2017 03:04:05 MSK     2017-01-02 00:04:05 
+14.  12/13/2019                  2019-12-13 00:00:00 
+15.  13/12/2019                  2019-12-13 00:00:00 
+16.  03/04/2019                  2019-03-04 00:00:00 
 parseDateTimeBestEffortUSOrZero	parseDateTimeBestEffortUSOrNull
- s                                             a                     b
+     s                                             a                     b
 
- 1970/01/02 010203Z          1970-01-02 01:02:03   1970-01-02 01:02:03 
- 01-02-2001 UTC              2001-01-02 00:00:00   2001-01-02 00:00:00 
- 10.23.1990                  1990-10-23 00:00:00   1990-10-23 00:00:00 
- 01-02-2017 03:04:05+1       2017-01-02 02:04:05   2017-01-02 02:04:05 
- 01/02/2017 03:04:05+300     2017-01-02 00:04:05   2017-01-02 00:04:05 
- 01.02.2017 03:04:05GMT      2017-01-02 03:04:05   2017-01-02 03:04:05 
- 01-02-2017 03:04:05 MSD     2017-01-01 23:04:05   2017-01-01 23:04:05 
- 01-02-2017 11:04:05 AM      2017-01-02 11:04:05   2017-01-02 11:04:05 
- 01-02-2017 11:04:05 PM      2017-01-02 23:04:05   2017-01-02 23:04:05 
- 01-02-2017 12:04:05 AM      2017-01-02 00:04:05   2017-01-02 00:04:05 
- 01-02-2017 12:04:05 PM      2017-01-02 12:04:05   2017-01-02 12:04:05 
- 01.02.17 03:04:05 MSD Feb   2017-02-01 23:04:05   2017-02-01 23:04:05 
- 01/02/2017 03:04:05 MSK     2017-01-02 00:04:05   2017-01-02 00:04:05 
- 12/13/2019                  2019-12-13 00:00:00   2019-12-13 00:00:00 
- 13/12/2019                  2019-12-13 00:00:00   2019-12-13 00:00:00 
- 03/04/2019                  2019-03-04 00:00:00   2019-03-04 00:00:00 
-                             1970-01-01 00:00:00                  ᴺᵁᴸᴸ 
- xyz                         1970-01-01 00:00:00                  ᴺᵁᴸᴸ 
+ 1.  1970/01/02 010203Z          1970-01-02 01:02:03   1970-01-02 01:02:03 
+ 2.  01-02-2001 UTC              2001-01-02 00:00:00   2001-01-02 00:00:00 
+ 3.  10.23.1990                  1990-10-23 00:00:00   1990-10-23 00:00:00 
+ 4.  01-02-2017 03:04:05+1       2017-01-02 02:04:05   2017-01-02 02:04:05 
+ 5.  01/02/2017 03:04:05+300     2017-01-02 00:04:05   2017-01-02 00:04:05 
+ 6.  01.02.2017 03:04:05GMT      2017-01-02 03:04:05   2017-01-02 03:04:05 
+ 7.  01-02-2017 03:04:05 MSD     2017-01-01 23:04:05   2017-01-01 23:04:05 
+ 8.  01-02-2017 11:04:05 AM      2017-01-02 11:04:05   2017-01-02 11:04:05 
+ 9.  01-02-2017 11:04:05 PM      2017-01-02 23:04:05   2017-01-02 23:04:05 
+10.  01-02-2017 12:04:05 AM      2017-01-02 00:04:05   2017-01-02 00:04:05 
+11.  01-02-2017 12:04:05 PM      2017-01-02 12:04:05   2017-01-02 12:04:05 
+12.  01.02.17 03:04:05 MSD Feb   2017-02-01 23:04:05   2017-02-01 23:04:05 
+13.  01/02/2017 03:04:05 MSK     2017-01-02 00:04:05   2017-01-02 00:04:05 
+14.  12/13/2019                  2019-12-13 00:00:00   2019-12-13 00:00:00 
+15.  13/12/2019                  2019-12-13 00:00:00   2019-12-13 00:00:00 
+16.  03/04/2019                  2019-03-04 00:00:00   2019-03-04 00:00:00 
+17.                              1970-01-01 00:00:00                  ᴺᵁᴸᴸ 
+18.  xyz                         1970-01-01 00:00:00                  ᴺᵁᴸᴸ 
diff --git a/tests/queries/0_stateless/01472_many_rows_in_totals.reference b/tests/queries/0_stateless/01472_many_rows_in_totals.reference
index 92a9e4bbb53..6b0eaf3a6aa 100644
--- a/tests/queries/0_stateless/01472_many_rows_in_totals.reference
+++ b/tests/queries/0_stateless/01472_many_rows_in_totals.reference
@@ -1,21 +1,21 @@
-┏━━━┳━━━┓
-┃ [1mg[0m ┃ [1ms[0m ┃
-┡━━━╇━━━┩
-│ 0 │ 2 │
-├───┼───┤
-│ 0 │ 2 │
-├───┼───┤
-│ 1 │ 4 │
-├───┼───┤
-│ 1 │ 4 │
-└───┴───┘
+   ┏━━━┳━━━┓
+   ┃ [1mg[0m ┃ [1ms[0m ┃
+   ┡━━━╇━━━┩
+[90m1. [0m│ 0 │ 2 │
+   ├───┼───┤
+[90m2. [0m│ 0 │ 2 │
+   ├───┼───┤
+[90m3. [0m│ 1 │ 4 │
+   ├───┼───┤
+[90m4. [0m│ 1 │ 4 │
+   └───┴───┘
 
 Totals:
-┏━━━┳━━━┓
-┃ [1mg[0m ┃ [1ms[0m ┃
-┡━━━╇━━━┩
-│ 0 │ 6 │
-└───┴───┘
+   ┏━━━┳━━━┓
+   ┃ [1mg[0m ┃ [1ms[0m ┃
+   ┡━━━╇━━━┩
+[90m1. [0m│ 0 │ 6 │
+   └───┴───┘
 --
 0	2
 0	2
diff --git a/tests/queries/0_stateless/01509_output_format_pretty_row_numbers.reference b/tests/queries/0_stateless/01509_output_format_pretty_row_numbers.reference
index a270447ffc9..1dc350f0227 100644
--- a/tests/queries/0_stateless/01509_output_format_pretty_row_numbers.reference
+++ b/tests/queries/0_stateless/01509_output_format_pretty_row_numbers.reference
@@ -107,49 +107,49 @@
     ┏━━━━━━━━┓
     ┃ [1mnumber[0m ┃
     ┡━━━━━━━━┩
- 1. │      0 │
+ [90m1. [0m│      0 │
     ├────────┤
- 2. │      1 │
+ [90m2. [0m│      1 │
     ├────────┤
- 3. │      2 │
+ [90m3. [0m│      2 │
     ├────────┤
- 4. │      3 │
+ [90m4. [0m│      3 │
     ├────────┤
- 5. │      4 │
+ [90m5. [0m│      4 │
     ├────────┤
- 6. │      5 │
+ [90m6. [0m│      5 │
     ├────────┤
- 7. │      6 │
+ [90m7. [0m│      6 │
     ├────────┤
- 8. │      7 │
+ [90m8. [0m│      7 │
     ├────────┤
- 9. │      8 │
+ [90m9. [0m│      8 │
     ├────────┤
-10. │      9 │
+[90m10. [0m│      9 │
     └────────┘
     ┌─[1mnumber[0m─┐
- 1. │      0 │
- 2. │      1 │
- 3. │      2 │
- 4. │      3 │
- 5. │      4 │
- 6. │      5 │
- 7. │      6 │
- 8. │      7 │
- 9. │      8 │
-10. │      9 │
+ [90m1. [0m│      0 │
+ [90m2. [0m│      1 │
+ [90m3. [0m│      2 │
+ [90m4. [0m│      3 │
+ [90m5. [0m│      4 │
+ [90m6. [0m│      5 │
+ [90m7. [0m│      6 │
+ [90m8. [0m│      7 │
+ [90m9. [0m│      8 │
+[90m10. [0m│      9 │
     └────────┘
     ┌─[1mnumber[0m─┐
- 1. │      0 │
- 2. │      1 │
- 3. │      2 │
- 4. │      3 │
- 5. │      4 │
- 6. │      5 │
- 7. │      6 │
- 8. │      7 │
- 9. │      8 │
-10. │      9 │
+ [90m1. [0m│      0 │
+ [90m2. [0m│      1 │
+ [90m3. [0m│      2 │
+ [90m4. [0m│      3 │
+ [90m5. [0m│      4 │
+ [90m6. [0m│      5 │
+ [90m7. [0m│      6 │
+ [90m8. [0m│      7 │
+ [90m9. [0m│      8 │
+[90m10. [0m│      9 │
     └────────┘
     ┏━━━━━━━━┓
     ┃ number ┃
@@ -200,35 +200,35 @@
 10.       9 
      [1mnumber[0m
 
- 1.       0 
- 2.       1 
- 3.       2 
- 4.       3 
- 5.       4 
- 6.       5 
- 7.       6 
- 8.       7 
- 9.       8 
-10.       9 
+ [90m1. [0m      0 
+ [90m2. [0m      1 
+ [90m3. [0m      2 
+ [90m4. [0m      3 
+ [90m5. [0m      4 
+ [90m6. [0m      5 
+ [90m7. [0m      6 
+ [90m8. [0m      7 
+ [90m9. [0m      8 
+[90m10. [0m      9 
    ┏━━━┓
    ┃ [1ma[0m ┃
    ┡━━━┩
-1. │ 1 │
+[90m1. [0m│ 1 │
    └───┘
    ┏━━━┓
    ┃ [1ma[0m ┃
    ┡━━━┩
-2. │ 2 │
+[90m2. [0m│ 2 │
    └───┘
    ┌─[1ma[0m─┐
-1. │ 1 │
+[90m1. [0m│ 1 │
    └───┘
    ┌─[1ma[0m─┐
-2. │ 2 │
+[90m2. [0m│ 2 │
    └───┘
    ┌─[1ma[0m─┐
-1. │ 1 │
-2. │ 2 │
+[90m1. [0m│ 1 │
+[90m2. [0m│ 2 │
    └───┘
    ┏━━━┓
    ┃ a ┃
@@ -248,10 +248,10 @@
    └───┘
     [1ma[0m
 
-1.  1 
+[90m1. [0m 1 
     [1ma[0m
 
-2.  2 
+[90m2. [0m 2 
     a
 
 1.  1 
@@ -261,94 +261,94 @@
    ┏━━━━━━━━┓
    ┃ [1mnumber[0m ┃
    ┡━━━━━━━━┩
-1. │      0 │
+[90m1. [0m│      0 │
    └────────┘
    ┏━━━━━━━━┓
    ┃ [1mnumber[0m ┃
    ┡━━━━━━━━┩
-2. │      1 │
+[90m2. [0m│      1 │
    └────────┘
    ┏━━━━━━━━┓
    ┃ [1mnumber[0m ┃
    ┡━━━━━━━━┩
-3. │      2 │
+[90m3. [0m│      2 │
    └────────┘
    ┏━━━━━━━━┓
    ┃ [1mnumber[0m ┃
    ┡━━━━━━━━┩
-4. │      3 │
+[90m4. [0m│      3 │
    └────────┘
    ┏━━━━━━━━┓
    ┃ [1mnumber[0m ┃
    ┡━━━━━━━━┩
-5. │      4 │
+[90m5. [0m│      4 │
    └────────┘
    ┏━━━━━━━━┓
    ┃ [1mnumber[0m ┃
    ┡━━━━━━━━┩
-6. │      5 │
+[90m6. [0m│      5 │
    └────────┘
    ┏━━━━━━━━┓
    ┃ [1mnumber[0m ┃
    ┡━━━━━━━━┩
-7. │      6 │
+[90m7. [0m│      6 │
    └────────┘
    ┏━━━━━━━━┓
    ┃ [1mnumber[0m ┃
    ┡━━━━━━━━┩
-8. │      7 │
+[90m8. [0m│      7 │
    └────────┘
    ┏━━━━━━━━┓
    ┃ [1mnumber[0m ┃
    ┡━━━━━━━━┩
-9. │      8 │
+[90m9. [0m│      8 │
    └────────┘
     ┏━━━━━━━━┓
     ┃ [1mnumber[0m ┃
     ┡━━━━━━━━┩
-10. │      9 │
+[90m10. [0m│      9 │
     └────────┘
    ┌─[1mnumber[0m─┐
-1. │      0 │
+[90m1. [0m│      0 │
    └────────┘
    ┌─[1mnumber[0m─┐
-2. │      1 │
+[90m2. [0m│      1 │
    └────────┘
    ┌─[1mnumber[0m─┐
-3. │      2 │
+[90m3. [0m│      2 │
    └────────┘
    ┌─[1mnumber[0m─┐
-4. │      3 │
+[90m4. [0m│      3 │
    └────────┘
    ┌─[1mnumber[0m─┐
-5. │      4 │
+[90m5. [0m│      4 │
    └────────┘
    ┌─[1mnumber[0m─┐
-6. │      5 │
+[90m6. [0m│      5 │
    └────────┘
    ┌─[1mnumber[0m─┐
-7. │      6 │
+[90m7. [0m│      6 │
    └────────┘
    ┌─[1mnumber[0m─┐
-8. │      7 │
+[90m8. [0m│      7 │
    └────────┘
    ┌─[1mnumber[0m─┐
-9. │      8 │
+[90m9. [0m│      8 │
    └────────┘
     ┌─[1mnumber[0m─┐
-10. │      9 │
+[90m10. [0m│      9 │
     └────────┘
     ┌─[1mnumber[0m─┐
- 1. │      0 │
- 2. │      1 │
- 3. │      2 │
- 4. │      3 │
- 5. │      4 │
- 6. │      5 │
- 7. │      6 │
- 8. │      7 │
- 9. │      8 │
-10. │      9 │
+ [90m1. [0m│      0 │
+ [90m2. [0m│      1 │
+ [90m3. [0m│      2 │
+ [90m4. [0m│      3 │
+ [90m5. [0m│      4 │
+ [90m6. [0m│      5 │
+ [90m7. [0m│      6 │
+ [90m8. [0m│      7 │
+ [90m9. [0m│      8 │
+[90m10. [0m│      9 │
     └────────┘
    ┏━━━━━━━━┓
    ┃ number ┃
@@ -432,34 +432,34 @@
     └────────┘
     [1mnumber[0m
 
-1.       0 
+[90m1. [0m      0 
     [1mnumber[0m
 
-2.       1 
+[90m2. [0m      1 
     [1mnumber[0m
 
-3.       2 
+[90m3. [0m      2 
     [1mnumber[0m
 
-4.       3 
+[90m4. [0m      3 
     [1mnumber[0m
 
-5.       4 
+[90m5. [0m      4 
     [1mnumber[0m
 
-6.       5 
+[90m6. [0m      5 
     [1mnumber[0m
 
-7.       6 
+[90m7. [0m      6 
     [1mnumber[0m
 
-8.       7 
+[90m8. [0m      7 
     [1mnumber[0m
 
-9.       8 
+[90m9. [0m      8 
      [1mnumber[0m
 
-10.       9 
+[90m10. [0m      9 
     number
 
 1.       0 
diff --git a/tests/queries/0_stateless/01509_output_format_pretty_row_numbers.sql b/tests/queries/0_stateless/01509_output_format_pretty_row_numbers.sql
index 3536b628ef2..0a09aef7fb2 100644
--- a/tests/queries/0_stateless/01509_output_format_pretty_row_numbers.sql
+++ b/tests/queries/0_stateless/01509_output_format_pretty_row_numbers.sql
@@ -1,4 +1,5 @@
 SET output_format_pretty_color=1;
+SET output_format_pretty_row_numbers=0;
 SELECT * FROM numbers(10) FORMAT Pretty;
 SELECT * FROM numbers(10) FORMAT PrettyCompact;
 SELECT * FROM numbers(10) FORMAT PrettyCompactMonoBlock;
diff --git a/tests/queries/0_stateless/01553_settings_early_apply.reference b/tests/queries/0_stateless/01553_settings_early_apply.reference
index 860d8d48c85..3306aaa734a 100644
--- a/tests/queries/0_stateless/01553_settings_early_apply.reference
+++ b/tests/queries/0_stateless/01553_settings_early_apply.reference
@@ -34,9 +34,9 @@ UInt64
 	</data>
 	<rows>0</rows>
 </result>
- number
+    number
 
-      0 
+1.       0 
 0
 1
 2
diff --git a/tests/queries/0_stateless/01645_system_table_engines.reference b/tests/queries/0_stateless/01645_system_table_engines.reference
index e19e6e035a6..e136700da74 100644
--- a/tests/queries/0_stateless/01645_system_table_engines.reference
+++ b/tests/queries/0_stateless/01645_system_table_engines.reference
@@ -1,4 +1,4 @@
-┌─name──────────────────────────┬─supports_settings─┬─supports_skipping_indices─┬─supports_projections─┬─supports_sort_order─┬─supports_ttl─┬─supports_replication─┬─supports_deduplication─┬─supports_parallel_insert─┐
-│ MergeTree                     │                 1 │                         1 │                    1 │                   1 │            1 │                    0 │                      0 │                        1 │
-│ ReplicatedCollapsingMergeTree │                 1 │                         1 │                    1 │                   1 │            1 │                    1 │                      1 │                        1 │
-└───────────────────────────────┴───────────────────┴───────────────────────────┴──────────────────────┴─────────────────────┴──────────────┴──────────────────────┴────────────────────────┴──────────────────────────┘
+   ┌─name──────────────────────────┬─supports_settings─┬─supports_skipping_indices─┬─supports_projections─┬─supports_sort_order─┬─supports_ttl─┬─supports_replication─┬─supports_deduplication─┬─supports_parallel_insert─┐
+1. │ MergeTree                     │                 1 │                         1 │                    1 │                   1 │            1 │                    0 │                      0 │                        1 │
+2. │ ReplicatedCollapsingMergeTree │                 1 │                         1 │                    1 │                   1 │            1 │                    1 │                      1 │                        1 │
+   └───────────────────────────────┴───────────────────┴───────────────────────────┴──────────────────────┴─────────────────────┴──────────────┴──────────────────────┴────────────────────────┴──────────────────────────┘
diff --git a/tests/queries/0_stateless/01656_ipv4_bad_formatting.reference b/tests/queries/0_stateless/01656_ipv4_bad_formatting.reference
index a7b5c448f13..4cd84ff99fc 100644
--- a/tests/queries/0_stateless/01656_ipv4_bad_formatting.reference
+++ b/tests/queries/0_stateless/01656_ipv4_bad_formatting.reference
@@ -1,4 +1,4 @@
-┌─x───────────────┬─y───────────────┬──────────z─┐
-│ 1.1.1.1         │ 1.1.1.1         │   16843009 │
-│ 255.255.255.255 │ 255.255.255.255 │ 4294967295 │
-└─────────────────┴─────────────────┴────────────┘
+   ┌─x───────────────┬─y───────────────┬──────────z─┐
+1. │ 1.1.1.1         │ 1.1.1.1         │   16843009 │
+2. │ 255.255.255.255 │ 255.255.255.255 │ 4294967295 │
+   └─────────────────┴─────────────────┴────────────┘
diff --git a/tests/queries/0_stateless/01671_merge_join_and_constants.reference b/tests/queries/0_stateless/01671_merge_join_and_constants.reference
index f82033ab3c7..1f904df6ae7 100644
--- a/tests/queries/0_stateless/01671_merge_join_and_constants.reference
+++ b/tests/queries/0_stateless/01671_merge_join_and_constants.reference
@@ -1,6 +1,6 @@
-┌─[1ma[0m─┬──────────[1mb[0m─┬─[1mc[0m─┬──────────[1md[0m─┬─[1m'0.10'[0m─┬─[1mc[0m─┐
-│ a │ 2018-01-01 │   │ 1970-01-01 │        │   │
-│ b │ 2018-01-01 │ B │ 2018-01-01 │ 0.10   │ B │
-│ c │ 2018-01-01 │ C │ 2018-01-01 │ 0.10   │ C │
-└───┴────────────┴───┴────────────┴────────┴───┘
+   ┌─[1ma[0m─┬──────────[1mb[0m─┬─[1mc[0m─┬──────────[1md[0m─┬─[1m'0.10'[0m─┬─[1mc[0m─┐
+[90m1. [0m│ a │ 2018-01-01 │   │ 1970-01-01 │        │   │
+[90m2. [0m│ b │ 2018-01-01 │ B │ 2018-01-01 │ 0.10   │ B │
+[90m3. [0m│ c │ 2018-01-01 │ C │ 2018-01-01 │ 0.10   │ C │
+   └───┴────────────┴───┴────────────┴────────┴───┘
 \N	\N	\N	\N	0	0
diff --git a/tests/queries/0_stateless/02026_describe_include_subcolumns.reference b/tests/queries/0_stateless/02026_describe_include_subcolumns.reference
index ac114a03837..dec65f62748 100644
--- a/tests/queries/0_stateless/02026_describe_include_subcolumns.reference
+++ b/tests/queries/0_stateless/02026_describe_include_subcolumns.reference
@@ -1,33 +1,33 @@
-┌─name─┬─type──────────────────────────────────────────────────────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────┬─codec_expression─┬─ttl_expression───────┐
-│ d    │ Date                                                                      │              │                    │                         │                  │                      │
-│ n    │ Nullable(String)                                                          │              │                    │ It is a nullable column │                  │                      │
-│ arr1 │ Array(UInt32)                                                             │              │                    │                         │ ZSTD(1)          │                      │
-│ arr2 │ Array(Array(String))                                                      │              │                    │                         │                  │ d + toIntervalDay(1) │
-│ t    │ Tuple(
+   ┌─name─┬─type──────────────────────────────────────────────────────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────┬─codec_expression─┬─ttl_expression───────┐
+1. │ d    │ Date                                                                      │              │                    │                         │                  │                      │
+2. │ n    │ Nullable(String)                                                          │              │                    │ It is a nullable column │                  │                      │
+3. │ arr1 │ Array(UInt32)                                                             │              │                    │                         │ ZSTD(1)          │                      │
+4. │ arr2 │ Array(Array(String))                                                      │              │                    │                         │                  │ d + toIntervalDay(1) │
+5. │ t    │ Tuple(
     s String,
     a Array(Tuple(
         a UInt32,
         b UInt32))) │              │                    │                         │ ZSTD(1)          │                      │
-└──────┴───────────────────────────────────────────────────────────────────────────┴──────────────┴────────────────────┴─────────────────────────┴──────────────────┴──────────────────────┘
-┌─name───────┬─type──────────────────────────────────────────────────────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────┬─codec_expression─┬─ttl_expression───────┬─is_subcolumn─┐
-│ d          │ Date                                                                      │              │                    │                         │                  │                      │            0 │
-│ n          │ Nullable(String)                                                          │              │                    │ It is a nullable column │                  │                      │            0 │
-│ arr1       │ Array(UInt32)                                                             │              │                    │                         │ ZSTD(1)          │                      │            0 │
-│ arr2       │ Array(Array(String))                                                      │              │                    │                         │                  │ d + toIntervalDay(1) │            0 │
-│ t          │ Tuple(
+   └──────┴───────────────────────────────────────────────────────────────────────────┴──────────────┴────────────────────┴─────────────────────────┴──────────────────┴──────────────────────┘
+    ┌─name───────┬─type──────────────────────────────────────────────────────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────┬─codec_expression─┬─ttl_expression───────┬─is_subcolumn─┐
+ 1. │ d          │ Date                                                                      │              │                    │                         │                  │                      │            0 │
+ 2. │ n          │ Nullable(String)                                                          │              │                    │ It is a nullable column │                  │                      │            0 │
+ 3. │ arr1       │ Array(UInt32)                                                             │              │                    │                         │ ZSTD(1)          │                      │            0 │
+ 4. │ arr2       │ Array(Array(String))                                                      │              │                    │                         │                  │ d + toIntervalDay(1) │            0 │
+ 5. │ t          │ Tuple(
     s String,
     a Array(Tuple(
         a UInt32,
         b UInt32))) │              │                    │                         │ ZSTD(1)          │                      │            0 │
-│ n.null     │ UInt8                                                                     │              │                    │ It is a nullable column │                  │                      │            1 │
-│ arr1.size0 │ UInt64                                                                    │              │                    │                         │                  │                      │            1 │
-│ arr2.size0 │ UInt64                                                                    │              │                    │                         │                  │ d + toIntervalDay(1) │            1 │
-│ arr2.size1 │ Array(UInt64)                                                             │              │                    │                         │                  │ d + toIntervalDay(1) │            1 │
-│ t.s        │ String                                                                    │              │                    │                         │ ZSTD(1)          │                      │            1 │
-│ t.a        │ Array(Tuple(
+ 6. │ n.null     │ UInt8                                                                     │              │                    │ It is a nullable column │                  │                      │            1 │
+ 7. │ arr1.size0 │ UInt64                                                                    │              │                    │                         │                  │                      │            1 │
+ 8. │ arr2.size0 │ UInt64                                                                    │              │                    │                         │                  │ d + toIntervalDay(1) │            1 │
+ 9. │ arr2.size1 │ Array(UInt64)                                                             │              │                    │                         │                  │ d + toIntervalDay(1) │            1 │
+10. │ t.s        │ String                                                                    │              │                    │                         │ ZSTD(1)          │                      │            1 │
+11. │ t.a        │ Array(Tuple(
     a UInt32,
     b UInt32))                                   │              │                    │                         │                  │                      │            1 │
-│ t.a.size0  │ UInt64                                                                    │              │                    │                         │                  │                      │            1 │
-│ t.a.a      │ Array(UInt32)                                                             │              │                    │                         │ ZSTD(1)          │                      │            1 │
-│ t.a.b      │ Array(UInt32)                                                             │              │                    │                         │ ZSTD(1)          │                      │            1 │
-└────────────┴───────────────────────────────────────────────────────────────────────────┴──────────────┴────────────────────┴─────────────────────────┴──────────────────┴──────────────────────┴──────────────┘
+12. │ t.a.size0  │ UInt64                                                                    │              │                    │                         │                  │                      │            1 │
+13. │ t.a.a      │ Array(UInt32)                                                             │              │                    │                         │ ZSTD(1)          │                      │            1 │
+14. │ t.a.b      │ Array(UInt32)                                                             │              │                    │                         │ ZSTD(1)          │                      │            1 │
+    └────────────┴───────────────────────────────────────────────────────────────────────────┴──────────────┴────────────────────┴─────────────────────────┴──────────────────┴──────────────────────┴──────────────┘
diff --git a/tests/queries/0_stateless/02152_bool_type.reference b/tests/queries/0_stateless/02152_bool_type.reference
index a8c04f651e9..3d48302f941 100644
--- a/tests/queries/0_stateless/02152_bool_type.reference
+++ b/tests/queries/0_stateless/02152_bool_type.reference
@@ -32,11 +32,11 @@ Custom true
 Row 1:
 ──────
 CAST('true', 'Bool'): Custom true
-┏━━━━━━━━━━━━━━━━━━━━━━┓
-┃ [1mCAST('true', 'Bool')[0m ┃
-┡━━━━━━━━━━━━━━━━━━━━━━┩
-│ Custom true          │
-└──────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ [1mCAST('true', 'Bool')[0m ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━┩
+[90m1. [0m│ Custom true          │
+   └──────────────────────┘
 {"CAST('true', 'Bool')":true}
 1
 1
diff --git a/tests/queries/0_stateless/02375_pretty_formats.reference b/tests/queries/0_stateless/02375_pretty_formats.reference
index 51b18f7eb09..e48646ff4bd 100644
--- a/tests/queries/0_stateless/02375_pretty_formats.reference
+++ b/tests/queries/0_stateless/02375_pretty_formats.reference
@@ -1,118 +1,118 @@
 Pretty
-┏━━━┳━━━┓
-┃ [1mx[0m ┃ [1my[0m ┃
-┡━━━╇━━━┩
-│ 0 │ 1 │
-├───┼───┤
-│ 1 │ 2 │
-└───┴───┘
-┏━━━┳━━━┓
-┃ [1mx[0m ┃ [1my[0m ┃
-┡━━━╇━━━┩
-│ 2 │ 3 │
-├───┼───┤
-│ 3 │ 4 │
-└───┴───┘
+   ┏━━━┳━━━┓
+   ┃ [1mx[0m ┃ [1my[0m ┃
+   ┡━━━╇━━━┩
+[90m1. [0m│ 0 │ 1 │
+   ├───┼───┤
+[90m2. [0m│ 1 │ 2 │
+   └───┴───┘
+   ┏━━━┳━━━┓
+   ┃ [1mx[0m ┃ [1my[0m ┃
+   ┡━━━╇━━━┩
+[90m3. [0m│ 2 │ 3 │
+   ├───┼───┤
+[90m4. [0m│ 3 │ 4 │
+   └───┴───┘
 PrettyNoEscapes
-┏━━━┳━━━┓
-┃ x ┃ y ┃
-┡━━━╇━━━┩
-│ 0 │ 1 │
-├───┼───┤
-│ 1 │ 2 │
-└───┴───┘
-┏━━━┳━━━┓
-┃ x ┃ y ┃
-┡━━━╇━━━┩
-│ 2 │ 3 │
-├───┼───┤
-│ 3 │ 4 │
-└───┴───┘
+   ┏━━━┳━━━┓
+   ┃ x ┃ y ┃
+   ┡━━━╇━━━┩
+1. │ 0 │ 1 │
+   ├───┼───┤
+2. │ 1 │ 2 │
+   └───┴───┘
+   ┏━━━┳━━━┓
+   ┃ x ┃ y ┃
+   ┡━━━╇━━━┩
+3. │ 2 │ 3 │
+   ├───┼───┤
+4. │ 3 │ 4 │
+   └───┴───┘
 PrettyMonoBlock
-┏━━━┳━━━┓
-┃ [1mx[0m ┃ [1my[0m ┃
-┡━━━╇━━━┩
-│ 0 │ 1 │
-├───┼───┤
-│ 1 │ 2 │
-├───┼───┤
-│ 2 │ 3 │
-├───┼───┤
-│ 3 │ 4 │
-└───┴───┘
+   ┏━━━┳━━━┓
+   ┃ [1mx[0m ┃ [1my[0m ┃
+   ┡━━━╇━━━┩
+[90m1. [0m│ 0 │ 1 │
+   ├───┼───┤
+[90m2. [0m│ 1 │ 2 │
+   ├───┼───┤
+[90m3. [0m│ 2 │ 3 │
+   ├───┼───┤
+[90m4. [0m│ 3 │ 4 │
+   └───┴───┘
 PrettyNoEscapesMonoBlock
-┏━━━┳━━━┓
-┃ x ┃ y ┃
-┡━━━╇━━━┩
-│ 0 │ 1 │
-├───┼───┤
-│ 1 │ 2 │
-├───┼───┤
-│ 2 │ 3 │
-├───┼───┤
-│ 3 │ 4 │
-└───┴───┘
+   ┏━━━┳━━━┓
+   ┃ x ┃ y ┃
+   ┡━━━╇━━━┩
+1. │ 0 │ 1 │
+   ├───┼───┤
+2. │ 1 │ 2 │
+   ├───┼───┤
+3. │ 2 │ 3 │
+   ├───┼───┤
+4. │ 3 │ 4 │
+   └───┴───┘
 PrettyCompact
-┌─[1mx[0m─┬─[1my[0m─┐
-│ 0 │ 1 │
-│ 1 │ 2 │
-└───┴───┘
-┌─[1mx[0m─┬─[1my[0m─┐
-│ 2 │ 3 │
-│ 3 │ 4 │
-└───┴───┘
+   ┌─[1mx[0m─┬─[1my[0m─┐
+[90m1. [0m│ 0 │ 1 │
+[90m2. [0m│ 1 │ 2 │
+   └───┴───┘
+   ┌─[1mx[0m─┬─[1my[0m─┐
+[90m3. [0m│ 2 │ 3 │
+[90m4. [0m│ 3 │ 4 │
+   └───┴───┘
 PrettyCompactNoEscapes
-┌─x─┬─y─┐
-│ 0 │ 1 │
-│ 1 │ 2 │
-└───┴───┘
-┌─x─┬─y─┐
-│ 2 │ 3 │
-│ 3 │ 4 │
-└───┴───┘
+   ┌─x─┬─y─┐
+1. │ 0 │ 1 │
+2. │ 1 │ 2 │
+   └───┴───┘
+   ┌─x─┬─y─┐
+3. │ 2 │ 3 │
+4. │ 3 │ 4 │
+   └───┴───┘
 PrettyCompactMonoBlock
-┌─[1mx[0m─┬─[1my[0m─┐
-│ 0 │ 1 │
-│ 1 │ 2 │
-│ 2 │ 3 │
-│ 3 │ 4 │
-└───┴───┘
+   ┌─[1mx[0m─┬─[1my[0m─┐
+[90m1. [0m│ 0 │ 1 │
+[90m2. [0m│ 1 │ 2 │
+[90m3. [0m│ 2 │ 3 │
+[90m4. [0m│ 3 │ 4 │
+   └───┴───┘
 PrettyCompactNoEscapesMonoBlock
-┌─x─┬─y─┐
-│ 0 │ 1 │
-│ 1 │ 2 │
-│ 2 │ 3 │
-│ 3 │ 4 │
-└───┴───┘
+   ┌─x─┬─y─┐
+1. │ 0 │ 1 │
+2. │ 1 │ 2 │
+3. │ 2 │ 3 │
+4. │ 3 │ 4 │
+   └───┴───┘
 PrettySpace
- [1mx[0m   [1my[0m
+    [1mx[0m   [1my[0m
 
- 0   1 
- 1   2 
- [1mx[0m   [1my[0m
+[90m1. [0m 0   1 
+[90m2. [0m 1   2 
+    [1mx[0m   [1my[0m
 
- 2   3 
- 3   4 
+[90m3. [0m 2   3 
+[90m4. [0m 3   4 
 PrettySpaceNoEscapes
- x   y
+    x   y
 
- 0   1 
- 1   2 
- x   y
+1.  0   1 
+2.  1   2 
+    x   y
 
- 2   3 
- 3   4 
+3.  2   3 
+4.  3   4 
 PrettySpaceMonoBlock
- [1mx[0m   [1my[0m
+    [1mx[0m   [1my[0m
 
- 0   1 
- 1   2 
- 2   3 
- 3   4 
+[90m1. [0m 0   1 
+[90m2. [0m 1   2 
+[90m3. [0m 2   3 
+[90m4. [0m 3   4 
 PrettySpaceNoEscapesMonoBlock
- x   y
+    x   y
 
- 0   1 
- 1   2 
- 2   3 
- 3   4 
+1.  0   1 
+2.  1   2 
+3.  2   3 
+4.  3   4 
diff --git a/tests/queries/0_stateless/02381_parseDateTime64BestEffortUS.reference b/tests/queries/0_stateless/02381_parseDateTime64BestEffortUS.reference
index c9a13c97baf..469c523c578 100644
--- a/tests/queries/0_stateless/02381_parseDateTime64BestEffortUS.reference
+++ b/tests/queries/0_stateless/02381_parseDateTime64BestEffortUS.reference
@@ -1,10 +1,10 @@
 parseDateTime64BestEffortUS
- s                                           a
+    s                                           a
 
- 01-02-1930 12:00:00   1930-01-02 12:00:00.000 
- 12.02.1930 12:00:00   1930-12-02 12:00:00.000 
- 13/02/1930 12:00:00   1930-02-13 12:00:00.000 
- 02/25/1930 12:00:00   1930-02-25 12:00:00.000 
+1.  01-02-1930 12:00:00   1930-01-02 12:00:00.000 
+2.  12.02.1930 12:00:00   1930-12-02 12:00:00.000 
+3.  13/02/1930 12:00:00   1930-02-13 12:00:00.000 
+4.  02/25/1930 12:00:00   1930-02-25 12:00:00.000 
 
 parseDateTime64BestEffortUSOrNull
 \N
diff --git a/tests/queries/0_stateless/02418_do_not_return_empty_blocks_from_ConvertingAggregatedToChunksTransform.reference b/tests/queries/0_stateless/02418_do_not_return_empty_blocks_from_ConvertingAggregatedToChunksTransform.reference
index f2586c9c42a..9a54cd0ebaa 100644
--- a/tests/queries/0_stateless/02418_do_not_return_empty_blocks_from_ConvertingAggregatedToChunksTransform.reference
+++ b/tests/queries/0_stateless/02418_do_not_return_empty_blocks_from_ConvertingAggregatedToChunksTransform.reference
@@ -1,6 +1,6 @@
-┌─[1mnumber[0m─┐
-│     42 │
-└────────┘
-┌─[1mnumber[0m─┐
-│     42 │
-└────────┘
+   ┌─[1mnumber[0m─┐
+[90m1. [0m│     42 │
+   └────────┘
+   ┌─[1mnumber[0m─┐
+[90m1. [0m│     42 │
+   └────────┘
diff --git a/tests/queries/0_stateless/02790_sql_standard_fetch.reference b/tests/queries/0_stateless/02790_sql_standard_fetch.reference
index ef578b526da..6ae56306797 100644
--- a/tests/queries/0_stateless/02790_sql_standard_fetch.reference
+++ b/tests/queries/0_stateless/02790_sql_standard_fetch.reference
@@ -1,36 +1,36 @@
-┌─name───────────┬─department─┬─salary─┐
-│ Frank          │ it         │    120 │
-│ Henry or Irene │ it         │    104 │
-│ Henry or Irene │ it         │    104 │
-│ Alice          │ sales      │    100 │
-│ Dave or Cindy  │ sales      │     96 │
-└────────────────┴────────────┴────────┘
-┌─name───────────┬─department─┬─salary─┐
-│ Frank          │ it         │    120 │
-│ Henry or Irene │ it         │    104 │
-│ Henry or Irene │ it         │    104 │
-│ Alice          │ sales      │    100 │
-│ Dave or Cindy  │ sales      │     96 │
-└────────────────┴────────────┴────────┘
-┌─name───────────┬─department─┬─salary─┐
-│ Frank          │ it         │    120 │
-│ Henry or Irene │ it         │    104 │
-│ Henry or Irene │ it         │    104 │
-│ Alice          │ sales      │    100 │
-│ Dave or Cindy  │ sales      │     96 │
-│ Dave or Cindy  │ sales      │     96 │
-└────────────────┴────────────┴────────┘
-┌─name──────────┬─department─┬─salary─┐
-│ Alice         │ sales      │    100 │
-│ Dave or Cindy │ sales      │     96 │
-│ Dave or Cindy │ sales      │     96 │
-│ Grace         │ it         │     90 │
-│ Emma          │ it         │     84 │
-└───────────────┴────────────┴────────┘
-┌─name──────────┬─department─┬─salary─┐
-│ Alice         │ sales      │    100 │
-│ Dave or Cindy │ sales      │     96 │
-│ Dave or Cindy │ sales      │     96 │
-│ Grace         │ it         │     90 │
-│ Emma          │ it         │     84 │
-└───────────────┴────────────┴────────┘
+   ┌─name───────────┬─department─┬─salary─┐
+1. │ Frank          │ it         │    120 │
+2. │ Henry or Irene │ it         │    104 │
+3. │ Henry or Irene │ it         │    104 │
+4. │ Alice          │ sales      │    100 │
+5. │ Dave or Cindy  │ sales      │     96 │
+   └────────────────┴────────────┴────────┘
+   ┌─name───────────┬─department─┬─salary─┐
+1. │ Frank          │ it         │    120 │
+2. │ Henry or Irene │ it         │    104 │
+3. │ Henry or Irene │ it         │    104 │
+4. │ Alice          │ sales      │    100 │
+5. │ Dave or Cindy  │ sales      │     96 │
+   └────────────────┴────────────┴────────┘
+   ┌─name───────────┬─department─┬─salary─┐
+1. │ Frank          │ it         │    120 │
+2. │ Henry or Irene │ it         │    104 │
+3. │ Henry or Irene │ it         │    104 │
+4. │ Alice          │ sales      │    100 │
+5. │ Dave or Cindy  │ sales      │     96 │
+6. │ Dave or Cindy  │ sales      │     96 │
+   └────────────────┴────────────┴────────┘
+   ┌─name──────────┬─department─┬─salary─┐
+1. │ Alice         │ sales      │    100 │
+2. │ Dave or Cindy │ sales      │     96 │
+3. │ Dave or Cindy │ sales      │     96 │
+4. │ Grace         │ it         │     90 │
+5. │ Emma          │ it         │     84 │
+   └───────────────┴────────────┴────────┘
+   ┌─name──────────┬─department─┬─salary─┐
+1. │ Alice         │ sales      │    100 │
+2. │ Dave or Cindy │ sales      │     96 │
+3. │ Dave or Cindy │ sales      │     96 │
+4. │ Grace         │ it         │     90 │
+5. │ Emma          │ it         │     84 │
+   └───────────────┴────────────┴────────┘
diff --git a/tests/queries/0_stateless/02793_implicit_pretty_format_settings.expect b/tests/queries/0_stateless/02793_implicit_pretty_format_settings.expect
index 569cbc7330e..f9d3a2709d8 100755
--- a/tests/queries/0_stateless/02793_implicit_pretty_format_settings.expect
+++ b/tests/queries/0_stateless/02793_implicit_pretty_format_settings.expect
@@ -19,7 +19,7 @@ spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT_BINARY \
 expect ":) "
 
 # Send a command
-send -- "SELECT 1 SETTINGS output_format_pretty_row_numbers = 1\r"
+send -- "SELECT 1 SETTINGS output_format_pretty_row_numbers = 1, output_format_pretty_color = 0\r"
 expect "1. │ 1 │"
 expect ":) "
 
diff --git a/tests/queries/0_stateless/02798_explain_settings_not_applied_bug.reference b/tests/queries/0_stateless/02798_explain_settings_not_applied_bug.reference
index ffb61b54f9a..3ad865b7a74 100644
--- a/tests/queries/0_stateless/02798_explain_settings_not_applied_bug.reference
+++ b/tests/queries/0_stateless/02798_explain_settings_not_applied_bug.reference
@@ -1,11 +1,11 @@
- [1mexplain[0m                                                                 
+    [1mexplain[0m                                                                 
 
- (Expression)                                                             
- ExpressionTransform                                                      
-   (Aggregating)                                                          
-   FinalizeAggregatedTransform                                            
-     AggregatingInOrderTransform                                          
-       (Expression)                                                       
-       ExpressionTransform                                                
-         (ReadFromMergeTree)                                              
-         MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) 0 → 1 
+[90m1. [0m (Expression)                                                             
+[90m2. [0m ExpressionTransform                                                      
+[90m3. [0m   (Aggregating)                                                          
+[90m4. [0m   FinalizeAggregatedTransform                                            
+[90m5. [0m     AggregatingInOrderTransform                                          
+[90m6. [0m       (Expression)                                                       
+[90m7. [0m       ExpressionTransform                                                
+[90m8. [0m         (ReadFromMergeTree)                                              
+[90m9. [0m         MergeTreeSelect(pool: ReadPoolInOrder, algorithm: InOrder) 0 → 1 
diff --git a/tests/queries/0_stateless/02890_describe_table_options.reference b/tests/queries/0_stateless/02890_describe_table_options.reference
index 05daade09d8..15ff1dc0f15 100644
--- a/tests/queries/0_stateless/02890_describe_table_options.reference
+++ b/tests/queries/0_stateless/02890_describe_table_options.reference
@@ -2,197 +2,197 @@
 
 SET describe_compact_output = 0, describe_include_virtual_columns = 0, describe_include_subcolumns = 0;
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-┌─name─┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┐
-│ id   │ UInt64                    │              │                    │ index column │                  │                │
-│ arr  │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │
-│ t    │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │              │ ZSTD(1)          │                │
-└──────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┘
+   ┌─name─┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┐
+1. │ id   │ UInt64                    │              │                    │ index column │                  │                │
+2. │ arr  │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │
+3. │ t    │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │              │ ZSTD(1)          │                │
+   └──────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┘
 DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
-┌─name─┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┐
-│ id   │ UInt64                    │              │                    │ index column │                  │                │
-│ arr  │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │
-│ t    │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │              │ ZSTD(1)          │                │
-└──────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┘
+   ┌─name─┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┐
+1. │ id   │ UInt64                    │              │                    │ index column │                  │                │
+2. │ arr  │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │
+3. │ t    │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │              │ ZSTD(1)          │                │
+   └──────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┘
 SET describe_compact_output = 0, describe_include_virtual_columns = 0, describe_include_subcolumns = 1;
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-┌─name──────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┐
-│ id        │ UInt64                    │              │                    │ index column │                  │                │            0 │
-│ arr       │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │            0 │
-│ t         │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │              │ ZSTD(1)          │                │            0 │
-│ arr.size0 │ UInt64                    │              │                    │              │                  │                │            1 │
-│ t.a       │ String                    │              │                    │              │ ZSTD(1)          │                │            1 │
-│ t.b       │ UInt64                    │              │                    │              │ ZSTD(1)          │                │            1 │
-└───────────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┴──────────────┘
+   ┌─name──────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┐
+1. │ id        │ UInt64                    │              │                    │ index column │                  │                │            0 │
+2. │ arr       │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │            0 │
+3. │ t         │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │              │ ZSTD(1)          │                │            0 │
+4. │ arr.size0 │ UInt64                    │              │                    │              │                  │                │            1 │
+5. │ t.a       │ String                    │              │                    │              │ ZSTD(1)          │                │            1 │
+6. │ t.b       │ UInt64                    │              │                    │              │ ZSTD(1)          │                │            1 │
+   └───────────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┴──────────────┘
 DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
-┌─name──────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┐
-│ id        │ UInt64                    │              │                    │ index column │                  │                │            0 │
-│ arr       │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │            0 │
-│ t         │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │              │ ZSTD(1)          │                │            0 │
-│ arr.size0 │ UInt64                    │              │                    │              │                  │                │            1 │
-│ t.a       │ String                    │              │                    │              │ ZSTD(1)          │                │            1 │
-│ t.b       │ UInt64                    │              │                    │              │ ZSTD(1)          │                │            1 │
-└───────────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┴──────────────┘
+   ┌─name──────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment──────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┐
+1. │ id        │ UInt64                    │              │                    │ index column │                  │                │            0 │
+2. │ arr       │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │              │ ZSTD(1)          │                │            0 │
+3. │ t         │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │              │ ZSTD(1)          │                │            0 │
+4. │ arr.size0 │ UInt64                    │              │                    │              │                  │                │            1 │
+5. │ t.a       │ String                    │              │                    │              │ ZSTD(1)          │                │            1 │
+6. │ t.b       │ UInt64                    │              │                    │              │ ZSTD(1)          │                │            1 │
+   └───────────┴───────────────────────────┴──────────────┴────────────────────┴──────────────┴──────────────────┴────────────────┴──────────────┘
 SET describe_compact_output = 0, describe_include_virtual_columns = 1, describe_include_subcolumns = 0;
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_virtual─┐
-│ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │          0 │
-│ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │          0 │
-│ t              │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │                                                                                         │ ZSTD(1)          │                │          0 │
-│ _part          │ LowCardinality(String)    │              │                    │ Name of part                                                                            │                  │                │          1 │
-│ _part_index    │ UInt64                    │              │                    │ Sequential index of the part in the query result                                        │                  │                │          1 │
-│ _part_uuid     │ UUID                      │              │                    │ Unique part identifier (if enabled MergeTree setting assign_part_uuids)                 │                  │                │          1 │
-│ _partition_id  │ LowCardinality(String)    │              │                    │ Name of partition                                                                       │                  │                │          1 │
-│ _sample_factor │ Float64                   │              │                    │ Sample factor (from the query)                                                          │                  │                │          1 │
-│ _part_offset   │ UInt64                    │              │                    │ Number of row in the part                                                               │                  │                │          1 │
-│ _row_exists    │ UInt8                     │              │                    │ Persisted mask created by lightweight delete that show whether row exists or is deleted │                  │                │          1 │
-│ _block_number  │ UInt64                    │              │                    │ Persisted original number of block that was assigned at insert                          │ Delta, LZ4       │                │          1 │
-└────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴────────────┘
+    ┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_virtual─┐
+ 1. │ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │          0 │
+ 2. │ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │          0 │
+ 3. │ t              │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │                                                                                         │ ZSTD(1)          │                │          0 │
+ 4. │ _part          │ LowCardinality(String)    │              │                    │ Name of part                                                                            │                  │                │          1 │
+ 5. │ _part_index    │ UInt64                    │              │                    │ Sequential index of the part in the query result                                        │                  │                │          1 │
+ 6. │ _part_uuid     │ UUID                      │              │                    │ Unique part identifier (if enabled MergeTree setting assign_part_uuids)                 │                  │                │          1 │
+ 7. │ _partition_id  │ LowCardinality(String)    │              │                    │ Name of partition                                                                       │                  │                │          1 │
+ 8. │ _sample_factor │ Float64                   │              │                    │ Sample factor (from the query)                                                          │                  │                │          1 │
+ 9. │ _part_offset   │ UInt64                    │              │                    │ Number of row in the part                                                               │                  │                │          1 │
+10. │ _row_exists    │ UInt8                     │              │                    │ Persisted mask created by lightweight delete that show whether row exists or is deleted │                  │                │          1 │
+11. │ _block_number  │ UInt64                    │              │                    │ Persisted original number of block that was assigned at insert                          │ Delta, LZ4       │                │          1 │
+    └────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴────────────┘
 DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
-┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_virtual─┐
-│ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │          0 │
-│ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │          0 │
-│ t              │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │                                                                                         │ ZSTD(1)          │                │          0 │
-│ _part          │ LowCardinality(String)    │              │                    │ Name of part                                                                            │                  │                │          1 │
-│ _part_index    │ UInt64                    │              │                    │ Sequential index of the part in the query result                                        │                  │                │          1 │
-│ _part_uuid     │ UUID                      │              │                    │ Unique part identifier (if enabled MergeTree setting assign_part_uuids)                 │                  │                │          1 │
-│ _partition_id  │ LowCardinality(String)    │              │                    │ Name of partition                                                                       │                  │                │          1 │
-│ _sample_factor │ Float64                   │              │                    │ Sample factor (from the query)                                                          │                  │                │          1 │
-│ _part_offset   │ UInt64                    │              │                    │ Number of row in the part                                                               │                  │                │          1 │
-│ _row_exists    │ UInt8                     │              │                    │ Persisted mask created by lightweight delete that show whether row exists or is deleted │                  │                │          1 │
-│ _block_number  │ UInt64                    │              │                    │ Persisted original number of block that was assigned at insert                          │ Delta, LZ4       │                │          1 │
-│ _shard_num     │ UInt32                    │              │                    │ Deprecated. Use function shardNum instead                                               │                  │                │          1 │
-└────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴────────────┘
+    ┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_virtual─┐
+ 1. │ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │          0 │
+ 2. │ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │          0 │
+ 3. │ t              │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │                                                                                         │ ZSTD(1)          │                │          0 │
+ 4. │ _part          │ LowCardinality(String)    │              │                    │ Name of part                                                                            │                  │                │          1 │
+ 5. │ _part_index    │ UInt64                    │              │                    │ Sequential index of the part in the query result                                        │                  │                │          1 │
+ 6. │ _part_uuid     │ UUID                      │              │                    │ Unique part identifier (if enabled MergeTree setting assign_part_uuids)                 │                  │                │          1 │
+ 7. │ _partition_id  │ LowCardinality(String)    │              │                    │ Name of partition                                                                       │                  │                │          1 │
+ 8. │ _sample_factor │ Float64                   │              │                    │ Sample factor (from the query)                                                          │                  │                │          1 │
+ 9. │ _part_offset   │ UInt64                    │              │                    │ Number of row in the part                                                               │                  │                │          1 │
+10. │ _row_exists    │ UInt8                     │              │                    │ Persisted mask created by lightweight delete that show whether row exists or is deleted │                  │                │          1 │
+11. │ _block_number  │ UInt64                    │              │                    │ Persisted original number of block that was assigned at insert                          │ Delta, LZ4       │                │          1 │
+12. │ _shard_num     │ UInt32                    │              │                    │ Deprecated. Use function shardNum instead                                               │                  │                │          1 │
+    └────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴────────────┘
 SET describe_compact_output = 0, describe_include_virtual_columns = 1, describe_include_subcolumns = 1;
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┬─is_virtual─┐
-│ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │            0 │          0 │
-│ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │            0 │          0 │
-│ t              │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │                                                                                         │ ZSTD(1)          │                │            0 │          0 │
-│ _part          │ LowCardinality(String)    │              │                    │ Name of part                                                                            │                  │                │            0 │          1 │
-│ _part_index    │ UInt64                    │              │                    │ Sequential index of the part in the query result                                        │                  │                │            0 │          1 │
-│ _part_uuid     │ UUID                      │              │                    │ Unique part identifier (if enabled MergeTree setting assign_part_uuids)                 │                  │                │            0 │          1 │
-│ _partition_id  │ LowCardinality(String)    │              │                    │ Name of partition                                                                       │                  │                │            0 │          1 │
-│ _sample_factor │ Float64                   │              │                    │ Sample factor (from the query)                                                          │                  │                │            0 │          1 │
-│ _part_offset   │ UInt64                    │              │                    │ Number of row in the part                                                               │                  │                │            0 │          1 │
-│ _row_exists    │ UInt8                     │              │                    │ Persisted mask created by lightweight delete that show whether row exists or is deleted │                  │                │            0 │          1 │
-│ _block_number  │ UInt64                    │              │                    │ Persisted original number of block that was assigned at insert                          │ Delta, LZ4       │                │            0 │          1 │
-│ arr.size0      │ UInt64                    │              │                    │                                                                                         │                  │                │            1 │          0 │
-│ t.a            │ String                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
-│ t.b            │ UInt64                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
-└────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴──────────────┴────────────┘
+    ┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┬─is_virtual─┐
+ 1. │ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │            0 │          0 │
+ 2. │ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │            0 │          0 │
+ 3. │ t              │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │                                                                                         │ ZSTD(1)          │                │            0 │          0 │
+ 4. │ _part          │ LowCardinality(String)    │              │                    │ Name of part                                                                            │                  │                │            0 │          1 │
+ 5. │ _part_index    │ UInt64                    │              │                    │ Sequential index of the part in the query result                                        │                  │                │            0 │          1 │
+ 6. │ _part_uuid     │ UUID                      │              │                    │ Unique part identifier (if enabled MergeTree setting assign_part_uuids)                 │                  │                │            0 │          1 │
+ 7. │ _partition_id  │ LowCardinality(String)    │              │                    │ Name of partition                                                                       │                  │                │            0 │          1 │
+ 8. │ _sample_factor │ Float64                   │              │                    │ Sample factor (from the query)                                                          │                  │                │            0 │          1 │
+ 9. │ _part_offset   │ UInt64                    │              │                    │ Number of row in the part                                                               │                  │                │            0 │          1 │
+10. │ _row_exists    │ UInt8                     │              │                    │ Persisted mask created by lightweight delete that show whether row exists or is deleted │                  │                │            0 │          1 │
+11. │ _block_number  │ UInt64                    │              │                    │ Persisted original number of block that was assigned at insert                          │ Delta, LZ4       │                │            0 │          1 │
+12. │ arr.size0      │ UInt64                    │              │                    │                                                                                         │                  │                │            1 │          0 │
+13. │ t.a            │ String                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
+14. │ t.b            │ UInt64                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
+    └────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴──────────────┴────────────┘
 DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
-┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┬─is_virtual─┐
-│ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │            0 │          0 │
-│ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │            0 │          0 │
-│ t              │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │                                                                                         │ ZSTD(1)          │                │            0 │          0 │
-│ _part          │ LowCardinality(String)    │              │                    │ Name of part                                                                            │                  │                │            0 │          1 │
-│ _part_index    │ UInt64                    │              │                    │ Sequential index of the part in the query result                                        │                  │                │            0 │          1 │
-│ _part_uuid     │ UUID                      │              │                    │ Unique part identifier (if enabled MergeTree setting assign_part_uuids)                 │                  │                │            0 │          1 │
-│ _partition_id  │ LowCardinality(String)    │              │                    │ Name of partition                                                                       │                  │                │            0 │          1 │
-│ _sample_factor │ Float64                   │              │                    │ Sample factor (from the query)                                                          │                  │                │            0 │          1 │
-│ _part_offset   │ UInt64                    │              │                    │ Number of row in the part                                                               │                  │                │            0 │          1 │
-│ _row_exists    │ UInt8                     │              │                    │ Persisted mask created by lightweight delete that show whether row exists or is deleted │                  │                │            0 │          1 │
-│ _block_number  │ UInt64                    │              │                    │ Persisted original number of block that was assigned at insert                          │ Delta, LZ4       │                │            0 │          1 │
-│ _shard_num     │ UInt32                    │              │                    │ Deprecated. Use function shardNum instead                                               │                  │                │            0 │          1 │
-│ arr.size0      │ UInt64                    │              │                    │                                                                                         │                  │                │            1 │          0 │
-│ t.a            │ String                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
-│ t.b            │ UInt64                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
-└────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴──────────────┴────────────┘
+    ┌─name───────────┬─type──────────────────────┬─default_type─┬─default_expression─┬─comment─────────────────────────────────────────────────────────────────────────────────┬─codec_expression─┬─ttl_expression─┬─is_subcolumn─┬─is_virtual─┐
+ 1. │ id             │ UInt64                    │              │                    │ index column                                                                            │                  │                │            0 │          0 │
+ 2. │ arr            │ Array(UInt64)             │ DEFAULT      │ [10, 20]           │                                                                                         │ ZSTD(1)          │                │            0 │          0 │
+ 3. │ t              │ Tuple(a String, b UInt64) │ DEFAULT      │ ('foo', 0)         │                                                                                         │ ZSTD(1)          │                │            0 │          0 │
+ 4. │ _part          │ LowCardinality(String)    │              │                    │ Name of part                                                                            │                  │                │            0 │          1 │
+ 5. │ _part_index    │ UInt64                    │              │                    │ Sequential index of the part in the query result                                        │                  │                │            0 │          1 │
+ 6. │ _part_uuid     │ UUID                      │              │                    │ Unique part identifier (if enabled MergeTree setting assign_part_uuids)                 │                  │                │            0 │          1 │
+ 7. │ _partition_id  │ LowCardinality(String)    │              │                    │ Name of partition                                                                       │                  │                │            0 │          1 │
+ 8. │ _sample_factor │ Float64                   │              │                    │ Sample factor (from the query)                                                          │                  │                │            0 │          1 │
+ 9. │ _part_offset   │ UInt64                    │              │                    │ Number of row in the part                                                               │                  │                │            0 │          1 │
+10. │ _row_exists    │ UInt8                     │              │                    │ Persisted mask created by lightweight delete that show whether row exists or is deleted │                  │                │            0 │          1 │
+11. │ _block_number  │ UInt64                    │              │                    │ Persisted original number of block that was assigned at insert                          │ Delta, LZ4       │                │            0 │          1 │
+12. │ _shard_num     │ UInt32                    │              │                    │ Deprecated. Use function shardNum instead                                               │                  │                │            0 │          1 │
+13. │ arr.size0      │ UInt64                    │              │                    │                                                                                         │                  │                │            1 │          0 │
+14. │ t.a            │ String                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
+15. │ t.b            │ UInt64                    │              │                    │                                                                                         │ ZSTD(1)          │                │            1 │          0 │
+    └────────────────┴───────────────────────────┴──────────────┴────────────────────┴─────────────────────────────────────────────────────────────────────────────────────────┴──────────────────┴────────────────┴──────────────┴────────────┘
 SET describe_compact_output = 1, describe_include_virtual_columns = 0, describe_include_subcolumns = 0;
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-┌─name─┬─type──────────────────────┐
-│ id   │ UInt64                    │
-│ arr  │ Array(UInt64)             │
-│ t    │ Tuple(a String, b UInt64) │
-└──────┴───────────────────────────┘
+   ┌─name─┬─type──────────────────────┐
+1. │ id   │ UInt64                    │
+2. │ arr  │ Array(UInt64)             │
+3. │ t    │ Tuple(a String, b UInt64) │
+   └──────┴───────────────────────────┘
 DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
-┌─name─┬─type──────────────────────┐
-│ id   │ UInt64                    │
-│ arr  │ Array(UInt64)             │
-│ t    │ Tuple(a String, b UInt64) │
-└──────┴───────────────────────────┘
+   ┌─name─┬─type──────────────────────┐
+1. │ id   │ UInt64                    │
+2. │ arr  │ Array(UInt64)             │
+3. │ t    │ Tuple(a String, b UInt64) │
+   └──────┴───────────────────────────┘
 SET describe_compact_output = 1, describe_include_virtual_columns = 0, describe_include_subcolumns = 1;
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-┌─name──────┬─type──────────────────────┬─is_subcolumn─┐
-│ id        │ UInt64                    │            0 │
-│ arr       │ Array(UInt64)             │            0 │
-│ t         │ Tuple(a String, b UInt64) │            0 │
-│ arr.size0 │ UInt64                    │            1 │
-│ t.a       │ String                    │            1 │
-│ t.b       │ UInt64                    │            1 │
-└───────────┴───────────────────────────┴──────────────┘
+   ┌─name──────┬─type──────────────────────┬─is_subcolumn─┐
+1. │ id        │ UInt64                    │            0 │
+2. │ arr       │ Array(UInt64)             │            0 │
+3. │ t         │ Tuple(a String, b UInt64) │            0 │
+4. │ arr.size0 │ UInt64                    │            1 │
+5. │ t.a       │ String                    │            1 │
+6. │ t.b       │ UInt64                    │            1 │
+   └───────────┴───────────────────────────┴──────────────┘
 DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
-┌─name──────┬─type──────────────────────┬─is_subcolumn─┐
-│ id        │ UInt64                    │            0 │
-│ arr       │ Array(UInt64)             │            0 │
-│ t         │ Tuple(a String, b UInt64) │            0 │
-│ arr.size0 │ UInt64                    │            1 │
-│ t.a       │ String                    │            1 │
-│ t.b       │ UInt64                    │            1 │
-└───────────┴───────────────────────────┴──────────────┘
+   ┌─name──────┬─type──────────────────────┬─is_subcolumn─┐
+1. │ id        │ UInt64                    │            0 │
+2. │ arr       │ Array(UInt64)             │            0 │
+3. │ t         │ Tuple(a String, b UInt64) │            0 │
+4. │ arr.size0 │ UInt64                    │            1 │
+5. │ t.a       │ String                    │            1 │
+6. │ t.b       │ UInt64                    │            1 │
+   └───────────┴───────────────────────────┴──────────────┘
 SET describe_compact_output = 1, describe_include_virtual_columns = 1, describe_include_subcolumns = 0;
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-┌─name───────────┬─type──────────────────────┬─is_virtual─┐
-│ id             │ UInt64                    │          0 │
-│ arr            │ Array(UInt64)             │          0 │
-│ t              │ Tuple(a String, b UInt64) │          0 │
-│ _part          │ LowCardinality(String)    │          1 │
-│ _part_index    │ UInt64                    │          1 │
-│ _part_uuid     │ UUID                      │          1 │
-│ _partition_id  │ LowCardinality(String)    │          1 │
-│ _sample_factor │ Float64                   │          1 │
-│ _part_offset   │ UInt64                    │          1 │
-│ _row_exists    │ UInt8                     │          1 │
-│ _block_number  │ UInt64                    │          1 │
-└────────────────┴───────────────────────────┴────────────┘
+    ┌─name───────────┬─type──────────────────────┬─is_virtual─┐
+ 1. │ id             │ UInt64                    │          0 │
+ 2. │ arr            │ Array(UInt64)             │          0 │
+ 3. │ t              │ Tuple(a String, b UInt64) │          0 │
+ 4. │ _part          │ LowCardinality(String)    │          1 │
+ 5. │ _part_index    │ UInt64                    │          1 │
+ 6. │ _part_uuid     │ UUID                      │          1 │
+ 7. │ _partition_id  │ LowCardinality(String)    │          1 │
+ 8. │ _sample_factor │ Float64                   │          1 │
+ 9. │ _part_offset   │ UInt64                    │          1 │
+10. │ _row_exists    │ UInt8                     │          1 │
+11. │ _block_number  │ UInt64                    │          1 │
+    └────────────────┴───────────────────────────┴────────────┘
 DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
-┌─name───────────┬─type──────────────────────┬─is_virtual─┐
-│ id             │ UInt64                    │          0 │
-│ arr            │ Array(UInt64)             │          0 │
-│ t              │ Tuple(a String, b UInt64) │          0 │
-│ _part          │ LowCardinality(String)    │          1 │
-│ _part_index    │ UInt64                    │          1 │
-│ _part_uuid     │ UUID                      │          1 │
-│ _partition_id  │ LowCardinality(String)    │          1 │
-│ _sample_factor │ Float64                   │          1 │
-│ _part_offset   │ UInt64                    │          1 │
-│ _row_exists    │ UInt8                     │          1 │
-│ _block_number  │ UInt64                    │          1 │
-│ _shard_num     │ UInt32                    │          1 │
-└────────────────┴───────────────────────────┴────────────┘
+    ┌─name───────────┬─type──────────────────────┬─is_virtual─┐
+ 1. │ id             │ UInt64                    │          0 │
+ 2. │ arr            │ Array(UInt64)             │          0 │
+ 3. │ t              │ Tuple(a String, b UInt64) │          0 │
+ 4. │ _part          │ LowCardinality(String)    │          1 │
+ 5. │ _part_index    │ UInt64                    │          1 │
+ 6. │ _part_uuid     │ UUID                      │          1 │
+ 7. │ _partition_id  │ LowCardinality(String)    │          1 │
+ 8. │ _sample_factor │ Float64                   │          1 │
+ 9. │ _part_offset   │ UInt64                    │          1 │
+10. │ _row_exists    │ UInt8                     │          1 │
+11. │ _block_number  │ UInt64                    │          1 │
+12. │ _shard_num     │ UInt32                    │          1 │
+    └────────────────┴───────────────────────────┴────────────┘
 SET describe_compact_output = 1, describe_include_virtual_columns = 1, describe_include_subcolumns = 1;
 DESCRIBE TABLE t_describe_options FORMAT PrettyCompactNoEscapes;
-┌─name───────────┬─type──────────────────────┬─is_subcolumn─┬─is_virtual─┐
-│ id             │ UInt64                    │            0 │          0 │
-│ arr            │ Array(UInt64)             │            0 │          0 │
-│ t              │ Tuple(a String, b UInt64) │            0 │          0 │
-│ _part          │ LowCardinality(String)    │            0 │          1 │
-│ _part_index    │ UInt64                    │            0 │          1 │
-│ _part_uuid     │ UUID                      │            0 │          1 │
-│ _partition_id  │ LowCardinality(String)    │            0 │          1 │
-│ _sample_factor │ Float64                   │            0 │          1 │
-│ _part_offset   │ UInt64                    │            0 │          1 │
-│ _row_exists    │ UInt8                     │            0 │          1 │
-│ _block_number  │ UInt64                    │            0 │          1 │
-│ arr.size0      │ UInt64                    │            1 │          0 │
-│ t.a            │ String                    │            1 │          0 │
-│ t.b            │ UInt64                    │            1 │          0 │
-└────────────────┴───────────────────────────┴──────────────┴────────────┘
+    ┌─name───────────┬─type──────────────────────┬─is_subcolumn─┬─is_virtual─┐
+ 1. │ id             │ UInt64                    │            0 │          0 │
+ 2. │ arr            │ Array(UInt64)             │            0 │          0 │
+ 3. │ t              │ Tuple(a String, b UInt64) │            0 │          0 │
+ 4. │ _part          │ LowCardinality(String)    │            0 │          1 │
+ 5. │ _part_index    │ UInt64                    │            0 │          1 │
+ 6. │ _part_uuid     │ UUID                      │            0 │          1 │
+ 7. │ _partition_id  │ LowCardinality(String)    │            0 │          1 │
+ 8. │ _sample_factor │ Float64                   │            0 │          1 │
+ 9. │ _part_offset   │ UInt64                    │            0 │          1 │
+10. │ _row_exists    │ UInt8                     │            0 │          1 │
+11. │ _block_number  │ UInt64                    │            0 │          1 │
+12. │ arr.size0      │ UInt64                    │            1 │          0 │
+13. │ t.a            │ String                    │            1 │          0 │
+14. │ t.b            │ UInt64                    │            1 │          0 │
+    └────────────────┴───────────────────────────┴──────────────┴────────────┘
 DESCRIBE remote(test_shard_localhost, currentDatabase(), t_describe_options) FORMAT PrettyCompactNoEscapes;
-┌─name───────────┬─type──────────────────────┬─is_subcolumn─┬─is_virtual─┐
-│ id             │ UInt64                    │            0 │          0 │
-│ arr            │ Array(UInt64)             │            0 │          0 │
-│ t              │ Tuple(a String, b UInt64) │            0 │          0 │
-│ _part          │ LowCardinality(String)    │            0 │          1 │
-│ _part_index    │ UInt64                    │            0 │          1 │
-│ _part_uuid     │ UUID                      │            0 │          1 │
-│ _partition_id  │ LowCardinality(String)    │            0 │          1 │
-│ _sample_factor │ Float64                   │            0 │          1 │
-│ _part_offset   │ UInt64                    │            0 │          1 │
-│ _row_exists    │ UInt8                     │            0 │          1 │
-│ _block_number  │ UInt64                    │            0 │          1 │
-│ _shard_num     │ UInt32                    │            0 │          1 │
-│ arr.size0      │ UInt64                    │            1 │          0 │
-│ t.a            │ String                    │            1 │          0 │
-│ t.b            │ UInt64                    │            1 │          0 │
-└────────────────┴───────────────────────────┴──────────────┴────────────┘
+    ┌─name───────────┬─type──────────────────────┬─is_subcolumn─┬─is_virtual─┐
+ 1. │ id             │ UInt64                    │            0 │          0 │
+ 2. │ arr            │ Array(UInt64)             │            0 │          0 │
+ 3. │ t              │ Tuple(a String, b UInt64) │            0 │          0 │
+ 4. │ _part          │ LowCardinality(String)    │            0 │          1 │
+ 5. │ _part_index    │ UInt64                    │            0 │          1 │
+ 6. │ _part_uuid     │ UUID                      │            0 │          1 │
+ 7. │ _partition_id  │ LowCardinality(String)    │            0 │          1 │
+ 8. │ _sample_factor │ Float64                   │            0 │          1 │
+ 9. │ _part_offset   │ UInt64                    │            0 │          1 │
+10. │ _row_exists    │ UInt8                     │            0 │          1 │
+11. │ _block_number  │ UInt64                    │            0 │          1 │
+12. │ _shard_num     │ UInt32                    │            0 │          1 │
+13. │ arr.size0      │ UInt64                    │            1 │          0 │
+14. │ t.a            │ String                    │            1 │          0 │
+15. │ t.b            │ UInt64                    │            1 │          0 │
+    └────────────────┴───────────────────────────┴──────────────┴────────────┘
diff --git a/tests/queries/0_stateless/02896_union_distinct_http_format.reference b/tests/queries/0_stateless/02896_union_distinct_http_format.reference
index 3a68ab6dc9f..406c89021c1 100644
--- a/tests/queries/0_stateless/02896_union_distinct_http_format.reference
+++ b/tests/queries/0_stateless/02896_union_distinct_http_format.reference
@@ -1,7 +1,7 @@
-┌─[1m1[0m─┐
-│ 1 │
-└───┘
-┌─[1ma[0m─┐
-│ 1 │
-│ 2 │
-└───┘
+   ┌─[1m1[0m─┐
+[90m1. [0m│ 1 │
+   └───┘
+   ┌─[1ma[0m─┐
+[90m1. [0m│ 1 │
+[90m2. [0m│ 2 │
+   └───┘
diff --git a/tests/queries/0_stateless/02947_merge_tree_index_table_1.reference b/tests/queries/0_stateless/02947_merge_tree_index_table_1.reference
index 0ce9de91293..d4397328dbc 100644
--- a/tests/queries/0_stateless/02947_merge_tree_index_table_1.reference
+++ b/tests/queries/0_stateless/02947_merge_tree_index_table_1.reference
@@ -18,30 +18,30 @@
 3	18	v324
 4	14	v196
 4	19	v361
-┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬──b─┐
-│ all_1_1_0 │           0 │               3 │ 0 │  0 │
-│ all_1_1_0 │           1 │               3 │ 1 │  6 │
-│ all_1_1_0 │           2 │               3 │ 3 │  3 │
-│ all_1_1_0 │           3 │               1 │ 4 │  9 │
-│ all_1_1_0 │           4 │               0 │ 4 │  9 │
-│ all_2_2_0 │           0 │               3 │ 0 │ 10 │
-│ all_2_2_0 │           1 │               3 │ 1 │ 16 │
-│ all_2_2_0 │           2 │               3 │ 3 │ 13 │
-│ all_2_2_0 │           3 │               1 │ 4 │ 19 │
-│ all_2_2_0 │           4 │               0 │ 4 │ 19 │
-└───────────┴─────────────┴─────────────────┴───┴────┘
-┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬──b─┬─a.mark─┬─b.mark─┬─s.mark─┐
-│ all_1_1_0 │           0 │               3 │ 0 │  0 │ (0,0)  │ (0,0)  │ (0,0)  │
-│ all_1_1_0 │           1 │               3 │ 1 │  6 │ (0,24) │ (0,24) │ (0,10) │
-│ all_1_1_0 │           2 │               3 │ 3 │  3 │ (0,48) │ (0,48) │ (0,21) │
-│ all_1_1_0 │           3 │               1 │ 4 │  9 │ (0,72) │ (0,72) │ (0,32) │
-│ all_1_1_0 │           4 │               0 │ 4 │  9 │ (0,80) │ (0,80) │ (0,36) │
-│ all_2_2_0 │           0 │               3 │ 0 │ 10 │ (0,0)  │ (0,0)  │ (0,0)  │
-│ all_2_2_0 │           1 │               3 │ 1 │ 16 │ (0,24) │ (0,24) │ (0,15) │
-│ all_2_2_0 │           2 │               3 │ 3 │ 13 │ (0,48) │ (0,48) │ (0,30) │
-│ all_2_2_0 │           3 │               1 │ 4 │ 19 │ (0,72) │ (0,72) │ (0,45) │
-│ all_2_2_0 │           4 │               0 │ 4 │ 19 │ (0,80) │ (0,80) │ (0,50) │
-└───────────┴─────────────┴─────────────────┴───┴────┴────────┴────────┴────────┘
+    ┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬──b─┐
+ 1. │ all_1_1_0 │           0 │               3 │ 0 │  0 │
+ 2. │ all_1_1_0 │           1 │               3 │ 1 │  6 │
+ 3. │ all_1_1_0 │           2 │               3 │ 3 │  3 │
+ 4. │ all_1_1_0 │           3 │               1 │ 4 │  9 │
+ 5. │ all_1_1_0 │           4 │               0 │ 4 │  9 │
+ 6. │ all_2_2_0 │           0 │               3 │ 0 │ 10 │
+ 7. │ all_2_2_0 │           1 │               3 │ 1 │ 16 │
+ 8. │ all_2_2_0 │           2 │               3 │ 3 │ 13 │
+ 9. │ all_2_2_0 │           3 │               1 │ 4 │ 19 │
+10. │ all_2_2_0 │           4 │               0 │ 4 │ 19 │
+    └───────────┴─────────────┴─────────────────┴───┴────┘
+    ┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬──b─┬─a.mark─┬─b.mark─┬─s.mark─┐
+ 1. │ all_1_1_0 │           0 │               3 │ 0 │  0 │ (0,0)  │ (0,0)  │ (0,0)  │
+ 2. │ all_1_1_0 │           1 │               3 │ 1 │  6 │ (0,24) │ (0,24) │ (0,10) │
+ 3. │ all_1_1_0 │           2 │               3 │ 3 │  3 │ (0,48) │ (0,48) │ (0,21) │
+ 4. │ all_1_1_0 │           3 │               1 │ 4 │  9 │ (0,72) │ (0,72) │ (0,32) │
+ 5. │ all_1_1_0 │           4 │               0 │ 4 │  9 │ (0,80) │ (0,80) │ (0,36) │
+ 6. │ all_2_2_0 │           0 │               3 │ 0 │ 10 │ (0,0)  │ (0,0)  │ (0,0)  │
+ 7. │ all_2_2_0 │           1 │               3 │ 1 │ 16 │ (0,24) │ (0,24) │ (0,15) │
+ 8. │ all_2_2_0 │           2 │               3 │ 3 │ 13 │ (0,48) │ (0,48) │ (0,30) │
+ 9. │ all_2_2_0 │           3 │               1 │ 4 │ 19 │ (0,72) │ (0,72) │ (0,45) │
+10. │ all_2_2_0 │           4 │               0 │ 4 │ 19 │ (0,80) │ (0,80) │ (0,50) │
+    └───────────┴─────────────┴─────────────────┴───┴────┴────────┴────────┴────────┘
 0	0	v0
 0	4	v16
 0	8	v64
@@ -62,23 +62,23 @@
 3	11	v121
 3	15	v225
 3	19	v361
-┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬──b─┐
-│ all_1_1_0 │           0 │               3 │ 0 │  0 │
-│ all_1_1_0 │           1 │               3 │ 1 │  1 │
-│ all_1_1_0 │           2 │               4 │ 2 │  2 │
-│ all_1_1_0 │           3 │               0 │ 3 │  7 │
-│ all_2_2_0 │           0 │               3 │ 0 │ 12 │
-│ all_2_2_0 │           1 │               3 │ 1 │ 17 │
-│ all_2_2_0 │           2 │               4 │ 2 │ 18 │
-│ all_2_2_0 │           3 │               0 │ 3 │ 19 │
-└───────────┴─────────────┴─────────────────┴───┴────┘
-┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬──b─┬─a.mark──┬─b.mark──┬─s.mark──┐
-│ all_1_1_0 │           0 │               3 │ 0 │  0 │ (0,0)   │ (35,0)  │ (77,0)  │
-│ all_1_1_0 │           1 │               3 │ 1 │  1 │ (114,0) │ (153,0) │ (197,0) │
-│ all_1_1_0 │           2 │               4 │ 2 │  2 │ (234,0) │ (281,0) │ (329,0) │
-│ all_1_1_0 │           3 │               0 │ 3 │  7 │ (369,0) │ (369,0) │ (369,0) │
-│ all_2_2_0 │           0 │               3 │ 0 │ 12 │ (0,0)   │ (38,0)  │ (82,0)  │
-│ all_2_2_0 │           1 │               3 │ 1 │ 17 │ (124,0) │ (168,0) │ (212,0) │
-│ all_2_2_0 │           2 │               4 │ 2 │ 18 │ (254,0) │ (297,0) │ (345,0) │
-│ all_2_2_0 │           3 │               0 │ 3 │ 19 │ (392,0) │ (392,0) │ (392,0) │
-└───────────┴─────────────┴─────────────────┴───┴────┴─────────┴─────────┴─────────┘
+   ┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬──b─┐
+1. │ all_1_1_0 │           0 │               3 │ 0 │  0 │
+2. │ all_1_1_0 │           1 │               3 │ 1 │  1 │
+3. │ all_1_1_0 │           2 │               4 │ 2 │  2 │
+4. │ all_1_1_0 │           3 │               0 │ 3 │  7 │
+5. │ all_2_2_0 │           0 │               3 │ 0 │ 12 │
+6. │ all_2_2_0 │           1 │               3 │ 1 │ 17 │
+7. │ all_2_2_0 │           2 │               4 │ 2 │ 18 │
+8. │ all_2_2_0 │           3 │               0 │ 3 │ 19 │
+   └───────────┴─────────────┴─────────────────┴───┴────┘
+   ┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬──b─┬─a.mark──┬─b.mark──┬─s.mark──┐
+1. │ all_1_1_0 │           0 │               3 │ 0 │  0 │ (0,0)   │ (42,0)  │ (96,0)  │
+2. │ all_1_1_0 │           1 │               3 │ 1 │  1 │ (141,0) │ (195,0) │ (249,0) │
+3. │ all_1_1_0 │           2 │               4 │ 2 │  2 │ (294,0) │ (349,0) │ (404,0) │
+4. │ all_1_1_0 │           3 │               0 │ 3 │  7 │ (452,0) │ (452,0) │ (452,0) │
+5. │ all_2_2_0 │           0 │               3 │ 0 │ 12 │ (0,0)   │ (50,0)  │ (104,0) │
+6. │ all_2_2_0 │           1 │               3 │ 1 │ 17 │ (153,0) │ (207,0) │ (261,0) │
+7. │ all_2_2_0 │           2 │               4 │ 2 │ 18 │ (310,0) │ (365,0) │ (420,0) │
+8. │ all_2_2_0 │           3 │               0 │ 3 │ 19 │ (474,0) │ (474,0) │ (474,0) │
+   └───────────┴─────────────┴─────────────────┴───┴────┴─────────┴─────────┴─────────┘
diff --git a/tests/queries/0_stateless/02947_merge_tree_index_table_2.reference b/tests/queries/0_stateless/02947_merge_tree_index_table_2.reference
index 7bfcb7b2822..5328ff18d12 100644
--- a/tests/queries/0_stateless/02947_merge_tree_index_table_2.reference
+++ b/tests/queries/0_stateless/02947_merge_tree_index_table_2.reference
@@ -13,21 +13,21 @@
 │ all_3_3_0 │           3 │               1 │ 4 │ 9 │                         96 │
 │ all_3_3_0 │           4 │               0 │ 4 │ 9 │                         96 │
 └───────────┴─────────────┴─────────────────┴───┴───┴────────────────────────────┘
-┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬─b─┬─modulo(sipHash64(sp), 100)─┬─a.mark──┬─b.mark──┬─c.mark──────┬─sp.sparse.idx.mark─┬─sp.mark─┬─arr.size0.mark─┬─arr.dict.mark─┬─arr.mark─┬─n.size0.mark─┬─n%2Ec1.mark─┬─n%2Ec2.mark─┬─t%2Ec2.mark─┬─t%2Ec1.mark─┬─t.mark──────┬─column%2Ewith%2Edots.mark─┐
-│ all_1_1_0 │           0 │               3 │ 0 │ 0 │                         19 │ (0,0)   │ (0,0)   │ (NULL,NULL) │ (0,0)              │ (0,0)   │ (0,0)          │ (0,8)         │ (0,0)    │ (0,0)        │ (0,0)       │ (0,0)       │ (0,0)       │ (0,0)       │ (NULL,NULL) │ (0,0)                     │
-│ all_1_1_0 │           1 │               3 │ 1 │ 6 │                         19 │ (0,24)  │ (0,24)  │ (NULL,NULL) │ (0,9)              │ (0,0)   │ (0,24)         │ (0,8)         │ (0,22)   │ (0,24)       │ (0,36)      │ (0,72)      │ (0,24)      │ (0,24)      │ (NULL,NULL) │ (0,24)                    │
-│ all_1_1_0 │           2 │               3 │ 3 │ 3 │                         19 │ (0,48)  │ (0,48)  │ (NULL,NULL) │ (0,18)             │ (0,0)   │ (0,48)         │ (0,8)         │ (0,44)   │ (0,48)       │ (0,72)      │ (0,144)     │ (0,48)      │ (0,48)      │ (NULL,NULL) │ (0,48)                    │
-│ all_1_1_0 │           3 │               1 │ 4 │ 9 │                         19 │ (0,72)  │ (0,72)  │ (NULL,NULL) │ (0,27)             │ (0,0)   │ (0,72)         │ (0,8)         │ (0,66)   │ (0,72)       │ (0,108)     │ (0,216)     │ (0,72)      │ (0,72)      │ (NULL,NULL) │ (0,72)                    │
-│ all_1_1_0 │           4 │               0 │ 4 │ 9 │                         19 │ (0,80)  │ (0,80)  │ (NULL,NULL) │ (0,36)             │ (0,0)   │ (0,80)         │ (0,25)        │ (0,84)   │ (0,80)       │ (0,120)     │ (0,240)     │ (0,80)      │ (0,80)      │ (NULL,NULL) │ (0,80)                    │
-│ all_2_2_0 │           0 │               3 │ 0 │ 0 │                         96 │ (0,0)   │ (42,0)  │ (84,0)      │ (NULL,NULL)        │ (126,0) │ (NULL,NULL)    │ (NULL,NULL)   │ (165,0)  │ (NULL,NULL)  │ (232,0)     │ (286,0)     │ (NULL,NULL) │ (NULL,NULL) │ (342,0)     │ (391,0)                   │
-│ all_2_2_0 │           1 │               2 │ 3 │ 3 │                         96 │ (433,0) │ (472,0) │ (511,0)     │ (NULL,NULL)        │ (550,0) │ (NULL,NULL)    │ (NULL,NULL)   │ (589,0)  │ (NULL,NULL)  │ (659,0)     │ (717,0)     │ (NULL,NULL) │ (NULL,NULL) │ (773,0)     │ (817,0)                   │
-│ all_2_2_0 │           2 │               0 │ 4 │ 4 │                         96 │ (856,0) │ (856,0) │ (856,0)     │ (NULL,NULL)        │ (856,0) │ (NULL,NULL)    │ (NULL,NULL)   │ (856,0)  │ (NULL,NULL)  │ (856,0)     │ (856,0)     │ (NULL,NULL) │ (NULL,NULL) │ (856,0)     │ (856,0)                   │
-│ all_3_3_0 │           0 │               3 │ 0 │ 0 │                         96 │ (0,0)   │ (0,0)   │ (0,0)       │ (NULL,NULL)        │ (0,0)   │ (0,0)          │ (0,8)         │ (0,0)    │ (0,0)        │ (0,0)       │ (0,0)       │ (0,0)       │ (0,0)       │ (NULL,NULL) │ (0,0)                     │
-│ all_3_3_0 │           1 │               3 │ 1 │ 6 │                         96 │ (0,24)  │ (0,24)  │ (0,24)      │ (NULL,NULL)        │ (0,24)  │ (0,24)         │ (0,8)         │ (0,22)   │ (0,24)       │ (0,36)      │ (0,72)      │ (0,24)      │ (0,24)      │ (NULL,NULL) │ (0,24)                    │
-│ all_3_3_0 │           2 │               3 │ 3 │ 3 │                         96 │ (0,48)  │ (0,48)  │ (0,48)      │ (NULL,NULL)        │ (0,48)  │ (0,48)         │ (0,8)         │ (0,44)   │ (0,48)       │ (0,72)      │ (0,144)     │ (0,48)      │ (0,48)      │ (NULL,NULL) │ (0,48)                    │
-│ all_3_3_0 │           3 │               1 │ 4 │ 9 │                         96 │ (0,72)  │ (0,72)  │ (0,72)      │ (NULL,NULL)        │ (0,72)  │ (0,72)         │ (0,8)         │ (0,66)   │ (0,72)       │ (0,108)     │ (0,216)     │ (0,72)      │ (0,72)      │ (NULL,NULL) │ (0,72)                    │
-│ all_3_3_0 │           4 │               0 │ 4 │ 9 │                         96 │ (0,80)  │ (0,80)  │ (0,80)      │ (NULL,NULL)        │ (0,80)  │ (0,80)         │ (0,25)        │ (0,84)   │ (0,80)       │ (0,120)     │ (0,240)     │ (0,80)      │ (0,80)      │ (NULL,NULL) │ (0,80)                    │
-└───────────┴─────────────┴─────────────────┴───┴───┴────────────────────────────┴─────────┴─────────┴─────────────┴────────────────────┴─────────┴────────────────┴───────────────┴──────────┴──────────────┴─────────────┴─────────────┴─────────────┴─────────────┴─────────────┴───────────────────────────┘
+┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬─b─┬─modulo(sipHash64(sp), 100)─┬─a.mark───┬─b.mark───┬─c.mark──────┬─sp.sparse.idx.mark─┬─sp.mark──┬─arr.size0.mark─┬─arr.dict.mark─┬─arr.mark─┬─n.size0.mark─┬─n%2Ec1.mark─┬─n%2Ec2.mark─┬─t%2Ec2.mark─┬─t%2Ec1.mark─┬─t.mark──────┬─column%2Ewith%2Edots.mark─┐
+│ all_1_1_0 │           0 │               3 │ 0 │ 0 │                         19 │ (0,0)    │ (0,0)    │ (NULL,NULL) │ (0,0)              │ (0,0)    │ (0,0)          │ (0,8)         │ (0,0)    │ (0,0)        │ (0,0)       │ (0,0)       │ (0,0)       │ (0,0)       │ (NULL,NULL) │ (0,0)                     │
+│ all_1_1_0 │           1 │               3 │ 1 │ 6 │                         19 │ (0,24)   │ (0,24)   │ (NULL,NULL) │ (0,9)              │ (0,0)    │ (0,24)         │ (0,8)         │ (0,22)   │ (0,24)       │ (0,36)      │ (0,72)      │ (0,24)      │ (0,24)      │ (NULL,NULL) │ (0,24)                    │
+│ all_1_1_0 │           2 │               3 │ 3 │ 3 │                         19 │ (0,48)   │ (0,48)   │ (NULL,NULL) │ (0,18)             │ (0,0)    │ (0,48)         │ (0,8)         │ (0,44)   │ (0,48)       │ (0,72)      │ (0,144)     │ (0,48)      │ (0,48)      │ (NULL,NULL) │ (0,48)                    │
+│ all_1_1_0 │           3 │               1 │ 4 │ 9 │                         19 │ (0,72)   │ (0,72)   │ (NULL,NULL) │ (0,27)             │ (0,0)    │ (0,72)         │ (0,8)         │ (0,66)   │ (0,72)       │ (0,108)     │ (0,216)     │ (0,72)      │ (0,72)      │ (NULL,NULL) │ (0,72)                    │
+│ all_1_1_0 │           4 │               0 │ 4 │ 9 │                         19 │ (0,80)   │ (0,80)   │ (NULL,NULL) │ (0,36)             │ (0,0)    │ (0,80)         │ (0,25)        │ (0,84)   │ (0,80)       │ (0,120)     │ (0,240)     │ (0,80)      │ (0,80)      │ (NULL,NULL) │ (0,80)                    │
+│ all_2_2_0 │           0 │               3 │ 0 │ 0 │                         96 │ (0,0)    │ (54,0)   │ (108,0)     │ (NULL,NULL)        │ (162,0)  │ (NULL,NULL)    │ (NULL,NULL)   │ (216,0)  │ (NULL,NULL)  │ (291,0)     │ (355,0)     │ (NULL,NULL) │ (NULL,NULL) │ (426,0)     │ (484,0)                   │
+│ all_2_2_0 │           1 │               2 │ 3 │ 3 │                         96 │ (538,0)  │ (588,0)  │ (638,0)     │ (NULL,NULL)        │ (688,0)  │ (NULL,NULL)    │ (NULL,NULL)   │ (738,0)  │ (NULL,NULL)  │ (808,0)     │ (868,0)     │ (NULL,NULL) │ (NULL,NULL) │ (931,0)     │ (986,0)                   │
+│ all_2_2_0 │           2 │               0 │ 4 │ 4 │                         96 │ (1036,0) │ (1036,0) │ (1036,0)    │ (NULL,NULL)        │ (1036,0) │ (NULL,NULL)    │ (NULL,NULL)   │ (1036,0) │ (NULL,NULL)  │ (1036,0)    │ (1036,0)    │ (NULL,NULL) │ (NULL,NULL) │ (1036,0)    │ (1036,0)                  │
+│ all_3_3_0 │           0 │               3 │ 0 │ 0 │                         96 │ (0,0)    │ (0,0)    │ (0,0)       │ (NULL,NULL)        │ (0,0)    │ (0,0)          │ (0,8)         │ (0,0)    │ (0,0)        │ (0,0)       │ (0,0)       │ (0,0)       │ (0,0)       │ (NULL,NULL) │ (0,0)                     │
+│ all_3_3_0 │           1 │               3 │ 1 │ 6 │                         96 │ (0,24)   │ (0,24)   │ (0,24)      │ (NULL,NULL)        │ (0,24)   │ (0,24)         │ (0,8)         │ (0,22)   │ (0,24)       │ (0,36)      │ (0,72)      │ (0,24)      │ (0,24)      │ (NULL,NULL) │ (0,24)                    │
+│ all_3_3_0 │           2 │               3 │ 3 │ 3 │                         96 │ (0,48)   │ (0,48)   │ (0,48)      │ (NULL,NULL)        │ (0,48)   │ (0,48)         │ (0,8)         │ (0,44)   │ (0,48)       │ (0,72)      │ (0,144)     │ (0,48)      │ (0,48)      │ (NULL,NULL) │ (0,48)                    │
+│ all_3_3_0 │           3 │               1 │ 4 │ 9 │                         96 │ (0,72)   │ (0,72)   │ (0,72)      │ (NULL,NULL)        │ (0,72)   │ (0,72)         │ (0,8)         │ (0,66)   │ (0,72)       │ (0,108)     │ (0,216)     │ (0,72)      │ (0,72)      │ (NULL,NULL) │ (0,72)                    │
+│ all_3_3_0 │           4 │               0 │ 4 │ 9 │                         96 │ (0,80)   │ (0,80)   │ (0,80)      │ (NULL,NULL)        │ (0,80)   │ (0,80)         │ (0,25)        │ (0,84)   │ (0,80)       │ (0,120)     │ (0,240)     │ (0,80)      │ (0,80)      │ (NULL,NULL) │ (0,80)                    │
+└───────────┴─────────────┴─────────────────┴───┴───┴────────────────────────────┴──────────┴──────────┴─────────────┴────────────────────┴──────────┴────────────────┴───────────────┴──────────┴──────────────┴─────────────┴─────────────┴─────────────┴─────────────┴─────────────┴───────────────────────────┘
 part_name	String
 mark_number	UInt64
 rows_in_granule	UInt64
diff --git a/tests/queries/0_stateless/02998_pretty_format_print_readable_number_on_single_value.reference b/tests/queries/0_stateless/02998_pretty_format_print_readable_number_on_single_value.reference
index 496e0337209..357b534cf00 100644
--- a/tests/queries/0_stateless/02998_pretty_format_print_readable_number_on_single_value.reference
+++ b/tests/queries/0_stateless/02998_pretty_format_print_readable_number_on_single_value.reference
@@ -1,360 +1,360 @@
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000000 │
-└─────────┘
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000000 │
-└─────────┘
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000000 │
-└─────────┘
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000000 │
-└─────────┘
-┌───────a─┐
-│ 1000000 │
-└─────────┘
-┌───────a─┐
-│ 1000000 │
-└─────────┘
-┌───────a─┐
-│ 1000000 │
-└─────────┘
-┌───────a─┐
-│ 1000000 │
-└─────────┘
-       a
-
- 1000000 
-       a
-
- 1000000 
-       a
-
- 1000000 
-       a
-
- 1000000 
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000000 │ -- 1.00 million
-└─────────┘
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000000 │ -- 1.00 million
-└─────────┘
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000000 │ -- 1.00 million
-└─────────┘
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000000 │ -- 1.00 million
-└─────────┘
-┌───────a─┐
-│ 1000000 │ -- 1.00 million
-└─────────┘
-┌───────a─┐
-│ 1000000 │ -- 1.00 million
-└─────────┘
-┌───────a─┐
-│ 1000000 │ -- 1.00 million
-└─────────┘
-┌───────a─┐
-│ 1000000 │ -- 1.00 million
-└─────────┘
-       a
-
- 1000000  -- 1.00 million
-       a
-
- 1000000  -- 1.00 million
-       a
-
- 1000000  -- 1.00 million
-       a
-
- 1000000  -- 1.00 million
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000001 │ -- 1.00 million
-└─────────┘
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000001 │ -- 1.00 million
-└─────────┘
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000001 │ -- 1.00 million
-└─────────┘
-┏━━━━━━━━━┓
-┃       a ┃
-┡━━━━━━━━━┩
-│ 1000001 │ -- 1.00 million
-└─────────┘
-┌───────a─┐
-│ 1000001 │ -- 1.00 million
-└─────────┘
-┌───────a─┐
-│ 1000001 │ -- 1.00 million
-└─────────┘
-┌───────a─┐
-│ 1000001 │ -- 1.00 million
-└─────────┘
-┌───────a─┐
-│ 1000001 │ -- 1.00 million
-└─────────┘
-       a
-
- 1000001  -- 1.00 million
-       a
-
- 1000001  -- 1.00 million
-       a
-
- 1000001  -- 1.00 million
-       a
-
- 1000001  -- 1.00 million
-┏━━━━━━━━━━━━┓
-┃          a ┃
-┡━━━━━━━━━━━━┩
-│ 1000000000 │ -- 1.00 billion
-└────────────┘
-┏━━━━━━━━━━━━┓
-┃          a ┃
-┡━━━━━━━━━━━━┩
-│ 1000000000 │ -- 1.00 billion
-└────────────┘
-┏━━━━━━━━━━━━┓
-┃          a ┃
-┡━━━━━━━━━━━━┩
-│ 1000000000 │ -- 1.00 billion
-└────────────┘
-┏━━━━━━━━━━━━┓
-┃          a ┃
-┡━━━━━━━━━━━━┩
-│ 1000000000 │ -- 1.00 billion
-└────────────┘
-┌──────────a─┐
-│ 1000000000 │ -- 1.00 billion
-└────────────┘
-┌──────────a─┐
-│ 1000000000 │ -- 1.00 billion
-└────────────┘
-┌──────────a─┐
-│ 1000000000 │ -- 1.00 billion
-└────────────┘
-┌──────────a─┐
-│ 1000000000 │ -- 1.00 billion
-└────────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000000 │
+   └─────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000000 │
+   └─────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000000 │
+   └─────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000000 │
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000000 │
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000000 │
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000000 │
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000000 │
+   └─────────┘
           a
 
- 1000000000  -- 1.00 billion
+1.  1000000 
           a
 
- 1000000000  -- 1.00 billion
+1.  1000000 
           a
 
- 1000000000  -- 1.00 billion
+1.  1000000 
           a
 
- 1000000000  -- 1.00 billion
-┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
-┃          a ┃          b ┃
-┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
-┃          a ┃          b ┃
-┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
-┃          a ┃          b ┃
-┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
-┃          a ┃          b ┃
-┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-┌──────────a─┬──────────b─┐
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-┌──────────a─┬──────────b─┐
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-┌──────────a─┬──────────b─┐
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-┌──────────a─┬──────────b─┐
-│ 1000000000 │ 1000000000 │
-└────────────┴────────────┘
-          a            b
-
- 1000000000   1000000000 
-          a            b
-
- 1000000000   1000000000 
-          a            b
-
- 1000000000   1000000000 
-          a            b
-
- 1000000000   1000000000 
-┏━━━━━━━━━━━━┓
-┃          a ┃
-┡━━━━━━━━━━━━┩
-│ 1000000000 │
-├────────────┤
-│ 1000000000 │
-└────────────┘
-┏━━━━━━━━━━━━┓
-┃          a ┃
-┡━━━━━━━━━━━━┩
-│ 1000000000 │
-├────────────┤
-│ 1000000000 │
-└────────────┘
-┏━━━━━━━━━━━━┓
-┃          a ┃
-┡━━━━━━━━━━━━┩
-│ 1000000000 │
-├────────────┤
-│ 1000000000 │
-└────────────┘
-┏━━━━━━━━━━━━┓
-┃          a ┃
-┡━━━━━━━━━━━━┩
-│ 1000000000 │
-├────────────┤
-│ 1000000000 │
-└────────────┘
-┌──────────a─┐
-│ 1000000000 │
-│ 1000000000 │
-└────────────┘
-┌──────────a─┐
-│ 1000000000 │
-│ 1000000000 │
-└────────────┘
-┌──────────a─┐
-│ 1000000000 │
-│ 1000000000 │
-└────────────┘
-┌──────────a─┐
-│ 1000000000 │
-│ 1000000000 │
-└────────────┘
+1.  1000000 
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000000 │ -- 1.00 million
+   └─────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000000 │ -- 1.00 million
+   └─────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000000 │ -- 1.00 million
+   └─────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000000 │ -- 1.00 million
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000000 │ -- 1.00 million
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000000 │ -- 1.00 million
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000000 │ -- 1.00 million
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000000 │ -- 1.00 million
+   └─────────┘
           a
 
- 1000000000 
- 1000000000 
+1.  1000000  -- 1.00 million
           a
 
- 1000000000 
- 1000000000 
+1.  1000000  -- 1.00 million
           a
 
- 1000000000 
- 1000000000 
+1.  1000000  -- 1.00 million
           a
 
- 1000000000 
- 1000000000 
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29', 'Date') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                 2024-02-29 │
-└────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29', 'Date') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                 2024-02-29 │
-└────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29', 'Date') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                 2024-02-29 │
-└────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29', 'Date') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                 2024-02-29 │
-└────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29', 'Date32') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                   2024-02-29 │
-└──────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29', 'Date32') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                   2024-02-29 │
-└──────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29', 'Date32') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                   2024-02-29 │
-└──────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29', 'Date32') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                   2024-02-29 │
-└──────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29 00:00:00', 'DateTime') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                     2024-02-29 00:00:00 │
-└─────────────────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29 00:00:00', 'DateTime') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                     2024-02-29 00:00:00 │
-└─────────────────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29 00:00:00', 'DateTime') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                     2024-02-29 00:00:00 │
-└─────────────────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST('2024-02-29 00:00:00', 'DateTime') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                     2024-02-29 00:00:00 │
-└─────────────────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST(CAST('2024-02-29 00:00:00', 'DateTime'), 'DateTime64') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                                     2024-02-29 00:00:00.000 │
-└─────────────────────────────────────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST(CAST('2024-02-29 00:00:00', 'DateTime'), 'DateTime64') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                                     2024-02-29 00:00:00.000 │
-└─────────────────────────────────────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST(CAST('2024-02-29 00:00:00', 'DateTime'), 'DateTime64') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                                     2024-02-29 00:00:00.000 │
-└─────────────────────────────────────────────────────────────┘
-┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
-┃ CAST(CAST('2024-02-29 00:00:00', 'DateTime'), 'DateTime64') ┃
-┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
-│                                     2024-02-29 00:00:00.000 │
-└─────────────────────────────────────────────────────────────┘
+1.  1000000  -- 1.00 million
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000001 │ -- 1.00 million
+   └─────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000001 │ -- 1.00 million
+   └─────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000001 │ -- 1.00 million
+   └─────────┘
+   ┏━━━━━━━━━┓
+   ┃       a ┃
+   ┡━━━━━━━━━┩
+1. │ 1000001 │ -- 1.00 million
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000001 │ -- 1.00 million
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000001 │ -- 1.00 million
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000001 │ -- 1.00 million
+   └─────────┘
+   ┌───────a─┐
+1. │ 1000001 │ -- 1.00 million
+   └─────────┘
+          a
+
+1.  1000001  -- 1.00 million
+          a
+
+1.  1000001  -- 1.00 million
+          a
+
+1.  1000001  -- 1.00 million
+          a
+
+1.  1000001  -- 1.00 million
+   ┏━━━━━━━━━━━━┓
+   ┃          a ┃
+   ┡━━━━━━━━━━━━┩
+1. │ 1000000000 │ -- 1.00 billion
+   └────────────┘
+   ┏━━━━━━━━━━━━┓
+   ┃          a ┃
+   ┡━━━━━━━━━━━━┩
+1. │ 1000000000 │ -- 1.00 billion
+   └────────────┘
+   ┏━━━━━━━━━━━━┓
+   ┃          a ┃
+   ┡━━━━━━━━━━━━┩
+1. │ 1000000000 │ -- 1.00 billion
+   └────────────┘
+   ┏━━━━━━━━━━━━┓
+   ┃          a ┃
+   ┡━━━━━━━━━━━━┩
+1. │ 1000000000 │ -- 1.00 billion
+   └────────────┘
+   ┌──────────a─┐
+1. │ 1000000000 │ -- 1.00 billion
+   └────────────┘
+   ┌──────────a─┐
+1. │ 1000000000 │ -- 1.00 billion
+   └────────────┘
+   ┌──────────a─┐
+1. │ 1000000000 │ -- 1.00 billion
+   └────────────┘
+   ┌──────────a─┐
+1. │ 1000000000 │ -- 1.00 billion
+   └────────────┘
+             a
+
+1.  1000000000  -- 1.00 billion
+             a
+
+1.  1000000000  -- 1.00 billion
+             a
+
+1.  1000000000  -- 1.00 billion
+             a
+
+1.  1000000000  -- 1.00 billion
+   ┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
+   ┃          a ┃          b ┃
+   ┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
+1. │ 1000000000 │ 1000000000 │
+   └────────────┴────────────┘
+   ┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
+   ┃          a ┃          b ┃
+   ┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
+1. │ 1000000000 │ 1000000000 │
+   └────────────┴────────────┘
+   ┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
+   ┃          a ┃          b ┃
+   ┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
+1. │ 1000000000 │ 1000000000 │
+   └────────────┴────────────┘
+   ┏━━━━━━━━━━━━┳━━━━━━━━━━━━┓
+   ┃          a ┃          b ┃
+   ┡━━━━━━━━━━━━╇━━━━━━━━━━━━┩
+1. │ 1000000000 │ 1000000000 │
+   └────────────┴────────────┘
+   ┌──────────a─┬──────────b─┐
+1. │ 1000000000 │ 1000000000 │
+   └────────────┴────────────┘
+   ┌──────────a─┬──────────b─┐
+1. │ 1000000000 │ 1000000000 │
+   └────────────┴────────────┘
+   ┌──────────a─┬──────────b─┐
+1. │ 1000000000 │ 1000000000 │
+   └────────────┴────────────┘
+   ┌──────────a─┬──────────b─┐
+1. │ 1000000000 │ 1000000000 │
+   └────────────┴────────────┘
+             a            b
+
+1.  1000000000   1000000000 
+             a            b
+
+1.  1000000000   1000000000 
+             a            b
+
+1.  1000000000   1000000000 
+             a            b
+
+1.  1000000000   1000000000 
+   ┏━━━━━━━━━━━━┓
+   ┃          a ┃
+   ┡━━━━━━━━━━━━┩
+1. │ 1000000000 │
+   ├────────────┤
+2. │ 1000000000 │
+   └────────────┘
+   ┏━━━━━━━━━━━━┓
+   ┃          a ┃
+   ┡━━━━━━━━━━━━┩
+1. │ 1000000000 │
+   ├────────────┤
+2. │ 1000000000 │
+   └────────────┘
+   ┏━━━━━━━━━━━━┓
+   ┃          a ┃
+   ┡━━━━━━━━━━━━┩
+1. │ 1000000000 │
+   ├────────────┤
+2. │ 1000000000 │
+   └────────────┘
+   ┏━━━━━━━━━━━━┓
+   ┃          a ┃
+   ┡━━━━━━━━━━━━┩
+1. │ 1000000000 │
+   ├────────────┤
+2. │ 1000000000 │
+   └────────────┘
+   ┌──────────a─┐
+1. │ 1000000000 │
+2. │ 1000000000 │
+   └────────────┘
+   ┌──────────a─┐
+1. │ 1000000000 │
+2. │ 1000000000 │
+   └────────────┘
+   ┌──────────a─┐
+1. │ 1000000000 │
+2. │ 1000000000 │
+   └────────────┘
+   ┌──────────a─┐
+1. │ 1000000000 │
+2. │ 1000000000 │
+   └────────────┘
+             a
+
+1.  1000000000 
+2.  1000000000 
+             a
+
+1.  1000000000 
+2.  1000000000 
+             a
+
+1.  1000000000 
+2.  1000000000 
+             a
+
+1.  1000000000 
+2.  1000000000 
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29', 'Date') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                 2024-02-29 │
+   └────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29', 'Date') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                 2024-02-29 │
+   └────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29', 'Date') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                 2024-02-29 │
+   └────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29', 'Date') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                 2024-02-29 │
+   └────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29', 'Date32') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                   2024-02-29 │
+   └──────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29', 'Date32') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                   2024-02-29 │
+   └──────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29', 'Date32') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                   2024-02-29 │
+   └──────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29', 'Date32') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                   2024-02-29 │
+   └──────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29 00:00:00', 'DateTime') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                     2024-02-29 00:00:00 │
+   └─────────────────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29 00:00:00', 'DateTime') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                     2024-02-29 00:00:00 │
+   └─────────────────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29 00:00:00', 'DateTime') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                     2024-02-29 00:00:00 │
+   └─────────────────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST('2024-02-29 00:00:00', 'DateTime') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                     2024-02-29 00:00:00 │
+   └─────────────────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST(CAST('2024-02-29 00:00:00', 'DateTime'), 'DateTime64') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                                     2024-02-29 00:00:00.000 │
+   └─────────────────────────────────────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST(CAST('2024-02-29 00:00:00', 'DateTime'), 'DateTime64') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                                     2024-02-29 00:00:00.000 │
+   └─────────────────────────────────────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST(CAST('2024-02-29 00:00:00', 'DateTime'), 'DateTime64') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                                     2024-02-29 00:00:00.000 │
+   └─────────────────────────────────────────────────────────────┘
+   ┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┓
+   ┃ CAST(CAST('2024-02-29 00:00:00', 'DateTime'), 'DateTime64') ┃
+   ┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┩
+1. │                                     2024-02-29 00:00:00.000 │
+   └─────────────────────────────────────────────────────────────┘

From a0bde74acb274cd57e7215741310a232e6be256f Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 03:26:59 +0100
Subject: [PATCH 933/985] Fix style

---
 src/AggregateFunctions/AggregateFunctionCount.cpp    | 6 ++++++
 src/AggregateFunctions/AggregateFunctionQuantile.cpp | 1 +
 2 files changed, 7 insertions(+)

diff --git a/src/AggregateFunctions/AggregateFunctionCount.cpp b/src/AggregateFunctions/AggregateFunctionCount.cpp
index 01099853364..25f991ab693 100644
--- a/src/AggregateFunctions/AggregateFunctionCount.cpp
+++ b/src/AggregateFunctions/AggregateFunctionCount.cpp
@@ -5,6 +5,12 @@
 
 namespace DB
 {
+
+namespace ErrorCodes
+{
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+}
+
 struct Settings;
 
 AggregateFunctionPtr AggregateFunctionCount::getOwnNullAdapter(
diff --git a/src/AggregateFunctions/AggregateFunctionQuantile.cpp b/src/AggregateFunctions/AggregateFunctionQuantile.cpp
index ba59759e745..4d37ec69d26 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantile.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantile.cpp
@@ -14,6 +14,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int NOT_IMPLEMENTED;
 }

From a2e89c8be71e27528854a451f5ebdc78f802676e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Fri, 22 Mar 2024 20:21:54 +0100
Subject: [PATCH 934/985] Fix wrong cases of numbers pretty printing

Add a test

Revert changes from another branch

Add a test

Better test

Revert wrong changes
---
 src/Core/Settings.h                           |  1 +
 src/Core/SettingsChangesHistory.h             |  1 +
 src/Formats/FormatFactory.cpp                 |  1 +
 src/Formats/FormatSettings.h                  |  1 +
 .../Formats/Impl/PrettyBlockOutputFormat.cpp  | 29 ++++++++++++-------
 .../Formats/Impl/PrettyBlockOutputFormat.h    |  2 +-
 .../Impl/PrettyCompactBlockOutputFormat.cpp   |  6 +++-
 .../Impl/PrettySpaceBlockOutputFormat.cpp     |  6 +++-
 ...ues_pretty_are_not_cut_if_single.reference |  4 +++
 ...ong_values_pretty_are_not_cut_if_single.sh | 17 +++++++++++
 10 files changed, 54 insertions(+), 14 deletions(-)
 create mode 100644 tests/queries/0_stateless/03020_long_values_pretty_are_not_cut_if_single.reference
 create mode 100755 tests/queries/0_stateless/03020_long_values_pretty_are_not_cut_if_single.sh

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d9071ef592b..4a9d1714af6 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1090,6 +1090,7 @@ class IColumn;
     M(UInt64, output_format_pretty_max_rows, 10000, "Rows limit for Pretty formats.", 0) \
     M(UInt64, output_format_pretty_max_column_pad_width, 250, "Maximum width to pad all values in a column in Pretty formats.", 0) \
     M(UInt64, output_format_pretty_max_value_width, 10000, "Maximum width of value to display in Pretty formats. If greater - it will be cut.", 0) \
+    M(UInt64, output_format_pretty_max_value_width_apply_for_single_value, false, "Only cut values (see the `output_format_pretty_max_value_width` setting) when it is not a single value in a block. Otherwise output it entirely, which is useful for the `SHOW CREATE TABLE` query.", 0) \
     M(UInt64Auto, output_format_pretty_color, "auto", "Use ANSI escape sequences in Pretty formats. 0 - disabled, 1 - enabled, 'auto' - enabled if a terminal.", 0) \
     M(String, output_format_pretty_grid_charset, "UTF-8", "Charset for printing grid borders. Available charsets: ASCII, UTF-8 (default one).", 0) \
     M(UInt64, output_format_parquet_row_group_size, 1000000, "Target row group size in rows.", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index ee56b86d9f2..e8ea2ebdce1 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -105,6 +105,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"keeper_retry_max_backoff_ms", 5000, 5000, "Max backoff timeout for general keeper operations"},
               {"s3queue_allow_experimental_sharded_mode", false, false, "Enable experimental sharded mode of S3Queue table engine. It is experimental because it will be rewritten"},
               {"merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability", 0.0, 0.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability."},
+              {"output_format_pretty_max_value_width_apply_for_single_value", true, false, "Single values in Pretty formats won't be cut."},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index e7dce273869..8522b1ee2c2 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -167,6 +167,7 @@ FormatSettings getFormatSettings(const ContextPtr & context, const Settings & se
     format_settings.pretty.max_column_pad_width = settings.output_format_pretty_max_column_pad_width;
     format_settings.pretty.max_rows = settings.output_format_pretty_max_rows;
     format_settings.pretty.max_value_width = settings.output_format_pretty_max_value_width;
+    format_settings.pretty.max_value_width_apply_for_single_value = settings.output_format_pretty_max_value_width_apply_for_single_value;
     format_settings.pretty.output_format_pretty_row_numbers = settings.output_format_pretty_row_numbers;
     format_settings.pretty.output_format_pretty_single_large_number_tip_threshold = settings.output_format_pretty_single_large_number_tip_threshold;
     format_settings.protobuf.input_flatten_google_wrappers = settings.input_format_protobuf_flatten_google_wrappers;
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index 42b21c77cef..e9d58472fcc 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -275,6 +275,7 @@ struct FormatSettings
         UInt64 max_rows = 10000;
         UInt64 max_column_pad_width = 250;
         UInt64 max_value_width = 10000;
+        UInt64 max_value_width_apply_for_single_value = false;
         SettingFieldUInt64Auto color{"auto"};
 
         bool output_format_pretty_row_numbers = false;
diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index c5db8f2e30a..9ff0847745c 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -164,6 +164,10 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
     const auto & columns = chunk.getColumns();
     const auto & header = getPort(port_kind).getHeader();
 
+    size_t cut_to_width = format_settings.pretty.max_value_width;
+    if (!format_settings.pretty.max_value_width_apply_for_single_value && num_rows == 1 && num_columns == 1 && total_rows == 0)
+        cut_to_width = 0;
+
     WidthsPerColumn widths;
     Widths max_widths;
     Widths name_widths;
@@ -303,7 +307,7 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
             const auto & type = *header.getByPosition(j).type;
             writeValueWithPadding(*columns[j], *serializations[j], i,
                 widths[j].empty() ? max_widths[j] : widths[j][i],
-                max_widths[j], type.shouldAlignRightInPrettyFormats());
+                max_widths[j], cut_to_width, type.shouldAlignRightInPrettyFormats());
         }
 
         writeCString(grid_symbols.bar, out);
@@ -324,7 +328,7 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
 
 void PrettyBlockOutputFormat::writeValueWithPadding(
     const IColumn & column, const ISerialization & serialization, size_t row_num,
-    size_t value_width, size_t pad_to_width, bool align_right)
+    size_t value_width, size_t pad_to_width, size_t cut_to_width, bool align_right)
 {
     String serialized_value = " ";
     {
@@ -332,7 +336,7 @@ void PrettyBlockOutputFormat::writeValueWithPadding(
         serialization.serializeText(column, row_num, out_serialize, format_settings);
     }
 
-    if (value_width > format_settings.pretty.max_value_width)
+    if (cut_to_width && value_width > cut_to_width)
     {
         serialized_value.resize(UTF8::computeBytesBeforeWidth(
             reinterpret_cast<const UInt8 *>(serialized_value.data()), serialized_value.size(), 0, 1 + format_settings.pretty.max_value_width));
@@ -419,16 +423,19 @@ void PrettyBlockOutputFormat::writeReadableNumberTip(const Chunk & chunk)
     auto is_single_number = readable_number_tip && chunk.getNumRows() == 1 && chunk.getNumColumns() == 1;
     if (!is_single_number)
         return;
+
     auto value = columns[0]->getFloat64(0);
     auto threshold = format_settings.pretty.output_format_pretty_single_large_number_tip_threshold;
-    if (threshold == 0 || value <= threshold)
-        return;
-    if (color)
-        writeCString("\033[90m", out);
-    writeCString(" -- ", out);
-    formatReadableQuantity(value, out, 2);
-    if (color)
-        writeCString("\033[0m", out);
+
+    if (threshold && isFinite(value) && abs(value) >= threshold)
+    {
+        if (color)
+            writeCString("\033[90m", out);
+        writeCString(" -- ", out);
+        formatReadableQuantity(value, out, 2);
+        if (color)
+            writeCString("\033[0m", out);
+    }
 }
 
 void registerOutputFormatPretty(FormatFactory & factory)
diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h
index 071bfa92e35..77757b9db2f 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h
@@ -48,7 +48,7 @@ protected:
 
     void writeValueWithPadding(
         const IColumn & column, const ISerialization & serialization, size_t row_num,
-        size_t value_width, size_t pad_to_width, bool align_right);
+        size_t value_width, size_t pad_to_width, size_t cut_to_width, bool align_right);
 
     void resetFormatterImpl() override
     {
diff --git a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
index bda51770838..99a5448d944 100644
--- a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
@@ -160,6 +160,10 @@ void PrettyCompactBlockOutputFormat::writeRow(
     size_t num_columns = max_widths.size();
     const auto & columns = chunk.getColumns();
 
+    size_t cut_to_width = format_settings.pretty.max_value_width;
+    if (!format_settings.pretty.max_value_width_apply_for_single_value && chunk.getNumRows() == 1 && num_columns == 1 && total_rows == 0)
+        cut_to_width = 0;
+
     writeCString(grid_symbols.bar, out);
 
     for (size_t j = 0; j < num_columns; ++j)
@@ -169,7 +173,7 @@ void PrettyCompactBlockOutputFormat::writeRow(
 
         const auto & type = *header.getByPosition(j).type;
         const auto & cur_widths = widths[j].empty() ? max_widths[j] : widths[j][row_num];
-        writeValueWithPadding(*columns[j], *serializations[j], row_num, cur_widths, max_widths[j], type.shouldAlignRightInPrettyFormats());
+        writeValueWithPadding(*columns[j], *serializations[j], row_num, cur_widths, max_widths[j], cut_to_width, type.shouldAlignRightInPrettyFormats());
     }
 
     writeCString(grid_symbols.bar, out);
diff --git a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
index e92863c93fb..6f2c0725b06 100644
--- a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
@@ -24,6 +24,10 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
     const auto & header = getPort(port_kind).getHeader();
     const auto & columns = chunk.getColumns();
 
+    size_t cut_to_width = format_settings.pretty.max_value_width;
+    if (!format_settings.pretty.max_value_width_apply_for_single_value && num_rows == 1 && num_columns == 1 && total_rows == 0)
+        cut_to_width = 0;
+
     WidthsPerColumn widths;
     Widths max_widths;
     Widths name_widths;
@@ -84,7 +88,7 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
             const auto & type = *header.getByPosition(column).type;
             auto & cur_width = widths[column].empty() ? max_widths[column] : widths[column][row];
             writeValueWithPadding(
-                *columns[column], *serializations[column], row, cur_width, max_widths[column], type.shouldAlignRightInPrettyFormats());
+                *columns[column], *serializations[column], row, cur_width, max_widths[column], cut_to_width, type.shouldAlignRightInPrettyFormats());
         }
 
         writeReadableNumberTip(chunk);
diff --git a/tests/queries/0_stateless/03020_long_values_pretty_are_not_cut_if_single.reference b/tests/queries/0_stateless/03020_long_values_pretty_are_not_cut_if_single.reference
new file mode 100644
index 00000000000..71f9c301195
--- /dev/null
+++ b/tests/queries/0_stateless/03020_long_values_pretty_are_not_cut_if_single.reference
@@ -0,0 +1,4 @@
+COMMENT 'Contains history of metrics values from tables system.metrics and system.events, periodically flushed to disk.' │
+COMMENT 'Contains history of metrics values from tables system.metrics and system.events, periodically flushed to disk.' │
+COMMENT 'Contains history of metrics values from tables system.metrics and system.events, periodically flushed to disk.' 
+\nCOMMENT \'Contains history of metrics values from tables system.metrics and system.events, periodically flushed to disk.\'
diff --git a/tests/queries/0_stateless/03020_long_values_pretty_are_not_cut_if_single.sh b/tests/queries/0_stateless/03020_long_values_pretty_are_not_cut_if_single.sh
new file mode 100755
index 00000000000..fa9e9f6d3e1
--- /dev/null
+++ b/tests/queries/0_stateless/03020_long_values_pretty_are_not_cut_if_single.sh
@@ -0,0 +1,17 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+# The metric_log table has a large number of columns, so its definition is also large.
+# And it is larger than the default value of `output_format_pretty_max_value_width`.
+# But cutting it in the result of SHOW CREATE TABLE will be bad for a user.
+# That's why we control it with the setting `output_format_pretty_max_value_width_apply_for_single_value`.
+
+${CLICKHOUSE_CLIENT} --query "SHOW CREATE TABLE system.metric_log" --format Pretty | grep -P '^COMMENT'
+${CLICKHOUSE_CLIENT} --query "SHOW CREATE TABLE system.metric_log" --format PrettyCompact | grep -P '^COMMENT'
+${CLICKHOUSE_CLIENT} --query "SHOW CREATE TABLE system.metric_log" --format PrettySpace | grep -P '^COMMENT'
+
+# Just in case, non-Pretty format:
+${CLICKHOUSE_CLIENT} --query "SHOW CREATE TABLE system.metric_log" --format TSV | grep -o -P '\\nCOMMENT.+$'

From 4cbecd0bbd6ebcc7376d7e4fdbd2f18552809b35 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 04:20:52 +0100
Subject: [PATCH 935/985] Add a setting

---
 src/Core/Settings.h                           |  1 +
 src/Core/SettingsChangesHistory.h             |  1 +
 src/Formats/FormatFactory.cpp                 |  1 +
 src/Formats/FormatSettings.h                  |  1 +
 .../Formats/Impl/PrettyBlockOutputFormat.cpp  | 74 ++++++++++++++++++-
 .../Formats/Impl/PrettyBlockOutputFormat.h    |  2 +-
 .../Impl/PrettyCompactBlockOutputFormat.cpp   |  2 +-
 .../Impl/PrettySpaceBlockOutputFormat.cpp     |  2 +-
 8 files changed, 79 insertions(+), 5 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d9071ef592b..ea582c18710 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1139,6 +1139,7 @@ class IColumn;
     M(Bool, output_format_enable_streaming, false, "Enable streaming in output formats that support it.", 0) \
     M(Bool, output_format_write_statistics, true, "Write statistics about read rows, bytes, time elapsed in suitable output formats.", 0) \
     M(Bool, output_format_pretty_row_numbers, false, "Add row numbers before each row for pretty output format", 0) \
+    M(Bool, output_format_pretty_highlight_digit_groups, true, "If enabled and if output is a terminal, highlight every digit corresponding to the number of thousands, millions, etc. with underline.", 0) \
     M(UInt64, output_format_pretty_single_large_number_tip_threshold, 1'000'000, "Print a readable number tip on the right side of the table if the block consists of a single number which exceeds this value (except 0)", 0) \
     M(Bool, insert_distributed_one_random_shard, false, "If setting is enabled, inserting into distributed table will choose a random shard to write when there is no sharding key", 0) \
     \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index ee56b86d9f2..3f72dd4df6e 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -105,6 +105,7 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"keeper_retry_max_backoff_ms", 5000, 5000, "Max backoff timeout for general keeper operations"},
               {"s3queue_allow_experimental_sharded_mode", false, false, "Enable experimental sharded mode of S3Queue table engine. It is experimental because it will be rewritten"},
               {"merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability", 0.0, 0.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability."},
+              {"output_format_pretty_highlight_digit_groups", false, true, "If enabled and if output is a terminal, highlight every digit corresponding to the number of thousands, millions, etc. with underline."},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index e7dce273869..9e01709f788 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -167,6 +167,7 @@ FormatSettings getFormatSettings(const ContextPtr & context, const Settings & se
     format_settings.pretty.max_column_pad_width = settings.output_format_pretty_max_column_pad_width;
     format_settings.pretty.max_rows = settings.output_format_pretty_max_rows;
     format_settings.pretty.max_value_width = settings.output_format_pretty_max_value_width;
+    format_settings.pretty.highlight_digit_groups = settings.output_format_pretty_highlight_digit_groups;
     format_settings.pretty.output_format_pretty_row_numbers = settings.output_format_pretty_row_numbers;
     format_settings.pretty.output_format_pretty_single_large_number_tip_threshold = settings.output_format_pretty_single_large_number_tip_threshold;
     format_settings.protobuf.input_flatten_google_wrappers = settings.input_format_protobuf_flatten_google_wrappers;
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index 42b21c77cef..d1b7f5b4d25 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -275,6 +275,7 @@ struct FormatSettings
         UInt64 max_rows = 10000;
         UInt64 max_column_pad_width = 250;
         UInt64 max_value_width = 10000;
+        bool highlight_digit_groups = true;
         SettingFieldUInt64Auto color{"auto"};
 
         bool output_format_pretty_row_numbers = false;
diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index c5db8f2e30a..2bdffa29599 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -303,7 +303,7 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
             const auto & type = *header.getByPosition(j).type;
             writeValueWithPadding(*columns[j], *serializations[j], i,
                 widths[j].empty() ? max_widths[j] : widths[j][i],
-                max_widths[j], type.shouldAlignRightInPrettyFormats());
+                max_widths[j], type.shouldAlignRightInPrettyFormats(), isNumber(type));
         }
 
         writeCString(grid_symbols.bar, out);
@@ -322,9 +322,75 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
 }
 
 
+static String highlightDigitGroups(String source)
+{
+    if (source.size() <= 4)
+        return source;
+
+    bool is_regular_number = true;
+    size_t num_digits_before_decimal = 0;
+    for (auto c : source)
+    {
+        if (c == '-' || c == ' ')
+            continue;
+        if (c == '.')
+            break;
+        if (c >= '0' && c <= '9')
+        {
+            ++num_digits_before_decimal;
+        }
+        else
+        {
+            is_regular_number = false;
+            break;
+        }
+    }
+
+    if (!is_regular_number || num_digits_before_decimal <= 4)
+        return source;
+
+    String result;
+    size_t size = source.size();
+    result.reserve(2 * size);
+
+    bool before_decimal = true;
+    size_t digit_num = 0;
+    for (size_t i = 0; i < size; ++i)
+    {
+        auto c = source[i];
+        if (before_decimal && c >= '0' && c <= '9')
+        {
+            ++digit_num;
+            size_t offset = num_digits_before_decimal - digit_num;
+            if (offset && offset % 3 == 0)
+            {
+                result += "\033[4m";
+                result += c;
+                result += "\033[0m";
+            }
+            else
+            {
+                result += c;
+            }
+        }
+        else if (c == '.')
+        {
+            before_decimal = false;
+            result += c;
+        }
+        else
+        {
+            result += c;
+        }
+    }
+
+    return result;
+}
+
+
 void PrettyBlockOutputFormat::writeValueWithPadding(
     const IColumn & column, const ISerialization & serialization, size_t row_num,
-    size_t value_width, size_t pad_to_width, bool align_right)
+    size_t value_width, size_t pad_to_width, bool align_right, bool is_number)
 {
     String serialized_value = " ";
     {
@@ -359,6 +425,10 @@ void PrettyBlockOutputFormat::writeValueWithPadding(
                 writeChar(' ', out);
     };
 
+    /// Highlight groups of thousands.
+    if (color && is_number && format_settings.pretty.highlight_digit_groups)
+        serialized_value = highlightDigitGroups(serialized_value);
+
     if (align_right)
     {
         write_padding();
diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h
index 071bfa92e35..d185df392f3 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.h
@@ -48,7 +48,7 @@ protected:
 
     void writeValueWithPadding(
         const IColumn & column, const ISerialization & serialization, size_t row_num,
-        size_t value_width, size_t pad_to_width, bool align_right);
+        size_t value_width, size_t pad_to_width, bool align_right, bool is_number);
 
     void resetFormatterImpl() override
     {
diff --git a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
index bda51770838..99a83a8b094 100644
--- a/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyCompactBlockOutputFormat.cpp
@@ -169,7 +169,7 @@ void PrettyCompactBlockOutputFormat::writeRow(
 
         const auto & type = *header.getByPosition(j).type;
         const auto & cur_widths = widths[j].empty() ? max_widths[j] : widths[j][row_num];
-        writeValueWithPadding(*columns[j], *serializations[j], row_num, cur_widths, max_widths[j], type.shouldAlignRightInPrettyFormats());
+        writeValueWithPadding(*columns[j], *serializations[j], row_num, cur_widths, max_widths[j], type.shouldAlignRightInPrettyFormats(), isNumber(type));
     }
 
     writeCString(grid_symbols.bar, out);
diff --git a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
index e92863c93fb..7b1758a4566 100644
--- a/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettySpaceBlockOutputFormat.cpp
@@ -84,7 +84,7 @@ void PrettySpaceBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port
             const auto & type = *header.getByPosition(column).type;
             auto & cur_width = widths[column].empty() ? max_widths[column] : widths[column][row];
             writeValueWithPadding(
-                *columns[column], *serializations[column], row, cur_width, max_widths[column], type.shouldAlignRightInPrettyFormats());
+                *columns[column], *serializations[column], row, cur_width, max_widths[column], type.shouldAlignRightInPrettyFormats(), isNumber(type));
         }
 
         writeReadableNumberTip(chunk);

From cd8cdb480a0cbb99b6d884215dc25c7535636cd9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 04:21:06 +0100
Subject: [PATCH 936/985] Fix error

---
 src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp   | 3 +++
 .../AggregateFunctionQuantileBFloat16Weighted.cpp              | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileDD.cpp         | 3 +++
 .../AggregateFunctionQuantileDeterministic.cpp                 | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileExact.cpp      | 3 +++
 .../AggregateFunctionQuantileExactExclusive.cpp                | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp  | 3 +++
 .../AggregateFunctionQuantileExactInclusive.cpp                | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp   | 3 +++
 .../AggregateFunctionQuantileExactWeighted.cpp                 | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileGK.cpp         | 3 +++
 .../AggregateFunctionQuantileInterpolatedWeighted.cpp          | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp    | 3 +++
 .../AggregateFunctionQuantileTDigestWeighted.cpp               | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp     | 3 +++
 .../AggregateFunctionQuantileTimingWeighted.cpp                | 3 +++
 16 files changed, 48 insertions(+)

diff --git a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
index 5e17a147924..902083d3661 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
index 25460646369..6f36a3ebe28 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
index d41581346b3..a65702ab7e1 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
@@ -27,6 +27,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
index 714d81a73d1..71e5b128df7 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
@@ -116,6 +116,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
index ba7e04fe2d1..24cabbd23a4 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
@@ -27,6 +27,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
index 0962d894c95..58289f2a199 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
index f278250bd36..a75265d214c 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
@@ -27,6 +27,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
index 56a5c91b254..6d79bf13ed0 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
index 2fc96bb0d22..ada7f47523f 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
index b4a72a920d1..4c3337d92ad 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
@@ -216,6 +216,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
index e020d029df6..035914957e9 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
@@ -503,6 +503,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
index a6edf499acb..24df84cb805 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
@@ -320,6 +320,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
index da2b10055ba..adcb8354956 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
index 15587f4eb4b..b17cff10fe6 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
index bf38d3a37f7..c703551b17b 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
index 282ebf70522..877bc459224 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 

From ef9ef9f2d76b0a5d5616b32bc4c44815b03f797c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 04:21:06 +0100
Subject: [PATCH 937/985] Fix error

---
 src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp   | 3 +++
 .../AggregateFunctionQuantileBFloat16Weighted.cpp              | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileDD.cpp         | 3 +++
 .../AggregateFunctionQuantileDeterministic.cpp                 | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileExact.cpp      | 3 +++
 .../AggregateFunctionQuantileExactExclusive.cpp                | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp  | 3 +++
 .../AggregateFunctionQuantileExactInclusive.cpp                | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp   | 3 +++
 .../AggregateFunctionQuantileExactWeighted.cpp                 | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileGK.cpp         | 3 +++
 .../AggregateFunctionQuantileInterpolatedWeighted.cpp          | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp    | 3 +++
 .../AggregateFunctionQuantileTDigestWeighted.cpp               | 3 +++
 src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp     | 3 +++
 .../AggregateFunctionQuantileTimingWeighted.cpp                | 3 +++
 16 files changed, 48 insertions(+)

diff --git a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
index 5e17a147924..902083d3661 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
index 25460646369..6f36a3ebe28 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
index d41581346b3..a65702ab7e1 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
@@ -27,6 +27,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
index 714d81a73d1..71e5b128df7 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
@@ -116,6 +116,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
index ba7e04fe2d1..24cabbd23a4 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
@@ -27,6 +27,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
index 0962d894c95..58289f2a199 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
index f278250bd36..a75265d214c 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
@@ -27,6 +27,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
index 56a5c91b254..6d79bf13ed0 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
index 2fc96bb0d22..ada7f47523f 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
index b4a72a920d1..4c3337d92ad 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
@@ -216,6 +216,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
index e020d029df6..035914957e9 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
@@ -503,6 +503,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
index a6edf499acb..24df84cb805 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
@@ -320,6 +320,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
index da2b10055ba..adcb8354956 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
index 15587f4eb4b..b17cff10fe6 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
index bf38d3a37f7..c703551b17b 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
index 282ebf70522..877bc459224 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
@@ -26,6 +26,9 @@ template <template <typename, bool> class Function>
 AggregateFunctionPtr createAggregateFunctionQuantile(
     const std::string & name, const DataTypes & argument_types, const Array & params, const Settings *)
 {
+    if (argument_types.empty())
+        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Aggregate function {} requires at least one argument", name);
+
     const DataTypePtr & argument_type = argument_types[0];
     WhichDataType which(argument_type);
 

From 293d08ee91108ad0867ddb2c9162f5a775e44933 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 04:29:37 +0100
Subject: [PATCH 938/985] Add a test

---
 .../03022_highlight_digit_groups.reference    | 68 +++++++++++++++++++
 .../03022_highlight_digit_groups.sql          |  6 ++
 2 files changed, 74 insertions(+)
 create mode 100644 tests/queries/0_stateless/03022_highlight_digit_groups.reference
 create mode 100644 tests/queries/0_stateless/03022_highlight_digit_groups.sql

diff --git a/tests/queries/0_stateless/03022_highlight_digit_groups.reference b/tests/queries/0_stateless/03022_highlight_digit_groups.reference
new file mode 100644
index 00000000000..4e814c36309
--- /dev/null
+++ b/tests/queries/0_stateless/03022_highlight_digit_groups.reference
@@ -0,0 +1,68 @@
+ [1mmultiply(exp10(number), if(modulo(number, 2), 1, -1))[0m
+
+                                                    -1 
+                                                    10 
+                                                  -100 
+                                                  1000 
+                                                -1[4m0[0m000 
+                                                10[4m0[0m000 
+                                              -[4m1[0m00[4m0[0m000 
+                                              1[4m0[0m00[4m0[0m000 
+                                            -10[4m0[0m00[4m0[0m000 
+                                            [4m1[0m00[4m0[0m00[4m0[0m000 
+                                          -1[4m0[0m00[4m0[0m00[4m0[0m000 
+                                          10[4m0[0m00[4m0[0m00[4m0[0m000 
+                                        -[4m1[0m00[4m0[0m00[4m0[0m00[4m0[0m000 
+                                        1[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m000 
+                                      -10[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m000 
+                                      [4m1[0m00[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m000 
+                                    -1[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m000 
+                                    10[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m000 
+                                  -[4m1[0m00[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m000 
+                                  1[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m000 
+                                -10[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m00[4m0[0m000 
+                                                  1e21 
+                                                 -1e22 
+                                                  1e23 
+                                                 -1e24 
+                                                  1e25 
+                                                 -1e26 
+                                                  1e27 
+                                                 -1e28 
+                                                  1e29 
+ [1mexp10(number)[0m
+
+             1 
+            10 
+           100 
+          1000 
+         10000 
+        100000 
+       1000000 
+      10000000 
+     100000000 
+    1000000000 
+ exp10(number)
+
+             1 
+            10 
+           100 
+          1000 
+         10000 
+        100000 
+       1000000 
+      10000000 
+     100000000 
+    1000000000 
+ [1mplus(exp10(number), exp10(negate(number)))[0m
+
+                                          2 
+                                       10.1 
+                                     100.01 
+                                   1000.001 
+                                 1[4m0[0m000.0001 
+                               10[4m0[0m000.00001 
+                             [4m1[0m00[4m0[0m000.000001 
+                           1[4m0[0m00[4m0[0m000.0000001 
+                         10[4m0[0m00[4m0[0m000.00000001 
+                                 [4m1[0m00[4m0[0m00[4m0[0m000 
diff --git a/tests/queries/0_stateless/03022_highlight_digit_groups.sql b/tests/queries/0_stateless/03022_highlight_digit_groups.sql
new file mode 100644
index 00000000000..57341f228a9
--- /dev/null
+++ b/tests/queries/0_stateless/03022_highlight_digit_groups.sql
@@ -0,0 +1,6 @@
+SELECT exp10(number) * (number % 2 ? 1 : -1) FROM numbers(30) FORMAT PrettySpace SETTINGS output_format_pretty_color = 1;
+
+SELECT exp10(number) FROM numbers(10) FORMAT PrettySpace SETTINGS output_format_pretty_color = 1, output_format_pretty_highlight_digit_groups = 0;
+SELECT exp10(number) FROM numbers(10) FORMAT PrettySpace;
+
+SELECT exp10(number) + exp10(-number) FROM numbers(10) FORMAT PrettySpace SETTINGS output_format_pretty_color = 1;

From d599ecdfddc43bda8d27b4ca02f84ba8daa91382 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 04:41:07 +0100
Subject: [PATCH 939/985] Fix error

---
 src/Common/formatReadable.cpp                     | 15 +++++++++++----
 .../0_stateless/03019_numbers_pretty.reference    |  5 +++++
 .../queries/0_stateless/03019_numbers_pretty.sql  |  1 +
 3 files changed, 17 insertions(+), 4 deletions(-)

diff --git a/src/Common/formatReadable.cpp b/src/Common/formatReadable.cpp
index c72733323d3..7e126a72c33 100644
--- a/src/Common/formatReadable.cpp
+++ b/src/Common/formatReadable.cpp
@@ -13,8 +13,6 @@ namespace DB
     }
 }
 
-// I wanted to make this ALWAYS_INLINE to prevent flappy performance tests,
-// but GCC complains it may not be inlined.
 static void formatReadable(double size, DB::WriteBuffer & out,
     int precision, const char ** units, size_t units_size, double delimiter)
 {
@@ -25,7 +23,12 @@ static void formatReadable(double size, DB::WriteBuffer & out,
     DB::DoubleConverter<false>::BufferType buffer;
     double_conversion::StringBuilder builder{buffer, sizeof(buffer)};
 
-    const auto result = DB::DoubleConverter<false>::instance().ToFixed(size, precision, &builder);
+    const auto & converter = DB::DoubleConverter<false>::instance();
+
+    auto result = converter.ToFixed(size, precision, &builder);
+
+    if (!result)
+        result = converter.ToShortest(size, &builder);
 
     if (!result)
         throw DB::Exception(DB::ErrorCodes::CANNOT_PRINT_FLOAT_OR_DOUBLE_NUMBER, "Cannot print float or double number");
@@ -65,7 +68,11 @@ std::string formatReadableSizeWithDecimalSuffix(double value, int precision)
 
 void formatReadableQuantity(double value, DB::WriteBuffer & out, int precision)
 {
-    const char * units[] = {"", " thousand", " million", " billion", " trillion", " quadrillion"};
+    const char * units[] = {"", " thousand", " million", " billion", " trillion", " quadrillion",
+        " quintillion", " sextillion", " septillion", " octillion", " nonillion", " decillion",
+        " undecillion", " duodecillion", " tredecillion", " quattuordecillion", " quindecillion",
+        " sexdecillion", " septendecillion", " octodecillion", " novemdecillion", " vigintillion"};
+
     formatReadable(value, out, precision, units, sizeof(units) / sizeof(units[0]), 1000);
 }
 
diff --git a/tests/queries/0_stateless/03019_numbers_pretty.reference b/tests/queries/0_stateless/03019_numbers_pretty.reference
index dd441dcd48f..5b25d3dd092 100644
--- a/tests/queries/0_stateless/03019_numbers_pretty.reference
+++ b/tests/queries/0_stateless/03019_numbers_pretty.reference
@@ -23,3 +23,8 @@
 ┡━━━━━┩
 │ nan │
 └─────┘
+┏━━━━━━━┓
+┃ 1e111 ┃
+┡━━━━━━━┩
+│ 1e111 │ -- 1000000000000000206105119874289560746212057939968.00 vigintillion
+└───────┘
diff --git a/tests/queries/0_stateless/03019_numbers_pretty.sql b/tests/queries/0_stateless/03019_numbers_pretty.sql
index e6d47abcd17..91efbe61d43 100644
--- a/tests/queries/0_stateless/03019_numbers_pretty.sql
+++ b/tests/queries/0_stateless/03019_numbers_pretty.sql
@@ -4,3 +4,4 @@ SELECT -1.23e9 FORMAT Pretty;
 SELECT inf FORMAT Pretty;
 SELECT -inf FORMAT Pretty;
 SELECT nan FORMAT Pretty;
+SELECT 1e111 FORMAT Pretty;

From 9d51f014c23af6668d842b85ef6889958479befb Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 04:52:45 +0100
Subject: [PATCH 940/985] Fix error

---
 src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp    | 1 +
 .../AggregateFunctionQuantileBFloat16Weighted.cpp               | 2 +-
 src/AggregateFunctions/AggregateFunctionQuantileDD.cpp          | 1 +
 .../AggregateFunctionQuantileDeterministic.cpp                  | 1 +
 src/AggregateFunctions/AggregateFunctionQuantileExact.cpp       | 1 +
 .../AggregateFunctionQuantileExactExclusive.cpp                 | 1 +
 src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp   | 1 +
 .../AggregateFunctionQuantileExactInclusive.cpp                 | 1 +
 src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp    | 1 +
 .../AggregateFunctionQuantileExactWeighted.cpp                  | 1 +
 src/AggregateFunctions/AggregateFunctionQuantileGK.cpp          | 1 +
 .../AggregateFunctionQuantileInterpolatedWeighted.cpp           | 1 +
 src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp     | 1 +
 .../AggregateFunctionQuantileTDigestWeighted.cpp                | 1 +
 src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp      | 1 +
 .../AggregateFunctionQuantileTimingWeighted.cpp                 | 1 +
 16 files changed, 16 insertions(+), 1 deletion(-)

diff --git a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
index 902083d3661..75ed099129a 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
index 6f36a3ebe28..6d881b77c16 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileBFloat16Weighted.cpp
@@ -1,7 +1,6 @@
 #include <AggregateFunctions/AggregateFunctionQuantile.h>
 #include <AggregateFunctions/QuantileBFloat16Histogram.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
-#include <AggregateFunctions/Helpers.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
 #include <Core/Field.h>
@@ -13,6 +12,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
index a65702ab7e1..f3d6b26ee75 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDD.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp b/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
index 71e5b128df7..fc186a25afb 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileDeterministic.cpp
@@ -14,6 +14,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int NOT_IMPLEMENTED;
 }
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
index 24cabbd23a4..8b7b5f88976 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExact.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
index 58289f2a199..080134eb919 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactExclusive.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
index a75265d214c..b44df755158 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactHigh.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
index 6d79bf13ed0..d8287be86ca 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactInclusive.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
index ada7f47523f..d192ed175da 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactLow.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
index 4c3337d92ad..469abdf45a2 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileExactWeighted.cpp
@@ -16,6 +16,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int NOT_IMPLEMENTED;
 }
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
index 035914957e9..e455f2f4123 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileGK.cpp
@@ -16,6 +16,7 @@ namespace DB
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int INCORRECT_DATA;
     extern const int LOGICAL_ERROR;
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
index 24df84cb805..231123c5363 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileInterpolatedWeighted.cpp
@@ -15,6 +15,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int NOT_IMPLEMENTED;
 }
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
index adcb8354956..7421e3b649f 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTDigest.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
index b17cff10fe6..226c441a152 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTDigestWeighted.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
index c703551b17b..1bb77892c0d 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTiming.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 
diff --git a/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp b/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
index 877bc459224..cc9db79176b 100644
--- a/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
+++ b/src/AggregateFunctions/AggregateFunctionQuantileTimingWeighted.cpp
@@ -13,6 +13,7 @@ struct Settings;
 
 namespace ErrorCodes
 {
+    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
 }
 

From c6004cc74206cae82f8efce694adc300449d8d91 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 04:57:32 +0100
Subject: [PATCH 941/985] Fix error

---
 src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index 9ff0847745c..9c3a49a049c 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -427,7 +427,7 @@ void PrettyBlockOutputFormat::writeReadableNumberTip(const Chunk & chunk)
     auto value = columns[0]->getFloat64(0);
     auto threshold = format_settings.pretty.output_format_pretty_single_large_number_tip_threshold;
 
-    if (threshold && isFinite(value) && abs(value) >= threshold)
+    if (threshold && isFinite(value) && abs(value) > threshold)
     {
         if (color)
             writeCString("\033[90m", out);

From 03216969d49e8bea6d9418c3d1968711bdb6e101 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 16:45:17 +0100
Subject: [PATCH 942/985] Update test

---
 .../0_stateless/01492_format_readable_quantity.reference    | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/01492_format_readable_quantity.reference b/tests/queries/0_stateless/01492_format_readable_quantity.reference
index 247063b70a2..5fa537fcf80 100644
--- a/tests/queries/0_stateless/01492_format_readable_quantity.reference
+++ b/tests/queries/0_stateless/01492_format_readable_quantity.reference
@@ -40,6 +40,6 @@
 86.59 quadrillion	86.59 quadrillion	2.15 billion
 235.39 quadrillion	235.39 quadrillion	2.15 billion
 639.84 quadrillion	639.84 quadrillion	2.15 billion
-1739.27 quadrillion	1739.27 quadrillion	2.15 billion
-4727.84 quadrillion	4727.84 quadrillion	2.15 billion
-12851.60 quadrillion	12851.60 quadrillion	2.15 billion
+1.74 quintillion	1.74 quintillion	2.15 billion
+4.73 quintillion	4.73 quintillion	2.15 billion
+12.85 quintillion	12.85 quintillion	2.15 billion

From d403e6544e237ec3800105d28e484f1a974fe8f1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 16:48:36 +0100
Subject: [PATCH 943/985] Update test

---
 tests/queries/0_stateless/01293_pretty_max_value_width.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/01293_pretty_max_value_width.sql b/tests/queries/0_stateless/01293_pretty_max_value_width.sql
index 2c9c56d0076..3d53f3a0c4e 100644
--- a/tests/queries/0_stateless/01293_pretty_max_value_width.sql
+++ b/tests/queries/0_stateless/01293_pretty_max_value_width.sql
@@ -1,4 +1,4 @@
-SET output_format_pretty_color=1;
+SET output_format_pretty_color = 1, output_format_pretty_max_value_width_apply_for_single_value = 1;
 SELECT 'привет' AS x, 'мир' AS y FORMAT Pretty;
 
 SET output_format_pretty_max_value_width = 5;

From 39732174e96f02fd3bd68bed79a97af9c22b1454 Mon Sep 17 00:00:00 2001
From: Nikita Fomichev <nikita.fomichev@clickhouse.com>
Date: Sat, 23 Mar 2024 14:53:13 +0100
Subject: [PATCH 944/985] Integration tests: set host user for mysql docker
 containers When run pytest locally, tests fail because of `Permission denied:
 'logs'`

---
 tests/integration/compose/docker_compose_mysql.yml         | 1 +
 tests/integration/compose/docker_compose_mysql_8_0.yml     | 1 +
 tests/integration/compose/docker_compose_mysql_cluster.yml | 3 +++
 tests/integration/helpers/cluster.py                       | 5 +++++
 4 files changed, 10 insertions(+)

diff --git a/tests/integration/compose/docker_compose_mysql.yml b/tests/integration/compose/docker_compose_mysql.yml
index 103fe2769e9..69f7f02fb4d 100644
--- a/tests/integration/compose/docker_compose_mysql.yml
+++ b/tests/integration/compose/docker_compose_mysql.yml
@@ -22,3 +22,4 @@ services:
             - type: ${MYSQL_LOGS_FS:-tmpfs}
               source: ${MYSQL_LOGS:-}
               target: /mysql/
+        user: ${MYSQL_DOCKER_USER}
diff --git a/tests/integration/compose/docker_compose_mysql_8_0.yml b/tests/integration/compose/docker_compose_mysql_8_0.yml
index 9c9c7430cec..1e0ded6c6bd 100644
--- a/tests/integration/compose/docker_compose_mysql_8_0.yml
+++ b/tests/integration/compose/docker_compose_mysql_8_0.yml
@@ -21,3 +21,4 @@ services:
             - type: ${MYSQL8_LOGS_FS:-tmpfs}
               source: ${MYSQL8_LOGS:-}
               target: /mysql/
+        user: ${MYSQL8_DOCKER_USER}
diff --git a/tests/integration/compose/docker_compose_mysql_cluster.yml b/tests/integration/compose/docker_compose_mysql_cluster.yml
index 079c451b9d6..3f7d21b733f 100644
--- a/tests/integration/compose/docker_compose_mysql_cluster.yml
+++ b/tests/integration/compose/docker_compose_mysql_cluster.yml
@@ -22,6 +22,7 @@ services:
             - type: ${MYSQL_CLUSTER_LOGS_FS:-tmpfs}
               source: ${MYSQL_CLUSTER_LOGS:-}
               target: /mysql/
+        user: ${MYSQL_CLUSTER_DOCKER_USER}
     mysql3:
         image: mysql:8.0
         restart: always
@@ -44,6 +45,7 @@ services:
             - type: ${MYSQL_CLUSTER_LOGS_FS:-tmpfs}
               source: ${MYSQL_CLUSTER_LOGS:-}
               target: /mysql/
+        user: ${MYSQL_CLUSTER_DOCKER_USER}
     mysql4:
         image: mysql:8.0
         restart: always
@@ -66,3 +68,4 @@ services:
             - type: ${MYSQL_CLUSTER_LOGS_FS:-tmpfs}
               source: ${MYSQL_CLUSTER_LOGS:-}
               target: /mysql/
+        user: ${MYSQL_CLUSTER_DOCKER_USER}
diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index b3088ba7c81..1ed8905389d 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -1047,6 +1047,8 @@ class ClickHouseCluster:
         env_variables["MYSQL_ROOT_HOST"] = "%"
         env_variables["MYSQL_LOGS"] = self.mysql57_logs_dir
         env_variables["MYSQL_LOGS_FS"] = "bind"
+        env_variables["MYSQL_DOCKER_USER"] = str(os.getuid())
+
         self.base_cmd.extend(
             ["--file", p.join(docker_compose_yml_dir, "docker_compose_mysql.yml")]
         )
@@ -1069,6 +1071,8 @@ class ClickHouseCluster:
         env_variables["MYSQL8_ROOT_HOST"] = "%"
         env_variables["MYSQL8_LOGS"] = self.mysql8_logs_dir
         env_variables["MYSQL8_LOGS_FS"] = "bind"
+        env_variables["MYSQL8_DOCKER_USER"] = str(os.getuid())
+
         self.base_cmd.extend(
             ["--file", p.join(docker_compose_yml_dir, "docker_compose_mysql_8_0.yml")]
         )
@@ -1090,6 +1094,7 @@ class ClickHouseCluster:
         env_variables["MYSQL_CLUSTER_ROOT_HOST"] = "%"
         env_variables["MYSQL_CLUSTER_LOGS"] = self.mysql_cluster_logs_dir
         env_variables["MYSQL_CLUSTER_LOGS_FS"] = "bind"
+        env_variables["MYSQL_CLUSTER_DOCKER_USER"] = str(os.getuid())
 
         self.base_cmd.extend(
             [

From d0a0141a470b7170959e24784d52091f28b163e9 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 17:39:04 +0100
Subject: [PATCH 945/985] Change defaults of Parquet/ORC/Arrow

---
 src/Core/Settings.h               | 10 +++++-----
 src/Core/SettingsChangesHistory.h |  5 +++++
 2 files changed, 10 insertions(+), 5 deletions(-)

diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index d9071ef592b..8794b1970ba 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -1094,10 +1094,10 @@ class IColumn;
     M(String, output_format_pretty_grid_charset, "UTF-8", "Charset for printing grid borders. Available charsets: ASCII, UTF-8 (default one).", 0) \
     M(UInt64, output_format_parquet_row_group_size, 1000000, "Target row group size in rows.", 0) \
     M(UInt64, output_format_parquet_row_group_size_bytes, 512 * 1024 * 1024, "Target row group size in bytes, before compression.", 0) \
-    M(Bool, output_format_parquet_string_as_string, false, "Use Parquet String type instead of Binary for String columns.", 0) \
+    M(Bool, output_format_parquet_string_as_string, true, "Use Parquet String type instead of Binary for String columns.", 0) \
     M(Bool, output_format_parquet_fixed_string_as_fixed_byte_array, true, "Use Parquet FIXED_LENGTH_BYTE_ARRAY type instead of Binary for FixedString columns.", 0) \
     M(ParquetVersion, output_format_parquet_version, "2.latest", "Parquet format version for output format. Supported versions: 1.0, 2.4, 2.6 and 2.latest (default)", 0) \
-    M(ParquetCompression, output_format_parquet_compression_method, "lz4", "Compression method for Parquet output format. Supported codecs: snappy, lz4, brotli, zstd, gzip, none (uncompressed)", 0) \
+    M(ParquetCompression, output_format_parquet_compression_method, "zstd", "Compression method for Parquet output format. Supported codecs: snappy, lz4, brotli, zstd, gzip, none (uncompressed)", 0) \
     M(Bool, output_format_parquet_compliant_nested_types, true, "In parquet file schema, use name 'element' instead of 'item' for list elements. This is a historical artifact of Arrow library implementation. Generally increases compatibility, except perhaps with some old versions of Arrow.", 0) \
     M(Bool, output_format_parquet_use_custom_encoder, false, "Use a faster Parquet encoder implementation.", 0) \
     M(Bool, output_format_parquet_parallel_encoding, true, "Do Parquet encoding in multiple threads. Requires output_format_parquet_use_custom_encoder.", 0) \
@@ -1148,12 +1148,12 @@ class IColumn;
     M(Bool, output_format_arrow_low_cardinality_as_dictionary, false, "Enable output LowCardinality type as Dictionary Arrow type", 0) \
     M(Bool, output_format_arrow_use_signed_indexes_for_dictionary, true, "Use signed integers for dictionary indexes in Arrow format", 0) \
     M(Bool, output_format_arrow_use_64_bit_indexes_for_dictionary, false, "Always use 64 bit integers for dictionary indexes in Arrow format", 0) \
-    M(Bool, output_format_arrow_string_as_string, false, "Use Arrow String type instead of Binary for String columns", 0) \
+    M(Bool, output_format_arrow_string_as_string, true, "Use Arrow String type instead of Binary for String columns", 0) \
     M(Bool, output_format_arrow_fixed_string_as_fixed_byte_array, true, "Use Arrow FIXED_SIZE_BINARY type instead of Binary for FixedString columns.", 0) \
     M(ArrowCompression, output_format_arrow_compression_method, "lz4_frame", "Compression method for Arrow output format. Supported codecs: lz4_frame, zstd, none (uncompressed)", 0) \
     \
-    M(Bool, output_format_orc_string_as_string, false, "Use ORC String type instead of Binary for String columns", 0) \
-    M(ORCCompression, output_format_orc_compression_method, "lz4", "Compression method for ORC output format. Supported codecs: lz4, snappy, zlib, zstd, none (uncompressed)", 0) \
+    M(Bool, output_format_orc_string_as_string, true, "Use ORC String type instead of Binary for String columns", 0) \
+    M(ORCCompression, output_format_orc_compression_method, "zstd", "Compression method for ORC output format. Supported codecs: lz4, snappy, zlib, zstd, none (uncompressed)", 0) \
     M(UInt64, output_format_orc_row_index_stride, 10'000, "Target row index stride in ORC output format", 0) \
     \
     M(CapnProtoEnumComparingMode, format_capn_proto_enum_comparising_mode, FormatSettings::CapnProtoEnumComparingMode::BY_VALUES, "How to map ClickHouse Enum and CapnProto Enum", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index ee56b86d9f2..0925bbd0aba 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -105,6 +105,11 @@ static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> sett
               {"keeper_retry_max_backoff_ms", 5000, 5000, "Max backoff timeout for general keeper operations"},
               {"s3queue_allow_experimental_sharded_mode", false, false, "Enable experimental sharded mode of S3Queue table engine. It is experimental because it will be rewritten"},
               {"merge_tree_read_split_ranges_into_intersecting_and_non_intersecting_injection_probability", 0.0, 0.0, "For testing of `PartsSplitter` - split read ranges into intersecting and non intersecting every time you read from MergeTree with the specified probability."},
+              {"output_format_parquet_string_as_string", false, true, "ClickHouse allows arbitrary binary data in the String data type, which is typically UTF-8. Parquet/ORC/Arrow Strings only support UTF-8. That's why you can choose which Arrow's data type to use for the ClickHouse String data type - String or Binary. While Binary would be more correct and compatible, using String by default will correspond to user expectations in most cases."},
+              {"output_format_orc_string_as_string", false, true, "ClickHouse allows arbitrary binary data in the String data type, which is typically UTF-8. Parquet/ORC/Arrow Strings only support UTF-8. That's why you can choose which Arrow's data type to use for the ClickHouse String data type - String or Binary. While Binary would be more correct and compatible, using String by default will correspond to user expectations in most cases."},
+              {"output_format_arrow_string_as_string", false, true, "ClickHouse allows arbitrary binary data in the String data type, which is typically UTF-8. Parquet/ORC/Arrow Strings only support UTF-8. That's why you can choose which Arrow's data type to use for the ClickHouse String data type - String or Binary. While Binary would be more correct and compatible, using String by default will correspond to user expectations in most cases."},
+              {"output_format_parquet_compression_method", "lz4", "zstd", "Parquet/ORC/Arrow support many compression methods, including lz4 and zstd. ClickHouse supports each and every compression method. Some inferior tools, such as 'duckdb', lack support for the faster `lz4` compression method, that's why we set zstd by default."},
+              {"output_format_orc_compression_method", "lz4", "zstd", "Parquet/ORC/Arrow support many compression methods, including lz4 and zstd. ClickHouse supports each and every compression method. Some inferior tools, such as 'duckdb', lack support for the faster `lz4` compression method, that's why we set zstd by default."},
               }},
     {"24.2", {{"allow_suspicious_variant_types", true, false, "Don't allow creating Variant type with suspicious variants by default"},
               {"validate_experimental_and_suspicious_types_inside_nested_types", false, true, "Validate usage of experimental and suspicious types inside nested types"},

From da8da3cbe99ce549f61ca20e043e90fe31dae7f6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 17:52:26 +0100
Subject: [PATCH 946/985] Better usability of "expect" tests: less trouble with
 running directly

---
 .../01176_mysql_client_interactive.expect            |  7 ++++++-
 .../0_stateless/01179_insert_values_semicolon.expect |  9 +++++++--
 .../0_stateless/01180_client_syntax_errors.expect    |  9 +++++++--
 ...1293_client_interactive_vertical_multiline.expect |  9 +++++++--
 ...293_client_interactive_vertical_singleline.expect | 10 ++++++++--
 ...0_client_save_history_when_terminated_long.expect |  9 +++++++--
 ..._client_autocomplete_word_break_characters.expect |  9 +++++++--
 .../0_stateless/01520_client_print_query_id.expect   |  9 +++++++--
 .../01565_query_loop_after_client_error.expect       |  9 +++++++--
 ...nt_highlight_multi_line_comment_regression.expect |  9 +++++++--
 ...1910_client_replxx_container_overflow_long.expect |  7 ++++++-
 .../01933_client_replxx_convert_history.expect       |  9 +++++++--
 .../0_stateless/01945_show_debug_warning.expect      |  9 +++++++--
 .../0_stateless/02047_client_exception.expect        |  9 +++++++--
 .../02049_clickhouse_local_merge_tree.expect         |  7 ++++++-
 .../02105_backslash_letter_commands.expect           |  9 +++++++--
 ...elayed_clickhouse_client_with_queries_file.expect | 12 +++++++++---
 .../02112_delayed_clickhouse_local.expect            |  7 ++++++-
 ...delayed_clickhouse_local_with_queries_file.expect | 11 ++++++++---
 .../0_stateless/02116_interactive_hello.expect       |  9 +++++++--
 .../02132_client_history_navigation.expect           |  9 +++++++--
 .../02160_client_autocomplete_parse_query.expect     |  9 +++++++--
 ...164_clickhouse_local_interactive_exception.expect |  7 ++++++-
 ...ouse_client_INSERT_progress_profile_events.expect |  7 ++++++-
 ...house_local_INSERT_progress_profile_events.expect |  7 ++++++-
 .../02352_interactive_queries_from_file.expect       |  7 ++++++-
 .../0_stateless/02417_repeat_input_commands.expect   |  9 +++++++--
 tests/queries/0_stateless/02456_progress_tty.expect  |  7 ++++++-
 ...480_client_option_print_num_processed_rows.expect |  7 ++++++-
 .../02493_inconsistent_hex_and_binary_number.expect  |  7 ++++++-
 .../02775_show_columns_called_from_mysql.expect      |  7 ++++++-
 .../02793_implicit_pretty_format_settings.expect     |  9 +++++++--
 .../02907_suggestions_readonly_user.expect           |  9 +++++++--
 .../02931_client_fuzzy_search_crash.expect           |  9 +++++++--
 .../0_stateless/03014_invalid_utf8_client.expect     |  9 +++++++--
 utils/check-style/check-style                        |  2 +-
 36 files changed, 238 insertions(+), 61 deletions(-)

diff --git a/tests/queries/0_stateless/01176_mysql_client_interactive.expect b/tests/queries/0_stateless/01176_mysql_client_interactive.expect
index 2bb6ba8726b..6bfff6dfab3 100755
--- a/tests/queries/0_stateless/01176_mysql_client_interactive.expect
+++ b/tests/queries/0_stateless/01176_mysql_client_interactive.expect
@@ -4,7 +4,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01179_insert_values_semicolon.expect b/tests/queries/0_stateless/01179_insert_values_semicolon.expect
index 072be483e4f..534b18a9500 100755
--- a/tests/queries/0_stateless/01179_insert_values_semicolon.expect
+++ b/tests/queries/0_stateless/01179_insert_values_semicolon.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01180_client_syntax_errors.expect b/tests/queries/0_stateless/01180_client_syntax_errors.expect
index 508ebc3433b..042b16c3296 100755
--- a/tests/queries/0_stateless/01180_client_syntax_errors.expect
+++ b/tests/queries/0_stateless/01180_client_syntax_errors.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01293_client_interactive_vertical_multiline.expect b/tests/queries/0_stateless/01293_client_interactive_vertical_multiline.expect
index 25933777f9f..90115ee06b3 100755
--- a/tests/queries/0_stateless/01293_client_interactive_vertical_multiline.expect
+++ b/tests/queries/0_stateless/01293_client_interactive_vertical_multiline.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01293_client_interactive_vertical_singleline.expect b/tests/queries/0_stateless/01293_client_interactive_vertical_singleline.expect
index 1ded43d3fed..68d2d1f0a13 100755
--- a/tests/queries/0_stateless/01293_client_interactive_vertical_singleline.expect
+++ b/tests/queries/0_stateless/01293_client_interactive_vertical_singleline.expect
@@ -2,8 +2,14 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01300_client_save_history_when_terminated_long.expect b/tests/queries/0_stateless/01300_client_save_history_when_terminated_long.expect
index c897d7e9772..9f471bc694b 100755
--- a/tests/queries/0_stateless/01300_client_save_history_when_terminated_long.expect
+++ b/tests/queries/0_stateless/01300_client_save_history_when_terminated_long.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01370_client_autocomplete_word_break_characters.expect b/tests/queries/0_stateless/01370_client_autocomplete_word_break_characters.expect
index 90e19e077ec..44f3ba9681a 100755
--- a/tests/queries/0_stateless/01370_client_autocomplete_word_break_characters.expect
+++ b/tests/queries/0_stateless/01370_client_autocomplete_word_break_characters.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01520_client_print_query_id.expect b/tests/queries/0_stateless/01520_client_print_query_id.expect
index 2034483a73d..70f446e1584 100755
--- a/tests/queries/0_stateless/01520_client_print_query_id.expect
+++ b/tests/queries/0_stateless/01520_client_print_query_id.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01565_query_loop_after_client_error.expect b/tests/queries/0_stateless/01565_query_loop_after_client_error.expect
index e718fd99b7f..ac69c18ce39 100755
--- a/tests/queries/0_stateless/01565_query_loop_after_client_error.expect
+++ b/tests/queries/0_stateless/01565_query_loop_after_client_error.expect
@@ -5,8 +5,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01755_client_highlight_multi_line_comment_regression.expect b/tests/queries/0_stateless/01755_client_highlight_multi_line_comment_regression.expect
index a7e4b45eb44..3efbe478ce5 100755
--- a/tests/queries/0_stateless/01755_client_highlight_multi_line_comment_regression.expect
+++ b/tests/queries/0_stateless/01755_client_highlight_multi_line_comment_regression.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01910_client_replxx_container_overflow_long.expect b/tests/queries/0_stateless/01910_client_replxx_container_overflow_long.expect
index 9105cf30f79..4cd64b68d54 100755
--- a/tests/queries/0_stateless/01910_client_replxx_container_overflow_long.expect
+++ b/tests/queries/0_stateless/01910_client_replxx_container_overflow_long.expect
@@ -2,7 +2,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01933_client_replxx_convert_history.expect b/tests/queries/0_stateless/01933_client_replxx_convert_history.expect
index 69c5ff0118e..005ccbb5ff4 100755
--- a/tests/queries/0_stateless/01933_client_replxx_convert_history.expect
+++ b/tests/queries/0_stateless/01933_client_replxx_convert_history.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/01945_show_debug_warning.expect b/tests/queries/0_stateless/01945_show_debug_warning.expect
index 28b114b5af4..a6950b5ab82 100755
--- a/tests/queries/0_stateless/01945_show_debug_warning.expect
+++ b/tests/queries/0_stateless/01945_show_debug_warning.expect
@@ -5,8 +5,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02047_client_exception.expect b/tests/queries/0_stateless/02047_client_exception.expect
index 4dfdf211ba2..d7dcb97867a 100755
--- a/tests/queries/0_stateless/02047_client_exception.expect
+++ b/tests/queries/0_stateless/02047_client_exception.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02049_clickhouse_local_merge_tree.expect b/tests/queries/0_stateless/02049_clickhouse_local_merge_tree.expect
index a1454696253..ddfd6e9d158 100755
--- a/tests/queries/0_stateless/02049_clickhouse_local_merge_tree.expect
+++ b/tests/queries/0_stateless/02049_clickhouse_local_merge_tree.expect
@@ -2,7 +2,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02105_backslash_letter_commands.expect b/tests/queries/0_stateless/02105_backslash_letter_commands.expect
index 984e6f6d2eb..7e78b7e7280 100755
--- a/tests/queries/0_stateless/02105_backslash_letter_commands.expect
+++ b/tests/queries/0_stateless/02105_backslash_letter_commands.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02112_delayed_clickhouse_client_with_queries_file.expect b/tests/queries/0_stateless/02112_delayed_clickhouse_client_with_queries_file.expect
index 5f882ae9824..4b8524add80 100755
--- a/tests/queries/0_stateless/02112_delayed_clickhouse_client_with_queries_file.expect
+++ b/tests/queries/0_stateless/02112_delayed_clickhouse_client_with_queries_file.expect
@@ -2,7 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 20
@@ -15,8 +21,8 @@ expect_after {
     -i $any_spawn_id timeout { exit 1 }
 }
 
-system "echo \"drop table if exists t; create table t(i String) engine=Memory; insert into t select 'test string'\" > $env(CLICKHOUSE_TMP)/file_02112"
-spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT --disable_suggestion --interactive --queries-file $env(CLICKHOUSE_TMP)/file_02112"
+system "echo \"drop table if exists t; create table t(i String) engine=Memory; insert into t select 'test string'\" > $CLICKHOUSE_TMP/file_02112"
+spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT --disable_suggestion --interactive --queries-file $CLICKHOUSE_TMP/file_02112"
 expect ":) "
 
 send -- "select i from t format TSV\r"
diff --git a/tests/queries/0_stateless/02112_delayed_clickhouse_local.expect b/tests/queries/0_stateless/02112_delayed_clickhouse_local.expect
index 3413651fe68..9df889e7c90 100755
--- a/tests/queries/0_stateless/02112_delayed_clickhouse_local.expect
+++ b/tests/queries/0_stateless/02112_delayed_clickhouse_local.expect
@@ -2,7 +2,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 20
diff --git a/tests/queries/0_stateless/02112_delayed_clickhouse_local_with_queries_file.expect b/tests/queries/0_stateless/02112_delayed_clickhouse_local_with_queries_file.expect
index 0a136ff2e74..0c07adf231d 100755
--- a/tests/queries/0_stateless/02112_delayed_clickhouse_local_with_queries_file.expect
+++ b/tests/queries/0_stateless/02112_delayed_clickhouse_local_with_queries_file.expect
@@ -2,7 +2,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 20
@@ -15,8 +20,8 @@ expect_after {
     -i $any_spawn_id timeout { exit 1 }
 }
 
-system "echo \"drop table if exists t; create table t(i String) engine=Memory; insert into t select 'test string'\" > $env(CLICKHOUSE_TMP)/file_02112"
-spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_LOCAL --disable_suggestion --interactive --queries-file $env(CLICKHOUSE_TMP)/file_02112"
+system "echo \"drop table if exists t; create table t(i String) engine=Memory; insert into t select 'test string'\" > $CLICKHOUSE_TMP/file_02112"
+spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_LOCAL --disable_suggestion --interactive --queries-file $CLICKHOUSE_TMP/file_02112"
 expect ":) "
 
 send -- "select \* from t format TSV\r"
diff --git a/tests/queries/0_stateless/02116_interactive_hello.expect b/tests/queries/0_stateless/02116_interactive_hello.expect
index 391cef75163..41cd515ea34 100755
--- a/tests/queries/0_stateless/02116_interactive_hello.expect
+++ b/tests/queries/0_stateless/02116_interactive_hello.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02132_client_history_navigation.expect b/tests/queries/0_stateless/02132_client_history_navigation.expect
index dc7e44b41ee..3fba7ab1692 100755
--- a/tests/queries/0_stateless/02132_client_history_navigation.expect
+++ b/tests/queries/0_stateless/02132_client_history_navigation.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02160_client_autocomplete_parse_query.expect b/tests/queries/0_stateless/02160_client_autocomplete_parse_query.expect
index 01d61a6ad0f..2d404b005c7 100755
--- a/tests/queries/0_stateless/02160_client_autocomplete_parse_query.expect
+++ b/tests/queries/0_stateless/02160_client_autocomplete_parse_query.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02164_clickhouse_local_interactive_exception.expect b/tests/queries/0_stateless/02164_clickhouse_local_interactive_exception.expect
index 57a2d1c432b..add977c4fce 100755
--- a/tests/queries/0_stateless/02164_clickhouse_local_interactive_exception.expect
+++ b/tests/queries/0_stateless/02164_clickhouse_local_interactive_exception.expect
@@ -2,7 +2,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 20
diff --git a/tests/queries/0_stateless/02310_clickhouse_client_INSERT_progress_profile_events.expect b/tests/queries/0_stateless/02310_clickhouse_client_INSERT_progress_profile_events.expect
index 9f6937cf80d..e9b83d6c65a 100755
--- a/tests/queries/0_stateless/02310_clickhouse_client_INSERT_progress_profile_events.expect
+++ b/tests/queries/0_stateless/02310_clickhouse_client_INSERT_progress_profile_events.expect
@@ -8,7 +8,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02310_clickhouse_local_INSERT_progress_profile_events.expect b/tests/queries/0_stateless/02310_clickhouse_local_INSERT_progress_profile_events.expect
index 5e514cd7c12..bde00b306cf 100755
--- a/tests/queries/0_stateless/02310_clickhouse_local_INSERT_progress_profile_events.expect
+++ b/tests/queries/0_stateless/02310_clickhouse_local_INSERT_progress_profile_events.expect
@@ -8,7 +8,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02352_interactive_queries_from_file.expect b/tests/queries/0_stateless/02352_interactive_queries_from_file.expect
index e28fb38862c..d11d55ba941 100755
--- a/tests/queries/0_stateless/02352_interactive_queries_from_file.expect
+++ b/tests/queries/0_stateless/02352_interactive_queries_from_file.expect
@@ -3,7 +3,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 20
diff --git a/tests/queries/0_stateless/02417_repeat_input_commands.expect b/tests/queries/0_stateless/02417_repeat_input_commands.expect
index 8070200c55c..5a4b2840854 100755
--- a/tests/queries/0_stateless/02417_repeat_input_commands.expect
+++ b/tests/queries/0_stateless/02417_repeat_input_commands.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02456_progress_tty.expect b/tests/queries/0_stateless/02456_progress_tty.expect
index 3d1d92e5400..73d7b447690 100755
--- a/tests/queries/0_stateless/02456_progress_tty.expect
+++ b/tests/queries/0_stateless/02456_progress_tty.expect
@@ -2,7 +2,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02480_client_option_print_num_processed_rows.expect b/tests/queries/0_stateless/02480_client_option_print_num_processed_rows.expect
index dd3c9309b2d..673a9a17c95 100755
--- a/tests/queries/0_stateless/02480_client_option_print_num_processed_rows.expect
+++ b/tests/queries/0_stateless/02480_client_option_print_num_processed_rows.expect
@@ -2,7 +2,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02493_inconsistent_hex_and_binary_number.expect b/tests/queries/0_stateless/02493_inconsistent_hex_and_binary_number.expect
index 1cc11f9bf9f..a111a0cfd23 100755
--- a/tests/queries/0_stateless/02493_inconsistent_hex_and_binary_number.expect
+++ b/tests/queries/0_stateless/02493_inconsistent_hex_and_binary_number.expect
@@ -2,7 +2,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02775_show_columns_called_from_mysql.expect b/tests/queries/0_stateless/02775_show_columns_called_from_mysql.expect
index 3798acf2a93..4798a6958c6 100755
--- a/tests/queries/0_stateless/02775_show_columns_called_from_mysql.expect
+++ b/tests/queries/0_stateless/02775_show_columns_called_from_mysql.expect
@@ -11,7 +11,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 log_user 0
 set timeout 60
 match_max 100000
diff --git a/tests/queries/0_stateless/02793_implicit_pretty_format_settings.expect b/tests/queries/0_stateless/02793_implicit_pretty_format_settings.expect
index 569cbc7330e..1ceae001028 100755
--- a/tests/queries/0_stateless/02793_implicit_pretty_format_settings.expect
+++ b/tests/queries/0_stateless/02793_implicit_pretty_format_settings.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02907_suggestions_readonly_user.expect b/tests/queries/0_stateless/02907_suggestions_readonly_user.expect
index e329c8ee376..025ccbfbae8 100755
--- a/tests/queries/0_stateless/02907_suggestions_readonly_user.expect
+++ b/tests/queries/0_stateless/02907_suggestions_readonly_user.expect
@@ -3,8 +3,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/02931_client_fuzzy_search_crash.expect b/tests/queries/0_stateless/02931_client_fuzzy_search_crash.expect
index 18acaf86a4b..992ff85ca1e 100755
--- a/tests/queries/0_stateless/02931_client_fuzzy_search_crash.expect
+++ b/tests/queries/0_stateless/02931_client_fuzzy_search_crash.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/tests/queries/0_stateless/03014_invalid_utf8_client.expect b/tests/queries/0_stateless/03014_invalid_utf8_client.expect
index 13cbfe408d4..6689e1a1179 100755
--- a/tests/queries/0_stateless/03014_invalid_utf8_client.expect
+++ b/tests/queries/0_stateless/03014_invalid_utf8_client.expect
@@ -2,8 +2,13 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0
 set timeout 60
diff --git a/utils/check-style/check-style b/utils/check-style/check-style
index d7387c3f843..23e8b6b2bc4 100755
--- a/utils/check-style/check-style
+++ b/utils/check-style/check-style
@@ -342,7 +342,7 @@ done
 
 expect_tests=( $(find $ROOT_PATH/tests/queries -name '*.expect') )
 for test_case in "${expect_tests[@]}"; do
-    pattern="^exp_internal -f \$env(CLICKHOUSE_TMP)/\$basename.debuglog 0$"
+    pattern="^exp_internal -f \$CLICKHOUSE_TMP/\$basename.debuglog 0$"
     grep -q "$pattern" "$test_case" || echo "Missing '$pattern' in '$test_case'"
 
     if grep -q "^spawn.*CLICKHOUSE_CLIENT_BINARY$" "$test_case"; then

From afaf5f279880d308c610b46270e1925b6d9e4386 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 18:09:50 +0100
Subject: [PATCH 947/985] Update test

---
 .../0_stateless/03021_output_format_tty.reference     |  8 --------
 tests/queries/0_stateless/03021_output_format_tty.sh  | 11 ++++++++---
 2 files changed, 8 insertions(+), 11 deletions(-)

diff --git a/tests/queries/0_stateless/03021_output_format_tty.reference b/tests/queries/0_stateless/03021_output_format_tty.reference
index 3d3927f704f..e69de29bb2d 100644
--- a/tests/queries/0_stateless/03021_output_format_tty.reference
+++ b/tests/queries/0_stateless/03021_output_format_tty.reference
@@ -1,8 +0,0 @@
-spawn bash -c source ./../shell_config.sh ; $CLICKHOUSE_CLIENT --query 'SELECT 1'
-┌─[1m1[0m─┐
-│ 1 │
-└───┘
-spawn bash -c source ./../shell_config.sh ; $CLICKHOUSE_LOCAL --query 'SELECT 2'
-┌─[1m2[0m─┐
-│ 2 │
-└───┘
diff --git a/tests/queries/0_stateless/03021_output_format_tty.sh b/tests/queries/0_stateless/03021_output_format_tty.sh
index 93ff8739ef2..dfc37c3b30a 100755
--- a/tests/queries/0_stateless/03021_output_format_tty.sh
+++ b/tests/queries/0_stateless/03021_output_format_tty.sh
@@ -2,10 +2,15 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
-set history_file $env(CLICKHOUSE_TMP)/$basename.history
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
+set history_file $CLICKHOUSE_TMP/$basename.history
 
-log_user 1
+log_user 0
 set timeout 60
 match_max 100000
 

From 3d8bde5e1ba7073ce5f784b3c700455eb14e07e1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 18:12:20 +0100
Subject: [PATCH 948/985] Fix test

---
 .../0_stateless/02456_progress_tty.expect     | 19 ++++++++++++-------
 1 file changed, 12 insertions(+), 7 deletions(-)

diff --git a/tests/queries/0_stateless/02456_progress_tty.expect b/tests/queries/0_stateless/02456_progress_tty.expect
index 3d1d92e5400..dd11ad3d90c 100755
--- a/tests/queries/0_stateless/02456_progress_tty.expect
+++ b/tests/queries/0_stateless/02456_progress_tty.expect
@@ -2,7 +2,12 @@
 
 set basedir [file dirname $argv0]
 set basename [file tail $argv0]
-exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+if {[info exists env(CLICKHOUSE_TMP)]} {
+    set CLICKHOUSE_TMP $env(CLICKHOUSE_TMP)
+} else {
+    set CLICKHOUSE_TMP "."
+}
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 
 log_user 0
 set timeout 60
@@ -18,34 +23,34 @@ spawn bash
 send "source $basedir/../shell_config.sh\r"
 
 # Progress is not displayed by default
-send "\$CLICKHOUSE_LOCAL --query 'SELECT sleep(1), \$\$Hello\$\$ FROM numbers(3) SETTINGS max_block_size = 1' 2>/dev/null\r"
+send "\$CLICKHOUSE_LOCAL --format TSV --query 'SELECT sleep(1), \$\$Hello\$\$ FROM numbers(3) SETTINGS max_block_size = 1' 2>/dev/null\r"
 expect -exact "0\tHello\r\n"
 send "\3"
 
 # The option --progress has implicit value of true
-send "\$CLICKHOUSE_LOCAL --progress --query 'SELECT sum(sleep(1) = 0) FROM numbers(3) SETTINGS max_block_size = 1' >/dev/null\r"
+send "\$CLICKHOUSE_LOCAL --format TSV --progress --query 'SELECT sum(sleep(1) = 0) FROM numbers(3) SETTINGS max_block_size = 1' >/dev/null\r"
 expect "Progress: "
 expect "█"
 send "\3"
 
 # It works even if we redirect both stdout and stderr to /dev/null
-send "\$CLICKHOUSE_LOCAL --progress --query 'SELECT sum(sleep(1) = 0) FROM numbers(3) SETTINGS max_block_size = 1' >/dev/null 2>&1\r"
+send "\$CLICKHOUSE_LOCAL --format TSV --progress --query 'SELECT sum(sleep(1) = 0) FROM numbers(3) SETTINGS max_block_size = 1' >/dev/null 2>&1\r"
 expect "Progress: "
 expect "█"
 send "\3"
 
 # But we can set it to false
-send "\$CLICKHOUSE_LOCAL --progress false --query 'SELECT sleep(1), \$\$Hello\$\$ FROM numbers(3) SETTINGS max_block_size = 1' 2>/dev/null\r"
+send "\$CLICKHOUSE_LOCAL --format TSV --progress false --query 'SELECT sleep(1), \$\$Hello\$\$ FROM numbers(3) SETTINGS max_block_size = 1' 2>/dev/null\r"
 expect -exact "0\tHello\r\n"
 send "\3"
 
 # As well as to 0 for the same effect
-send "\$CLICKHOUSE_LOCAL --progress 0 --query 'SELECT sleep(1), \$\$Hello\$\$ FROM numbers(3) SETTINGS max_block_size = 1' 2>/dev/null\r"
+send "\$CLICKHOUSE_LOCAL --format TSV --progress 0 --query 'SELECT sleep(1), \$\$Hello\$\$ FROM numbers(3) SETTINGS max_block_size = 1' 2>/dev/null\r"
 expect -exact "0\tHello\r\n"
 send "\3"
 
 # If we set it to 1, the progress will be displayed as well
-send "\$CLICKHOUSE_LOCAL --progress 1 --query 'SELECT sum(sleep(1) = 0) FROM numbers(3) SETTINGS max_block_size = 1' >/dev/null 2>&1\r"
+send "\$CLICKHOUSE_LOCAL --format TSV --progress 1 --query 'SELECT sum(sleep(1) = 0) FROM numbers(3) SETTINGS max_block_size = 1' >/dev/null 2>&1\r"
 expect "Progress: "
 expect "█"
 send "\3"

From 7823f49765902707a567c648a5a9ae84f04593bf Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 18:14:32 +0100
Subject: [PATCH 949/985] Update test

---
 tests/queries/0_stateless/00476_pretty_formats_and_widths.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/00476_pretty_formats_and_widths.sql b/tests/queries/0_stateless/00476_pretty_formats_and_widths.sql
index ece046b738e..4bace207fb5 100644
--- a/tests/queries/0_stateless/00476_pretty_formats_and_widths.sql
+++ b/tests/queries/0_stateless/00476_pretty_formats_and_widths.sql
@@ -1,4 +1,4 @@
-SET output_format_pretty_color=1;
+SET output_format_pretty_color=1, output_format_pretty_highlight_digit_groups=0;
 SELECT toUInt64(round(exp10(number))) AS x, toString(x) AS s FROM system.numbers LIMIT 10 FORMAT Pretty;
 SELECT toUInt64(round(exp10(number))) AS x, toString(x) AS s FROM system.numbers LIMIT 10 FORMAT PrettyCompact;
 SELECT toUInt64(round(exp10(number))) AS x, toString(x) AS s FROM system.numbers LIMIT 10 FORMAT PrettySpace;

From b3692fe1a501add9b09cb05c5de376aa6b9b82c6 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 20:40:47 +0300
Subject: [PATCH 950/985] Update 00990_function_current_user.sql

---
 tests/queries/0_stateless/00990_function_current_user.sql | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/00990_function_current_user.sql b/tests/queries/0_stateless/00990_function_current_user.sql
index 4cf59e72e11..729e8b3de8c 100644
--- a/tests/queries/0_stateless/00990_function_current_user.sql
+++ b/tests/queries/0_stateless/00990_function_current_user.sql
@@ -1,5 +1,5 @@
--- since actual user name is unknown, have to perform just smoke tests
+-- Since the actual user name is unknown, have to perform just smoke tests
 select currentUser() IS NOT NULL;
 select length(currentUser()) > 0;
 select currentUser() = user(), currentUser() = USER(), current_user() = currentUser();
-select currentUser() = initial_user from system.processes where query like '%$!@#%';
+select currentUser() = initial_user from system.processes where query like '%$!@#%' AND current_database = currentDatabase();

From 696eab7db1c48ef31cb19a5e2226d5fa7a11e262 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 18:44:38 +0100
Subject: [PATCH 951/985] Update

---
 .../01293_client_interactive_vertical_multiline.expect           | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tests/queries/0_stateless/01293_client_interactive_vertical_multiline.expect b/tests/queries/0_stateless/01293_client_interactive_vertical_multiline.expect
index 90115ee06b3..3de7df04ec0 100755
--- a/tests/queries/0_stateless/01293_client_interactive_vertical_multiline.expect
+++ b/tests/queries/0_stateless/01293_client_interactive_vertical_multiline.expect
@@ -8,6 +8,7 @@ if {[info exists env(CLICKHOUSE_TMP)]} {
 } else {
     set CLICKHOUSE_TMP "."
 }
+exp_internal -f $CLICKHOUSE_TMP/$basename.debuglog 0
 set history_file $CLICKHOUSE_TMP/$basename.history
 
 log_user 0

From d07b4114f1fa293800d0135d4b6496c8f362da49 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 21:09:26 +0300
Subject: [PATCH 952/985] Update
 25340_alter_materialized_view_query_has_inner_table.sql

---
 .../25340_alter_materialized_view_query_has_inner_table.sql   | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql b/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql
index 73bbac59a95..eb4c98fc8b4 100644
--- a/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql
+++ b/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql
@@ -9,7 +9,7 @@ INSERT INTO src_table (a, b) VALUES (1, 1), (2, 2);
 SELECT * FROM mv;
 
 SET allow_experimental_alter_materialized_view_structure = 1;
-ALTER TABLE mv MODIFY QUERY SELECT a, b FROM src_table; -- {serverError QUERY_IS_NOT_SUPPORTED_IN_MATERIALIZED_VIEW}
+ALTER TABLE mv MODIFY QUERY SELECT a, b FROM src_table; -- { serverError NO_SUCH_COLUMN_IN_TABLE }
 
 DROP TABLE src_table;
-DROP TABLE mv;
\ No newline at end of file
+DROP TABLE mv;

From a5dc6241bbe4191710a19f0dd89cfb79b4b01412 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 21:10:42 +0300
Subject: [PATCH 953/985] Update StorageMaterializedView.cpp

---
 src/Storages/StorageMaterializedView.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/Storages/StorageMaterializedView.cpp b/src/Storages/StorageMaterializedView.cpp
index 0d40b831437..79e70c35665 100644
--- a/src/Storages/StorageMaterializedView.cpp
+++ b/src/Storages/StorageMaterializedView.cpp
@@ -399,7 +399,7 @@ void StorageMaterializedView::alter(
 
     new_metadata.setSelectQuery(new_select);
 
-    /// check materialized view inner table structure
+    /// Check the materialized view's inner table structure.
     if (has_inner_table)
     {
         const Block & block = InterpreterSelectWithUnionQuery::getSampleBlock(new_select.select_query, local_context);
@@ -509,7 +509,7 @@ void StorageMaterializedView::renameInMemory(const StorageID & new_table_id)
         updateTargetTableId(new_table_id.database_name, std::nullopt);
     }
     const auto & select_query = metadata_snapshot->getSelectQuery();
-    // TODO Actually we don't need to update dependency if MV has UUID, but then db and table name will be outdated
+    /// TODO: Actually, we don't need to update dependency if MV has UUID, but then db and table name will be outdated
     DatabaseCatalog::instance().updateViewDependency(select_query.select_table_id, old_table_id, select_query.select_table_id, getStorageID());
 
     if (refresher)

From 25201919a57c24d2ff343f5143d4f9a19dcd568c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 19:23:01 +0100
Subject: [PATCH 954/985] Fix errors

---
 src/Storages/StorageMaterializedView.cpp                        | 2 +-
 ...022_alter_materialized_view_query_has_inner_table.reference} | 0
 ... => 03022_alter_materialized_view_query_has_inner_table.sql} | 0
 3 files changed, 1 insertion(+), 1 deletion(-)
 rename tests/queries/0_stateless/{25340_alter_materialized_view_query_has_inner_table.reference => 03022_alter_materialized_view_query_has_inner_table.reference} (100%)
 rename tests/queries/0_stateless/{25340_alter_materialized_view_query_has_inner_table.sql => 03022_alter_materialized_view_query_has_inner_table.sql} (100%)

diff --git a/src/Storages/StorageMaterializedView.cpp b/src/Storages/StorageMaterializedView.cpp
index 79e70c35665..bbb06e9be08 100644
--- a/src/Storages/StorageMaterializedView.cpp
+++ b/src/Storages/StorageMaterializedView.cpp
@@ -406,7 +406,7 @@ void StorageMaterializedView::alter(
         const auto & inner_table_metadata = tryGetTargetTable()->getInMemoryMetadata().columns;
         for (const auto & name : block.getNames())
             if (!inner_table_metadata.has(name))
-                throw Exception(ErrorCodes::NO_SUCH_COLUMN_IN_TABLE, "Column {} does not exist in the materialized view's inner table", col.name);
+                throw Exception(ErrorCodes::NO_SUCH_COLUMN_IN_TABLE, "Column {} does not exist in the materialized view's inner table", name);
     }
 
     DatabaseCatalog::instance().getDatabase(table_id.database_name)->alterTable(local_context, table_id, new_metadata);
diff --git a/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.reference b/tests/queries/0_stateless/03022_alter_materialized_view_query_has_inner_table.reference
similarity index 100%
rename from tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.reference
rename to tests/queries/0_stateless/03022_alter_materialized_view_query_has_inner_table.reference
diff --git a/tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql b/tests/queries/0_stateless/03022_alter_materialized_view_query_has_inner_table.sql
similarity index 100%
rename from tests/queries/0_stateless/25340_alter_materialized_view_query_has_inner_table.sql
rename to tests/queries/0_stateless/03022_alter_materialized_view_query_has_inner_table.sql

From 43d527ab6d3d8a8c36e77ad2b33dfe84058d1c54 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 21:25:08 +0300
Subject: [PATCH 955/985] Update CHANGELOG.md

---
 CHANGELOG.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 2814fdc310e..9df678d4b9a 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -198,7 +198,6 @@
 * Added `FROM <Replicas>` modifier for `SYSTEM SYNC REPLICA LIGHTWEIGHT` query. With the `FROM` modifier ensures we wait for fetches and drop-ranges only for the specified source replicas, as well as any replica not in zookeeper or with an empty source_replica. [#58393](https://github.com/ClickHouse/ClickHouse/pull/58393) ([Jayme Bird](https://github.com/jaymebrd)).
 * Added setting `update_insert_deduplication_token_in_dependent_materialized_views`. This setting allows to update insert deduplication token with table identifier during insert in dependent materialized views. Closes [#59165](https://github.com/ClickHouse/ClickHouse/issues/59165). [#59238](https://github.com/ClickHouse/ClickHouse/pull/59238) ([Maksim Kita](https://github.com/kitaisreal)).
 * Added statement `SYSTEM RELOAD ASYNCHRONOUS METRICS` which updates the asynchronous metrics. Mostly useful for testing and development. [#53710](https://github.com/ClickHouse/ClickHouse/pull/53710) ([Robert Schulze](https://github.com/rschu1ze)).
-* Attach parts from a different disk `ALTER TABLE destination ATTACH PARTITION tuple() FROM source` where source is an [instant table](https://github.com/ClickHouse/web-tables-demo). [#60112](https://github.com/ClickHouse/ClickHouse/pull/60112)([Unalian](https://github.com/Unalian)).
 
 #### Performance Improvement
 * Coordination for parallel replicas is rewritten for better parallelism and cache locality. It has been tested for linear scalability on hundreds of replicas. It also got support for reading in order. [#57968](https://github.com/ClickHouse/ClickHouse/pull/57968) ([Nikita Taranov](https://github.com/nickitat)).

From 13b4a2838cb060cf82dceeb3a155d3a742a409ed Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 21:26:23 +0300
Subject: [PATCH 956/985] Update StorageReplicatedMergeTree.cpp

---
 src/Storages/StorageReplicatedMergeTree.cpp | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index cf9cc6f27e1..395d8c62e89 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -8018,11 +8018,13 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
 
             bool zero_copy_enabled = storage_settings_ptr->allow_remote_fs_zero_copy_replication
                 || dynamic_cast<const MergeTreeData *>(source_table.get())->getSettings()->allow_remote_fs_zero_copy_replication;
+
             IDataPartStorage::ClonePartParams clone_params
             {
                 .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || (zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
+
             auto [dst_part, part_lock] = cloneAndLoadDataPart(
                 src_part,
                 TMP_PREFIX,
@@ -8031,6 +8033,7 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                 clone_params,
                 query_context->getReadSettings(),
                 query_context->getWriteSettings());
+
             dst_parts.emplace_back(std::move(dst_part));
             dst_parts_locks.emplace_back(std::move(part_lock));
             src_parts.emplace_back(src_part);

From e9c8a05c9deacdbe01b5cbd167fdc73eeb7af444 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 19:44:26 +0100
Subject: [PATCH 957/985] The new results are correct

---
 .../01293_pretty_max_value_width.reference    | 20 +++++++++----------
 .../01293_pretty_max_value_width.sql          |  2 +-
 2 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/tests/queries/0_stateless/01293_pretty_max_value_width.reference b/tests/queries/0_stateless/01293_pretty_max_value_width.reference
index 9887169f7af..3c82bd8d7ed 100644
--- a/tests/queries/0_stateless/01293_pretty_max_value_width.reference
+++ b/tests/queries/0_stateless/01293_pretty_max_value_width.reference
@@ -84,31 +84,31 @@
 ┏━━━┳━━━┓
 ┃ [1mx[0m ┃ [1my[0m ┃
 ┡━━━╇━━━┩
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
+│ привет │ мир │
 └───┴───┘
 ┌─[1mx[0m─┬─[1my[0m─┐
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
+│ привет │ мир │
 └───┴───┘
  [1mx[0m   [1my[0m
 
- [31;1m⋯[0m   [31;1m⋯[0m 
+ привет   мир 
 ┏━━━┳━━━┓
 ┃ [1mx[0m ┃ [1my[0m ┃
 ┡━━━╇━━━┩
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
+│ привет │ мир │
 ├───┼───┤
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
+│ мир │ привет │
 └───┴───┘
 ┌─[1mx[0m─┬─[1my[0m─┐
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
-│ [31;1m⋯[0m │ [31;1m⋯[0m │
+│ привет │ мир │
+│ мир │ привет │
 └───┴───┘
  [1mx[0m   [1my[0m
 
- [31;1m⋯[0m   [31;1m⋯[0m 
- [31;1m⋯[0m   [31;1m⋯[0m 
+ привет   мир 
+ мир   привет 
 ┏━━━┳━━━┓
 ┃ x ┃ y ┃
 ┡━━━╇━━━┩
-│ ⋯ │ ⋯ │
+│ привет │ мир │
 └───┴───┘
diff --git a/tests/queries/0_stateless/01293_pretty_max_value_width.sql b/tests/queries/0_stateless/01293_pretty_max_value_width.sql
index 3d53f3a0c4e..a8e0f19f58e 100644
--- a/tests/queries/0_stateless/01293_pretty_max_value_width.sql
+++ b/tests/queries/0_stateless/01293_pretty_max_value_width.sql
@@ -1,4 +1,4 @@
-SET output_format_pretty_color = 1, output_format_pretty_max_value_width_apply_for_single_value = 1;
+SET output_format_pretty_color = 1, output_format_pretty_max_value_width_apply_for_single_value = 1, output_format_pretty_row_numbers = 0;
 SELECT 'привет' AS x, 'мир' AS y FORMAT Pretty;
 
 SET output_format_pretty_max_value_width = 5;

From 789772caa1f7ffe4dfd2c586a9631dab7a139c67 Mon Sep 17 00:00:00 2001
From: Nikita Fomichev <nikita.fomichev@clickhouse.com>
Date: Sat, 23 Mar 2024 14:56:26 +0100
Subject: [PATCH 958/985] Integration tests: rich exception message raised from
 `ClickHouseInstance.query_with_retry()`

---
 tests/integration/helpers/cluster.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 1ed8905389d..281d7d8476c 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -3476,6 +3476,7 @@ class ClickHouseInstance:
     ):
         # logging.debug(f"Executing query {sql} on {self.name}")
         result = None
+        exception_msg = ""
         for i in range(retry_count):
             try:
                 result = self.query(
@@ -3493,17 +3494,19 @@ class ClickHouseInstance:
                     return result
                 time.sleep(sleep_time)
             except QueryRuntimeException as ex:
+                exception_msg = f"{type(ex).__name__}: {str(ex)}"
                 # Container is down, this is likely due to server crash.
                 if "No route to host" in str(ex):
                     raise
                 time.sleep(sleep_time)
             except Exception as ex:
                 # logging.debug("Retry {} got exception {}".format(i + 1, ex))
+                exception_msg = f"{type(ex).__name__}: {str(ex)}"
                 time.sleep(sleep_time)
 
         if result is not None:
             return result
-        raise Exception("Can't execute query {}".format(sql))
+        raise Exception(f"Can't execute query {sql}\n{exception_msg}")
 
     # As query() but doesn't wait response and returns response handler
     def get_query_request(self, sql, *args, **kwargs):

From 0e7c02e923fa49524cee4d47ac19133f60031738 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 19:51:21 +0100
Subject: [PATCH 959/985] Update tests

---
 .../02962_arrow_dictionary_indexes_types.reference        | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/queries/0_stateless/02962_arrow_dictionary_indexes_types.reference b/tests/queries/0_stateless/02962_arrow_dictionary_indexes_types.reference
index 05e8b3e24fc..98e2ae85655 100644
--- a/tests/queries/0_stateless/02962_arrow_dictionary_indexes_types.reference
+++ b/tests/queries/0_stateless/02962_arrow_dictionary_indexes_types.reference
@@ -1,4 +1,4 @@
-lc: dictionary<values=binary, indices=int64, ordered=0> not null
-lc: dictionary<values=binary, indices=int32, ordered=0> not null
-lc: dictionary<values=binary, indices=uint64, ordered=0> not null
-lc: dictionary<values=binary, indices=uint32, ordered=0> not null
+lc: dictionary<values=string, indices=int64, ordered=0> not null
+lc: dictionary<values=string, indices=int32, ordered=0> not null
+lc: dictionary<values=string, indices=uint64, ordered=0> not null
+lc: dictionary<values=string, indices=uint32, ordered=0> not null

From f7b100a88543d3b893a8d96be14ce0590c4dc5e8 Mon Sep 17 00:00:00 2001
From: Nikita Fomichev <nikita.fomichev@clickhouse.com>
Date: Sat, 23 Mar 2024 15:51:36 +0100
Subject: [PATCH 960/985] Integration tests: fix flaky tests

---
 .../test_backup_restore_on_cluster/test.py    |  1 +
 tests/integration/test_grpc_protocol/test.py  |  3 +
 .../test_merges_memory_limit/test.py          |  6 +-
 .../test_mysql57_database_engine/test.py      |  4 +-
 .../test.py                                   |  6 +-
 .../test.py                                   | 21 +++----
 tests/integration/test_ttl_move/test.py       |  2 +-
 .../configs/with_delay_config.xml             |  2 +-
 tests/integration/test_undrop_query/test.py   | 58 ++++++++-----------
 9 files changed, 52 insertions(+), 51 deletions(-)

diff --git a/tests/integration/test_backup_restore_on_cluster/test.py b/tests/integration/test_backup_restore_on_cluster/test.py
index 027c9736c32..c76e9718640 100644
--- a/tests/integration/test_backup_restore_on_cluster/test.py
+++ b/tests/integration/test_backup_restore_on_cluster/test.py
@@ -457,6 +457,7 @@ def test_replicated_database_async():
     )
 
     node1.query("SYSTEM SYNC REPLICA ON CLUSTER 'cluster' mydb.tbl")
+    node1.query("SYSTEM SYNC REPLICA ON CLUSTER 'cluster' mydb.tbl2")
 
     assert node1.query("SELECT * FROM mydb.tbl ORDER BY x") == TSV([1, 22])
     assert node2.query("SELECT * FROM mydb.tbl2 ORDER BY y") == TSV(["a", "bb"])
diff --git a/tests/integration/test_grpc_protocol/test.py b/tests/integration/test_grpc_protocol/test.py
index 0332e5bb90f..385523d1117 100644
--- a/tests/integration/test_grpc_protocol/test.py
+++ b/tests/integration/test_grpc_protocol/test.py
@@ -392,6 +392,9 @@ def test_progress():
         ),
     ]
 
+    # Stats data can be returned, which broke the test
+    results = [i for i in results if not isinstance(i, clickhouse_grpc_pb2.Stats)]
+
     assert results == expected_results
 
 
diff --git a/tests/integration/test_merges_memory_limit/test.py b/tests/integration/test_merges_memory_limit/test.py
index e663f3280cc..ca2b0bc5429 100644
--- a/tests/integration/test_merges_memory_limit/test.py
+++ b/tests/integration/test_merges_memory_limit/test.py
@@ -32,7 +32,11 @@ def test_memory_limit_success():
     )
 
     _, error = node.query_and_get_answer_with_error(
-        "SYSTEM START MERGES test_merge_oom;SET optimize_throw_if_noop=1;OPTIMIZE TABLE test_merge_oom FINAL"
+        """
+        SET optimize_throw_if_noop=1;
+        SYSTEM START MERGES test_merge_oom;
+        OPTIMIZE TABLE test_merge_oom FINAL;
+        """
     )
 
     assert not error
diff --git a/tests/integration/test_mysql57_database_engine/test.py b/tests/integration/test_mysql57_database_engine/test.py
index 26db6637bc6..e07cf443fd8 100644
--- a/tests/integration/test_mysql57_database_engine/test.py
+++ b/tests/integration/test_mysql57_database_engine/test.py
@@ -1021,7 +1021,9 @@ def test_restart_server(started_cluster):
                 clickhouse_node, mysql_node, action="REJECT --reject-with tcp-reset"
             )
             clickhouse_node.restart_clickhouse()
-            clickhouse_node.query_and_get_error("SHOW TABLES FROM test_restart")
+            clickhouse_node.query_and_get_error_with_retry(
+                "SHOW TABLES FROM test_restart"
+            )
         assert "test_table" in clickhouse_node.query("SHOW TABLES FROM test_restart")
 
 
diff --git a/tests/integration/test_replicated_merge_tree_s3_zero_copy/test.py b/tests/integration/test_replicated_merge_tree_s3_zero_copy/test.py
index 72a01d278d8..7d165d526ed 100644
--- a/tests/integration/test_replicated_merge_tree_s3_zero_copy/test.py
+++ b/tests/integration/test_replicated_merge_tree_s3_zero_copy/test.py
@@ -213,9 +213,9 @@ def test_drop_table(cluster):
 
     node.query_with_retry(
         "system sync replica test_drop_table",
-        settings={"receive_timeout": 5},
-        sleep_time=5,
-        retry_count=10,
+        settings={"receive_timeout": 10},
+        sleep_time=3,
+        retry_count=20,
     )
     node2.query("drop table test_drop_table sync")
     assert "1000\t499500\n" == node.query(
diff --git a/tests/integration/test_runtime_configurable_cache_size/test.py b/tests/integration/test_runtime_configurable_cache_size/test.py
index 6119ff1ebea..844105efd23 100644
--- a/tests/integration/test_runtime_configurable_cache_size/test.py
+++ b/tests/integration/test_runtime_configurable_cache_size/test.py
@@ -95,15 +95,15 @@ CONFIG_DIR = os.path.join(SCRIPT_DIR, "configs")
 
 
 def test_query_cache_size_is_runtime_configurable(start_cluster):
-    # the inital config specifies the maximum query cache size as 2, run 3 queries, expect 2 cache entries
+    # the initial config specifies the maximum query cache size as 2, run 3 queries, expect 2 cache entries
     node.query("SYSTEM DROP QUERY CACHE")
     node.query("SELECT 1 SETTINGS use_query_cache = 1, query_cache_ttl = 1")
     node.query("SELECT 2 SETTINGS use_query_cache = 1, query_cache_ttl = 1")
     node.query("SELECT 3 SETTINGS use_query_cache = 1, query_cache_ttl = 1")
 
-    time.sleep(2.0)
-    res = node.query(
-        "SELECT value FROM system.asynchronous_metrics WHERE metric = 'QueryCacheEntries'"
+    res = node.query_with_retry(
+        "SELECT value FROM system.asynchronous_metrics WHERE metric = 'QueryCacheEntries'",
+        check_callback=lambda result: result == "2\n",
     )
     assert res == "2\n"
 
@@ -116,9 +116,9 @@ def test_query_cache_size_is_runtime_configurable(start_cluster):
     node.query("SYSTEM RELOAD CONFIG")
 
     # check that eviction worked as expected
-    time.sleep(2.0)
-    res = node.query(
-        "SELECT value FROM system.asynchronous_metrics WHERE metric = 'QueryCacheEntries'"
+    res = node.query_with_retry(
+        "SELECT value FROM system.asynchronous_metrics WHERE metric = 'QueryCacheEntries'",
+        check_callback=lambda result: result == "2\n",
     )
     assert (
         res == "2\n"
@@ -131,9 +131,10 @@ def test_query_cache_size_is_runtime_configurable(start_cluster):
     # check that the new query cache maximum size is respected when more queries run
     node.query("SELECT 4 SETTINGS use_query_cache = 1, query_cache_ttl = 1")
     node.query("SELECT 5 SETTINGS use_query_cache = 1, query_cache_ttl = 1")
-    time.sleep(2.0)
-    res = node.query(
-        "SELECT value FROM system.asynchronous_metrics WHERE metric = 'QueryCacheEntries'"
+
+    res = node.query_with_retry(
+        "SELECT value FROM system.asynchronous_metrics WHERE metric = 'QueryCacheEntries'",
+        check_callback=lambda result: result == "1\n",
     )
     assert res == "1\n"
 
diff --git a/tests/integration/test_ttl_move/test.py b/tests/integration/test_ttl_move/test.py
index 1df9bc6d3c9..94432b89ab6 100644
--- a/tests/integration/test_ttl_move/test.py
+++ b/tests/integration/test_ttl_move/test.py
@@ -1635,7 +1635,7 @@ def test_alter_with_merge_work(started_cluster, name, engine, positive):
         optimize_table(20)
 
         if positive:
-            assert check_used_disks_with_retry(node1, name, set(["external"]), 50)
+            assert check_used_disks_with_retry(node1, name, set(["external"]), 100)
         else:
             assert check_used_disks_with_retry(node1, name, set(["jbod1", "jbod2"]), 50)
 
diff --git a/tests/integration/test_undrop_query/configs/with_delay_config.xml b/tests/integration/test_undrop_query/configs/with_delay_config.xml
index c672b187b01..5461003991d 100644
--- a/tests/integration/test_undrop_query/configs/with_delay_config.xml
+++ b/tests/integration/test_undrop_query/configs/with_delay_config.xml
@@ -1,3 +1,3 @@
 <clickhouse>
-    <database_atomic_delay_before_drop_table_sec>5</database_atomic_delay_before_drop_table_sec>
+    <database_atomic_delay_before_drop_table_sec>3</database_atomic_delay_before_drop_table_sec>
 </clickhouse>
diff --git a/tests/integration/test_undrop_query/test.py b/tests/integration/test_undrop_query/test.py
index 590a5690e55..9eac01c5219 100644
--- a/tests/integration/test_undrop_query/test.py
+++ b/tests/integration/test_undrop_query/test.py
@@ -1,7 +1,5 @@
 import pytest
 import uuid
-import random
-import logging
 import time
 
 from helpers.cluster import ClickHouseCluster
@@ -22,37 +20,29 @@ def started_cluster():
 
 
 def test_undrop_drop_and_undrop_loop(started_cluster):
-    count = 0
-    while count < 10:
-        random_sec = random.randint(0, 10)
-        table_uuid = uuid.uuid1().__str__()
-        logging.info(
-            "random_sec: " + random_sec.__str__() + ", table_uuid: " + table_uuid
-        )
+    # create, drop, undrop, drop, undrop table 5 times
+    for _ in range(5):
+        table_uuid = str(uuid.uuid1())
+        table = f"test_undrop_loop"
         node.query(
-            "create table test_undrop_loop"
-            + count.__str__()
-            + " UUID '"
-            + table_uuid
-            + "' (id Int32) Engine=MergeTree() order by id;"
+            f"CREATE TABLE {table} "
+            f"UUID '{table_uuid}' (id Int32) "
+            f"Engine=MergeTree() ORDER BY id"
         )
-        node.query("drop table test_undrop_loop" + count.__str__() + ";")
-        time.sleep(random_sec)
-        if random_sec >= 5:
-            error = node.query_and_get_error(
-                "undrop table test_undrop_loop"
-                + count.__str__()
-                + " uuid '"
-                + table_uuid
-                + "';"
-            )
-            assert "UNKNOWN_TABLE" in error
-        else:
-            node.query(
-                "undrop table test_undrop_loop"
-                + count.__str__()
-                + " uuid '"
-                + table_uuid
-                + "';"
-            )
-            count = count + 1
+
+        node.query(f"DROP TABLE {table}")
+        node.query(f"UNDROP TABLE {table} UUID '{table_uuid}'")
+
+        node.query(f"DROP TABLE {table}")
+        # database_atomic_delay_before_drop_table_sec=3
+        time.sleep(6)
+
+        """
+        Expect two things:
+        1. Table is dropped - UNKNOWN_TABLE in error
+        2. Table in process of dropping - Return code: 60.
+            The drop task of table ... (uuid) is in progress,
+            has been dropped or the database engine doesn't support it
+        """
+        error = node.query_and_get_error(f"UNDROP TABLE {table} UUID '{table_uuid}'")
+        assert "UNKNOWN_TABLE" in error or "The drop task of table" in error

From cf0a2c07d8e8a8c28a738e945a437d09ab97f638 Mon Sep 17 00:00:00 2001
From: Nikita Fomichev <nikita.fomichev@clickhouse.com>
Date: Sat, 23 Mar 2024 15:51:51 +0100
Subject: [PATCH 961/985] stateless tests: fix flaky tests

---
 .../02115_rewrite_local_join_right_distribute_table.sql       | 4 ++++
 tests/queries/0_stateless/02475_bson_each_row_format.sh       | 2 +-
 2 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02115_rewrite_local_join_right_distribute_table.sql b/tests/queries/0_stateless/02115_rewrite_local_join_right_distribute_table.sql
index d5ab82ba064..2ab324df787 100644
--- a/tests/queries/0_stateless/02115_rewrite_local_join_right_distribute_table.sql
+++ b/tests/queries/0_stateless/02115_rewrite_local_join_right_distribute_table.sql
@@ -23,6 +23,10 @@ select t1.* from t1_all t1 join t2_all t2 on t1.a = t2.a ORDER BY t1.a;
 
 SELECT '-';
 
+-- make sure data is fully written when reading from distributed
+optimize table t1_local final;
+optimize table t2_local final;
+
 set distributed_product_mode = 'global';
 select * from t1_all t1 where t1.a in (select t2.a from t2_all t2);
 explain syntax select t1.* from t1_all t1 join t2_all t2 on t1.a = t2.a;
diff --git a/tests/queries/0_stateless/02475_bson_each_row_format.sh b/tests/queries/0_stateless/02475_bson_each_row_format.sh
index f5c48608639..474a6cd0e47 100755
--- a/tests/queries/0_stateless/02475_bson_each_row_format.sh
+++ b/tests/queries/0_stateless/02475_bson_each_row_format.sh
@@ -1,5 +1,5 @@
 #!/usr/bin/env bash
-# Tags: no-parallel
+# Tags: no-parallel, no-debug
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh

From a3e7c73e9f5d19a2df1f4fca2245929b67f25f89 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 20:02:38 +0100
Subject: [PATCH 962/985] Fix tests

---
 .../02947_merge_tree_index_table_1.reference  | 16 +++++-----
 .../02947_merge_tree_index_table_1.sql        |  6 ++--
 .../02947_merge_tree_index_table_2.reference  | 30 +++++++++----------
 .../02947_merge_tree_index_table_2.sql        |  2 ++
 4 files changed, 29 insertions(+), 25 deletions(-)

diff --git a/tests/queries/0_stateless/02947_merge_tree_index_table_1.reference b/tests/queries/0_stateless/02947_merge_tree_index_table_1.reference
index d4397328dbc..b897f6e50ed 100644
--- a/tests/queries/0_stateless/02947_merge_tree_index_table_1.reference
+++ b/tests/queries/0_stateless/02947_merge_tree_index_table_1.reference
@@ -73,12 +73,12 @@
 8. │ all_2_2_0 │           3 │               0 │ 3 │ 19 │
    └───────────┴─────────────┴─────────────────┴───┴────┘
    ┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬──b─┬─a.mark──┬─b.mark──┬─s.mark──┐
-1. │ all_1_1_0 │           0 │               3 │ 0 │  0 │ (0,0)   │ (42,0)  │ (96,0)  │
-2. │ all_1_1_0 │           1 │               3 │ 1 │  1 │ (141,0) │ (195,0) │ (249,0) │
-3. │ all_1_1_0 │           2 │               4 │ 2 │  2 │ (294,0) │ (349,0) │ (404,0) │
-4. │ all_1_1_0 │           3 │               0 │ 3 │  7 │ (452,0) │ (452,0) │ (452,0) │
-5. │ all_2_2_0 │           0 │               3 │ 0 │ 12 │ (0,0)   │ (50,0)  │ (104,0) │
-6. │ all_2_2_0 │           1 │               3 │ 1 │ 17 │ (153,0) │ (207,0) │ (261,0) │
-7. │ all_2_2_0 │           2 │               4 │ 2 │ 18 │ (310,0) │ (365,0) │ (420,0) │
-8. │ all_2_2_0 │           3 │               0 │ 3 │ 19 │ (474,0) │ (474,0) │ (474,0) │
+1. │ all_1_1_0 │           0 │               3 │ 0 │  0 │ (0,0)   │ (35,0)  │ (77,0)  │
+2. │ all_1_1_0 │           1 │               3 │ 1 │  1 │ (114,0) │ (153,0) │ (197,0) │
+3. │ all_1_1_0 │           2 │               4 │ 2 │  2 │ (234,0) │ (281,0) │ (329,0) │
+4. │ all_1_1_0 │           3 │               0 │ 3 │  7 │ (369,0) │ (369,0) │ (369,0) │
+5. │ all_2_2_0 │           0 │               3 │ 0 │ 12 │ (0,0)   │ (38,0)  │ (82,0)  │
+6. │ all_2_2_0 │           1 │               3 │ 1 │ 17 │ (124,0) │ (168,0) │ (212,0) │
+7. │ all_2_2_0 │           2 │               4 │ 2 │ 18 │ (254,0) │ (297,0) │ (345,0) │
+8. │ all_2_2_0 │           3 │               0 │ 3 │ 19 │ (392,0) │ (392,0) │ (392,0) │
    └───────────┴─────────────┴─────────────────┴───┴────┴─────────┴─────────┴─────────┘
diff --git a/tests/queries/0_stateless/02947_merge_tree_index_table_1.sql b/tests/queries/0_stateless/02947_merge_tree_index_table_1.sql
index 412fd476413..84993de352b 100644
--- a/tests/queries/0_stateless/02947_merge_tree_index_table_1.sql
+++ b/tests/queries/0_stateless/02947_merge_tree_index_table_1.sql
@@ -1,6 +1,8 @@
+-- Tags: no-random-settings
+
 DROP TABLE IF EXISTS t_merge_tree_index;
 
-CREATE TABLE t_merge_tree_index (a UInt64, b UInt64, s String)
+CREATE TABLE t_merge_tree_index (a UInt64 CODEC(LZ4), b UInt64 CODEC(LZ4), s String CODEC(LZ4))
 ENGINE = MergeTree ORDER BY (a, b)
 SETTINGS
     index_granularity = 3,
@@ -18,7 +20,7 @@ SELECT * FROM mergeTreeIndex(currentDatabase(), t_merge_tree_index, with_marks =
 
 DROP TABLE t_merge_tree_index;
 
-CREATE TABLE t_merge_tree_index (a UInt64, b UInt64, s String)
+CREATE TABLE t_merge_tree_index (a UInt64 CODEC(LZ4), b UInt64 CODEC(LZ4), s String CODEC(LZ4))
 ENGINE = MergeTree ORDER BY (a, b)
 SETTINGS
     index_granularity = 3,
diff --git a/tests/queries/0_stateless/02947_merge_tree_index_table_2.reference b/tests/queries/0_stateless/02947_merge_tree_index_table_2.reference
index 5328ff18d12..7bfcb7b2822 100644
--- a/tests/queries/0_stateless/02947_merge_tree_index_table_2.reference
+++ b/tests/queries/0_stateless/02947_merge_tree_index_table_2.reference
@@ -13,21 +13,21 @@
 │ all_3_3_0 │           3 │               1 │ 4 │ 9 │                         96 │
 │ all_3_3_0 │           4 │               0 │ 4 │ 9 │                         96 │
 └───────────┴─────────────┴─────────────────┴───┴───┴────────────────────────────┘
-┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬─b─┬─modulo(sipHash64(sp), 100)─┬─a.mark───┬─b.mark───┬─c.mark──────┬─sp.sparse.idx.mark─┬─sp.mark──┬─arr.size0.mark─┬─arr.dict.mark─┬─arr.mark─┬─n.size0.mark─┬─n%2Ec1.mark─┬─n%2Ec2.mark─┬─t%2Ec2.mark─┬─t%2Ec1.mark─┬─t.mark──────┬─column%2Ewith%2Edots.mark─┐
-│ all_1_1_0 │           0 │               3 │ 0 │ 0 │                         19 │ (0,0)    │ (0,0)    │ (NULL,NULL) │ (0,0)              │ (0,0)    │ (0,0)          │ (0,8)         │ (0,0)    │ (0,0)        │ (0,0)       │ (0,0)       │ (0,0)       │ (0,0)       │ (NULL,NULL) │ (0,0)                     │
-│ all_1_1_0 │           1 │               3 │ 1 │ 6 │                         19 │ (0,24)   │ (0,24)   │ (NULL,NULL) │ (0,9)              │ (0,0)    │ (0,24)         │ (0,8)         │ (0,22)   │ (0,24)       │ (0,36)      │ (0,72)      │ (0,24)      │ (0,24)      │ (NULL,NULL) │ (0,24)                    │
-│ all_1_1_0 │           2 │               3 │ 3 │ 3 │                         19 │ (0,48)   │ (0,48)   │ (NULL,NULL) │ (0,18)             │ (0,0)    │ (0,48)         │ (0,8)         │ (0,44)   │ (0,48)       │ (0,72)      │ (0,144)     │ (0,48)      │ (0,48)      │ (NULL,NULL) │ (0,48)                    │
-│ all_1_1_0 │           3 │               1 │ 4 │ 9 │                         19 │ (0,72)   │ (0,72)   │ (NULL,NULL) │ (0,27)             │ (0,0)    │ (0,72)         │ (0,8)         │ (0,66)   │ (0,72)       │ (0,108)     │ (0,216)     │ (0,72)      │ (0,72)      │ (NULL,NULL) │ (0,72)                    │
-│ all_1_1_0 │           4 │               0 │ 4 │ 9 │                         19 │ (0,80)   │ (0,80)   │ (NULL,NULL) │ (0,36)             │ (0,0)    │ (0,80)         │ (0,25)        │ (0,84)   │ (0,80)       │ (0,120)     │ (0,240)     │ (0,80)      │ (0,80)      │ (NULL,NULL) │ (0,80)                    │
-│ all_2_2_0 │           0 │               3 │ 0 │ 0 │                         96 │ (0,0)    │ (54,0)   │ (108,0)     │ (NULL,NULL)        │ (162,0)  │ (NULL,NULL)    │ (NULL,NULL)   │ (216,0)  │ (NULL,NULL)  │ (291,0)     │ (355,0)     │ (NULL,NULL) │ (NULL,NULL) │ (426,0)     │ (484,0)                   │
-│ all_2_2_0 │           1 │               2 │ 3 │ 3 │                         96 │ (538,0)  │ (588,0)  │ (638,0)     │ (NULL,NULL)        │ (688,0)  │ (NULL,NULL)    │ (NULL,NULL)   │ (738,0)  │ (NULL,NULL)  │ (808,0)     │ (868,0)     │ (NULL,NULL) │ (NULL,NULL) │ (931,0)     │ (986,0)                   │
-│ all_2_2_0 │           2 │               0 │ 4 │ 4 │                         96 │ (1036,0) │ (1036,0) │ (1036,0)    │ (NULL,NULL)        │ (1036,0) │ (NULL,NULL)    │ (NULL,NULL)   │ (1036,0) │ (NULL,NULL)  │ (1036,0)    │ (1036,0)    │ (NULL,NULL) │ (NULL,NULL) │ (1036,0)    │ (1036,0)                  │
-│ all_3_3_0 │           0 │               3 │ 0 │ 0 │                         96 │ (0,0)    │ (0,0)    │ (0,0)       │ (NULL,NULL)        │ (0,0)    │ (0,0)          │ (0,8)         │ (0,0)    │ (0,0)        │ (0,0)       │ (0,0)       │ (0,0)       │ (0,0)       │ (NULL,NULL) │ (0,0)                     │
-│ all_3_3_0 │           1 │               3 │ 1 │ 6 │                         96 │ (0,24)   │ (0,24)   │ (0,24)      │ (NULL,NULL)        │ (0,24)   │ (0,24)         │ (0,8)         │ (0,22)   │ (0,24)       │ (0,36)      │ (0,72)      │ (0,24)      │ (0,24)      │ (NULL,NULL) │ (0,24)                    │
-│ all_3_3_0 │           2 │               3 │ 3 │ 3 │                         96 │ (0,48)   │ (0,48)   │ (0,48)      │ (NULL,NULL)        │ (0,48)   │ (0,48)         │ (0,8)         │ (0,44)   │ (0,48)       │ (0,72)      │ (0,144)     │ (0,48)      │ (0,48)      │ (NULL,NULL) │ (0,48)                    │
-│ all_3_3_0 │           3 │               1 │ 4 │ 9 │                         96 │ (0,72)   │ (0,72)   │ (0,72)      │ (NULL,NULL)        │ (0,72)   │ (0,72)         │ (0,8)         │ (0,66)   │ (0,72)       │ (0,108)     │ (0,216)     │ (0,72)      │ (0,72)      │ (NULL,NULL) │ (0,72)                    │
-│ all_3_3_0 │           4 │               0 │ 4 │ 9 │                         96 │ (0,80)   │ (0,80)   │ (0,80)      │ (NULL,NULL)        │ (0,80)   │ (0,80)         │ (0,25)        │ (0,84)   │ (0,80)       │ (0,120)     │ (0,240)     │ (0,80)      │ (0,80)      │ (NULL,NULL) │ (0,80)                    │
-└───────────┴─────────────┴─────────────────┴───┴───┴────────────────────────────┴──────────┴──────────┴─────────────┴────────────────────┴──────────┴────────────────┴───────────────┴──────────┴──────────────┴─────────────┴─────────────┴─────────────┴─────────────┴─────────────┴───────────────────────────┘
+┌─part_name─┬─mark_number─┬─rows_in_granule─┬─a─┬─b─┬─modulo(sipHash64(sp), 100)─┬─a.mark──┬─b.mark──┬─c.mark──────┬─sp.sparse.idx.mark─┬─sp.mark─┬─arr.size0.mark─┬─arr.dict.mark─┬─arr.mark─┬─n.size0.mark─┬─n%2Ec1.mark─┬─n%2Ec2.mark─┬─t%2Ec2.mark─┬─t%2Ec1.mark─┬─t.mark──────┬─column%2Ewith%2Edots.mark─┐
+│ all_1_1_0 │           0 │               3 │ 0 │ 0 │                         19 │ (0,0)   │ (0,0)   │ (NULL,NULL) │ (0,0)              │ (0,0)   │ (0,0)          │ (0,8)         │ (0,0)    │ (0,0)        │ (0,0)       │ (0,0)       │ (0,0)       │ (0,0)       │ (NULL,NULL) │ (0,0)                     │
+│ all_1_1_0 │           1 │               3 │ 1 │ 6 │                         19 │ (0,24)  │ (0,24)  │ (NULL,NULL) │ (0,9)              │ (0,0)   │ (0,24)         │ (0,8)         │ (0,22)   │ (0,24)       │ (0,36)      │ (0,72)      │ (0,24)      │ (0,24)      │ (NULL,NULL) │ (0,24)                    │
+│ all_1_1_0 │           2 │               3 │ 3 │ 3 │                         19 │ (0,48)  │ (0,48)  │ (NULL,NULL) │ (0,18)             │ (0,0)   │ (0,48)         │ (0,8)         │ (0,44)   │ (0,48)       │ (0,72)      │ (0,144)     │ (0,48)      │ (0,48)      │ (NULL,NULL) │ (0,48)                    │
+│ all_1_1_0 │           3 │               1 │ 4 │ 9 │                         19 │ (0,72)  │ (0,72)  │ (NULL,NULL) │ (0,27)             │ (0,0)   │ (0,72)         │ (0,8)         │ (0,66)   │ (0,72)       │ (0,108)     │ (0,216)     │ (0,72)      │ (0,72)      │ (NULL,NULL) │ (0,72)                    │
+│ all_1_1_0 │           4 │               0 │ 4 │ 9 │                         19 │ (0,80)  │ (0,80)  │ (NULL,NULL) │ (0,36)             │ (0,0)   │ (0,80)         │ (0,25)        │ (0,84)   │ (0,80)       │ (0,120)     │ (0,240)     │ (0,80)      │ (0,80)      │ (NULL,NULL) │ (0,80)                    │
+│ all_2_2_0 │           0 │               3 │ 0 │ 0 │                         96 │ (0,0)   │ (42,0)  │ (84,0)      │ (NULL,NULL)        │ (126,0) │ (NULL,NULL)    │ (NULL,NULL)   │ (165,0)  │ (NULL,NULL)  │ (232,0)     │ (286,0)     │ (NULL,NULL) │ (NULL,NULL) │ (342,0)     │ (391,0)                   │
+│ all_2_2_0 │           1 │               2 │ 3 │ 3 │                         96 │ (433,0) │ (472,0) │ (511,0)     │ (NULL,NULL)        │ (550,0) │ (NULL,NULL)    │ (NULL,NULL)   │ (589,0)  │ (NULL,NULL)  │ (659,0)     │ (717,0)     │ (NULL,NULL) │ (NULL,NULL) │ (773,0)     │ (817,0)                   │
+│ all_2_2_0 │           2 │               0 │ 4 │ 4 │                         96 │ (856,0) │ (856,0) │ (856,0)     │ (NULL,NULL)        │ (856,0) │ (NULL,NULL)    │ (NULL,NULL)   │ (856,0)  │ (NULL,NULL)  │ (856,0)     │ (856,0)     │ (NULL,NULL) │ (NULL,NULL) │ (856,0)     │ (856,0)                   │
+│ all_3_3_0 │           0 │               3 │ 0 │ 0 │                         96 │ (0,0)   │ (0,0)   │ (0,0)       │ (NULL,NULL)        │ (0,0)   │ (0,0)          │ (0,8)         │ (0,0)    │ (0,0)        │ (0,0)       │ (0,0)       │ (0,0)       │ (0,0)       │ (NULL,NULL) │ (0,0)                     │
+│ all_3_3_0 │           1 │               3 │ 1 │ 6 │                         96 │ (0,24)  │ (0,24)  │ (0,24)      │ (NULL,NULL)        │ (0,24)  │ (0,24)         │ (0,8)         │ (0,22)   │ (0,24)       │ (0,36)      │ (0,72)      │ (0,24)      │ (0,24)      │ (NULL,NULL) │ (0,24)                    │
+│ all_3_3_0 │           2 │               3 │ 3 │ 3 │                         96 │ (0,48)  │ (0,48)  │ (0,48)      │ (NULL,NULL)        │ (0,48)  │ (0,48)         │ (0,8)         │ (0,44)   │ (0,48)       │ (0,72)      │ (0,144)     │ (0,48)      │ (0,48)      │ (NULL,NULL) │ (0,48)                    │
+│ all_3_3_0 │           3 │               1 │ 4 │ 9 │                         96 │ (0,72)  │ (0,72)  │ (0,72)      │ (NULL,NULL)        │ (0,72)  │ (0,72)         │ (0,8)         │ (0,66)   │ (0,72)       │ (0,108)     │ (0,216)     │ (0,72)      │ (0,72)      │ (NULL,NULL) │ (0,72)                    │
+│ all_3_3_0 │           4 │               0 │ 4 │ 9 │                         96 │ (0,80)  │ (0,80)  │ (0,80)      │ (NULL,NULL)        │ (0,80)  │ (0,80)         │ (0,25)        │ (0,84)   │ (0,80)       │ (0,120)     │ (0,240)     │ (0,80)      │ (0,80)      │ (NULL,NULL) │ (0,80)                    │
+└───────────┴─────────────┴─────────────────┴───┴───┴────────────────────────────┴─────────┴─────────┴─────────────┴────────────────────┴─────────┴────────────────┴───────────────┴──────────┴──────────────┴─────────────┴─────────────┴─────────────┴─────────────┴─────────────┴───────────────────────────┘
 part_name	String
 mark_number	UInt64
 rows_in_granule	UInt64
diff --git a/tests/queries/0_stateless/02947_merge_tree_index_table_2.sql b/tests/queries/0_stateless/02947_merge_tree_index_table_2.sql
index f4fb2cec2dc..09c9a41e4d6 100644
--- a/tests/queries/0_stateless/02947_merge_tree_index_table_2.sql
+++ b/tests/queries/0_stateless/02947_merge_tree_index_table_2.sql
@@ -1,3 +1,5 @@
+-- Tags: no-random-settings
+
 DROP TABLE IF EXISTS t_merge_tree_index;
 
 SET output_format_pretty_row_numbers = 0;

From aeefba57b513a52527010fd14b94a4f911ab69a5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 22:49:23 +0300
Subject: [PATCH 963/985] Update StorageAzureBlob.cpp

---
 src/Storages/StorageAzureBlob.cpp | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index 289bd4643c4..306a5eac8e5 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -361,7 +361,8 @@ AzureClientPtr StorageAzureBlob::createClient(StorageAzureBlob::Configuration co
                 try
                 {
                     result->CreateIfNotExists();
-                } catch (const Azure::Storage::StorageException & e)
+                }
+                catch (const Azure::Storage::StorageException & e)
                 {
                     if (!(e.StatusCode == Azure::Core::Http::HttpStatusCode::Conflict
                         && e.ReasonPhrase == "The specified container already exists."))

From 7bdab0544182307f9a4c9d104077b7d904499fd1 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 00:09:29 +0300
Subject: [PATCH 964/985] Update
 03022_alter_materialized_view_query_has_inner_table.sql

---
 .../03022_alter_materialized_view_query_has_inner_table.sql     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/03022_alter_materialized_view_query_has_inner_table.sql b/tests/queries/0_stateless/03022_alter_materialized_view_query_has_inner_table.sql
index eb4c98fc8b4..cd36be085d8 100644
--- a/tests/queries/0_stateless/03022_alter_materialized_view_query_has_inner_table.sql
+++ b/tests/queries/0_stateless/03022_alter_materialized_view_query_has_inner_table.sql
@@ -2,7 +2,7 @@ DROP TABLE IF EXISTS src_table;
 DROP TABLE IF EXISTS mv;
 
 CREATE TABLE src_table (`a` UInt32, `b` UInt32) ENGINE = MergeTree ORDER BY a;
-CREATE MATERIALIZED VIEW mv UUID '2bad6d75-86fe-4da0-815b-2c7410253941' (`a` UInt32) ENGINE = MergeTree ORDER BY a AS SELECT a FROM src_table;
+CREATE MATERIALIZED VIEW mv (`a` UInt32) ENGINE = MergeTree ORDER BY a AS SELECT a FROM src_table;
 
 INSERT INTO src_table (a, b) VALUES (1, 1), (2, 2);
 

From 8b1a864bb393da1130bf4347649405e69ff9c871 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 22:25:05 +0100
Subject: [PATCH 965/985] Fix test
 "00002_log_and_exception_messages_formatting"

---
 .../00002_log_and_exception_messages_formatting.sql           | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql b/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql
index 3a83126ea11..dfa11dfcb13 100644
--- a/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql
+++ b/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql
@@ -56,13 +56,13 @@ SELECT
             WHERE
                 length(message_format_string) = 0
               AND (message like '%DB::Exception%' or message like '%Coordination::Exception%')
-              AND message not like '% Received from %' and message not like '%(SYNTAX_ERROR)%'
+              AND message not like '% Received from %' and message not like '%(SYNTAX_ERROR)%' and message not like '%Fault injection%'
             GROUP BY message ORDER BY c LIMIT 10
         ))
 FROM logs
 WHERE
   (message like '%DB::Exception%' or message like '%Coordination::Exception%')
-  AND message not like '% Received from %' and message not like '%(SYNTAX_ERROR)%';
+  AND message not like '% Received from %' and message not like '%(SYNTAX_ERROR)%' and message not like '%Fault injection%';
 
 
 -- FIXME some of the following messages are not informative and it has to be fixed

From 683cda379fd1846761d195070a4f3864bff5d385 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 22:26:41 +0100
Subject: [PATCH 966/985] A test is too slow for debug

---
 tests/queries/0_stateless/02998_primary_key_skip_columns.sql | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
index 6574a82a165..ee558996b52 100644
--- a/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
+++ b/tests/queries/0_stateless/02998_primary_key_skip_columns.sql
@@ -1,4 +1,4 @@
--- Tags: no-asan, no-tsan, no-msan, no-ubsan, no-random-settings
+-- Tags: no-asan, no-tsan, no-msan, no-ubsan, no-random-settings, no-debug
 
 DROP TABLE IF EXISTS test;
 

From 78eb81825bf58541c60f8e29610cecb019a0b38b Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sat, 23 Mar 2024 23:43:35 +0100
Subject: [PATCH 967/985] Update tests

---
 tests/queries/0_stateless/00725_comment_columns_long.sql       | 1 +
 .../00753_system_columns_and_system_tables_long.sql            | 1 +
 tests/queries/0_stateless/01666_blns_long.sql                  | 2 +-
 .../0_stateless/02421_formats_with_totals_and_extremes.sql.j2  | 3 +--
 4 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/tests/queries/0_stateless/00725_comment_columns_long.sql b/tests/queries/0_stateless/00725_comment_columns_long.sql
index 139f8ba006f..068f35b2e40 100644
--- a/tests/queries/0_stateless/00725_comment_columns_long.sql
+++ b/tests/queries/0_stateless/00725_comment_columns_long.sql
@@ -1,5 +1,6 @@
 -- Tags: long, no-replicated-database
 -- Tag no-replicated-database: Unsupported type of ALTER query
+SET output_format_pretty_row_numbers = 0;
 
 DROP TABLE IF EXISTS check_query_comment_column;
 
diff --git a/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.sql b/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.sql
index 51818228913..4613576cf4e 100644
--- a/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.sql
+++ b/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.sql
@@ -1,4 +1,5 @@
 -- Tags: long, no-s3-storage, no-random-merge-tree-settings
+SET output_format_pretty_row_numbers = 0;
 
 DROP TABLE IF EXISTS check_system_tables;
 
diff --git a/tests/queries/0_stateless/01666_blns_long.sql b/tests/queries/0_stateless/01666_blns_long.sql
index 01295b11138..d039c01c580 100644
--- a/tests/queries/0_stateless/01666_blns_long.sql
+++ b/tests/queries/0_stateless/01666_blns_long.sql
@@ -26,7 +26,7 @@ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
 */
 
-SET max_insert_threads = 0;
+SET max_insert_threads = 0, output_format_pretty_row_numbers = 0;
 
 DROP TABLE IF EXISTS test;
 
diff --git a/tests/queries/0_stateless/02421_formats_with_totals_and_extremes.sql.j2 b/tests/queries/0_stateless/02421_formats_with_totals_and_extremes.sql.j2
index f936501e72a..319d88f8d7c 100644
--- a/tests/queries/0_stateless/02421_formats_with_totals_and_extremes.sql.j2
+++ b/tests/queries/0_stateless/02421_formats_with_totals_and_extremes.sql.j2
@@ -1,6 +1,6 @@
 -- Tags: no-fasttest
 
-set output_format_pretty_color=1;
+set output_format_pretty_color = 1, output_format_pretty_row_numbers = 0;
 set output_format_write_statistics=0;
 
 {% for format in ['CSV', 'TSV', 'XML', 'Vertical', 'Pretty', 'JSON', 'JSONCompact'] -%}
@@ -20,4 +20,3 @@ select sum(number) from numbers(10) group by number % 2 with totals format {{ fo
 select '';
 
 {% endfor -%}
-

From 1acdf691ad73d87066dc364b3fb9471a3196c77c Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 00:59:23 +0100
Subject: [PATCH 968/985] Update test

---
 tests/queries/0_stateless/03022_highlight_digit_groups.sql | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/tests/queries/0_stateless/03022_highlight_digit_groups.sql b/tests/queries/0_stateless/03022_highlight_digit_groups.sql
index 57341f228a9..c48a02e712f 100644
--- a/tests/queries/0_stateless/03022_highlight_digit_groups.sql
+++ b/tests/queries/0_stateless/03022_highlight_digit_groups.sql
@@ -1,3 +1,5 @@
+SET output_format_pretty_row_numbers = 0;
+
 SELECT exp10(number) * (number % 2 ? 1 : -1) FROM numbers(30) FORMAT PrettySpace SETTINGS output_format_pretty_color = 1;
 
 SELECT exp10(number) FROM numbers(10) FORMAT PrettySpace SETTINGS output_format_pretty_color = 1, output_format_pretty_highlight_digit_groups = 0;

From d249d53de6d0bdf179ed3a2365c4f9c1fe454363 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 02:06:52 +0100
Subject: [PATCH 969/985] Remove DataStreams

---
 src/Server/TCPHandler.cpp | 7 +++----
 src/Server/TCPHandler.h   | 2 --
 2 files changed, 3 insertions(+), 6 deletions(-)

diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index 43b0161a487..26d2390f1df 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -38,7 +38,6 @@
 #include <Core/ServerSettings.h>
 #include <Access/AccessControl.h>
 #include <Access/Credentials.h>
-#include <DataTypes/DataTypeLowCardinality.h>
 #include <Compression/CompressionFactory.h>
 #include <Common/logger_useful.h>
 #include <Common/CurrentMetrics.h>
@@ -537,7 +536,7 @@ void TCPHandler::runImpl()
             }
             else if (state.io.pipeline.pulling())
             {
-                processOrdinaryQueryWithProcessors();
+                processOrdinaryQuery();
                 finish_or_cancel();
             }
             else if (state.io.pipeline.completed())
@@ -992,7 +991,7 @@ void TCPHandler::processInsertQuery()
 }
 
 
-void TCPHandler::processOrdinaryQueryWithProcessors()
+void TCPHandler::processOrdinaryQuery()
 {
     auto & pipeline = state.io.pipeline;
 
@@ -2184,7 +2183,7 @@ void TCPHandler::sendData(const Block & block)
         /// For testing hedged requests
         if (unknown_packet_in_send_data)
         {
-            constexpr UInt64 marker = (1ULL<<63) - 1;
+            constexpr UInt64 marker = (1ULL << 63) - 1;
             --unknown_packet_in_send_data;
             if (unknown_packet_in_send_data == 0)
                 writeVarUInt(marker, *out);
diff --git a/src/Server/TCPHandler.h b/src/Server/TCPHandler.h
index fc42a614f5c..28259d3a325 100644
--- a/src/Server/TCPHandler.h
+++ b/src/Server/TCPHandler.h
@@ -278,8 +278,6 @@ private:
     /// Process a request that does not require the receiving of data blocks from the client
     void processOrdinaryQuery();
 
-    void processOrdinaryQueryWithProcessors();
-
     void processTablesStatusRequest();
 
     void sendHello();

From 46a4307c0856618d88f87af70bce03c1e040bb06 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 02:11:12 +0100
Subject: [PATCH 970/985] Fix style

---
 src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
index 06fe516c9b3..3f22ea26187 100644
--- a/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/PrettyBlockOutputFormat.cpp
@@ -307,11 +307,7 @@ void PrettyBlockOutputFormat::writeChunk(const Chunk & chunk, PortKind port_kind
             const auto & type = *header.getByPosition(j).type;
             writeValueWithPadding(*columns[j], *serializations[j], i,
                 widths[j].empty() ? max_widths[j] : widths[j][i],
-<<<<<<< HEAD
-                max_widths[j], cut_to_width, type.shouldAlignRightInPrettyFormats());
-=======
-                max_widths[j], type.shouldAlignRightInPrettyFormats(), isNumber(type));
->>>>>>> master
+                max_widths[j], cut_to_width, type.shouldAlignRightInPrettyFormats(), isNumber(type));
         }
 
         writeCString(grid_symbols.bar, out);

From 2847b2984f0fcda39274bbe5bc25e0e2e421d951 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 04:14:32 +0300
Subject: [PATCH 971/985] Update ExternalLoaderStatus.cpp

---
 src/Common/ExternalLoaderStatus.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/Common/ExternalLoaderStatus.cpp b/src/Common/ExternalLoaderStatus.cpp
index f3298409f43..d9c9b37cc43 100644
--- a/src/Common/ExternalLoaderStatus.cpp
+++ b/src/Common/ExternalLoaderStatus.cpp
@@ -15,4 +15,5 @@ std::vector<std::pair<String, Int8>> getExternalLoaderStatusEnumAllPossibleValue
 
     return out;
 }
+
 }

From 82fa96d99c78bbef599bef115a098fdef968842e Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@yandex-team.ru>
Date: Sun, 24 Mar 2024 04:16:10 +0300
Subject: [PATCH 972/985] Update 03020_order_by_SimpleAggregateFunction.sql

---
 .../0_stateless/03020_order_by_SimpleAggregateFunction.sql    | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.sql b/tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.sql
index fd3418fb50e..f1727cb9e5c 100644
--- a/tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.sql
+++ b/tests/queries/0_stateless/03020_order_by_SimpleAggregateFunction.sql
@@ -1,5 +1,7 @@
 set allow_suspicious_primary_key = 0;
 
+DROP TABLE IF EXISTS data;
+
 create table data (key Int, value AggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() order by (key, value); -- { serverError DATA_TYPE_CANNOT_BE_USED_IN_KEY }
 create table data (key Int, value SimpleAggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() order by (key, value); -- { serverError DATA_TYPE_CANNOT_BE_USED_IN_KEY }
 
@@ -12,3 +14,5 @@ create table data (key Int, value SimpleAggregateFunction(sum, UInt64)) engine=A
 set allow_suspicious_primary_key = 1;
 
 create table data (key Int, value SimpleAggregateFunction(sum, UInt64)) engine=AggregatingMergeTree() primary key value order by (value, key);
+
+DROP TABLE data;

From d146cd51e59c3019e780b98d0926437a8133ba82 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 04:20:54 +0300
Subject: [PATCH 973/985] Update index.md

---
 docs/ru/index.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/ru/index.md b/docs/ru/index.md
index 88a90fa4b21..29f2bbe07fb 100644
--- a/docs/ru/index.md
+++ b/docs/ru/index.md
@@ -35,7 +35,7 @@ ClickHouse — столбцовая система управления база
 В примерах изображён только порядок расположения данных.
 То есть значения из разных столбцов хранятся отдельно, а данные одного столбца — вместе.
 
-Примеры столбцовых СУБД: Vertica, Paraccel (Actian Matrix, Amazon Redshift), Sybase IQ, Exasol, Infobright, InfiniDB, MonetDB (VectorWise, Actian Vector), LucidDB, SAP HANA, Google Dremel, Google PowerDrill, Druid, kdb+.
+Примеры столбцовых СУБД: Vertica, Paraccel (Actian Matrix, Amazon Redshift), Sybase IQ, Exasol, Infobright, InfiniDB, MonetDB (VectorWise, Actian Vector), LucidDB, SAP HANA и прочий треш, Google Dremel, Google PowerDrill, Druid, kdb+.
 {: .grey }
 
 Разный порядок хранения данных лучше подходит для разных сценариев работы.

From 622b2472b0bd9fc33a740b4fe52fd1789c0a4368 Mon Sep 17 00:00:00 2001
From: pufit <pufit@clickhouse.com>
Date: Sat, 23 Mar 2024 22:06:04 -0400
Subject: [PATCH 974/985] Another assertions fix, better initialization

---
 src/Common/Volnitsky.h | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/src/Common/Volnitsky.h b/src/Common/Volnitsky.h
index daf143f7303..6513bdb8bc3 100644
--- a/src/Common/Volnitsky.h
+++ b/src/Common/Volnitsky.h
@@ -254,7 +254,9 @@ namespace VolnitskyTraits
                     if (size_l != size_u)
                         return false;
 
-                    assert(size_l >= 1 && size_u >= 1);
+                    if (size_l == 0 || size_u == 0)
+                        return false;  /// Some part of the given ngram contains an invalid UTF-8 sequence.
+
                     chars.c1 = seq_l[0];
                     putNGramBase(n, offset);
 
@@ -277,7 +279,8 @@ namespace VolnitskyTraits
                     if (size_l != size_u)
                         return false;
 
-                    assert(size_l > seq_ngram_offset && size_u > seq_ngram_offset);
+                    if (size_l <= seq_ngram_offset || size_u <= seq_ngram_offset)
+                        return false;  /// Some part of the given ngram contains an invalid UTF-8 sequence.
 
                     chars.c0 = seq_l[seq_ngram_offset];
                     putNGramBase(n, offset);
@@ -303,10 +306,8 @@ namespace VolnitskyTraits
                     if (size_first_l != size_first_u || size_second_l != size_second_u)
                         return false;
 
-                    assert(size_first_l > seq_ngram_offset);
-                    assert(size_first_u > seq_ngram_offset);
-                    assert(size_second_l > 0);
-                    assert(size_second_u > 0);
+                    if (size_first_l <= seq_ngram_offset || size_first_u <= seq_ngram_offset || size_second_l == 0 || size_second_u == 0)
+                        return false;
 
                     auto c0l = first_l_seq[seq_ngram_offset];
                     auto c0u = first_u_seq[seq_ngram_offset];
@@ -400,7 +401,7 @@ public:
         if (fallback || fallback_searcher.force_fallback)
             return;
 
-        hash = std::unique_ptr<VolnitskyTraits::Offset[]>(new VolnitskyTraits::Offset[VolnitskyTraits::hash_size]{});
+        hash = std::make_unique<VolnitskyTraits::Offset[]>(VolnitskyTraits::hash_size);
 
         auto callback = [this](const VolnitskyTraits::Ngram ngram, const int offset) { return this->putNGramBase(ngram, offset); };
         /// ssize_t is used here because unsigned can't be used with condition like `i >= 0`, unsigned always >= 0

From af9d35dc595818b68b2963b4ff62b2f914bb2f03 Mon Sep 17 00:00:00 2001
From: Justin de Guzman <justin@justindeguzman.net>
Date: Sun, 24 Mar 2024 00:07:08 -0700
Subject: [PATCH 975/985] [Docs] Add keywords for advanced dashboard

Add keywords for advanced observability dashboard for better search
---
 docs/en/operations/monitoring.md | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/docs/en/operations/monitoring.md b/docs/en/operations/monitoring.md
index de61da6f5c4..573e8075bca 100644
--- a/docs/en/operations/monitoring.md
+++ b/docs/en/operations/monitoring.md
@@ -3,6 +3,7 @@ slug: /en/operations/monitoring
 sidebar_position: 45
 sidebar_label: Monitoring
 description: You can monitor the utilization of hardware resources and also ClickHouse server metrics.
+keywords: [monitoring, observability, advanced dashboard, dashboard, observability dashboard]
 ---
 
 # Monitoring
@@ -15,11 +16,11 @@ You can monitor:
 - Utilization of hardware resources.
 - ClickHouse server metrics.
 
-## Built-in observability dashboard
+## Built-in advanced observability dashboard
 
 <img width="400" alt="Screenshot 2023-11-12 at 6 08 58 PM" src="https://github.com/ClickHouse/ClickHouse/assets/3936029/2bd10011-4a47-4b94-b836-d44557c7fdc1" />
 
-ClickHouse comes with a built-in observability dashboard feature which can be accessed by `$HOST:$PORT/dashboard` (requires user and password) that shows the following metrics:
+ClickHouse comes with a built-in advanced observability dashboard feature which can be accessed by `$HOST:$PORT/dashboard` (requires user and password) that shows the following metrics:
 - Queries/second
 - CPU usage (cores)
 - Queries running

From 90e1f7d8ecfaed01a2acf4f1cfd991ac63c5c161 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 24 Mar 2024 16:19:06 +0100
Subject: [PATCH 976/985] Fix sanitizers suppressions

The -fsanitize-ignorelist (-fsanitize-blacklist is the alias for it)
accepts not the suppressions but special case list, that accept only
`fun` and `src`, so convert tsan_suppressions.txt into a proper
tsan_ignorelist.txt with a proper syntax, otherwise suppressions simply
does not work [1].

  [1]: https://s3.amazonaws.com/clickhouse-test-reports/61526/958659584957ff419a9305d9c7edee5703fedbdc/integration_tests__tsan__[6_6].html

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 cmake/sanitize.cmake                                   |  4 ++--
 tests/tsan_ignorelist.txt                              | 10 ++++++++++
 tests/tsan_suppressions.txt                            |  4 ----
 tests/{ubsan_suppressions.txt => ubsan_ignorelist.txt} |  9 ++++++++-
 4 files changed, 20 insertions(+), 7 deletions(-)
 create mode 100644 tests/tsan_ignorelist.txt
 delete mode 100644 tests/tsan_suppressions.txt
 rename tests/{ubsan_suppressions.txt => ubsan_ignorelist.txt} (50%)

diff --git a/cmake/sanitize.cmake b/cmake/sanitize.cmake
index 88dea294bf5..9d53b2004b4 100644
--- a/cmake/sanitize.cmake
+++ b/cmake/sanitize.cmake
@@ -30,7 +30,7 @@ if (SANITIZE)
     elseif (SANITIZE STREQUAL "thread")
         set (TSAN_FLAGS "-fsanitize=thread")
         if (COMPILER_CLANG)
-            set (TSAN_FLAGS "${TSAN_FLAGS} -fsanitize-blacklist=${PROJECT_SOURCE_DIR}/tests/tsan_suppressions.txt")
+            set (TSAN_FLAGS "${TSAN_FLAGS} -fsanitize-ignorelist=${PROJECT_SOURCE_DIR}/tests/tsan_ignorelist.txt")
         endif()
 
         set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${SAN_FLAGS} ${TSAN_FLAGS}")
@@ -48,7 +48,7 @@ if (SANITIZE)
             set(UBSAN_FLAGS "${UBSAN_FLAGS} -fno-sanitize=unsigned-integer-overflow")
         endif()
         if (COMPILER_CLANG)
-            set (UBSAN_FLAGS "${UBSAN_FLAGS} -fsanitize-blacklist=${PROJECT_SOURCE_DIR}/tests/ubsan_suppressions.txt")
+            set (UBSAN_FLAGS "${UBSAN_FLAGS} -fsanitize-ignorelist=${PROJECT_SOURCE_DIR}/tests/ubsan_ignorelist.txt")
         endif()
 
         set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${SAN_FLAGS} ${UBSAN_FLAGS}")
diff --git a/tests/tsan_ignorelist.txt b/tests/tsan_ignorelist.txt
new file mode 100644
index 00000000000..b565cc91411
--- /dev/null
+++ b/tests/tsan_ignorelist.txt
@@ -0,0 +1,10 @@
+# Note, this file is ignorelist file [1] not suppressions [2].
+#
+#  [1]: https://clang.llvm.org/docs/SanitizerSpecialCaseList.html
+#  [2]: https://github.com/google/sanitizers/wiki/ThreadSanitizerSuppressions
+#
+
+# https://github.com/ClickHouse/ClickHouse/issues/55629
+fun:rd_kafka_broker_set_nodename
+# https://github.com/ClickHouse/ClickHouse/issues/60443
+fun:rd_kafka_stats_emit_all
diff --git a/tests/tsan_suppressions.txt b/tests/tsan_suppressions.txt
deleted file mode 100644
index 4f29925761b..00000000000
--- a/tests/tsan_suppressions.txt
+++ /dev/null
@@ -1,4 +0,0 @@
-# https://github.com/ClickHouse/ClickHouse/issues/55629
-race:rd_kafka_broker_set_nodename
-# https://github.com/ClickHouse/ClickHouse/issues/60443
-race:rd_kafka_stats_emit_all
diff --git a/tests/ubsan_suppressions.txt b/tests/ubsan_ignorelist.txt
similarity index 50%
rename from tests/ubsan_suppressions.txt
rename to tests/ubsan_ignorelist.txt
index ea2ebe330bf..e89127507c0 100644
--- a/tests/ubsan_suppressions.txt
+++ b/tests/ubsan_ignorelist.txt
@@ -1,4 +1,11 @@
-# https://github.com/llvm-mirror/compiler-rt/blob/master/lib/ubsan/ubsan_checks.inc
+# Note, this file is ignorelist file [1] not suppressions [2].
+#
+#  [1]: https://clang.llvm.org/docs/SanitizerSpecialCaseList.html
+#  [2]: https://clang.llvm.org/docs/UndefinedBehaviorSanitizer.html#runtime-suppressions
+#
+# See also [3] for all UBSan checks.
+#
+#   [3]: https://github.com/llvm-mirror/compiler-rt/blob/master/lib/ubsan/ubsan_checks.inc
 
 # Some value is outside the range of representable values of type 'long' on user-provided data inside boost::geometry - ignore.
 src:*/Functions/pointInPolygon.cpp

From adfe1459cf69b44c64882d2e709dc6c8f2bf4152 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 24 Mar 2024 14:19:39 +0100
Subject: [PATCH 977/985] Better message for logging errors

Right now it is possible to get something like this [1]:

    Failed to write a log message: src/Storages/Kafka/KafkaConsumer.cpp:342

Without any details (likely there are some issues with fmt).

  [1]: https://s3.amazonaws.com/clickhouse-test-reports/61526/958659584957ff419a9305d9c7edee5703fedbdc/integration_tests__tsan__[6_6].html

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Common/logger_useful.h | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/src/Common/logger_useful.h b/src/Common/logger_useful.h
index 013b35e695e..1ce4f545e6f 100644
--- a/src/Common/logger_useful.h
+++ b/src/Common/logger_useful.h
@@ -107,6 +107,18 @@ namespace impl
             (PRIORITY), _file_function.c_str(), __LINE__, _format_string);                                          \
         _channel->log(_poco_message);                                                                               \
     }                                                                                                               \
+    catch (const Poco::Exception & logger_exception)                                                                \
+    {                                                                                                               \
+        ::write(STDERR_FILENO, static_cast<const void *>(MESSAGE_FOR_EXCEPTION_ON_LOGGING), sizeof(MESSAGE_FOR_EXCEPTION_ON_LOGGING)); \
+        const std::string & logger_exception_message = logger_exception.message();                                  \
+        ::write(STDERR_FILENO, static_cast<const void *>(logger_exception_message.data()), logger_exception_message.size()); \
+    }                                                                                                               \
+    catch (const std::exception & logger_exception)                                                                 \
+    {                                                                                                               \
+        ::write(STDERR_FILENO, static_cast<const void *>(MESSAGE_FOR_EXCEPTION_ON_LOGGING), sizeof(MESSAGE_FOR_EXCEPTION_ON_LOGGING)); \
+        const char * logger_exception_message = logger_exception.what();                                            \
+        ::write(STDERR_FILENO, static_cast<const void *>(logger_exception_message), strlen(logger_exception_message)); \
+    }                                                                                                               \
     catch (...)                                                                                                     \
     {                                                                                                               \
         ::write(STDERR_FILENO, static_cast<const void *>(MESSAGE_FOR_EXCEPTION_ON_LOGGING), sizeof(MESSAGE_FOR_EXCEPTION_ON_LOGGING)); \

From 4db69c36f9d0e759f9b94dc15551e3b9da3473bf Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 17:15:47 +0100
Subject: [PATCH 978/985] Remove unused code

---
 src/Client/LocalConnection.h | 8 --------
 1 file changed, 8 deletions(-)

diff --git a/src/Client/LocalConnection.h b/src/Client/LocalConnection.h
index fb8f9003364..9c2d0a81d8d 100644
--- a/src/Client/LocalConnection.h
+++ b/src/Client/LocalConnection.h
@@ -132,14 +132,6 @@ public:
     void setThrottler(const ThrottlerPtr &) override {}
 
 private:
-    void initBlockInput();
-
-    void processOrdinaryQuery();
-
-    void processOrdinaryQueryWithProcessors();
-
-    void updateState();
-
     bool pullBlock(Block & block);
 
     void finishQuery();

From aca3978f2d746e8225dca38255608d4847f1ae1a Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 17:21:53 +0100
Subject: [PATCH 979/985] Remove DataStreams (2)

---
 programs/odbc-bridge/CMakeLists.txt                           | 4 ++--
 programs/odbc-bridge/MainHandler.cpp                          | 4 ++--
 .../odbc-bridge/{ODBCBlockOutputStream.cpp => ODBCSink.cpp}   | 2 +-
 programs/odbc-bridge/{ODBCBlockOutputStream.h => ODBCSink.h}  | 0
 .../odbc-bridge/{ODBCBlockInputStream.cpp => ODBCSource.cpp}  | 3 +--
 programs/odbc-bridge/{ODBCBlockInputStream.h => ODBCSource.h} | 0
 6 files changed, 6 insertions(+), 7 deletions(-)
 rename programs/odbc-bridge/{ODBCBlockOutputStream.cpp => ODBCSink.cpp} (97%)
 rename programs/odbc-bridge/{ODBCBlockOutputStream.h => ODBCSink.h} (100%)
 rename programs/odbc-bridge/{ODBCBlockInputStream.cpp => ODBCSource.cpp} (98%)
 rename programs/odbc-bridge/{ODBCBlockInputStream.h => ODBCSource.h} (100%)

diff --git a/programs/odbc-bridge/CMakeLists.txt b/programs/odbc-bridge/CMakeLists.txt
index 18cda4d7a04..d6cbe8f7215 100644
--- a/programs/odbc-bridge/CMakeLists.txt
+++ b/programs/odbc-bridge/CMakeLists.txt
@@ -4,8 +4,8 @@ set (CLICKHOUSE_ODBC_BRIDGE_SOURCES
     ColumnInfoHandler.cpp
     IdentifierQuoteHandler.cpp
     MainHandler.cpp
-    ODBCBlockInputStream.cpp
-    ODBCBlockOutputStream.cpp
+    ODBCSource.cpp
+    ODBCSink.cpp
     ODBCBridge.cpp
     ODBCHandlerFactory.cpp
     PingHandler.cpp
diff --git a/programs/odbc-bridge/MainHandler.cpp b/programs/odbc-bridge/MainHandler.cpp
index e350afa2b10..2cf1576ccd7 100644
--- a/programs/odbc-bridge/MainHandler.cpp
+++ b/programs/odbc-bridge/MainHandler.cpp
@@ -1,8 +1,8 @@
 #include "MainHandler.h"
 
 #include "validateODBCConnectionString.h"
-#include "ODBCBlockInputStream.h"
-#include "ODBCBlockOutputStream.h"
+#include "ODBCSource.h"
+#include "ODBCSink.h"
 #include "getIdentifierQuote.h"
 #include <DataTypes/DataTypeFactory.h>
 #include <Formats/FormatFactory.h>
diff --git a/programs/odbc-bridge/ODBCBlockOutputStream.cpp b/programs/odbc-bridge/ODBCSink.cpp
similarity index 97%
rename from programs/odbc-bridge/ODBCBlockOutputStream.cpp
rename to programs/odbc-bridge/ODBCSink.cpp
index 37b70023169..ea2e88690ce 100644
--- a/programs/odbc-bridge/ODBCBlockOutputStream.cpp
+++ b/programs/odbc-bridge/ODBCSink.cpp
@@ -1,4 +1,4 @@
-#include "ODBCBlockOutputStream.h"
+#include "ODBCSink.h"
 
 #include <IO/WriteBufferFromString.h>
 #include <Interpreters/Context.h>
diff --git a/programs/odbc-bridge/ODBCBlockOutputStream.h b/programs/odbc-bridge/ODBCSink.h
similarity index 100%
rename from programs/odbc-bridge/ODBCBlockOutputStream.h
rename to programs/odbc-bridge/ODBCSink.h
diff --git a/programs/odbc-bridge/ODBCBlockInputStream.cpp b/programs/odbc-bridge/ODBCSource.cpp
similarity index 98%
rename from programs/odbc-bridge/ODBCBlockInputStream.cpp
rename to programs/odbc-bridge/ODBCSource.cpp
index 59a5deac960..7f0d47f7e2e 100644
--- a/programs/odbc-bridge/ODBCBlockInputStream.cpp
+++ b/programs/odbc-bridge/ODBCSource.cpp
@@ -1,11 +1,10 @@
-#include "ODBCBlockInputStream.h"
+#include "ODBCSource.h"
 #include <vector>
 #include <IO/ReadBufferFromString.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeDateTime64.h>
 #include <Common/assert_cast.h>
 #include <IO/ReadHelpers.h>
-#include <Common/logger_useful.h>
 
 
 namespace DB
diff --git a/programs/odbc-bridge/ODBCBlockInputStream.h b/programs/odbc-bridge/ODBCSource.h
similarity index 100%
rename from programs/odbc-bridge/ODBCBlockInputStream.h
rename to programs/odbc-bridge/ODBCSource.h

From e2974c9f4bba796d70195b9e2081499d127e8f24 Mon Sep 17 00:00:00 2001
From: Shubham Ranjan <shubham.ranjan1804@gmail.com>
Date: Mon, 25 Mar 2024 01:40:03 +0530
Subject: [PATCH 980/985] chore: update xxhash to v0.8.2

---
 contrib/xxHash                      | 2 +-
 contrib/xxHash-cmake/CMakeLists.txt | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/contrib/xxHash b/contrib/xxHash
index 3078dc6039f..bbb27a5efb8 160000
--- a/contrib/xxHash
+++ b/contrib/xxHash
@@ -1 +1 @@
-Subproject commit 3078dc6039f8c0bffcb1904f81cfe6b2c3209435
+Subproject commit bbb27a5efb85b92a0486cf361a8635715a53f6ba
diff --git a/contrib/xxHash-cmake/CMakeLists.txt b/contrib/xxHash-cmake/CMakeLists.txt
index 314094e9523..bd7192ae944 100644
--- a/contrib/xxHash-cmake/CMakeLists.txt
+++ b/contrib/xxHash-cmake/CMakeLists.txt
@@ -7,7 +7,7 @@ add_library(xxHash ${SRCS})
 target_include_directories(xxHash SYSTEM BEFORE INTERFACE "${LIBRARY_DIR}")
 
 # XXH_INLINE_ALL - Make all functions inline, with implementations being directly included within xxhash.h. Inlining functions is beneficial for speed on small keys.
-# https://github.com/Cyan4973/xxHash/tree/v0.8.1#build-modifiers
+# https://github.com/Cyan4973/xxHash/tree/v0.8.2#build-modifiers
 target_compile_definitions(xxHash PUBLIC XXH_INLINE_ALL)
 
 add_library(ch_contrib::xxHash ALIAS xxHash)

From 35722be8ec1e52a70a69079e98c886c93464e368 Mon Sep 17 00:00:00 2001
From: Azat Khuzhin <a3at.mail@gmail.com>
Date: Sun, 24 Mar 2024 17:19:14 +0100
Subject: [PATCH 981/985] Add ability to override initial INSERT SETTINGS via
 SYSTEM FLUSH DISTRIBUTED

This is useful to overwrite settings in the initial query during force
flush with SYSTEM FLUSH DISTRIBUTED.

For example imagine that your server is out of queries
(max_max_concurrent_queries_for_all_users had been reached), but you
want to flush the distributed table anyway, after this patch you can
use something like this:

    SYSTEM FLUSH DISTRIBUTED dist SETTINGS max_concurrent_queries_for_all_users=1000000

And also fix flush_on_detach for SYSTEM FLUSH DISTRIBUTED, it should
ignore flush_on_detach.

Signed-off-by: Azat Khuzhin <a.khuzhin@semrush.com>
---
 src/Interpreters/InterpreterSystemQuery.cpp   |  9 ++++--
 src/Parsers/ASTSystemQuery.cpp                | 15 +++++++++
 src/Parsers/ASTSystemQuery.h                  |  2 ++
 src/Parsers/ParserSystemQuery.cpp             | 18 +++++++++++
 .../DistributedAsyncInsertBatch.cpp           | 24 ++++++++------
 .../Distributed/DistributedAsyncInsertBatch.h |  7 +++--
 .../DistributedAsyncInsertDirectoryQueue.cpp  | 31 ++++++++++---------
 .../DistributedAsyncInsertDirectoryQueue.h    |  9 +++---
 src/Storages/StorageDistributed.cpp           | 15 ++++++---
 src/Storages/StorageDistributed.h             |  7 ++++-
 ...etry_insert_on_distributed_table.reference |  4 +--
 ...ystem_flush_distributed_settings.reference |  1 +
 ...3030_system_flush_distributed_settings.sql | 19 ++++++++++++
 13 files changed, 121 insertions(+), 40 deletions(-)
 create mode 100644 tests/queries/0_stateless/03030_system_flush_distributed_settings.reference
 create mode 100644 tests/queries/0_stateless/03030_system_flush_distributed_settings.sql

diff --git a/src/Interpreters/InterpreterSystemQuery.cpp b/src/Interpreters/InterpreterSystemQuery.cpp
index 49b3bd606d1..1cbc9c49631 100644
--- a/src/Interpreters/InterpreterSystemQuery.cpp
+++ b/src/Interpreters/InterpreterSystemQuery.cpp
@@ -59,6 +59,7 @@
 #include <Storages/System/StorageSystemFilesystemCache.h>
 #include <Parsers/ASTSystemQuery.h>
 #include <Parsers/ASTCreateQuery.h>
+#include <Parsers/ASTSetQuery.h>
 #include <Processors/Sources/SourceFromSingleChunk.h>
 #include <Common/ThreadFuzzer.h>
 #include <base/coverage.h>
@@ -1165,12 +1166,16 @@ void InterpreterSystemQuery::syncTransactionLog()
 }
 
 
-void InterpreterSystemQuery::flushDistributed(ASTSystemQuery &)
+void InterpreterSystemQuery::flushDistributed(ASTSystemQuery & query)
 {
     getContext()->checkAccess(AccessType::SYSTEM_FLUSH_DISTRIBUTED, table_id);
 
+    SettingsChanges settings_changes;
+    if (query.query_settings)
+        settings_changes = query.query_settings->as<ASTSetQuery>()->changes;
+
     if (auto * storage_distributed = dynamic_cast<StorageDistributed *>(DatabaseCatalog::instance().getTable(table_id, getContext()).get()))
-        storage_distributed->flushClusterNodesAllData(getContext());
+        storage_distributed->flushClusterNodesAllData(getContext(), settings_changes);
     else
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Table {} is not distributed", table_id.getNameForLogs());
 }
diff --git a/src/Parsers/ASTSystemQuery.cpp b/src/Parsers/ASTSystemQuery.cpp
index effc7207793..9215353e2b3 100644
--- a/src/Parsers/ASTSystemQuery.cpp
+++ b/src/Parsers/ASTSystemQuery.cpp
@@ -190,6 +190,21 @@ void ASTSystemQuery::formatImpl(const FormatSettings & settings, FormatState & s
         case Type::SYNC_REPLICA:
         case Type::WAIT_LOADING_PARTS:
         case Type::FLUSH_DISTRIBUTED:
+        {
+            if (table)
+            {
+                settings.ostr << ' ';
+                print_database_table();
+            }
+
+            if (query_settings)
+            {
+                settings.ostr << (settings.hilite ? hilite_keyword : "") << settings.nl_or_ws << "SETTINGS " << (settings.hilite ? hilite_none : "");
+                query_settings->formatImpl(settings, state, frame);
+            }
+
+            break;
+        }
         case Type::RELOAD_DICTIONARY:
         case Type::RELOAD_MODEL:
         case Type::RELOAD_FUNCTION:
diff --git a/src/Parsers/ASTSystemQuery.h b/src/Parsers/ASTSystemQuery.h
index 70a9e27178d..18a804ebc45 100644
--- a/src/Parsers/ASTSystemQuery.h
+++ b/src/Parsers/ASTSystemQuery.h
@@ -109,6 +109,7 @@ public:
 
     ASTPtr database;
     ASTPtr table;
+    ASTPtr query_settings;
 
     String getDatabase() const;
     String getTable() const;
@@ -158,6 +159,7 @@ public:
 
         if (database) { res->database = database->clone(); res->children.push_back(res->database); }
         if (table) { res->table = table->clone(); res->children.push_back(res->table); }
+        if (query_settings) { res->query_settings = query_settings->clone(); res->children.push_back(res->query_settings); }
 
         return res;
     }
diff --git a/src/Parsers/ParserSystemQuery.cpp b/src/Parsers/ParserSystemQuery.cpp
index df168e74772..81f9332c730 100644
--- a/src/Parsers/ParserSystemQuery.cpp
+++ b/src/Parsers/ParserSystemQuery.cpp
@@ -4,6 +4,7 @@
 #include <Parsers/ExpressionElementParsers.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTLiteral.h>
+#include <Parsers/ParserSetQuery.h>
 #include <Parsers/parseDatabaseAndTableName.h>
 #include <IO/ReadBufferFromString.h>
 #include <IO/ReadHelpers.h>
@@ -328,6 +329,21 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
         }
 
         case Type::FLUSH_DISTRIBUTED:
+        {
+            if (!parseQueryWithOnClusterAndMaybeTable(res, pos, expected, /* require table = */ true, /* allow_string_literal = */ false))
+                return false;
+
+            ParserKeyword s_settings(Keyword::SETTINGS);
+            if (s_settings.ignore(pos, expected))
+            {
+                ParserSetQuery parser_settings(/* parse_only_internals_= */ true);
+                if (!parser_settings.parse(pos, res->query_settings, expected))
+                    return false;
+            }
+
+            break;
+        }
+
         case Type::RESTORE_REPLICA:
         {
             if (!parseQueryWithOnClusterAndMaybeTable(res, pos, expected, /* require table = */ true, /* allow_string_literal = */ false))
@@ -616,6 +632,8 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
         res->children.push_back(res->database);
     if (res->table)
         res->children.push_back(res->table);
+    if (res->query_settings)
+        res->children.push_back(res->query_settings);
 
     node = std::move(res);
     return true;
diff --git a/src/Storages/Distributed/DistributedAsyncInsertBatch.cpp b/src/Storages/Distributed/DistributedAsyncInsertBatch.cpp
index 97268cf1389..8d95e49de57 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertBatch.cpp
+++ b/src/Storages/Distributed/DistributedAsyncInsertBatch.cpp
@@ -60,7 +60,7 @@ bool DistributedAsyncInsertBatch::isEnoughSize() const
         || (parent.min_batched_block_size_bytes && total_bytes >= parent.min_batched_block_size_bytes);
 }
 
-void DistributedAsyncInsertBatch::send()
+void DistributedAsyncInsertBatch::send(const SettingsChanges & settings_changes)
 {
     if (files.empty())
         return;
@@ -84,14 +84,14 @@ void DistributedAsyncInsertBatch::send()
     {
         try
         {
-            sendBatch();
+            sendBatch(settings_changes);
         }
         catch (const Exception & e)
         {
             if (split_batch_on_failure && files.size() > 1 && isSplittableErrorCode(e.code(), e.isRemoteException()))
             {
                 tryLogCurrentException(parent.log, "Trying to split batch due to");
-                sendSeparateFiles();
+                sendSeparateFiles(settings_changes);
             }
             else
                 throw;
@@ -201,7 +201,7 @@ void DistributedAsyncInsertBatch::readText(ReadBuffer & in)
     recovered = true;
 }
 
-void DistributedAsyncInsertBatch::sendBatch()
+void DistributedAsyncInsertBatch::sendBatch(const SettingsChanges & settings_changes)
 {
     std::unique_ptr<RemoteInserter> remote;
     bool compression_expected = false;
@@ -228,7 +228,10 @@ void DistributedAsyncInsertBatch::sendBatch()
 
             if (!remote)
             {
-                auto timeouts = ConnectionTimeouts::getTCPTimeoutsWithFailover(distributed_header.insert_settings);
+                Settings insert_settings = distributed_header.insert_settings;
+                insert_settings.applyChanges(settings_changes);
+
+                auto timeouts = ConnectionTimeouts::getTCPTimeoutsWithFailover(insert_settings);
                 connection = parent.pool->get(timeouts);
                 compression_expected = connection->getCompression() == Protocol::Compression::Enable;
 
@@ -240,7 +243,7 @@ void DistributedAsyncInsertBatch::sendBatch()
 
                 remote = std::make_unique<RemoteInserter>(*connection, timeouts,
                     distributed_header.insert_query,
-                    distributed_header.insert_settings,
+                    insert_settings,
                     distributed_header.client_info);
             }
             writeRemoteConvert(distributed_header, *remote, compression_expected, in, parent.log);
@@ -264,7 +267,7 @@ void DistributedAsyncInsertBatch::sendBatch()
     }
 }
 
-void DistributedAsyncInsertBatch::sendSeparateFiles()
+void DistributedAsyncInsertBatch::sendSeparateFiles(const SettingsChanges & settings_changes)
 {
     size_t broken_files = 0;
 
@@ -277,18 +280,21 @@ void DistributedAsyncInsertBatch::sendSeparateFiles()
             ReadBufferFromFile in(file);
             const auto & distributed_header = DistributedAsyncInsertHeader::read(in, parent.log);
 
+            Settings insert_settings = distributed_header.insert_settings;
+            insert_settings.applyChanges(settings_changes);
+
             // This function is called in a separated thread, so we set up the trace context from the file
             trace_context = distributed_header.createTracingContextHolder(
                 __PRETTY_FUNCTION__,
                 parent.storage.getContext()->getOpenTelemetrySpanLog());
 
-            auto timeouts = ConnectionTimeouts::getTCPTimeoutsWithFailover(distributed_header.insert_settings);
+            auto timeouts = ConnectionTimeouts::getTCPTimeoutsWithFailover(insert_settings);
             auto connection = parent.pool->get(timeouts);
             bool compression_expected = connection->getCompression() == Protocol::Compression::Enable;
 
             RemoteInserter remote(*connection, timeouts,
                 distributed_header.insert_query,
-                distributed_header.insert_settings,
+                insert_settings,
                 distributed_header.client_info);
 
             writeRemoteConvert(distributed_header, remote, compression_expected, in, parent.log);
diff --git a/src/Storages/Distributed/DistributedAsyncInsertBatch.h b/src/Storages/Distributed/DistributedAsyncInsertBatch.h
index db96634d6f1..e37c3ae6134 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertBatch.h
+++ b/src/Storages/Distributed/DistributedAsyncInsertBatch.h
@@ -9,6 +9,7 @@ namespace DB
 class DistributedAsyncInsertDirectoryQueue;
 class WriteBuffer;
 class ReadBuffer;
+class SettingsChanges;
 
 class DistributedAsyncInsertBatch
 {
@@ -16,7 +17,7 @@ public:
     explicit DistributedAsyncInsertBatch(DistributedAsyncInsertDirectoryQueue & parent_);
 
     bool isEnoughSize() const;
-    void send();
+    void send(const SettingsChanges & settings_changes);
 
     /// Write batch to current_batch.txt
     void serialize();
@@ -35,8 +36,8 @@ public:
 private:
     void writeText(WriteBuffer & out);
     void readText(ReadBuffer & in);
-    void sendBatch();
-    void sendSeparateFiles();
+    void sendBatch(const SettingsChanges & settings_changes);
+    void sendSeparateFiles(const SettingsChanges & settings_changes);
 
     DistributedAsyncInsertDirectoryQueue & parent;
 
diff --git a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp
index 4e01cb2c6cf..7fed076713d 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp
+++ b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp
@@ -146,7 +146,7 @@ DistributedAsyncInsertDirectoryQueue::~DistributedAsyncInsertDirectoryQueue()
     }
 }
 
-void DistributedAsyncInsertDirectoryQueue::flushAllData()
+void DistributedAsyncInsertDirectoryQueue::flushAllData(const SettingsChanges & settings_changes)
 {
     if (pending_files.isFinished())
         return;
@@ -154,7 +154,7 @@ void DistributedAsyncInsertDirectoryQueue::flushAllData()
     std::lock_guard lock{mutex};
     if (!hasPendingFiles())
         return;
-    processFiles();
+    processFiles(settings_changes);
 }
 
 void DistributedAsyncInsertDirectoryQueue::shutdownAndDropAllData()
@@ -362,19 +362,19 @@ void DistributedAsyncInsertDirectoryQueue::initializeFilesFromDisk()
         status.broken_bytes_count = broken_bytes_count;
     }
 }
-void DistributedAsyncInsertDirectoryQueue::processFiles()
+void DistributedAsyncInsertDirectoryQueue::processFiles(const SettingsChanges & settings_changes)
 try
 {
     if (should_batch_inserts)
-        processFilesWithBatching();
+        processFilesWithBatching(settings_changes);
     else
     {
         /// Process unprocessed file.
         if (!current_file.empty())
-            processFile(current_file);
+            processFile(current_file, settings_changes);
 
         while (!pending_files.isFinished() && pending_files.tryPop(current_file))
-            processFile(current_file);
+            processFile(current_file, settings_changes);
     }
 
     std::lock_guard status_lock(status_mutex);
@@ -393,7 +393,7 @@ catch (...)
     throw;
 }
 
-void DistributedAsyncInsertDirectoryQueue::processFile(std::string & file_path)
+void DistributedAsyncInsertDirectoryQueue::processFile(std::string & file_path, const SettingsChanges & settings_changes)
 {
     OpenTelemetry::TracingContextHolderPtr thread_trace_context;
 
@@ -408,8 +408,11 @@ void DistributedAsyncInsertDirectoryQueue::processFile(std::string & file_path)
             __PRETTY_FUNCTION__,
             storage.getContext()->getOpenTelemetrySpanLog());
 
-        auto timeouts = ConnectionTimeouts::getTCPTimeoutsWithFailover(distributed_header.insert_settings);
-        auto connection = pool->get(timeouts, distributed_header.insert_settings);
+        Settings insert_settings = distributed_header.insert_settings;
+        insert_settings.applyChanges(settings_changes);
+
+        auto timeouts = ConnectionTimeouts::getTCPTimeoutsWithFailover(insert_settings);
+        auto connection = pool->get(timeouts, insert_settings);
         LOG_DEBUG(log, "Sending `{}` to {} ({} rows, {} bytes)",
             file_path,
             connection->getDescription(),
@@ -418,7 +421,7 @@ void DistributedAsyncInsertDirectoryQueue::processFile(std::string & file_path)
 
         RemoteInserter remote{*connection, timeouts,
             distributed_header.insert_query,
-            distributed_header.insert_settings,
+            insert_settings,
             distributed_header.client_info};
         bool compression_expected = connection->getCompression() == Protocol::Compression::Enable;
         writeRemoteConvert(distributed_header, remote, compression_expected, in, log);
@@ -515,7 +518,7 @@ DistributedAsyncInsertDirectoryQueue::Status DistributedAsyncInsertDirectoryQueu
     return current_status;
 }
 
-void DistributedAsyncInsertDirectoryQueue::processFilesWithBatching()
+void DistributedAsyncInsertDirectoryQueue::processFilesWithBatching(const SettingsChanges & settings_changes)
 {
     /// Possibly, we failed to send a batch on the previous iteration. Try to send exactly the same batch.
     if (fs::exists(current_batch_file_path))
@@ -533,7 +536,7 @@ void DistributedAsyncInsertDirectoryQueue::processFilesWithBatching()
         /// file was missing, then the batch is not complete and there is no
         /// point in trying to pretend that it will not break deduplication.
         if (batch.valid())
-            batch.send();
+            batch.send(settings_changes);
 
         auto dir_sync_guard = getDirectorySyncGuard(relative_path);
         fs::remove(current_batch_file_path);
@@ -615,14 +618,14 @@ void DistributedAsyncInsertDirectoryQueue::processFilesWithBatching()
 
             if (batch.isEnoughSize())
             {
-                batch.send();
+                batch.send(settings_changes);
             }
         }
 
         for (auto & kv : header_to_batch)
         {
             DistributedAsyncInsertBatch & batch = kv.second;
-            batch.send();
+            batch.send(settings_changes);
         }
     }
     catch (...)
diff --git a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h
index a1b436bb9c8..4d6afe31d61 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h
+++ b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h
@@ -20,6 +20,7 @@ using DiskPtr = std::shared_ptr<IDisk>;
 class StorageDistributed;
 class ActionBlocker;
 class BackgroundSchedulePool;
+class SettingsChanges;
 
 class IProcessor;
 using ProcessorPtr = std::shared_ptr<IProcessor>;
@@ -59,7 +60,7 @@ public:
 
     void updatePath(const std::string & new_relative_path);
 
-    void flushAllData();
+    void flushAllData(const SettingsChanges & settings_changes);
 
     void shutdownAndDropAllData();
 
@@ -98,9 +99,9 @@ private:
 
     void addFile(const std::string & file_path);
     void initializeFilesFromDisk();
-    void processFiles();
-    void processFile(std::string & file_path);
-    void processFilesWithBatching();
+    void processFiles(const SettingsChanges & settings_changes = {});
+    void processFile(std::string & file_path, const SettingsChanges & settings_changes);
+    void processFilesWithBatching(const SettingsChanges & settings_changes);
 
     void markAsBroken(const std::string & file_path);
     void markAsSend(const std::string & file_path);
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 6f578e38945..1ee7c6fc6a5 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -1731,7 +1731,7 @@ void StorageDistributed::flushAndPrepareForShutdown()
 {
     try
     {
-        flushClusterNodesAllData(getContext());
+        flushClusterNodesAllDataImpl(getContext(), /* settings_changes= */ {}, getDistributedSettingsRef().flush_on_detach);
     }
     catch (...)
     {
@@ -1739,7 +1739,12 @@ void StorageDistributed::flushAndPrepareForShutdown()
     }
 }
 
-void StorageDistributed::flushClusterNodesAllData(ContextPtr local_context)
+void StorageDistributed::flushClusterNodesAllData(ContextPtr local_context, const SettingsChanges & settings_changes)
+{
+    flushClusterNodesAllDataImpl(local_context, settings_changes, /* flush= */ true);
+}
+
+void StorageDistributed::flushClusterNodesAllDataImpl(ContextPtr local_context, const SettingsChanges & settings_changes, bool flush)
 {
     /// Sync SYSTEM FLUSH DISTRIBUTED with TRUNCATE
     auto table_lock = lockForShare(local_context->getCurrentQueryId(), local_context->getSettingsRef().lock_acquire_timeout);
@@ -1754,7 +1759,7 @@ void StorageDistributed::flushClusterNodesAllData(ContextPtr local_context)
             directory_queues.push_back(node.second.directory_queue);
     }
 
-    if (getDistributedSettingsRef().flush_on_detach)
+    if (flush)
     {
         LOG_INFO(log, "Flushing pending INSERT blocks");
 
@@ -1764,9 +1769,9 @@ void StorageDistributed::flushClusterNodesAllData(ContextPtr local_context)
 
         for (const auto & node : directory_queues)
         {
-            auto future = scheduleFromThreadPool<void>([node_to_flush = node]
+            auto future = scheduleFromThreadPool<void>([node_to_flush = node, &settings_changes]
             {
-                node_to_flush->flushAllData();
+                node_to_flush->flushAllData(settings_changes);
             }, pool, "DistFlush");
             futures.push_back(std::move(future));
         }
diff --git a/src/Storages/StorageDistributed.h b/src/Storages/StorageDistributed.h
index 323646ab911..6709b1a2d8c 100644
--- a/src/Storages/StorageDistributed.h
+++ b/src/Storages/StorageDistributed.h
@@ -5,6 +5,7 @@
 #include <Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h>
 #include <Storages/Distributed/DistributedSettings.h>
 #include <Storages/getStructureOfRemoteTable.h>
+#include <Common/SettingsChanges.h>
 #include <Common/SimpleIncrement.h>
 #include <Client/ConnectionPool.h>
 #include <Client/ConnectionPoolWithFailover.h>
@@ -152,7 +153,7 @@ public:
     ClusterPtr getCluster() const;
 
     /// Used by InterpreterSystemQuery
-    void flushClusterNodesAllData(ContextPtr context);
+    void flushClusterNodesAllData(ContextPtr context, const SettingsChanges & settings_changes);
 
     size_t getShardCount() const;
 
@@ -165,6 +166,10 @@ private:
     const String & getShardingKeyColumnName() const { return sharding_key_column_name; }
     const String & getRelativeDataPath() const { return relative_data_path; }
 
+    /// @param flush - if true the do flush (DistributedAsyncInsertDirectoryQueue::flushAllData()),
+    /// otherwise only shutdown (DistributedAsyncInsertDirectoryQueue::shutdownWithoutFlush())
+    void flushClusterNodesAllDataImpl(ContextPtr context, const SettingsChanges & settings_changes, bool flush);
+
     /// create directory monitors for each existing subdirectory
     void initializeDirectoryQueuesForDisk(const DiskPtr & disk);
 
diff --git a/tests/queries/0_stateless/02417_opentelemetry_insert_on_distributed_table.reference b/tests/queries/0_stateless/02417_opentelemetry_insert_on_distributed_table.reference
index a0689a0a090..f2b5b95e45c 100644
--- a/tests/queries/0_stateless/02417_opentelemetry_insert_on_distributed_table.reference
+++ b/tests/queries/0_stateless/02417_opentelemetry_insert_on_distributed_table.reference
@@ -3,8 +3,8 @@
 {"operation_name":"void DB::DistributedSink::writeToLocal(const Cluster::ShardInfo &, const Block &, size_t)","cluster":"test_cluster_two_shards_localhost","shard":"2","rows":"1","bytes":"8"}
 1
 ===2===
-{"operation_name":"void DB::DistributedAsyncInsertDirectoryQueue::processFile(std::string &)","cluster":"test_cluster_two_shards_localhost","shard":"1","rows":"1","bytes":"8"}
-{"operation_name":"void DB::DistributedAsyncInsertDirectoryQueue::processFile(std::string &)","cluster":"test_cluster_two_shards_localhost","shard":"2","rows":"1","bytes":"8"}
+{"operation_name":"void DB::DistributedAsyncInsertDirectoryQueue::processFile(std::string &, const SettingsChanges &)","cluster":"test_cluster_two_shards_localhost","shard":"1","rows":"1","bytes":"8"}
+{"operation_name":"void DB::DistributedAsyncInsertDirectoryQueue::processFile(std::string &, const SettingsChanges &)","cluster":"test_cluster_two_shards_localhost","shard":"2","rows":"1","bytes":"8"}
 3
 2
 ===3===
diff --git a/tests/queries/0_stateless/03030_system_flush_distributed_settings.reference b/tests/queries/0_stateless/03030_system_flush_distributed_settings.reference
new file mode 100644
index 00000000000..5caff40c4a0
--- /dev/null
+++ b/tests/queries/0_stateless/03030_system_flush_distributed_settings.reference
@@ -0,0 +1 @@
+10000
diff --git a/tests/queries/0_stateless/03030_system_flush_distributed_settings.sql b/tests/queries/0_stateless/03030_system_flush_distributed_settings.sql
new file mode 100644
index 00000000000..da2a387e07c
--- /dev/null
+++ b/tests/queries/0_stateless/03030_system_flush_distributed_settings.sql
@@ -0,0 +1,19 @@
+drop table if exists ephemeral;
+drop table if exists dist_in;
+drop table if exists data;
+drop table if exists mv;
+drop table if exists dist_out;
+
+create table ephemeral (key Int, value Int) engine=Null();
+create table dist_in as ephemeral engine=Distributed(test_shard_localhost, currentDatabase(), ephemeral, key) settings background_insert_batch=1;
+create table data (key Int, uniq_values Int) engine=Memory();
+create materialized view mv to data as select key, uniqExact(value) uniq_values from ephemeral group by key;
+system stop distributed sends dist_in;
+create table dist_out as data engine=Distributed(test_shard_localhost, currentDatabase(), data);
+
+set prefer_localhost_replica=0;
+
+insert into dist_in select number/100, number from system.numbers limit 1e6 settings max_memory_usage='20Mi';
+system flush distributed dist_in; -- { serverError MEMORY_LIMIT_EXCEEDED }
+system flush distributed dist_in settings max_memory_usage=0;
+select count() from dist_out;

From 54c3bde6a774b6ae722a7eb5baaa477ea968514b Mon Sep 17 00:00:00 2001
From: Igor Nikonov <igor@clickhouse.com>
Date: Sun, 24 Mar 2024 21:20:51 +0000
Subject: [PATCH 982/985] Fix: DISTINCT in subquery with analyzer

RemoveUnusedProjectionColumnsPass incorrectly removed columns,
unused in outer query, from subqueries with DISTINCT
---
 .../Passes/RemoveUnusedProjectionColumnsPass.cpp  |  7 +++++++
 .../03023_remove_unused_column_distinct.reference |  6 ++++++
 .../03023_remove_unused_column_distinct.sql       | 15 +++++++++++++++
 3 files changed, 28 insertions(+)
 create mode 100644 tests/queries/0_stateless/03023_remove_unused_column_distinct.reference
 create mode 100644 tests/queries/0_stateless/03023_remove_unused_column_distinct.sql

diff --git a/src/Analyzer/Passes/RemoveUnusedProjectionColumnsPass.cpp b/src/Analyzer/Passes/RemoveUnusedProjectionColumnsPass.cpp
index 25c2a311977..78228f8f472 100644
--- a/src/Analyzer/Passes/RemoveUnusedProjectionColumnsPass.cpp
+++ b/src/Analyzer/Passes/RemoveUnusedProjectionColumnsPass.cpp
@@ -148,6 +148,13 @@ void RemoveUnusedProjectionColumnsPass::run(QueryTreeNodePtr & query_tree_node,
 
         for (auto & [query_or_union_node, used_columns] : visitor.query_or_union_node_to_used_columns)
         {
+            /// can't remove columns from distinct, see example - 03023_remove_unused_column_distinct.sql
+            if (auto * query_node = query_or_union_node->as<QueryNode>())
+            {
+                if (query_node->isDistinct())
+                    continue;
+            }
+
             auto used_projection_indexes = convertUsedColumnNamesToUsedProjectionIndexes(query_or_union_node, used_columns);
             updateUsedProjectionIndexes(query_or_union_node, used_projection_indexes);
 
diff --git a/tests/queries/0_stateless/03023_remove_unused_column_distinct.reference b/tests/queries/0_stateless/03023_remove_unused_column_distinct.reference
new file mode 100644
index 00000000000..adb11f046e0
--- /dev/null
+++ b/tests/queries/0_stateless/03023_remove_unused_column_distinct.reference
@@ -0,0 +1,6 @@
+product_0
+product_1
+product_0
+product_1
+product_0
+product_1
diff --git a/tests/queries/0_stateless/03023_remove_unused_column_distinct.sql b/tests/queries/0_stateless/03023_remove_unused_column_distinct.sql
new file mode 100644
index 00000000000..c2f32bfe3c1
--- /dev/null
+++ b/tests/queries/0_stateless/03023_remove_unused_column_distinct.sql
@@ -0,0 +1,15 @@
+SELECT product_id
+FROM
+(
+    SELECT DISTINCT
+        product_id,
+        section_id
+    FROM
+    (
+        SELECT
+            concat('product_', number % 2) AS product_id,
+            concat('section_', number % 3) AS section_id
+        FROM numbers(10)
+    )
+)
+SETTINGS allow_experimental_analyzer = 1;

From 06a9ac712645bb3275174152558e7b0680ee31a5 Mon Sep 17 00:00:00 2001
From: Alexey Milovidov <milovidov@clickhouse.com>
Date: Sun, 24 Mar 2024 23:23:13 +0100
Subject: [PATCH 983/985] Fix tests

---
 tests/integration/test_storage_kafka/test.py    | 2 +-
 tests/integration/test_storage_rabbitmq/test.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/integration/test_storage_kafka/test.py b/tests/integration/test_storage_kafka/test.py
index 5bdea179449..081b15520a1 100644
--- a/tests/integration/test_storage_kafka/test.py
+++ b/tests/integration/test_storage_kafka/test.py
@@ -4452,7 +4452,7 @@ def test_block_based_formats_1(kafka_cluster):
                      kafka_group_name = '{topic}',
                      kafka_format = 'PrettySpace';
 
-        INSERT INTO test.kafka SELECT number * 10 as key, number * 100 as value FROM numbers(5) settings max_block_size=2, optimize_trivial_insert_select=0, output_format_pretty_color=1;
+        INSERT INTO test.kafka SELECT number * 10 as key, number * 100 as value FROM numbers(5) settings max_block_size=2, optimize_trivial_insert_select=0, output_format_pretty_color=1, output_format_pretty_row_numbers=0;
     """
     )
 
diff --git a/tests/integration/test_storage_rabbitmq/test.py b/tests/integration/test_storage_rabbitmq/test.py
index 0f1c5eb17dd..1017e58e50c 100644
--- a/tests/integration/test_storage_rabbitmq/test.py
+++ b/tests/integration/test_storage_rabbitmq/test.py
@@ -3202,7 +3202,7 @@ def test_block_based_formats_1(rabbitmq_cluster):
     )
 
     instance.query(
-        "INSERT INTO test.rabbitmq SELECT number * 10 as key, number * 100 as value FROM numbers(5) settings max_block_size=2, optimize_trivial_insert_select=0, output_format_pretty_color=1;"
+        "INSERT INTO test.rabbitmq SELECT number * 10 as key, number * 100 as value FROM numbers(5) settings max_block_size=2, optimize_trivial_insert_select=0, output_format_pretty_color=1, output_format_pretty_row_numbers=0;"
     )
     insert_messages = []
 

From 24735354d95ea0665d94a6db6ae4ea5ebdb70583 Mon Sep 17 00:00:00 2001
From: Yakov Olkhovskiy <yakov@clickhouse.com>
Date: Sun, 24 Mar 2024 23:38:13 +0000
Subject: [PATCH 984/985] fix add offset step

---
 src/Planner/Planner.cpp | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index 5624a911210..5f73bba67a6 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -1029,9 +1029,12 @@ void addExtremesStepIfNeeded(QueryPlan & query_plan, const PlannerContextPtr & p
 
 void addOffsetStep(QueryPlan & query_plan, const QueryAnalysisResult & query_analysis_result)
 {
-    UInt64 limit_offset = query_analysis_result.limit_offset;
-    auto offsets_step = std::make_unique<OffsetStep>(query_plan.getCurrentDataStream(), limit_offset);
-    query_plan.addStep(std::move(offsets_step));
+    /// If there is not a LIMIT but an offset
+    if (!query_analysis_result.limit_length && query_analysis_result.limit_offset)
+    {
+        auto offsets_step = std::make_unique<OffsetStep>(query_plan.getCurrentDataStream(), query_analysis_result.limit_offset);
+        query_plan.addStep(std::move(offsets_step));
+    }
 }
 
 void collectSetsFromActionsDAG(const ActionsDAGPtr & dag, std::unordered_set<const FutureSet *> & useful_sets)

From fb36c8b1ef29be680942d6bdeda3ece214683d87 Mon Sep 17 00:00:00 2001
From: Yakov Olkhovskiy <yakov@clickhouse.com>
Date: Sun, 24 Mar 2024 23:44:00 +0000
Subject: [PATCH 985/985] update tests/analyzer_tech_debt.txt

---
 tests/analyzer_tech_debt.txt | 1 -
 1 file changed, 1 deletion(-)

diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index e2d8084df5e..31cec5acd1d 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -7,5 +7,4 @@
 02901_parallel_replicas_rollup
 # Flaky. Please don't delete them without fixing them:
 01287_max_execution_speed
-02003_WithMergeableStateAfterAggregationAndLimit_LIMIT_BY_LIMIT_OFFSET
 02404_memory_bound_merging